From 3ef7527be7724dbaa129d155842ff047dfe414c2 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 12 Jun 2026 22:04:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: laion/openthoughts-4-code-qwen3-32b-annotated-32k_qwen2.5-1.5B_32k Source: Original Platform --- .gitattributes | 53 + README.md | 61 + added_tokens.json | 24 + all_results.json | 16 + chat_template.jinja | 54 + config.json | 58 + configuration.json | 1 + generation_config.json | 14 + merges.txt | 3 + model.safetensors | 3 + run_summary.json | 12 + special_tokens_map.json | 31 + tokenizer.json | 3 + tokenizer_config.json | 208 + train_results.json | 16 + trainer_log.jsonl | 1521 ++++ trainer_state.json | 16525 ++++++++++++++++++++++++++++++++++++++ training_args.bin | 3 + training_loss.png | Bin 0 -> 48904 bytes vocab.json | 3 + 20 files changed, 18609 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 all_results.json create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model.safetensors create mode 100644 run_summary.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_loss.png create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..506927c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,53 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text + + +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text + +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +merges.txt filter=lfs diff=lfs merge=lfs -text +model.safetensors filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +training_args.bin filter=lfs diff=lfs merge=lfs -text +vocab.json filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..eca2ed9 --- /dev/null +++ b/README.md @@ -0,0 +1,61 @@ +--- +library_name: transformers +license: apache-2.0 +base_model: Qwen/Qwen2.5-1.5B-Instruct +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: openthoughts-4-code-qwen3-32b-annotated-32k_qwen2.5-1.5B_32k + results: [] +datasets: +- laion/openthoughts-4-code-qwen3-32b-32k-annotated +--- + + + +# Openthoughts-4-code-qwen3-32b-annotated-32k_qwen2.5-1.5B_32k + +This model is a fine-tuned version of [Qwen/Qwen2.5-1.5B-Instruct](https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct) on the laion/Qwen3-32B_hero_run_4_code_32k-sharegpt dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 0.00015 +- train_batch_size: 1 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 256 +- total_train_batch_size: 256 +- total_eval_batch_size: 2048 +- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.99) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 2.0 + +### Training results + + +### Framework versions + +- Transformers 4.55.0 +- Pytorch 2.7.1+cu128 +- Datasets 3.6.0 +- Tokenizers 0.21.1 \ No newline at end of file diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..482ced4 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,24 @@ +{ + "": 151658, + "": 151657, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..4e5b86b --- /dev/null +++ b/all_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 0.005619164353050912, + "achieved_tflops_per_gpu_theoretical": 323.025179674411, + "epoch": 2.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6287916302680969, + "mfu_percent": 0.001801014215721446, + "mfu_percent_theoretical": 103.53371143410608, + "total_flos": 2.788441056922829e+16, + "train_loss": 0.21610206831669151, + "train_runtime": 19384.2842, + "train_samples_per_second": 98.968, + "train_steps_per_second": 0.387, + "valid_targets_mean": 15631.9, + "valid_targets_min": 505 +} \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..bdf7919 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,54 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0]['role'] == 'system' %} + {{- messages[0]['content'] }} + {%- else %} + {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }} + {%- endif %} + {{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0]['role'] == 'system' %} + {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }} + {%- else %} + {{- '<|im_start|>system\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- for message in messages %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %} + {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {{- '<|im_start|>' + message.role }} + {%- if message.content %} + {{- '\n' + message.content }} + {%- endif %} + {%- for tool_call in message.tool_calls %} + {%- if tool_call.function is defined %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {{- tool_call.arguments | tojson }} + {{- '}\n' }} + {%- endfor %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- message.content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} +{%- endif %} diff --git a/config.json b/config.json new file mode 100644 index 0000000..5c4811c --- /dev/null +++ b/config.json @@ -0,0 +1,58 @@ +{ + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 151643, + "eos_token_id": 151645, + "hidden_act": "silu", + "hidden_size": 1536, + "initializer_range": 0.02, + "intermediate_size": 8960, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 21, + "model_type": "qwen2", + "num_attention_heads": 12, + "num_hidden_layers": 28, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": true, + "torch_dtype": "bfloat16", + "transformers_version": "4.55.0", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..2aa6d83 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,14 @@ +{ + "bos_token_id": 151643, + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "repetition_penalty": 1.1, + "temperature": 0.7, + "top_k": 20, + "top_p": 0.8, + "transformers_version": "4.55.0" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..8c5c82e --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13529be5451d49b8092868d73ea75d8ae6b27b50b0651a1c609f891419e7bf7a +size 3087467144 diff --git a/run_summary.json b/run_summary.json new file mode 100644 index 0000000..fbf9105 --- /dev/null +++ b/run_summary.json @@ -0,0 +1,12 @@ +{ + "agent_name": null, + "training_start": null, + "training_end": null, + "created_by": "DCAgent", + "base_model_name": "/p/scratch/synthlaion/dc-agent-shared/hf_hub/models--Qwen--Qwen2.5-1.5B-Instruct/snapshots/989aa7980e4cf806f80c7fef2b1adb7bc71aa306", + "dataset_name": "laion/Qwen3-32B_hero_run_4_code_32k-sharegpt", + "training_type": "SFT", + "training_parameters": "https://huggingface.co/mlfoundations-dev/Qwen2.5-1.5B-32k-NODES-64-MBS-1-GAS-1-GBS-256_Qwen2-5-1-5B-Instruct/blob/main/config.json", + "wandb_link": null, + "traces_location_s3": null +} \ No newline at end of file diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..51ebb3b --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..a406f80 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,208 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 32768, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..4e5b86b --- /dev/null +++ b/train_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 0.005619164353050912, + "achieved_tflops_per_gpu_theoretical": 323.025179674411, + "epoch": 2.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6287916302680969, + "mfu_percent": 0.001801014215721446, + "mfu_percent_theoretical": 103.53371143410608, + "total_flos": 2.788441056922829e+16, + "train_loss": 0.21610206831669151, + "train_runtime": 19384.2842, + "train_samples_per_second": 98.968, + "train_steps_per_second": 0.387, + "valid_targets_mean": 15631.9, + "valid_targets_min": 505 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..1c2d834 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,1521 @@ +{"current_steps": 5, "total_steps": 7494, "loss": 0.9535, "lr": 7.999999999999999e-07, "epoch": 0.0013344008540165466, "percentage": 0.07, "elapsed_time": "0:09:54", "remaining_time": "10 days, 7:16:36"} +{"current_steps": 10, "total_steps": 7494, "loss": 0.9367, "lr": 1.8e-06, "epoch": 0.0026688017080330933, "percentage": 0.13, "elapsed_time": "0:10:25", "remaining_time": "5 days, 10:04:15"} +{"current_steps": 15, "total_steps": 7494, "loss": 0.9145, "lr": 2.8e-06, "epoch": 0.0040032025620496394, "percentage": 0.2, "elapsed_time": "0:10:54", "remaining_time": "3 days, 18:38:35"} +{"current_steps": 20, "total_steps": 7494, "loss": 0.9386, "lr": 3.7999999999999996e-06, "epoch": 0.0053376034160661865, "percentage": 0.27, "elapsed_time": "0:11:58", "remaining_time": "3 days, 2:34:07"} +{"current_steps": 25, "total_steps": 7494, "loss": 0.8995, "lr": 4.8e-06, "epoch": 0.006672004270082733, "percentage": 0.33, "elapsed_time": "0:12:25", "remaining_time": "2 days, 13:53:17"} +{"current_steps": 30, "total_steps": 7494, "loss": 0.9114, "lr": 5.7999999999999995e-06, "epoch": 0.008006405124099279, "percentage": 0.4, "elapsed_time": "0:13:26", "remaining_time": "2 days, 7:44:35"} +{"current_steps": 35, "total_steps": 7494, "loss": 0.8679, "lr": 6.8e-06, "epoch": 0.009340805978115827, "percentage": 0.47, "elapsed_time": "0:14:01", "remaining_time": "2 days, 1:49:40"} +{"current_steps": 40, "total_steps": 7494, "loss": 0.8755, "lr": 7.799999999999998e-06, "epoch": 0.010675206832132373, "percentage": 0.53, "elapsed_time": "0:14:52", "remaining_time": "1 day, 22:11:13"} +{"current_steps": 45, "total_steps": 7494, "loss": 0.8423, "lr": 8.799999999999999e-06, "epoch": 0.01200960768614892, "percentage": 0.6, "elapsed_time": "0:15:19", "remaining_time": "1 day, 18:15:56"} +{"current_steps": 50, "total_steps": 7494, "loss": 0.8624, "lr": 9.799999999999998e-06, "epoch": 0.013344008540165465, "percentage": 0.67, "elapsed_time": "0:15:46", "remaining_time": "1 day, 15:07:50"} +{"current_steps": 55, "total_steps": 7494, "loss": 0.8295, "lr": 1.0799999999999998e-05, "epoch": 0.014678409394182012, "percentage": 0.73, "elapsed_time": "0:16:41", "remaining_time": "1 day, 13:38:17"} +{"current_steps": 60, "total_steps": 7494, "loss": 0.8227, "lr": 1.1799999999999999e-05, "epoch": 0.016012810248198558, "percentage": 0.8, "elapsed_time": "0:17:13", "remaining_time": "1 day, 11:33:33"} +{"current_steps": 65, "total_steps": 7494, "loss": 0.8309, "lr": 1.2799999999999998e-05, "epoch": 0.017347211102215106, "percentage": 0.87, "elapsed_time": "0:17:39", "remaining_time": "1 day, 9:37:59"} +{"current_steps": 70, "total_steps": 7494, "loss": 0.8167, "lr": 1.3799999999999998e-05, "epoch": 0.018681611956231654, "percentage": 0.93, "elapsed_time": "0:18:05", "remaining_time": "1 day, 7:58:33"} +{"current_steps": 75, "total_steps": 7494, "loss": 0.7966, "lr": 1.4799999999999999e-05, "epoch": 0.020016012810248198, "percentage": 1.0, "elapsed_time": "0:19:00", "remaining_time": "1 day, 7:20:55"} +{"current_steps": 80, "total_steps": 7494, "loss": 0.799, "lr": 1.5799999999999998e-05, "epoch": 0.021350413664264746, "percentage": 1.07, "elapsed_time": "0:19:26", "remaining_time": "1 day, 6:01:56"} +{"current_steps": 85, "total_steps": 7494, "loss": 0.7965, "lr": 1.68e-05, "epoch": 0.02268481451828129, "percentage": 1.13, "elapsed_time": "0:19:52", "remaining_time": "1 day, 4:52:47"} +{"current_steps": 90, "total_steps": 7494, "loss": 0.7925, "lr": 1.78e-05, "epoch": 0.02401921537229784, "percentage": 1.2, "elapsed_time": "0:20:28", "remaining_time": "1 day, 4:04:57"} +{"current_steps": 95, "total_steps": 7494, "loss": 0.8008, "lr": 1.8799999999999996e-05, "epoch": 0.025353616226314386, "percentage": 1.27, "elapsed_time": "0:21:17", "remaining_time": "1 day, 3:38:18"} +{"current_steps": 5, "total_steps": 7494, "loss": 0.9535, "lr": 7.999999999999999e-07, "epoch": 0.0013344008540165466, "percentage": 0.07, "elapsed_time": "0:09:25", "remaining_time": "9 days, 19:19:25"} +{"current_steps": 10, "total_steps": 7494, "loss": 0.9367, "lr": 1.8e-06, "epoch": 0.0026688017080330933, "percentage": 0.13, "elapsed_time": "0:09:57", "remaining_time": "5 days, 4:14:02"} +{"current_steps": 15, "total_steps": 7494, "loss": 0.9145, "lr": 2.8e-06, "epoch": 0.0040032025620496394, "percentage": 0.2, "elapsed_time": "0:10:26", "remaining_time": "3 days, 14:42:59"} +{"current_steps": 20, "total_steps": 7494, "loss": 0.9386, "lr": 3.7999999999999996e-06, "epoch": 0.0053376034160661865, "percentage": 0.27, "elapsed_time": "0:11:31", "remaining_time": "2 days, 23:44:40"} +{"current_steps": 25, "total_steps": 7494, "loss": 0.8995, "lr": 4.8e-06, "epoch": 0.006672004270082733, "percentage": 0.33, "elapsed_time": "0:11:57", "remaining_time": "2 days, 11:33:53"} +{"current_steps": 30, "total_steps": 7494, "loss": 0.9114, "lr": 5.7999999999999995e-06, "epoch": 0.008006405124099279, "percentage": 0.4, "elapsed_time": "0:12:23", "remaining_time": "2 days, 3:24:50"} +{"current_steps": 35, "total_steps": 7494, "loss": 0.8679, "lr": 6.8e-06, "epoch": 0.009340805978115827, "percentage": 0.47, "elapsed_time": "0:12:57", "remaining_time": "1 day, 22:01:57"} +{"current_steps": 40, "total_steps": 7494, "loss": 0.8752, "lr": 7.799999999999998e-06, "epoch": 0.010675206832132373, "percentage": 0.53, "elapsed_time": "0:13:51", "remaining_time": "1 day, 19:01:19"} +{"current_steps": 45, "total_steps": 7494, "loss": 0.8419, "lr": 8.799999999999999e-06, "epoch": 0.01200960768614892, "percentage": 0.6, "elapsed_time": "0:14:17", "remaining_time": "1 day, 15:25:01"} +{"current_steps": 50, "total_steps": 7494, "loss": 0.8621, "lr": 9.799999999999998e-06, "epoch": 0.013344008540165465, "percentage": 0.67, "elapsed_time": "0:14:43", "remaining_time": "1 day, 12:31:09"} +{"current_steps": 55, "total_steps": 7494, "loss": 0.8292, "lr": 1.0799999999999998e-05, "epoch": 0.014678409394182012, "percentage": 0.73, "elapsed_time": "0:15:39", "remaining_time": "1 day, 11:17:56"} +{"current_steps": 60, "total_steps": 7494, "loss": 0.8224, "lr": 1.1799999999999999e-05, "epoch": 0.016012810248198558, "percentage": 0.8, "elapsed_time": "0:16:10", "remaining_time": "1 day, 9:23:27"} +{"current_steps": 65, "total_steps": 7494, "loss": 0.8305, "lr": 1.2799999999999998e-05, "epoch": 0.017347211102215106, "percentage": 0.87, "elapsed_time": "0:16:36", "remaining_time": "1 day, 7:37:22"} +{"current_steps": 70, "total_steps": 7494, "loss": 0.8164, "lr": 1.3799999999999998e-05, "epoch": 0.018681611956231654, "percentage": 0.93, "elapsed_time": "0:17:01", "remaining_time": "1 day, 6:05:46"} +{"current_steps": 75, "total_steps": 7494, "loss": 0.7964, "lr": 1.4799999999999999e-05, "epoch": 0.020016012810248198, "percentage": 1.0, "elapsed_time": "0:17:58", "remaining_time": "1 day, 5:38:52"} +{"current_steps": 80, "total_steps": 7494, "loss": 0.7989, "lr": 1.5799999999999998e-05, "epoch": 0.021350413664264746, "percentage": 1.07, "elapsed_time": "0:18:24", "remaining_time": "1 day, 4:26:31"} +{"current_steps": 85, "total_steps": 7494, "loss": 0.7965, "lr": 1.68e-05, "epoch": 0.02268481451828129, "percentage": 1.13, "elapsed_time": "0:19:20", "remaining_time": "1 day, 4:05:52"} +{"current_steps": 90, "total_steps": 7494, "loss": 0.7926, "lr": 1.78e-05, "epoch": 0.02401921537229784, "percentage": 1.2, "elapsed_time": "0:21:49", "remaining_time": "1 day, 5:54:57"} +{"current_steps": 95, "total_steps": 7494, "loss": 0.8009, "lr": 1.8799999999999996e-05, "epoch": 0.025353616226314386, "percentage": 1.27, "elapsed_time": "0:22:39", "remaining_time": "1 day, 5:24:22"} +{"current_steps": 100, "total_steps": 7494, "loss": 0.772, "lr": 1.98e-05, "epoch": 0.02668801708033093, "percentage": 1.33, "elapsed_time": "0:23:04", "remaining_time": "1 day, 4:26:33"} +{"current_steps": 105, "total_steps": 7494, "loss": 0.7746, "lr": 2.0799999999999997e-05, "epoch": 0.02802241793434748, "percentage": 1.4, "elapsed_time": "0:23:35", "remaining_time": "1 day, 3:40:40"} +{"current_steps": 110, "total_steps": 7494, "loss": 0.7691, "lr": 2.1799999999999998e-05, "epoch": 0.029356818788364023, "percentage": 1.47, "elapsed_time": "0:24:28", "remaining_time": "1 day, 3:22:58"} +{"current_steps": 115, "total_steps": 7494, "loss": 0.7771, "lr": 2.28e-05, "epoch": 0.03069121964238057, "percentage": 1.53, "elapsed_time": "0:25:01", "remaining_time": "1 day, 2:45:16"} +{"current_steps": 120, "total_steps": 7494, "loss": 0.7815, "lr": 2.38e-05, "epoch": 0.032025620496397116, "percentage": 1.6, "elapsed_time": "0:25:26", "remaining_time": "1 day, 2:03:28"} +{"current_steps": 125, "total_steps": 7494, "loss": 0.7829, "lr": 2.4799999999999996e-05, "epoch": 0.03336002135041367, "percentage": 1.67, "elapsed_time": "0:25:52", "remaining_time": "1 day, 1:25:02"} +{"current_steps": 130, "total_steps": 7494, "loss": 0.7623, "lr": 2.5799999999999997e-05, "epoch": 0.03469442220443021, "percentage": 1.73, "elapsed_time": "0:26:54", "remaining_time": "1 day, 1:23:55"} +{"current_steps": 135, "total_steps": 7494, "loss": 0.7565, "lr": 2.6799999999999998e-05, "epoch": 0.036028823058446756, "percentage": 1.8, "elapsed_time": "0:27:19", "remaining_time": "1 day, 0:49:39"} +{"current_steps": 140, "total_steps": 7494, "loss": 0.7886, "lr": 2.7799999999999995e-05, "epoch": 0.03736322391246331, "percentage": 1.87, "elapsed_time": "0:27:45", "remaining_time": "1 day, 0:17:43"} +{"current_steps": 145, "total_steps": 7494, "loss": 0.7753, "lr": 2.88e-05, "epoch": 0.03869762476647985, "percentage": 1.93, "elapsed_time": "0:28:17", "remaining_time": "23:53:29"} +{"current_steps": 150, "total_steps": 7494, "loss": 0.7661, "lr": 2.9799999999999996e-05, "epoch": 0.040032025620496396, "percentage": 2.0, "elapsed_time": "0:29:54", "remaining_time": "1 day, 0:24:25"} +{"current_steps": 155, "total_steps": 7494, "loss": 0.7708, "lr": 3.0799999999999996e-05, "epoch": 0.04136642647451294, "percentage": 2.07, "elapsed_time": "0:30:20", "remaining_time": "23:56:17"} +{"current_steps": 160, "total_steps": 7494, "loss": 0.7601, "lr": 3.1799999999999994e-05, "epoch": 0.04270082732852949, "percentage": 2.14, "elapsed_time": "0:30:45", "remaining_time": "23:29:50"} +{"current_steps": 165, "total_steps": 7494, "loss": 0.7435, "lr": 3.28e-05, "epoch": 0.044035228182546036, "percentage": 2.2, "elapsed_time": "0:31:35", "remaining_time": "23:23:23"} +{"current_steps": 170, "total_steps": 7494, "loss": 0.7605, "lr": 3.3799999999999995e-05, "epoch": 0.04536962903656258, "percentage": 2.27, "elapsed_time": "0:32:11", "remaining_time": "23:06:41"} +{"current_steps": 175, "total_steps": 7494, "loss": 0.7376, "lr": 3.48e-05, "epoch": 0.04670402989057913, "percentage": 2.34, "elapsed_time": "0:32:36", "remaining_time": "22:44:00"} +{"current_steps": 180, "total_steps": 7494, "loss": 0.7759, "lr": 3.5799999999999996e-05, "epoch": 0.04803843074459568, "percentage": 2.4, "elapsed_time": "0:33:02", "remaining_time": "22:22:24"} +{"current_steps": 185, "total_steps": 7494, "loss": 0.7487, "lr": 3.679999999999999e-05, "epoch": 0.04937283159861222, "percentage": 2.47, "elapsed_time": "0:34:02", "remaining_time": "22:24:46"} +{"current_steps": 190, "total_steps": 7494, "loss": 0.7693, "lr": 3.78e-05, "epoch": 0.05070723245262877, "percentage": 2.54, "elapsed_time": "0:34:28", "remaining_time": "22:05:24"} +{"current_steps": 195, "total_steps": 7494, "loss": 0.7515, "lr": 3.8799999999999994e-05, "epoch": 0.05204163330664532, "percentage": 2.6, "elapsed_time": "0:34:54", "remaining_time": "21:46:22"} +{"current_steps": 200, "total_steps": 7494, "loss": 0.751, "lr": 3.979999999999999e-05, "epoch": 0.05337603416066186, "percentage": 2.67, "elapsed_time": "0:35:23", "remaining_time": "21:30:29"} +{"current_steps": 205, "total_steps": 7494, "loss": 0.7633, "lr": 4.08e-05, "epoch": 0.054710435014678406, "percentage": 2.74, "elapsed_time": "0:36:25", "remaining_time": "21:35:00"} +{"current_steps": 210, "total_steps": 7494, "loss": 0.7607, "lr": 4.18e-05, "epoch": 0.05604483586869496, "percentage": 2.8, "elapsed_time": "0:36:50", "remaining_time": "21:18:09"} +{"current_steps": 205, "total_steps": 7494, "loss": 0.7633, "lr": 4.08e-05, "epoch": 0.054710435014678406, "percentage": 2.74, "elapsed_time": "0:08:19", "remaining_time": "4:56:13"} +{"current_steps": 210, "total_steps": 7494, "loss": 0.7607, "lr": 4.18e-05, "epoch": 0.05604483586869496, "percentage": 2.8, "elapsed_time": "0:08:51", "remaining_time": "5:07:27"} +{"current_steps": 215, "total_steps": 7494, "loss": 0.7494, "lr": 4.28e-05, "epoch": 0.0573792367227115, "percentage": 2.87, "elapsed_time": "0:09:21", "remaining_time": "5:16:34"} +{"current_steps": 220, "total_steps": 7494, "loss": 0.7532, "lr": 4.3799999999999994e-05, "epoch": 0.058713637576728046, "percentage": 2.94, "elapsed_time": "0:10:19", "remaining_time": "5:41:22"} +{"current_steps": 225, "total_steps": 7494, "loss": 0.7452, "lr": 4.48e-05, "epoch": 0.0600480384307446, "percentage": 3.0, "elapsed_time": "0:10:45", "remaining_time": "5:47:49"} +{"current_steps": 230, "total_steps": 7494, "loss": 0.7659, "lr": 4.5799999999999995e-05, "epoch": 0.06138243928476114, "percentage": 3.07, "elapsed_time": "0:11:12", "remaining_time": "5:53:52"} +{"current_steps": 235, "total_steps": 7494, "loss": 0.7531, "lr": 4.68e-05, "epoch": 0.0627168401387777, "percentage": 3.14, "elapsed_time": "0:11:45", "remaining_time": "6:03:10"} +{"current_steps": 240, "total_steps": 7494, "loss": 0.7481, "lr": 4.7799999999999996e-05, "epoch": 0.06405124099279423, "percentage": 3.2, "elapsed_time": "0:12:34", "remaining_time": "6:19:58"} +{"current_steps": 245, "total_steps": 7494, "loss": 0.7361, "lr": 4.8799999999999994e-05, "epoch": 0.06538564184681078, "percentage": 3.27, "elapsed_time": "0:12:59", "remaining_time": "6:24:37"} +{"current_steps": 250, "total_steps": 7494, "loss": 0.7647, "lr": 4.98e-05, "epoch": 0.06672004270082733, "percentage": 3.34, "elapsed_time": "0:13:26", "remaining_time": "6:29:15"} +{"current_steps": 255, "total_steps": 7494, "loss": 0.7516, "lr": 5.0799999999999995e-05, "epoch": 0.06805444355484387, "percentage": 3.4, "elapsed_time": "0:14:20", "remaining_time": "6:47:16"} +{"current_steps": 260, "total_steps": 7494, "loss": 0.7373, "lr": 5.179999999999999e-05, "epoch": 0.06938884440886042, "percentage": 3.47, "elapsed_time": "0:14:48", "remaining_time": "6:52:12"} +{"current_steps": 265, "total_steps": 7494, "loss": 0.7385, "lr": 5.279999999999999e-05, "epoch": 0.07072324526287697, "percentage": 3.54, "elapsed_time": "0:15:14", "remaining_time": "6:55:53"} +{"current_steps": 270, "total_steps": 7494, "loss": 0.7459, "lr": 5.38e-05, "epoch": 0.07205764611689351, "percentage": 3.6, "elapsed_time": "0:15:40", "remaining_time": "6:59:19"} +{"current_steps": 275, "total_steps": 7494, "loss": 0.7382, "lr": 5.48e-05, "epoch": 0.07339204697091006, "percentage": 3.67, "elapsed_time": "0:16:36", "remaining_time": "7:16:08"} +{"current_steps": 280, "total_steps": 7494, "loss": 0.7288, "lr": 5.5799999999999994e-05, "epoch": 0.07472644782492661, "percentage": 3.74, "elapsed_time": "0:17:02", "remaining_time": "7:19:09"} +{"current_steps": 285, "total_steps": 7494, "loss": 0.7388, "lr": 5.679999999999999e-05, "epoch": 0.07606084867894315, "percentage": 3.8, "elapsed_time": "0:17:28", "remaining_time": "7:21:51"} +{"current_steps": 290, "total_steps": 7494, "loss": 0.7289, "lr": 5.78e-05, "epoch": 0.0773952495329597, "percentage": 3.87, "elapsed_time": "0:18:02", "remaining_time": "7:28:12"} +{"current_steps": 295, "total_steps": 7494, "loss": 0.7277, "lr": 5.88e-05, "epoch": 0.07872965038697624, "percentage": 3.94, "elapsed_time": "0:18:51", "remaining_time": "7:40:08"} +{"current_steps": 300, "total_steps": 7494, "loss": 0.7596, "lr": 5.98e-05, "epoch": 0.08006405124099279, "percentage": 4.0, "elapsed_time": "0:19:16", "remaining_time": "7:42:18"} +{"current_steps": 305, "total_steps": 7494, "loss": 0.7345, "lr": 6.0799999999999994e-05, "epoch": 0.08139845209500934, "percentage": 4.07, "elapsed_time": "0:19:51", "remaining_time": "7:47:59"} +{"current_steps": 310, "total_steps": 7494, "loss": 0.7449, "lr": 6.18e-05, "epoch": 0.08273285294902588, "percentage": 4.14, "elapsed_time": "0:20:43", "remaining_time": "8:00:11"} +{"current_steps": 315, "total_steps": 7494, "loss": 0.7299, "lr": 6.28e-05, "epoch": 0.08406725380304243, "percentage": 4.2, "elapsed_time": "0:21:13", "remaining_time": "8:03:44"} +{"current_steps": 320, "total_steps": 7494, "loss": 0.7372, "lr": 6.379999999999999e-05, "epoch": 0.08540165465705898, "percentage": 4.27, "elapsed_time": "0:21:38", "remaining_time": "8:05:19"} +{"current_steps": 325, "total_steps": 7494, "loss": 0.7176, "lr": 6.479999999999999e-05, "epoch": 0.08673605551107552, "percentage": 4.34, "elapsed_time": "0:22:05", "remaining_time": "8:07:07"} +{"current_steps": 330, "total_steps": 7494, "loss": 0.716, "lr": 6.579999999999999e-05, "epoch": 0.08807045636509207, "percentage": 4.4, "elapsed_time": "0:23:02", "remaining_time": "8:20:14"} +{"current_steps": 335, "total_steps": 7494, "loss": 0.725, "lr": 6.68e-05, "epoch": 0.08940485721910862, "percentage": 4.47, "elapsed_time": "0:23:28", "remaining_time": "8:21:32"} +{"current_steps": 340, "total_steps": 7494, "loss": 0.7378, "lr": 6.78e-05, "epoch": 0.09073925807312516, "percentage": 4.54, "elapsed_time": "0:23:53", "remaining_time": "8:22:38"} +{"current_steps": 345, "total_steps": 7494, "loss": 0.7283, "lr": 6.879999999999999e-05, "epoch": 0.09207365892714171, "percentage": 4.6, "elapsed_time": "0:24:26", "remaining_time": "8:26:29"} +{"current_steps": 350, "total_steps": 7494, "loss": 0.7395, "lr": 6.979999999999999e-05, "epoch": 0.09340805978115826, "percentage": 4.67, "elapsed_time": "0:25:18", "remaining_time": "8:36:31"} +{"current_steps": 355, "total_steps": 7494, "loss": 0.7362, "lr": 7.079999999999999e-05, "epoch": 0.0947424606351748, "percentage": 4.74, "elapsed_time": "0:25:43", "remaining_time": "8:37:23"} +{"current_steps": 360, "total_steps": 7494, "loss": 0.7228, "lr": 7.18e-05, "epoch": 0.09607686148919135, "percentage": 4.8, "elapsed_time": "0:26:09", "remaining_time": "8:38:13"} +{"current_steps": 365, "total_steps": 7494, "loss": 0.7336, "lr": 7.28e-05, "epoch": 0.0974112623432079, "percentage": 4.87, "elapsed_time": "0:26:59", "remaining_time": "8:47:15"} +{"current_steps": 370, "total_steps": 7494, "loss": 0.7288, "lr": 7.379999999999999e-05, "epoch": 0.09874566319722444, "percentage": 4.94, "elapsed_time": "0:27:36", "remaining_time": "8:51:27"} +{"current_steps": 375, "total_steps": 7494, "loss": 0.7357, "lr": 7.479999999999999e-05, "epoch": 0.100080064051241, "percentage": 5.0, "elapsed_time": "0:28:01", "remaining_time": "8:51:58"} +{"current_steps": 380, "total_steps": 7494, "loss": 0.7199, "lr": 7.579999999999999e-05, "epoch": 0.10141446490525755, "percentage": 5.07, "elapsed_time": "0:28:26", "remaining_time": "8:52:29"} +{"current_steps": 385, "total_steps": 7494, "loss": 0.7239, "lr": 7.68e-05, "epoch": 0.10274886575927408, "percentage": 5.14, "elapsed_time": "0:29:24", "remaining_time": "9:03:07"} +{"current_steps": 390, "total_steps": 7494, "loss": 0.7299, "lr": 7.780000000000001e-05, "epoch": 0.10408326661329063, "percentage": 5.2, "elapsed_time": "0:29:51", "remaining_time": "9:04:01"} +{"current_steps": 395, "total_steps": 7494, "loss": 0.7177, "lr": 7.879999999999999e-05, "epoch": 0.10541766746730719, "percentage": 5.27, "elapsed_time": "0:30:17", "remaining_time": "9:04:20"} +{"current_steps": 400, "total_steps": 7494, "loss": 0.73, "lr": 7.98e-05, "epoch": 0.10675206832132372, "percentage": 5.34, "elapsed_time": "0:30:45", "remaining_time": "9:05:33"} +{"current_steps": 405, "total_steps": 7494, "loss": 0.7392, "lr": 8.079999999999999e-05, "epoch": 0.10808646917534027, "percentage": 5.4, "elapsed_time": "0:31:50", "remaining_time": "9:17:19"} +{"current_steps": 410, "total_steps": 7494, "loss": 0.7268, "lr": 8.18e-05, "epoch": 0.10942087002935681, "percentage": 5.47, "elapsed_time": "0:32:15", "remaining_time": "9:17:24"} +{"current_steps": 415, "total_steps": 7494, "loss": 0.7005, "lr": 8.28e-05, "epoch": 0.11075527088337336, "percentage": 5.54, "elapsed_time": "0:32:40", "remaining_time": "9:17:30"} +{"current_steps": 420, "total_steps": 7494, "loss": 0.703, "lr": 8.379999999999999e-05, "epoch": 0.11208967173738991, "percentage": 5.6, "elapsed_time": "0:33:25", "remaining_time": "9:22:52"} +{"current_steps": 425, "total_steps": 7494, "loss": 0.715, "lr": 8.48e-05, "epoch": 0.11342407259140645, "percentage": 5.67, "elapsed_time": "0:34:06", "remaining_time": "9:27:21"} +{"current_steps": 430, "total_steps": 7494, "loss": 0.7204, "lr": 8.579999999999998e-05, "epoch": 0.114758473445423, "percentage": 5.74, "elapsed_time": "0:34:31", "remaining_time": "9:27:13"} +{"current_steps": 435, "total_steps": 7494, "loss": 0.7315, "lr": 8.68e-05, "epoch": 0.11609287429943956, "percentage": 5.8, "elapsed_time": "0:34:56", "remaining_time": "9:27:07"} +{"current_steps": 440, "total_steps": 7494, "loss": 0.7176, "lr": 8.779999999999999e-05, "epoch": 0.11742727515345609, "percentage": 5.87, "elapsed_time": "0:35:52", "remaining_time": "9:35:12"} +{"current_steps": 445, "total_steps": 7494, "loss": 0.7136, "lr": 8.879999999999999e-05, "epoch": 0.11876167600747264, "percentage": 5.94, "elapsed_time": "0:36:23", "remaining_time": "9:36:33"} +{"current_steps": 450, "total_steps": 7494, "loss": 0.7237, "lr": 8.98e-05, "epoch": 0.1200960768614892, "percentage": 6.0, "elapsed_time": "0:36:48", "remaining_time": "9:36:17"} +{"current_steps": 455, "total_steps": 7494, "loss": 0.7107, "lr": 9.079999999999998e-05, "epoch": 0.12143047771550573, "percentage": 6.07, "elapsed_time": "0:37:15", "remaining_time": "9:36:24"} +{"current_steps": 460, "total_steps": 7494, "loss": 0.7134, "lr": 9.18e-05, "epoch": 0.12276487856952228, "percentage": 6.14, "elapsed_time": "0:38:14", "remaining_time": "9:44:48"} +{"current_steps": 465, "total_steps": 7494, "loss": 0.7253, "lr": 9.279999999999999e-05, "epoch": 0.12409927942353884, "percentage": 6.2, "elapsed_time": "0:39:14", "remaining_time": "9:53:16"} +{"current_steps": 470, "total_steps": 7494, "loss": 0.7129, "lr": 9.379999999999999e-05, "epoch": 0.1254336802775554, "percentage": 6.27, "elapsed_time": "0:39:40", "remaining_time": "9:52:53"} +{"current_steps": 475, "total_steps": 7494, "loss": 0.734, "lr": 9.479999999999999e-05, "epoch": 0.12676808113157192, "percentage": 6.34, "elapsed_time": "0:40:13", "remaining_time": "9:54:21"} +{"current_steps": 480, "total_steps": 7494, "loss": 0.72, "lr": 9.58e-05, "epoch": 0.12810248198558846, "percentage": 6.41, "elapsed_time": "0:41:07", "remaining_time": "10:00:54"} +{"current_steps": 485, "total_steps": 7494, "loss": 0.7278, "lr": 9.68e-05, "epoch": 0.12943688283960503, "percentage": 6.47, "elapsed_time": "0:41:32", "remaining_time": "10:00:23"} +{"current_steps": 490, "total_steps": 7494, "loss": 0.714, "lr": 9.779999999999999e-05, "epoch": 0.13077128369362157, "percentage": 6.54, "elapsed_time": "0:41:58", "remaining_time": "9:59:54"} +{"current_steps": 495, "total_steps": 7494, "loss": 0.7212, "lr": 9.879999999999999e-05, "epoch": 0.1321056845476381, "percentage": 6.61, "elapsed_time": "0:42:44", "remaining_time": "10:04:25"} +{"current_steps": 500, "total_steps": 7494, "loss": 0.7251, "lr": 9.979999999999999e-05, "epoch": 0.13344008540165467, "percentage": 6.67, "elapsed_time": "0:43:27", "remaining_time": "10:07:51"} +{"current_steps": 505, "total_steps": 7494, "loss": 0.72, "lr": 0.0001008, "epoch": 0.1347744862556712, "percentage": 6.74, "elapsed_time": "0:44:02", "remaining_time": "10:09:28"} +{"current_steps": 510, "total_steps": 7494, "loss": 0.7155, "lr": 0.00010179999999999998, "epoch": 0.13610888710968774, "percentage": 6.81, "elapsed_time": "0:44:27", "remaining_time": "10:08:54"} +{"current_steps": 515, "total_steps": 7494, "loss": 0.7102, "lr": 0.00010279999999999999, "epoch": 0.1374432879637043, "percentage": 6.87, "elapsed_time": "0:45:27", "remaining_time": "10:16:01"} +{"current_steps": 520, "total_steps": 7494, "loss": 0.7049, "lr": 0.00010379999999999999, "epoch": 0.13877768881772085, "percentage": 6.94, "elapsed_time": "0:45:57", "remaining_time": "10:16:23"} +{"current_steps": 525, "total_steps": 7494, "loss": 0.7213, "lr": 0.00010479999999999999, "epoch": 0.14011208967173738, "percentage": 7.01, "elapsed_time": "0:46:22", "remaining_time": "10:15:40"} +{"current_steps": 530, "total_steps": 7494, "loss": 0.7189, "lr": 0.0001058, "epoch": 0.14144649052575395, "percentage": 7.07, "elapsed_time": "0:47:24", "remaining_time": "10:22:56"} +{"current_steps": 535, "total_steps": 7494, "loss": 0.7188, "lr": 0.00010679999999999998, "epoch": 0.14278089137977049, "percentage": 7.14, "elapsed_time": "0:48:21", "remaining_time": "10:28:57"} +{"current_steps": 540, "total_steps": 7494, "loss": 0.7283, "lr": 0.00010779999999999999, "epoch": 0.14411529223378702, "percentage": 7.21, "elapsed_time": "0:48:47", "remaining_time": "10:28:22"} +{"current_steps": 545, "total_steps": 7494, "loss": 0.7178, "lr": 0.0001088, "epoch": 0.1454496930878036, "percentage": 7.27, "elapsed_time": "0:49:13", "remaining_time": "10:27:36"} +{"current_steps": 550, "total_steps": 7494, "loss": 0.7393, "lr": 0.00010979999999999999, "epoch": 0.14678409394182013, "percentage": 7.34, "elapsed_time": "0:49:50", "remaining_time": "10:29:11"} +{"current_steps": 555, "total_steps": 7494, "loss": 0.6967, "lr": 0.0001108, "epoch": 0.14811849479583666, "percentage": 7.41, "elapsed_time": "0:50:39", "remaining_time": "10:33:18"} +{"current_steps": 560, "total_steps": 7494, "loss": 0.7226, "lr": 0.00011179999999999998, "epoch": 0.14945289564985323, "percentage": 7.47, "elapsed_time": "0:51:04", "remaining_time": "10:32:29"} +{"current_steps": 565, "total_steps": 7494, "loss": 0.689, "lr": 0.00011279999999999999, "epoch": 0.15078729650386977, "percentage": 7.54, "elapsed_time": "0:51:30", "remaining_time": "10:31:42"} +{"current_steps": 570, "total_steps": 7494, "loss": 0.7125, "lr": 0.0001138, "epoch": 0.1521216973578863, "percentage": 7.61, "elapsed_time": "0:53:01", "remaining_time": "10:44:05"} +{"current_steps": 575, "total_steps": 7494, "loss": 0.7258, "lr": 0.00011479999999999999, "epoch": 0.15345609821190287, "percentage": 7.67, "elapsed_time": "0:54:17", "remaining_time": "10:53:16"} +{"current_steps": 580, "total_steps": 7494, "loss": 0.7283, "lr": 0.0001158, "epoch": 0.1547904990659194, "percentage": 7.74, "elapsed_time": "0:54:43", "remaining_time": "10:52:17"} +{"current_steps": 585, "total_steps": 7494, "loss": 0.73, "lr": 0.00011679999999999998, "epoch": 0.15612489991993594, "percentage": 7.81, "elapsed_time": "0:55:08", "remaining_time": "10:51:19"} +{"current_steps": 590, "total_steps": 7494, "loss": 0.7309, "lr": 0.00011779999999999999, "epoch": 0.15745930077395248, "percentage": 7.87, "elapsed_time": "0:56:08", "remaining_time": "10:56:55"} +{"current_steps": 595, "total_steps": 7494, "loss": 0.7138, "lr": 0.0001188, "epoch": 0.15879370162796905, "percentage": 7.94, "elapsed_time": "0:56:39", "remaining_time": "10:56:53"} +{"current_steps": 600, "total_steps": 7494, "loss": 0.7085, "lr": 0.00011979999999999998, "epoch": 0.16012810248198558, "percentage": 8.01, "elapsed_time": "0:57:04", "remaining_time": "10:55:47"} +{"current_steps": 605, "total_steps": 7494, "loss": 0.7223, "lr": 0.0001208, "epoch": 0.16146250333600212, "percentage": 8.07, "elapsed_time": "0:57:43", "remaining_time": "10:57:13"} +{"current_steps": 610, "total_steps": 7494, "loss": 0.7157, "lr": 0.00012179999999999999, "epoch": 0.1627969041900187, "percentage": 8.14, "elapsed_time": "0:58:43", "remaining_time": "11:02:39"} +{"current_steps": 615, "total_steps": 7494, "loss": 0.7084, "lr": 0.00012279999999999998, "epoch": 0.16413130504403523, "percentage": 8.21, "elapsed_time": "0:59:10", "remaining_time": "11:01:50"} +{"current_steps": 620, "total_steps": 7494, "loss": 0.7216, "lr": 0.0001238, "epoch": 0.16546570589805176, "percentage": 8.27, "elapsed_time": "0:59:35", "remaining_time": "11:00:44"} +{"current_steps": 625, "total_steps": 7494, "loss": 0.7238, "lr": 0.00012479999999999997, "epoch": 0.16680010675206833, "percentage": 8.34, "elapsed_time": "1:00:13", "remaining_time": "11:01:55"} +{"current_steps": 630, "total_steps": 7494, "loss": 0.715, "lr": 0.0001258, "epoch": 0.16813450760608487, "percentage": 8.41, "elapsed_time": "1:01:05", "remaining_time": "11:05:37"} +{"current_steps": 635, "total_steps": 7494, "loss": 0.7157, "lr": 0.0001268, "epoch": 0.1694689084601014, "percentage": 8.47, "elapsed_time": "1:01:31", "remaining_time": "11:04:36"} +{"current_steps": 640, "total_steps": 7494, "loss": 0.7161, "lr": 0.0001278, "epoch": 0.17080330931411797, "percentage": 8.54, "elapsed_time": "1:02:27", "remaining_time": "11:08:53"} +{"current_steps": 645, "total_steps": 7494, "loss": 0.7069, "lr": 0.0001288, "epoch": 0.1721377101681345, "percentage": 8.61, "elapsed_time": "1:03:15", "remaining_time": "11:11:42"} +{"current_steps": 650, "total_steps": 7494, "loss": 0.7229, "lr": 0.00012979999999999998, "epoch": 0.17347211102215104, "percentage": 8.67, "elapsed_time": "1:03:55", "remaining_time": "11:13:07"} +{"current_steps": 655, "total_steps": 7494, "loss": 0.7222, "lr": 0.00013079999999999998, "epoch": 0.1748065118761676, "percentage": 8.74, "elapsed_time": "1:04:21", "remaining_time": "11:11:58"} +{"current_steps": 660, "total_steps": 7494, "loss": 0.7019, "lr": 0.0001318, "epoch": 0.17614091273018415, "percentage": 8.81, "elapsed_time": "1:04:47", "remaining_time": "11:10:54"} +{"current_steps": 665, "total_steps": 7494, "loss": 0.718, "lr": 0.00013279999999999998, "epoch": 0.17747531358420068, "percentage": 8.87, "elapsed_time": "1:05:43", "remaining_time": "11:14:57"} +{"current_steps": 670, "total_steps": 7494, "loss": 0.7221, "lr": 0.0001338, "epoch": 0.17880971443821725, "percentage": 8.94, "elapsed_time": "1:06:16", "remaining_time": "11:14:57"} +{"current_steps": 675, "total_steps": 7494, "loss": 0.7236, "lr": 0.00013479999999999997, "epoch": 0.1801441152922338, "percentage": 9.01, "elapsed_time": "1:06:41", "remaining_time": "11:13:45"} +{"current_steps": 680, "total_steps": 7494, "loss": 0.7025, "lr": 0.0001358, "epoch": 0.18147851614625032, "percentage": 9.07, "elapsed_time": "1:07:10", "remaining_time": "11:13:10"} +{"current_steps": 685, "total_steps": 7494, "loss": 0.7189, "lr": 0.0001368, "epoch": 0.1828129170002669, "percentage": 9.14, "elapsed_time": "1:08:32", "remaining_time": "11:21:14"} +{"current_steps": 690, "total_steps": 7494, "loss": 0.7047, "lr": 0.0001378, "epoch": 0.18414731785428343, "percentage": 9.21, "elapsed_time": "1:08:58", "remaining_time": "11:20:11"} +{"current_steps": 695, "total_steps": 7494, "loss": 0.7014, "lr": 0.00013879999999999999, "epoch": 0.18548171870829996, "percentage": 9.27, "elapsed_time": "1:09:24", "remaining_time": "11:18:56"} +{"current_steps": 700, "total_steps": 7494, "loss": 0.7104, "lr": 0.00013979999999999998, "epoch": 0.18681611956231653, "percentage": 9.34, "elapsed_time": "1:10:00", "remaining_time": "11:19:24"} +{"current_steps": 705, "total_steps": 7494, "loss": 0.7053, "lr": 0.00014079999999999998, "epoch": 0.18815052041633307, "percentage": 9.41, "elapsed_time": "1:11:02", "remaining_time": "11:24:06"} +{"current_steps": 710, "total_steps": 7494, "loss": 0.7087, "lr": 0.0001418, "epoch": 0.1894849212703496, "percentage": 9.47, "elapsed_time": "1:11:29", "remaining_time": "11:23:02"} +{"current_steps": 715, "total_steps": 7494, "loss": 0.6996, "lr": 0.00014279999999999997, "epoch": 0.19081932212436617, "percentage": 9.54, "elapsed_time": "1:11:54", "remaining_time": "11:21:46"} +{"current_steps": 720, "total_steps": 7494, "loss": 0.6826, "lr": 0.0001438, "epoch": 0.1921537229783827, "percentage": 9.61, "elapsed_time": "1:12:38", "remaining_time": "11:23:30"} +{"current_steps": 725, "total_steps": 7494, "loss": 0.6966, "lr": 0.0001448, "epoch": 0.19348812383239924, "percentage": 9.67, "elapsed_time": "1:13:23", "remaining_time": "11:25:15"} +{"current_steps": 730, "total_steps": 7494, "loss": 0.712, "lr": 0.0001458, "epoch": 0.1948225246864158, "percentage": 9.74, "elapsed_time": "1:13:49", "remaining_time": "11:23:58"} +{"current_steps": 735, "total_steps": 7494, "loss": 0.7071, "lr": 0.0001468, "epoch": 0.19615692554043235, "percentage": 9.81, "elapsed_time": "1:14:14", "remaining_time": "11:22:45"} +{"current_steps": 740, "total_steps": 7494, "loss": 0.7106, "lr": 0.0001478, "epoch": 0.19749132639444889, "percentage": 9.87, "elapsed_time": "1:15:07", "remaining_time": "11:25:36"} +{"current_steps": 745, "total_steps": 7494, "loss": 0.7001, "lr": 0.00014879999999999998, "epoch": 0.19882572724846545, "percentage": 9.94, "elapsed_time": "1:15:41", "remaining_time": "11:25:41"} +{"current_steps": 750, "total_steps": 7494, "loss": 0.7054, "lr": 0.00014979999999999998, "epoch": 0.200160128102482, "percentage": 10.01, "elapsed_time": "1:16:06", "remaining_time": "11:24:25"} +{"current_steps": 755, "total_steps": 7494, "loss": 0.7035, "lr": 0.00014999986979857214, "epoch": 0.20149452895649853, "percentage": 10.07, "elapsed_time": "1:16:34", "remaining_time": "11:23:30"} +{"current_steps": 760, "total_steps": 7494, "loss": 0.7045, "lr": 0.00014999934085604638, "epoch": 0.2028289298105151, "percentage": 10.14, "elapsed_time": "1:17:31", "remaining_time": "11:26:51"} +{"current_steps": 765, "total_steps": 7494, "loss": 0.7057, "lr": 0.00014999840503770068, "epoch": 0.20416333066453163, "percentage": 10.21, "elapsed_time": "1:18:01", "remaining_time": "11:26:18"} +{"current_steps": 770, "total_steps": 7494, "loss": 0.7181, "lr": 0.00014999706234861205, "epoch": 0.20549773151854817, "percentage": 10.27, "elapsed_time": "1:18:26", "remaining_time": "11:25:00"} +{"current_steps": 775, "total_steps": 7494, "loss": 0.7086, "lr": 0.00014999531279606457, "epoch": 0.20683213237256473, "percentage": 10.34, "elapsed_time": "1:18:58", "remaining_time": "11:24:45"} +{"current_steps": 780, "total_steps": 7494, "loss": 0.7147, "lr": 0.00014999315638954965, "epoch": 0.20816653322658127, "percentage": 10.41, "elapsed_time": "1:19:54", "remaining_time": "11:27:51"} +{"current_steps": 785, "total_steps": 7494, "loss": 0.7113, "lr": 0.000149990593140766, "epoch": 0.2095009340805978, "percentage": 10.48, "elapsed_time": "1:20:21", "remaining_time": "11:26:46"} +{"current_steps": 790, "total_steps": 7494, "loss": 0.694, "lr": 0.00014998762306361933, "epoch": 0.21083533493461437, "percentage": 10.54, "elapsed_time": "1:20:46", "remaining_time": "11:25:30"} +{"current_steps": 795, "total_steps": 7494, "loss": 0.7001, "lr": 0.00014998424617422253, "epoch": 0.2121697357886309, "percentage": 10.61, "elapsed_time": "1:21:49", "remaining_time": "11:29:26"} +{"current_steps": 800, "total_steps": 7494, "loss": 0.7014, "lr": 0.00014998046249089538, "epoch": 0.21350413664264745, "percentage": 10.68, "elapsed_time": "1:22:39", "remaining_time": "11:31:41"} +{"current_steps": 805, "total_steps": 7494, "loss": 0.6998, "lr": 0.00014997627203416458, "epoch": 0.214838537496664, "percentage": 10.74, "elapsed_time": "1:23:14", "remaining_time": "11:31:44"} +{"current_steps": 810, "total_steps": 7494, "loss": 0.7013, "lr": 0.00014997167482676366, "epoch": 0.21617293835068055, "percentage": 10.81, "elapsed_time": "1:23:40", "remaining_time": "11:30:27"} +{"current_steps": 815, "total_steps": 7494, "loss": 0.6972, "lr": 0.00014996667089363272, "epoch": 0.2175073392046971, "percentage": 10.88, "elapsed_time": "1:24:30", "remaining_time": "11:32:31"} +{"current_steps": 820, "total_steps": 7494, "loss": 0.7162, "lr": 0.00014996126026191832, "epoch": 0.21884174005871362, "percentage": 10.94, "elapsed_time": "1:25:10", "remaining_time": "11:33:11"} +{"current_steps": 825, "total_steps": 7494, "loss": 0.7122, "lr": 0.00014995544296097355, "epoch": 0.2201761409127302, "percentage": 11.01, "elapsed_time": "1:25:35", "remaining_time": "11:31:53"} +{"current_steps": 830, "total_steps": 7494, "loss": 0.7094, "lr": 0.00014994921902235757, "epoch": 0.22151054176674673, "percentage": 11.08, "elapsed_time": "1:26:01", "remaining_time": "11:30:41"} +{"current_steps": 835, "total_steps": 7494, "loss": 0.6913, "lr": 0.0001499425884798356, "epoch": 0.22284494262076326, "percentage": 11.14, "elapsed_time": "1:26:57", "remaining_time": "11:33:26"} +{"current_steps": 840, "total_steps": 7494, "loss": 0.7015, "lr": 0.00014993555136937872, "epoch": 0.22417934347477983, "percentage": 11.21, "elapsed_time": "1:27:31", "remaining_time": "11:33:19"} +{"current_steps": 845, "total_steps": 7494, "loss": 0.7108, "lr": 0.0001499281077291637, "epoch": 0.22551374432879637, "percentage": 11.28, "elapsed_time": "1:27:56", "remaining_time": "11:32:01"} +{"current_steps": 850, "total_steps": 7494, "loss": 0.7268, "lr": 0.00014992025759957267, "epoch": 0.2268481451828129, "percentage": 11.34, "elapsed_time": "1:28:25", "remaining_time": "11:31:08"} +{"current_steps": 855, "total_steps": 7494, "loss": 0.6981, "lr": 0.0001499120010231931, "epoch": 0.22818254603682947, "percentage": 11.41, "elapsed_time": "1:29:21", "remaining_time": "11:33:48"} +{"current_steps": 860, "total_steps": 7494, "loss": 0.6987, "lr": 0.00014990333804481738, "epoch": 0.229516946890846, "percentage": 11.48, "elapsed_time": "1:29:50", "remaining_time": "11:33:02"} +{"current_steps": 865, "total_steps": 7494, "loss": 0.6985, "lr": 0.00014989426871144266, "epoch": 0.23085134774486255, "percentage": 11.54, "elapsed_time": "1:30:16", "remaining_time": "11:31:47"} +{"current_steps": 870, "total_steps": 7494, "loss": 0.6855, "lr": 0.00014988479307227062, "epoch": 0.2321857485988791, "percentage": 11.61, "elapsed_time": "1:31:14", "remaining_time": "11:34:42"} +{"current_steps": 875, "total_steps": 7494, "loss": 0.7033, "lr": 0.00014987491117870717, "epoch": 0.23352014945289565, "percentage": 11.68, "elapsed_time": "1:32:08", "remaining_time": "11:37:00"} +{"current_steps": 880, "total_steps": 7494, "loss": 0.6884, "lr": 0.00014986462308436214, "epoch": 0.23485455030691219, "percentage": 11.74, "elapsed_time": "1:32:34", "remaining_time": "11:35:50"} +{"current_steps": 885, "total_steps": 7494, "loss": 0.7011, "lr": 0.00014985392884504903, "epoch": 0.23618895116092875, "percentage": 11.81, "elapsed_time": "1:33:00", "remaining_time": "11:34:31"} +{"current_steps": 890, "total_steps": 7494, "loss": 0.698, "lr": 0.00014984282851878477, "epoch": 0.2375233520149453, "percentage": 11.88, "elapsed_time": "1:33:40", "remaining_time": "11:35:06"} +{"current_steps": 895, "total_steps": 7494, "loss": 0.6982, "lr": 0.00014983132216578923, "epoch": 0.23885775286896183, "percentage": 11.94, "elapsed_time": "1:34:30", "remaining_time": "11:36:52"} +{"current_steps": 900, "total_steps": 7494, "loss": 0.6764, "lr": 0.00014981940984848508, "epoch": 0.2401921537229784, "percentage": 12.01, "elapsed_time": "1:34:56", "remaining_time": "11:35:37"} +{"current_steps": 905, "total_steps": 7494, "loss": 0.7052, "lr": 0.00014980709163149732, "epoch": 0.24152655457699493, "percentage": 12.08, "elapsed_time": "1:35:31", "remaining_time": "11:35:27"} +{"current_steps": 910, "total_steps": 7494, "loss": 0.6993, "lr": 0.000149794367581653, "epoch": 0.24286095543101147, "percentage": 12.14, "elapsed_time": "1:36:19", "remaining_time": "11:36:54"} +{"current_steps": 915, "total_steps": 7494, "loss": 0.6879, "lr": 0.00014978123776798082, "epoch": 0.24419535628502803, "percentage": 12.21, "elapsed_time": "1:37:00", "remaining_time": "11:37:27"} +{"current_steps": 920, "total_steps": 7494, "loss": 0.6906, "lr": 0.00014976770226171084, "epoch": 0.24552975713904457, "percentage": 12.28, "elapsed_time": "1:37:25", "remaining_time": "11:36:11"} +{"current_steps": 925, "total_steps": 7494, "loss": 0.6954, "lr": 0.00014975376113627394, "epoch": 0.2468641579930611, "percentage": 12.34, "elapsed_time": "1:37:51", "remaining_time": "11:34:59"} +{"current_steps": 930, "total_steps": 7494, "loss": 0.7149, "lr": 0.00014973941446730154, "epoch": 0.24819855884707767, "percentage": 12.41, "elapsed_time": "1:39:10", "remaining_time": "11:39:55"} +{"current_steps": 935, "total_steps": 7494, "loss": 0.6949, "lr": 0.00014972466233262517, "epoch": 0.2495329597010942, "percentage": 12.48, "elapsed_time": "1:39:45", "remaining_time": "11:39:45"} +{"current_steps": 940, "total_steps": 7494, "loss": 0.7109, "lr": 0.00014970950481227603, "epoch": 0.2508673605551108, "percentage": 12.54, "elapsed_time": "1:40:10", "remaining_time": "11:38:27"} +{"current_steps": 945, "total_steps": 7494, "loss": 0.7029, "lr": 0.00014969394198848456, "epoch": 0.2522017614091273, "percentage": 12.61, "elapsed_time": "1:41:05", "remaining_time": "11:40:33"} +{"current_steps": 950, "total_steps": 7494, "loss": 0.6799, "lr": 0.00014967797394567993, "epoch": 0.25353616226314385, "percentage": 12.68, "elapsed_time": "1:42:04", "remaining_time": "11:43:08"} +{"current_steps": 955, "total_steps": 7494, "loss": 0.6784, "lr": 0.00014966160077048982, "epoch": 0.2548705631171604, "percentage": 12.74, "elapsed_time": "1:42:35", "remaining_time": "11:42:24"} +{"current_steps": 960, "total_steps": 7494, "loss": 0.703, "lr": 0.00014964482255173958, "epoch": 0.2562049639711769, "percentage": 12.81, "elapsed_time": "1:43:00", "remaining_time": "11:41:07"} +{"current_steps": 965, "total_steps": 7494, "loss": 0.7009, "lr": 0.00014962763938045206, "epoch": 0.25753936482519346, "percentage": 12.88, "elapsed_time": "1:43:34", "remaining_time": "11:40:45"} +{"current_steps": 970, "total_steps": 7494, "loss": 0.6866, "lr": 0.00014961005134984693, "epoch": 0.25887376567921005, "percentage": 12.94, "elapsed_time": "1:44:29", "remaining_time": "11:42:46"} +{"current_steps": 975, "total_steps": 7494, "loss": 0.6845, "lr": 0.00014959205855534036, "epoch": 0.2602081665332266, "percentage": 13.01, "elapsed_time": "1:44:57", "remaining_time": "11:41:43"} +{"current_steps": 980, "total_steps": 7494, "loss": 0.6816, "lr": 0.00014957366109454427, "epoch": 0.26154256738724313, "percentage": 13.08, "elapsed_time": "1:45:23", "remaining_time": "11:40:28"} +{"current_steps": 985, "total_steps": 7494, "loss": 0.6959, "lr": 0.00014955485906726596, "epoch": 0.26287696824125967, "percentage": 13.14, "elapsed_time": "1:46:04", "remaining_time": "11:40:54"} +{"current_steps": 990, "total_steps": 7494, "loss": 0.7069, "lr": 0.00014953565257550756, "epoch": 0.2642113690952762, "percentage": 13.21, "elapsed_time": "1:46:56", "remaining_time": "11:42:34"} +{"current_steps": 995, "total_steps": 7494, "loss": 0.6946, "lr": 0.00014951604172346535, "epoch": 0.26554576994929274, "percentage": 13.28, "elapsed_time": "1:47:22", "remaining_time": "11:41:18"} +{"current_steps": 1000, "total_steps": 7494, "loss": 0.7005, "lr": 0.00014949602661752944, "epoch": 0.26688017080330934, "percentage": 13.34, "elapsed_time": "1:47:48", "remaining_time": "11:40:05"} +{"current_steps": 1005, "total_steps": 7494, "loss": 0.6683, "lr": 0.0001494756073662829, "epoch": 0.2682145716573259, "percentage": 13.41, "elapsed_time": "1:48:43", "remaining_time": "11:42:00"} +{"current_steps": 1010, "total_steps": 7494, "loss": 0.69, "lr": 0.00014945478408050135, "epoch": 0.2695489725113424, "percentage": 13.48, "elapsed_time": "1:49:27", "remaining_time": "11:42:44"} +{"current_steps": 1015, "total_steps": 7494, "loss": 0.6932, "lr": 0.00014943355687315239, "epoch": 0.27088337336535895, "percentage": 13.54, "elapsed_time": "1:49:53", "remaining_time": "11:41:26"} +{"current_steps": 1020, "total_steps": 7494, "loss": 0.6833, "lr": 0.0001494119258593948, "epoch": 0.2722177742193755, "percentage": 13.61, "elapsed_time": "1:50:19", "remaining_time": "11:40:16"} +{"current_steps": 1025, "total_steps": 7494, "loss": 0.7083, "lr": 0.00014938989115657815, "epoch": 0.273552175073392, "percentage": 13.68, "elapsed_time": "1:51:11", "remaining_time": "11:41:43"} +{"current_steps": 1030, "total_steps": 7494, "loss": 0.7071, "lr": 0.00014936745288424198, "epoch": 0.2748865759274086, "percentage": 13.74, "elapsed_time": "1:51:49", "remaining_time": "11:41:47"} +{"current_steps": 1035, "total_steps": 7494, "loss": 0.7001, "lr": 0.0001493446111641152, "epoch": 0.27622097678142515, "percentage": 13.81, "elapsed_time": "1:52:15", "remaining_time": "11:40:31"} +{"current_steps": 1040, "total_steps": 7494, "loss": 0.6806, "lr": 0.00014932136612011554, "epoch": 0.2775553776354417, "percentage": 13.88, "elapsed_time": "1:52:43", "remaining_time": "11:39:34"} +{"current_steps": 1045, "total_steps": 7494, "loss": 0.6878, "lr": 0.00014929771787834868, "epoch": 0.27888977848945823, "percentage": 13.94, "elapsed_time": "1:53:39", "remaining_time": "11:41:27"} +{"current_steps": 1050, "total_steps": 7494, "loss": 0.6978, "lr": 0.00014927366656710772, "epoch": 0.28022417934347477, "percentage": 14.01, "elapsed_time": "1:54:11", "remaining_time": "11:40:49"} +{"current_steps": 1055, "total_steps": 7494, "loss": 0.7055, "lr": 0.00014924921231687245, "epoch": 0.2815585801974913, "percentage": 14.08, "elapsed_time": "1:54:37", "remaining_time": "11:39:33"} +{"current_steps": 1060, "total_steps": 7494, "loss": 0.6899, "lr": 0.0001492243552603086, "epoch": 0.2828929810515079, "percentage": 14.14, "elapsed_time": "1:55:09", "remaining_time": "11:38:57"} +{"current_steps": 1065, "total_steps": 7494, "loss": 0.6943, "lr": 0.00014919909553226716, "epoch": 0.28422738190552443, "percentage": 14.21, "elapsed_time": "1:56:02", "remaining_time": "11:40:30"} +{"current_steps": 1070, "total_steps": 7494, "loss": 0.689, "lr": 0.00014917343326978366, "epoch": 0.28556178275954097, "percentage": 14.28, "elapsed_time": "1:56:31", "remaining_time": "11:39:35"} +{"current_steps": 1075, "total_steps": 7494, "loss": 0.6751, "lr": 0.00014914736861207733, "epoch": 0.2868961836135575, "percentage": 14.34, "elapsed_time": "1:56:57", "remaining_time": "11:38:20"} +{"current_steps": 1080, "total_steps": 7494, "loss": 0.6952, "lr": 0.0001491209017005505, "epoch": 0.28823058446757405, "percentage": 14.41, "elapsed_time": "1:57:33", "remaining_time": "11:38:11"} +{"current_steps": 1085, "total_steps": 7494, "loss": 0.6866, "lr": 0.00014909403267878771, "epoch": 0.2895649853215906, "percentage": 14.48, "elapsed_time": "1:58:26", "remaining_time": "11:39:38"} +{"current_steps": 1090, "total_steps": 7494, "loss": 0.7153, "lr": 0.000149066761692555, "epoch": 0.2908993861756072, "percentage": 14.54, "elapsed_time": "1:58:53", "remaining_time": "11:38:28"} +{"current_steps": 1095, "total_steps": 7494, "loss": 0.7205, "lr": 0.00014903908888979904, "epoch": 0.2922337870296237, "percentage": 14.61, "elapsed_time": "1:59:19", "remaining_time": "11:37:16"} +{"current_steps": 1100, "total_steps": 7494, "loss": 0.6987, "lr": 0.00014901101442064637, "epoch": 0.29356818788364025, "percentage": 14.68, "elapsed_time": "2:00:02", "remaining_time": "11:37:43"} +{"current_steps": 1105, "total_steps": 7494, "loss": 0.68, "lr": 0.00014898253843740271, "epoch": 0.2949025887376568, "percentage": 14.75, "elapsed_time": "2:00:57", "remaining_time": "11:39:24"} +{"current_steps": 1110, "total_steps": 7494, "loss": 0.6838, "lr": 0.00014895366109455189, "epoch": 0.2962369895916733, "percentage": 14.81, "elapsed_time": "2:01:23", "remaining_time": "11:38:11"} +{"current_steps": 1115, "total_steps": 7494, "loss": 0.6971, "lr": 0.00014892438254875522, "epoch": 0.29757139044568987, "percentage": 14.88, "elapsed_time": "2:02:23", "remaining_time": "11:40:14"} +{"current_steps": 1120, "total_steps": 7494, "loss": 0.6898, "lr": 0.00014889470295885047, "epoch": 0.29890579129970646, "percentage": 14.95, "elapsed_time": "2:03:15", "remaining_time": "11:41:27"} +{"current_steps": 1125, "total_steps": 7494, "loss": 0.6845, "lr": 0.0001488646224858512, "epoch": 0.300240192153723, "percentage": 15.01, "elapsed_time": "2:03:54", "remaining_time": "11:41:30"} +{"current_steps": 1130, "total_steps": 7494, "loss": 0.6882, "lr": 0.00014883414129294575, "epoch": 0.30157459300773953, "percentage": 15.08, "elapsed_time": "2:04:20", "remaining_time": "11:40:15"} +{"current_steps": 1135, "total_steps": 7494, "loss": 0.6723, "lr": 0.00014880325954549635, "epoch": 0.30290899386175607, "percentage": 15.15, "elapsed_time": "2:04:48", "remaining_time": "11:39:15"} +{"current_steps": 1140, "total_steps": 7494, "loss": 0.6794, "lr": 0.00014877197741103827, "epoch": 0.3042433947157726, "percentage": 15.21, "elapsed_time": "2:05:45", "remaining_time": "11:40:55"} +{"current_steps": 1145, "total_steps": 7494, "loss": 0.6922, "lr": 0.00014874029505927897, "epoch": 0.30557779556978915, "percentage": 15.28, "elapsed_time": "2:06:21", "remaining_time": "11:40:36"} +{"current_steps": 1150, "total_steps": 7494, "loss": 0.7049, "lr": 0.00014870821266209705, "epoch": 0.30691219642380574, "percentage": 15.35, "elapsed_time": "2:06:46", "remaining_time": "11:39:21"} +{"current_steps": 1155, "total_steps": 7494, "loss": 0.7001, "lr": 0.00014867573039354138, "epoch": 0.3082465972778223, "percentage": 15.41, "elapsed_time": "2:07:16", "remaining_time": "11:38:32"} +{"current_steps": 1160, "total_steps": 7494, "loss": 0.7009, "lr": 0.00014864284842983018, "epoch": 0.3095809981318388, "percentage": 15.48, "elapsed_time": "2:08:13", "remaining_time": "11:40:09"} +{"current_steps": 1165, "total_steps": 7494, "loss": 0.6803, "lr": 0.00014860956694935003, "epoch": 0.31091539898585535, "percentage": 15.55, "elapsed_time": "2:08:45", "remaining_time": "11:39:31"} +{"current_steps": 1170, "total_steps": 7494, "loss": 0.6737, "lr": 0.0001485758861326549, "epoch": 0.3122497998398719, "percentage": 15.61, "elapsed_time": "2:09:11", "remaining_time": "11:38:16"} +{"current_steps": 1175, "total_steps": 7494, "loss": 0.6764, "lr": 0.00014854180616246523, "epoch": 0.3135842006938884, "percentage": 15.68, "elapsed_time": "2:10:19", "remaining_time": "11:40:53"} +{"current_steps": 1180, "total_steps": 7494, "loss": 0.6993, "lr": 0.00014850732722366682, "epoch": 0.31491860154790496, "percentage": 15.75, "elapsed_time": "2:11:17", "remaining_time": "11:42:28"} +{"current_steps": 1185, "total_steps": 7494, "loss": 0.6919, "lr": 0.00014847244950330998, "epoch": 0.31625300240192156, "percentage": 15.81, "elapsed_time": "2:11:45", "remaining_time": "11:41:28"} +{"current_steps": 1190, "total_steps": 7494, "loss": 0.697, "lr": 0.00014843717319060833, "epoch": 0.3175874032559381, "percentage": 15.88, "elapsed_time": "2:12:11", "remaining_time": "11:40:19"} +{"current_steps": 1195, "total_steps": 7494, "loss": 0.6903, "lr": 0.00014840149847693794, "epoch": 0.31892180410995463, "percentage": 15.95, "elapsed_time": "2:12:51", "remaining_time": "11:40:16"} +{"current_steps": 1200, "total_steps": 7494, "loss": 0.6804, "lr": 0.00014836542555583628, "epoch": 0.32025620496397117, "percentage": 16.01, "elapsed_time": "2:13:44", "remaining_time": "11:41:27"} +{"current_steps": 1205, "total_steps": 7494, "loss": 0.6931, "lr": 0.000148328954623001, "epoch": 0.3215906058179877, "percentage": 16.08, "elapsed_time": "2:14:19", "remaining_time": "11:41:01"} +{"current_steps": 1210, "total_steps": 7494, "loss": 0.6782, "lr": 0.00014829208587628908, "epoch": 0.32292500667200424, "percentage": 16.15, "elapsed_time": "2:14:44", "remaining_time": "11:39:45"} +{"current_steps": 1215, "total_steps": 7494, "loss": 0.6792, "lr": 0.0001482548195157156, "epoch": 0.32425940752602084, "percentage": 16.21, "elapsed_time": "2:15:55", "remaining_time": "11:42:27"} +{"current_steps": 1220, "total_steps": 7494, "loss": 0.6724, "lr": 0.00014821715574345277, "epoch": 0.3255938083800374, "percentage": 16.28, "elapsed_time": "2:16:43", "remaining_time": "11:43:06"} +{"current_steps": 1225, "total_steps": 7494, "loss": 0.6786, "lr": 0.0001481790947638288, "epoch": 0.3269282092340539, "percentage": 16.35, "elapsed_time": "2:17:08", "remaining_time": "11:41:51"} +{"current_steps": 1230, "total_steps": 7494, "loss": 0.6756, "lr": 0.00014814063678332667, "epoch": 0.32826261008807045, "percentage": 16.41, "elapsed_time": "2:17:35", "remaining_time": "11:40:42"} +{"current_steps": 1235, "total_steps": 7494, "loss": 0.6734, "lr": 0.00014810178201058323, "epoch": 0.329597010942087, "percentage": 16.48, "elapsed_time": "2:18:25", "remaining_time": "11:41:34"} +{"current_steps": 1240, "total_steps": 7494, "loss": 0.674, "lr": 0.00014806253065638786, "epoch": 0.3309314117961035, "percentage": 16.55, "elapsed_time": "2:19:05", "remaining_time": "11:41:30"} +{"current_steps": 1245, "total_steps": 7494, "loss": 0.6727, "lr": 0.00014802288293368148, "epoch": 0.3322658126501201, "percentage": 16.61, "elapsed_time": "2:19:30", "remaining_time": "11:40:15"} +{"current_steps": 1250, "total_steps": 7494, "loss": 0.6853, "lr": 0.0001479828390575553, "epoch": 0.33360021350413666, "percentage": 16.68, "elapsed_time": "2:19:59", "remaining_time": "11:39:15"} +{"current_steps": 1255, "total_steps": 7494, "loss": 0.6826, "lr": 0.00014794239924524968, "epoch": 0.3349346143581532, "percentage": 16.75, "elapsed_time": "2:20:50", "remaining_time": "11:40:09"} +{"current_steps": 1260, "total_steps": 7494, "loss": 0.6851, "lr": 0.00014790156371615303, "epoch": 0.33626901521216973, "percentage": 16.81, "elapsed_time": "2:21:26", "remaining_time": "11:39:45"} +{"current_steps": 1265, "total_steps": 7494, "loss": 0.6656, "lr": 0.00014786033269180044, "epoch": 0.33760341606618627, "percentage": 16.88, "elapsed_time": "2:21:51", "remaining_time": "11:38:32"} +{"current_steps": 1270, "total_steps": 7494, "loss": 0.688, "lr": 0.00014781870639587262, "epoch": 0.3389378169202028, "percentage": 16.95, "elapsed_time": "2:22:21", "remaining_time": "11:37:38"} +{"current_steps": 1275, "total_steps": 7494, "loss": 0.703, "lr": 0.0001477766850541947, "epoch": 0.3402722177742194, "percentage": 17.01, "elapsed_time": "2:23:14", "remaining_time": "11:38:41"} +{"current_steps": 1280, "total_steps": 7494, "loss": 0.6944, "lr": 0.00014773426889473493, "epoch": 0.34160661862823594, "percentage": 17.08, "elapsed_time": "2:23:46", "remaining_time": "11:38:00"} +{"current_steps": 1285, "total_steps": 7494, "loss": 0.7053, "lr": 0.0001476914581476034, "epoch": 0.3429410194822525, "percentage": 17.15, "elapsed_time": "2:24:12", "remaining_time": "11:36:47"} +{"current_steps": 1290, "total_steps": 7494, "loss": 0.6806, "lr": 0.000147648253045051, "epoch": 0.344275420336269, "percentage": 17.21, "elapsed_time": "2:24:48", "remaining_time": "11:36:27"} +{"current_steps": 1295, "total_steps": 7494, "loss": 0.6874, "lr": 0.0001476046538214679, "epoch": 0.34560982119028555, "percentage": 17.28, "elapsed_time": "2:25:46", "remaining_time": "11:37:46"} +{"current_steps": 1300, "total_steps": 7494, "loss": 0.7022, "lr": 0.00014756066071338247, "epoch": 0.3469442220443021, "percentage": 17.35, "elapsed_time": "2:26:14", "remaining_time": "11:36:45"} +{"current_steps": 1305, "total_steps": 7494, "loss": 0.6833, "lr": 0.00014751627395945984, "epoch": 0.3482786228983187, "percentage": 17.41, "elapsed_time": "2:26:49", "remaining_time": "11:36:18"} +{"current_steps": 1310, "total_steps": 7494, "loss": 0.6801, "lr": 0.0001474714938005008, "epoch": 0.3496130237523352, "percentage": 17.48, "elapsed_time": "2:27:30", "remaining_time": "11:36:20"} +{"current_steps": 1315, "total_steps": 7494, "loss": 0.7026, "lr": 0.00014742632047944033, "epoch": 0.35094742460635175, "percentage": 17.55, "elapsed_time": "2:28:22", "remaining_time": "11:37:09"} +{"current_steps": 1320, "total_steps": 7494, "loss": 0.6867, "lr": 0.00014738075424134634, "epoch": 0.3522818254603683, "percentage": 17.61, "elapsed_time": "2:29:13", "remaining_time": "11:37:55"} +{"current_steps": 1325, "total_steps": 7494, "loss": 0.6798, "lr": 0.00014733479533341837, "epoch": 0.35361622631438483, "percentage": 17.68, "elapsed_time": "2:29:39", "remaining_time": "11:36:45"} +{"current_steps": 1330, "total_steps": 7494, "loss": 0.6892, "lr": 0.00014728844400498616, "epoch": 0.35495062716840137, "percentage": 17.75, "elapsed_time": "2:30:25", "remaining_time": "11:37:09"} +{"current_steps": 1335, "total_steps": 7494, "loss": 0.6817, "lr": 0.00014724170050750836, "epoch": 0.35628502802241796, "percentage": 17.81, "elapsed_time": "2:31:11", "remaining_time": "11:37:29"} +{"current_steps": 1340, "total_steps": 7494, "loss": 0.6923, "lr": 0.00014719456509457122, "epoch": 0.3576194288764345, "percentage": 17.88, "elapsed_time": "2:31:37", "remaining_time": "11:36:18"} +{"current_steps": 1345, "total_steps": 7494, "loss": 0.6856, "lr": 0.00014714703802188713, "epoch": 0.35895382973045104, "percentage": 17.95, "elapsed_time": "2:32:03", "remaining_time": "11:35:11"} +{"current_steps": 1350, "total_steps": 7494, "loss": 0.6926, "lr": 0.0001470991195472932, "epoch": 0.3602882305844676, "percentage": 18.01, "elapsed_time": "2:32:54", "remaining_time": "11:35:54"} +{"current_steps": 1355, "total_steps": 7494, "loss": 0.6797, "lr": 0.00014705080993075, "epoch": 0.3616226314384841, "percentage": 18.08, "elapsed_time": "2:33:34", "remaining_time": "11:35:48"} +{"current_steps": 1360, "total_steps": 7494, "loss": 0.6887, "lr": 0.00014700210943433998, "epoch": 0.36295703229250065, "percentage": 18.15, "elapsed_time": "2:34:00", "remaining_time": "11:34:37"} +{"current_steps": 1365, "total_steps": 7494, "loss": 0.6946, "lr": 0.00014695301832226627, "epoch": 0.36429143314651724, "percentage": 18.21, "elapsed_time": "2:34:28", "remaining_time": "11:33:36"} +{"current_steps": 1370, "total_steps": 7494, "loss": 0.6784, "lr": 0.00014690353686085098, "epoch": 0.3656258340005338, "percentage": 18.28, "elapsed_time": "2:35:20", "remaining_time": "11:34:21"} +{"current_steps": 1375, "total_steps": 7494, "loss": 0.6851, "lr": 0.00014685366531853395, "epoch": 0.3669602348545503, "percentage": 18.35, "elapsed_time": "2:35:57", "remaining_time": "11:34:01"} +{"current_steps": 1380, "total_steps": 7494, "loss": 0.6846, "lr": 0.00014680340396587118, "epoch": 0.36829463570856685, "percentage": 18.41, "elapsed_time": "2:36:22", "remaining_time": "11:32:49"} +{"current_steps": 1385, "total_steps": 7494, "loss": 0.6702, "lr": 0.0001467527530755335, "epoch": 0.3696290365625834, "percentage": 18.48, "elapsed_time": "2:37:18", "remaining_time": "11:33:52"} +{"current_steps": 1390, "total_steps": 7494, "loss": 0.6769, "lr": 0.000146701712922305, "epoch": 0.37096343741659993, "percentage": 18.55, "elapsed_time": "2:38:13", "remaining_time": "11:34:47"} +{"current_steps": 1395, "total_steps": 7494, "loss": 0.6821, "lr": 0.00014665028378308138, "epoch": 0.37229783827061647, "percentage": 18.61, "elapsed_time": "2:39:25", "remaining_time": "11:37:00"} +{"current_steps": 1400, "total_steps": 7494, "loss": 0.6841, "lr": 0.00014659846593686885, "epoch": 0.37363223912463306, "percentage": 18.68, "elapsed_time": "2:39:50", "remaining_time": "11:35:47"} +{"current_steps": 1405, "total_steps": 7494, "loss": 0.6889, "lr": 0.0001465462596647822, "epoch": 0.3749666399786496, "percentage": 18.75, "elapsed_time": "2:40:31", "remaining_time": "11:35:41"} +{"current_steps": 1410, "total_steps": 7494, "loss": 0.6584, "lr": 0.0001464936652500435, "epoch": 0.37630104083266613, "percentage": 18.82, "elapsed_time": "2:41:28", "remaining_time": "11:36:45"} +{"current_steps": 1415, "total_steps": 7494, "loss": 0.6749, "lr": 0.0001464406829779806, "epoch": 0.37763544168668267, "percentage": 18.88, "elapsed_time": "2:41:58", "remaining_time": "11:35:50"} +{"current_steps": 1420, "total_steps": 7494, "loss": 0.6687, "lr": 0.0001463873131360254, "epoch": 0.3789698425406992, "percentage": 18.95, "elapsed_time": "2:42:23", "remaining_time": "11:34:38"} +{"current_steps": 1425, "total_steps": 7494, "loss": 0.6747, "lr": 0.0001463335560137124, "epoch": 0.38030424339471575, "percentage": 19.02, "elapsed_time": "2:43:03", "remaining_time": "11:34:25"} +{"current_steps": 1430, "total_steps": 7494, "loss": 0.6746, "lr": 0.00014627941190267717, "epoch": 0.38163864424873234, "percentage": 19.08, "elapsed_time": "2:43:53", "remaining_time": "11:34:58"} +{"current_steps": 1435, "total_steps": 7494, "loss": 0.6876, "lr": 0.00014622488109665468, "epoch": 0.3829730451027489, "percentage": 19.15, "elapsed_time": "2:44:47", "remaining_time": "11:35:46"} +{"current_steps": 1440, "total_steps": 7494, "loss": 0.6794, "lr": 0.0001461699638914777, "epoch": 0.3843074459567654, "percentage": 19.22, "elapsed_time": "2:45:12", "remaining_time": "11:34:35"} +{"current_steps": 1445, "total_steps": 7494, "loss": 0.674, "lr": 0.00014611466058507536, "epoch": 0.38564184681078195, "percentage": 19.28, "elapsed_time": "2:45:56", "remaining_time": "11:34:40"} +{"current_steps": 1450, "total_steps": 7494, "loss": 0.6856, "lr": 0.00014605897147747132, "epoch": 0.3869762476647985, "percentage": 19.35, "elapsed_time": "2:46:46", "remaining_time": "11:35:10"} +{"current_steps": 1455, "total_steps": 7494, "loss": 0.6903, "lr": 0.0001460028968707822, "epoch": 0.388310648518815, "percentage": 19.42, "elapsed_time": "2:47:13", "remaining_time": "11:34:03"} +{"current_steps": 1460, "total_steps": 7494, "loss": 0.676, "lr": 0.0001459464370692161, "epoch": 0.3896450493728316, "percentage": 19.48, "elapsed_time": "2:47:39", "remaining_time": "11:32:54"} +{"current_steps": 1465, "total_steps": 7494, "loss": 0.6781, "lr": 0.0001458895923790707, "epoch": 0.39097945022684816, "percentage": 19.55, "elapsed_time": "2:48:28", "remaining_time": "11:33:19"} +{"current_steps": 1470, "total_steps": 7494, "loss": 0.6753, "lr": 0.0001458323631087318, "epoch": 0.3923138510808647, "percentage": 19.62, "elapsed_time": "2:49:13", "remaining_time": "11:33:27"} +{"current_steps": 1475, "total_steps": 7494, "loss": 0.6575, "lr": 0.00014577474956867155, "epoch": 0.39364825193488123, "percentage": 19.68, "elapsed_time": "2:49:39", "remaining_time": "11:32:18"} +{"current_steps": 1480, "total_steps": 7494, "loss": 0.6844, "lr": 0.00014571675207144676, "epoch": 0.39498265278889777, "percentage": 19.75, "elapsed_time": "2:51:19", "remaining_time": "11:36:12"} +{"current_steps": 1485, "total_steps": 7494, "loss": 0.6888, "lr": 0.00014565837093169728, "epoch": 0.3963170536429143, "percentage": 19.82, "elapsed_time": "2:52:13", "remaining_time": "11:36:53"} +{"current_steps": 1490, "total_steps": 7494, "loss": 0.6885, "lr": 0.00014559960646614418, "epoch": 0.3976514544969309, "percentage": 19.88, "elapsed_time": "2:52:59", "remaining_time": "11:37:04"} +{"current_steps": 1495, "total_steps": 7494, "loss": 0.6761, "lr": 0.00014554045899358814, "epoch": 0.39898585535094744, "percentage": 19.95, "elapsed_time": "2:53:25", "remaining_time": "11:35:55"} +{"current_steps": 1500, "total_steps": 7494, "loss": 0.6789, "lr": 0.00014548092883490772, "epoch": 0.400320256204964, "percentage": 20.02, "elapsed_time": "2:53:55", "remaining_time": "11:34:59"} +{"current_steps": 1505, "total_steps": 7494, "loss": 0.691, "lr": 0.00014542101631305745, "epoch": 0.4016546570589805, "percentage": 20.08, "elapsed_time": "2:54:58", "remaining_time": "11:36:16"} +{"current_steps": 1510, "total_steps": 7494, "loss": 0.6722, "lr": 0.00014536072175306628, "epoch": 0.40298905791299705, "percentage": 20.15, "elapsed_time": "2:55:34", "remaining_time": "11:35:47"} +{"current_steps": 1515, "total_steps": 7494, "loss": 0.6638, "lr": 0.00014530004548203573, "epoch": 0.4043234587670136, "percentage": 20.22, "elapsed_time": "2:56:00", "remaining_time": "11:34:36"} +{"current_steps": 1520, "total_steps": 7494, "loss": 0.6935, "lr": 0.00014523898782913818, "epoch": 0.4056578596210302, "percentage": 20.28, "elapsed_time": "2:56:32", "remaining_time": "11:33:51"} +{"current_steps": 1525, "total_steps": 7494, "loss": 0.679, "lr": 0.00014517754912561496, "epoch": 0.4069922604750467, "percentage": 20.35, "elapsed_time": "2:57:26", "remaining_time": "11:34:33"} +{"current_steps": 1530, "total_steps": 7494, "loss": 0.6636, "lr": 0.00014511572970477457, "epoch": 0.40832666132906326, "percentage": 20.42, "elapsed_time": "2:58:00", "remaining_time": "11:33:52"} +{"current_steps": 1535, "total_steps": 7494, "loss": 0.6777, "lr": 0.00014505352990199107, "epoch": 0.4096610621830798, "percentage": 20.48, "elapsed_time": "2:58:52", "remaining_time": "11:34:24"} +{"current_steps": 1540, "total_steps": 7494, "loss": 0.675, "lr": 0.000144990950054702, "epoch": 0.41099546303709633, "percentage": 20.55, "elapsed_time": "2:59:27", "remaining_time": "11:33:50"} +{"current_steps": 1545, "total_steps": 7494, "loss": 0.6802, "lr": 0.0001449279905024067, "epoch": 0.41232986389111287, "percentage": 20.62, "elapsed_time": "3:00:21", "remaining_time": "11:34:27"} +{"current_steps": 1550, "total_steps": 7494, "loss": 0.6786, "lr": 0.00014486465158666443, "epoch": 0.41366426474512946, "percentage": 20.68, "elapsed_time": "3:01:55", "remaining_time": "11:37:38"} +{"current_steps": 1555, "total_steps": 7494, "loss": 0.6965, "lr": 0.00014480093365109252, "epoch": 0.414998665599146, "percentage": 20.75, "elapsed_time": "3:02:20", "remaining_time": "11:36:26"} +{"current_steps": 1560, "total_steps": 7494, "loss": 0.6732, "lr": 0.00014473683704136454, "epoch": 0.41633306645316254, "percentage": 20.82, "elapsed_time": "3:03:01", "remaining_time": "11:36:11"} +{"current_steps": 1565, "total_steps": 7494, "loss": 0.6729, "lr": 0.0001446723621052083, "epoch": 0.4176674673071791, "percentage": 20.88, "elapsed_time": "3:03:50", "remaining_time": "11:36:30"} +{"current_steps": 1570, "total_steps": 7494, "loss": 0.661, "lr": 0.00014460750919240416, "epoch": 0.4190018681611956, "percentage": 20.95, "elapsed_time": "3:04:18", "remaining_time": "11:35:27"} +{"current_steps": 1575, "total_steps": 7494, "loss": 0.6766, "lr": 0.00014454227865478292, "epoch": 0.42033626901521215, "percentage": 21.02, "elapsed_time": "3:04:44", "remaining_time": "11:34:16"} +{"current_steps": 1580, "total_steps": 7494, "loss": 0.6901, "lr": 0.0001444766708462241, "epoch": 0.42167066986922874, "percentage": 21.08, "elapsed_time": "3:05:30", "remaining_time": "11:34:22"} +{"current_steps": 1585, "total_steps": 7494, "loss": 0.6758, "lr": 0.0001444106861226539, "epoch": 0.4230050707232453, "percentage": 21.15, "elapsed_time": "3:06:18", "remaining_time": "11:34:33"} +{"current_steps": 1590, "total_steps": 7494, "loss": 0.669, "lr": 0.00014434432484204335, "epoch": 0.4243394715772618, "percentage": 21.22, "elapsed_time": "3:06:45", "remaining_time": "11:33:28"} +{"current_steps": 1595, "total_steps": 7494, "loss": 0.673, "lr": 0.0001442775873644062, "epoch": 0.42567387243127836, "percentage": 21.28, "elapsed_time": "3:07:11", "remaining_time": "11:32:20"} +{"current_steps": 1600, "total_steps": 7494, "loss": 0.6803, "lr": 0.00014421047405179725, "epoch": 0.4270082732852949, "percentage": 21.35, "elapsed_time": "3:08:00", "remaining_time": "11:32:33"} +{"current_steps": 1605, "total_steps": 7494, "loss": 0.6798, "lr": 0.00014414298526831012, "epoch": 0.42834267413931143, "percentage": 21.42, "elapsed_time": "3:08:51", "remaining_time": "11:32:58"} +{"current_steps": 1610, "total_steps": 7494, "loss": 0.6844, "lr": 0.00014407512138007547, "epoch": 0.429677074993328, "percentage": 21.48, "elapsed_time": "3:09:18", "remaining_time": "11:31:50"} +{"current_steps": 1615, "total_steps": 7494, "loss": 0.6608, "lr": 0.0001440068827552588, "epoch": 0.43101147584734456, "percentage": 21.55, "elapsed_time": "3:09:45", "remaining_time": "11:30:47"} +{"current_steps": 1620, "total_steps": 7494, "loss": 0.6947, "lr": 0.0001439382697640587, "epoch": 0.4323458767013611, "percentage": 21.62, "elapsed_time": "3:10:36", "remaining_time": "11:31:07"} +{"current_steps": 1625, "total_steps": 7494, "loss": 0.656, "lr": 0.00014386928277870461, "epoch": 0.43368027755537764, "percentage": 21.68, "elapsed_time": "3:11:17", "remaining_time": "11:30:53"} +{"current_steps": 1630, "total_steps": 7494, "loss": 0.6933, "lr": 0.00014379992217345504, "epoch": 0.4350146784093942, "percentage": 21.75, "elapsed_time": "3:11:43", "remaining_time": "11:29:45"} +{"current_steps": 1635, "total_steps": 7494, "loss": 0.6755, "lr": 0.0001437301883245953, "epoch": 0.4363490792634107, "percentage": 21.82, "elapsed_time": "3:12:14", "remaining_time": "11:28:53"} +{"current_steps": 1640, "total_steps": 7494, "loss": 0.6701, "lr": 0.0001436600816104356, "epoch": 0.43768348011742725, "percentage": 21.88, "elapsed_time": "3:13:05", "remaining_time": "11:29:15"} +{"current_steps": 1645, "total_steps": 7494, "loss": 0.6714, "lr": 0.000143589602411309, "epoch": 0.43901788097144384, "percentage": 21.95, "elapsed_time": "3:13:42", "remaining_time": "11:28:45"} +{"current_steps": 1650, "total_steps": 7494, "loss": 0.6682, "lr": 0.00014351875110956927, "epoch": 0.4403522818254604, "percentage": 22.02, "elapsed_time": "3:14:08", "remaining_time": "11:27:35"} +{"current_steps": 1655, "total_steps": 7494, "loss": 0.6872, "lr": 0.00014344752808958887, "epoch": 0.4416866826794769, "percentage": 22.08, "elapsed_time": "3:15:06", "remaining_time": "11:28:20"} +{"current_steps": 1660, "total_steps": 7494, "loss": 0.669, "lr": 0.0001433759337377569, "epoch": 0.44302108353349345, "percentage": 22.15, "elapsed_time": "3:15:57", "remaining_time": "11:28:41"} +{"current_steps": 1665, "total_steps": 7494, "loss": 0.6658, "lr": 0.00014330396844247685, "epoch": 0.44435548438751, "percentage": 22.22, "elapsed_time": "3:16:31", "remaining_time": "11:28:01"} +{"current_steps": 1670, "total_steps": 7494, "loss": 0.6726, "lr": 0.0001432316325941647, "epoch": 0.44568988524152653, "percentage": 22.28, "elapsed_time": "3:16:57", "remaining_time": "11:26:51"} +{"current_steps": 1675, "total_steps": 7494, "loss": 0.6806, "lr": 0.00014315892658524665, "epoch": 0.4470242860955431, "percentage": 22.35, "elapsed_time": "3:17:31", "remaining_time": "11:26:13"} +{"current_steps": 1680, "total_steps": 7494, "loss": 0.6527, "lr": 0.0001430858508101571, "epoch": 0.44835868694955966, "percentage": 22.42, "elapsed_time": "3:18:25", "remaining_time": "11:26:39"} +{"current_steps": 1685, "total_steps": 7494, "loss": 0.6911, "lr": 0.00014301240566533637, "epoch": 0.4496930878035762, "percentage": 22.48, "elapsed_time": "3:18:57", "remaining_time": "11:25:53"} +{"current_steps": 1690, "total_steps": 7494, "loss": 0.6644, "lr": 0.00014293859154922866, "epoch": 0.45102748865759273, "percentage": 22.55, "elapsed_time": "3:19:22", "remaining_time": "11:24:43"} +{"current_steps": 1695, "total_steps": 7494, "loss": 0.6786, "lr": 0.00014286440886227995, "epoch": 0.45236188951160927, "percentage": 22.62, "elapsed_time": "3:20:01", "remaining_time": "11:24:20"} +{"current_steps": 1700, "total_steps": 7494, "loss": 0.6921, "lr": 0.00014278985800693562, "epoch": 0.4536962903656258, "percentage": 22.68, "elapsed_time": "3:20:53", "remaining_time": "11:24:39"} +{"current_steps": 1705, "total_steps": 7494, "loss": 0.6653, "lr": 0.0001427149393876384, "epoch": 0.4550306912196424, "percentage": 22.75, "elapsed_time": "3:21:30", "remaining_time": "11:24:10"} +{"current_steps": 1710, "total_steps": 7494, "loss": 0.6748, "lr": 0.00014263965341082622, "epoch": 0.45636509207365894, "percentage": 22.82, "elapsed_time": "3:21:56", "remaining_time": "11:23:02"} +{"current_steps": 1715, "total_steps": 7494, "loss": 0.6913, "lr": 0.00014256400048492994, "epoch": 0.4576994929276755, "percentage": 22.88, "elapsed_time": "3:22:39", "remaining_time": "11:22:55"} +{"current_steps": 1720, "total_steps": 7494, "loss": 0.652, "lr": 0.00014248798102037106, "epoch": 0.459033893781692, "percentage": 22.95, "elapsed_time": "3:23:28", "remaining_time": "11:23:04"} +{"current_steps": 1725, "total_steps": 7494, "loss": 0.6779, "lr": 0.0001424115954295597, "epoch": 0.46036829463570855, "percentage": 23.02, "elapsed_time": "3:23:56", "remaining_time": "11:22:03"} +{"current_steps": 1730, "total_steps": 7494, "loss": 0.6751, "lr": 0.00014233484412689212, "epoch": 0.4617026954897251, "percentage": 23.09, "elapsed_time": "3:24:22", "remaining_time": "11:20:56"} +{"current_steps": 1735, "total_steps": 7494, "loss": 0.6628, "lr": 0.00014225772752874866, "epoch": 0.4630370963437417, "percentage": 23.15, "elapsed_time": "3:25:10", "remaining_time": "11:21:01"} +{"current_steps": 1740, "total_steps": 7494, "loss": 0.6557, "lr": 0.00014218024605349133, "epoch": 0.4643714971977582, "percentage": 23.22, "elapsed_time": "3:25:55", "remaining_time": "11:20:57"} +{"current_steps": 1745, "total_steps": 7494, "loss": 0.6684, "lr": 0.00014210240012146178, "epoch": 0.46570589805177476, "percentage": 23.29, "elapsed_time": "3:26:22", "remaining_time": "11:19:53"} +{"current_steps": 1750, "total_steps": 7494, "loss": 0.6772, "lr": 0.00014202419015497863, "epoch": 0.4670402989057913, "percentage": 23.35, "elapsed_time": "3:27:26", "remaining_time": "11:20:52"} +{"current_steps": 1755, "total_steps": 7494, "loss": 0.6738, "lr": 0.00014194561657833563, "epoch": 0.46837469975980783, "percentage": 23.42, "elapsed_time": "3:28:16", "remaining_time": "11:21:05"} +{"current_steps": 1760, "total_steps": 7494, "loss": 0.6652, "lr": 0.000141866679817799, "epoch": 0.46970910061382437, "percentage": 23.49, "elapsed_time": "3:28:58", "remaining_time": "11:20:51"} +{"current_steps": 1765, "total_steps": 7494, "loss": 0.6765, "lr": 0.00014178738030160527, "epoch": 0.47104350146784096, "percentage": 23.55, "elapsed_time": "3:29:25", "remaining_time": "11:19:45"} +{"current_steps": 1770, "total_steps": 7494, "loss": 0.6717, "lr": 0.000141707718459959, "epoch": 0.4723779023218575, "percentage": 23.62, "elapsed_time": "3:29:54", "remaining_time": "11:18:48"} +{"current_steps": 1775, "total_steps": 7494, "loss": 0.6519, "lr": 0.00014162769472503032, "epoch": 0.47371230317587404, "percentage": 23.69, "elapsed_time": "3:30:43", "remaining_time": "11:18:57"} +{"current_steps": 1780, "total_steps": 7494, "loss": 0.6537, "lr": 0.00014154730953095274, "epoch": 0.4750467040298906, "percentage": 23.75, "elapsed_time": "3:31:23", "remaining_time": "11:18:35"} +{"current_steps": 1785, "total_steps": 7494, "loss": 0.6809, "lr": 0.0001414665633138206, "epoch": 0.4763811048839071, "percentage": 23.82, "elapsed_time": "3:31:49", "remaining_time": "11:17:27"} +{"current_steps": 1790, "total_steps": 7494, "loss": 0.6836, "lr": 0.00014138545651168683, "epoch": 0.47771550573792365, "percentage": 23.89, "elapsed_time": "3:33:07", "remaining_time": "11:19:08"} +{"current_steps": 1795, "total_steps": 7494, "loss": 0.6641, "lr": 0.00014130398956456062, "epoch": 0.47904990659194024, "percentage": 23.95, "elapsed_time": "3:33:59", "remaining_time": "11:19:25"} +{"current_steps": 1800, "total_steps": 7494, "loss": 0.6713, "lr": 0.00014122216291440496, "epoch": 0.4803843074459568, "percentage": 24.02, "elapsed_time": "3:34:36", "remaining_time": "11:18:51"} +{"current_steps": 1805, "total_steps": 7494, "loss": 0.6783, "lr": 0.00014113997700513422, "epoch": 0.4817187082999733, "percentage": 24.09, "elapsed_time": "3:35:11", "remaining_time": "11:18:14"} +{"current_steps": 1810, "total_steps": 7494, "loss": 0.6494, "lr": 0.00014105743228261174, "epoch": 0.48305310915398986, "percentage": 24.15, "elapsed_time": "3:35:45", "remaining_time": "11:17:33"} +{"current_steps": 1815, "total_steps": 7494, "loss": 0.6816, "lr": 0.00014097452919464748, "epoch": 0.4843875100080064, "percentage": 24.22, "elapsed_time": "3:36:36", "remaining_time": "11:17:44"} +{"current_steps": 1820, "total_steps": 7494, "loss": 0.66, "lr": 0.00014089126819099557, "epoch": 0.48572191086202293, "percentage": 24.29, "elapsed_time": "3:37:09", "remaining_time": "11:17:01"} +{"current_steps": 1825, "total_steps": 7494, "loss": 0.6817, "lr": 0.00014080764972335184, "epoch": 0.4870563117160395, "percentage": 24.35, "elapsed_time": "3:38:11", "remaining_time": "11:17:46"} +{"current_steps": 1830, "total_steps": 7494, "loss": 0.6693, "lr": 0.00014072367424535135, "epoch": 0.48839071257005606, "percentage": 24.42, "elapsed_time": "3:38:49", "remaining_time": "11:17:16"} +{"current_steps": 1835, "total_steps": 7494, "loss": 0.6695, "lr": 0.000140639342212566, "epoch": 0.4897251134240726, "percentage": 24.49, "elapsed_time": "3:39:41", "remaining_time": "11:17:29"} +{"current_steps": 1840, "total_steps": 7494, "loss": 0.6667, "lr": 0.000140554654082502, "epoch": 0.49105951427808914, "percentage": 24.55, "elapsed_time": "3:40:11", "remaining_time": "11:16:37"} +{"current_steps": 1845, "total_steps": 7494, "loss": 0.6849, "lr": 0.0001404696103145975, "epoch": 0.4923939151321057, "percentage": 24.62, "elapsed_time": "3:40:37", "remaining_time": "11:15:30"} +{"current_steps": 1850, "total_steps": 7494, "loss": 0.6609, "lr": 0.0001403842113702198, "epoch": 0.4937283159861222, "percentage": 24.69, "elapsed_time": "3:41:19", "remaining_time": "11:15:14"} +{"current_steps": 1855, "total_steps": 7494, "loss": 0.6801, "lr": 0.00014029845771266325, "epoch": 0.49506271684013875, "percentage": 24.75, "elapsed_time": "3:42:07", "remaining_time": "11:15:14"} +{"current_steps": 1860, "total_steps": 7494, "loss": 0.6827, "lr": 0.00014021234980714648, "epoch": 0.49639711769415534, "percentage": 24.82, "elapsed_time": "3:42:36", "remaining_time": "11:14:18"} +{"current_steps": 1865, "total_steps": 7494, "loss": 0.6815, "lr": 0.00014012588812080992, "epoch": 0.4977315185481719, "percentage": 24.89, "elapsed_time": "3:43:02", "remaining_time": "11:13:11"} +{"current_steps": 1870, "total_steps": 7494, "loss": 0.6667, "lr": 0.00014003907312271319, "epoch": 0.4990659194021884, "percentage": 24.95, "elapsed_time": "3:43:48", "remaining_time": "11:13:06"} +{"current_steps": 1875, "total_steps": 7494, "loss": 0.6664, "lr": 0.0001399519052838329, "epoch": 0.500400320256205, "percentage": 25.02, "elapsed_time": "3:44:37", "remaining_time": "11:13:07"} +{"current_steps": 1880, "total_steps": 7494, "loss": 0.6742, "lr": 0.00013986438507705958, "epoch": 0.5017347211102215, "percentage": 25.09, "elapsed_time": "3:45:39", "remaining_time": "11:13:50"} +{"current_steps": 1885, "total_steps": 7494, "loss": 0.6739, "lr": 0.00013977651297719548, "epoch": 0.503069121964238, "percentage": 25.15, "elapsed_time": "3:46:05", "remaining_time": "11:12:45"} +{"current_steps": 1890, "total_steps": 7494, "loss": 0.6594, "lr": 0.00013968828946095193, "epoch": 0.5044035228182546, "percentage": 25.22, "elapsed_time": "3:46:53", "remaining_time": "11:12:44"} +{"current_steps": 1895, "total_steps": 7494, "loss": 0.6672, "lr": 0.00013959971500694668, "epoch": 0.5057379236722711, "percentage": 25.29, "elapsed_time": "3:47:38", "remaining_time": "11:12:34"} +{"current_steps": 1900, "total_steps": 7494, "loss": 0.67, "lr": 0.00013951079009570132, "epoch": 0.5070723245262877, "percentage": 25.35, "elapsed_time": "3:48:38", "remaining_time": "11:13:11"} +{"current_steps": 1905, "total_steps": 7494, "loss": 0.6659, "lr": 0.00013942151520963868, "epoch": 0.5084067253803043, "percentage": 25.42, "elapsed_time": "3:49:16", "remaining_time": "11:12:39"} +{"current_steps": 1905, "total_steps": 7494, "loss": 0.6659, "lr": 0.00013942151520963868, "epoch": 0.5084067253803043, "percentage": 25.42, "elapsed_time": "0:09:07", "remaining_time": "0:26:46"} +{"current_steps": 1910, "total_steps": 7494, "loss": 0.6738, "lr": 0.00013933189083308031, "epoch": 0.5097411262343208, "percentage": 25.49, "elapsed_time": "0:11:22", "remaining_time": "0:33:16"} +{"current_steps": 1915, "total_steps": 7494, "loss": 0.6608, "lr": 0.00013924191745224364, "epoch": 0.5110755270883374, "percentage": 25.55, "elapsed_time": "0:12:13", "remaining_time": "0:35:38"} +{"current_steps": 1920, "total_steps": 7494, "loss": 0.6848, "lr": 0.00013915159555523957, "epoch": 0.5124099279423538, "percentage": 25.62, "elapsed_time": "0:13:15", "remaining_time": "0:38:29"} +{"current_steps": 1925, "total_steps": 7494, "loss": 0.6524, "lr": 0.00013906092563206968, "epoch": 0.5137443287963704, "percentage": 25.69, "elapsed_time": "0:13:41", "remaining_time": "0:39:37"} +{"current_steps": 1930, "total_steps": 7494, "loss": 0.6795, "lr": 0.00013896990817462363, "epoch": 0.5150787296503869, "percentage": 25.75, "elapsed_time": "0:14:07", "remaining_time": "0:40:43"} +{"current_steps": 1935, "total_steps": 7494, "loss": 0.6714, "lr": 0.00013887854367667645, "epoch": 0.5164131305044035, "percentage": 25.82, "elapsed_time": "0:14:38", "remaining_time": "0:42:04"} +{"current_steps": 1940, "total_steps": 7494, "loss": 0.6747, "lr": 0.00013878683263388587, "epoch": 0.5177475313584201, "percentage": 25.89, "elapsed_time": "0:15:29", "remaining_time": "0:44:20"} +{"current_steps": 1945, "total_steps": 7494, "loss": 0.6727, "lr": 0.00013869477554378972, "epoch": 0.5190819322124366, "percentage": 25.95, "elapsed_time": "0:15:54", "remaining_time": "0:45:24"} +{"current_steps": 1950, "total_steps": 7494, "loss": 0.6532, "lr": 0.00013860237290580306, "epoch": 0.5204163330664532, "percentage": 26.02, "elapsed_time": "0:16:20", "remaining_time": "0:46:26"} +{"current_steps": 1955, "total_steps": 7494, "loss": 0.679, "lr": 0.00013850962522121569, "epoch": 0.5217507339204697, "percentage": 26.09, "elapsed_time": "0:17:14", "remaining_time": "0:48:50"} +{"current_steps": 1960, "total_steps": 7494, "loss": 0.6655, "lr": 0.00013841653299318915, "epoch": 0.5230851347744863, "percentage": 26.15, "elapsed_time": "0:17:42", "remaining_time": "0:49:59"} +{"current_steps": 1965, "total_steps": 7494, "loss": 0.6503, "lr": 0.00013832309672675428, "epoch": 0.5244195356285029, "percentage": 26.22, "elapsed_time": "0:18:07", "remaining_time": "0:51:00"} +{"current_steps": 1970, "total_steps": 7494, "loss": 0.6734, "lr": 0.00013822931692880828, "epoch": 0.5257539364825193, "percentage": 26.29, "elapsed_time": "0:18:33", "remaining_time": "0:52:01"} +{"current_steps": 1975, "total_steps": 7494, "loss": 0.6681, "lr": 0.00013813519410811208, "epoch": 0.5270883373365359, "percentage": 26.35, "elapsed_time": "0:19:31", "remaining_time": "0:54:33"} +{"current_steps": 1980, "total_steps": 7494, "loss": 0.6816, "lr": 0.00013804072877528746, "epoch": 0.5284227381905524, "percentage": 26.42, "elapsed_time": "0:19:56", "remaining_time": "0:55:32"} +{"current_steps": 1985, "total_steps": 7494, "loss": 0.6596, "lr": 0.0001379459214428144, "epoch": 0.529757139044569, "percentage": 26.49, "elapsed_time": "0:20:22", "remaining_time": "0:56:31"} +{"current_steps": 1990, "total_steps": 7494, "loss": 0.6697, "lr": 0.0001378507726250283, "epoch": 0.5310915398985855, "percentage": 26.55, "elapsed_time": "0:20:55", "remaining_time": "0:57:51"} +{"current_steps": 1995, "total_steps": 7494, "loss": 0.6639, "lr": 0.00013775528283811695, "epoch": 0.5324259407526021, "percentage": 26.62, "elapsed_time": "0:21:46", "remaining_time": "1:00:01"} +{"current_steps": 2000, "total_steps": 7494, "loss": 0.6693, "lr": 0.00013765945260011815, "epoch": 0.5337603416066187, "percentage": 26.69, "elapsed_time": "0:22:11", "remaining_time": "1:00:58"} +{"current_steps": 2005, "total_steps": 7494, "loss": 0.6642, "lr": 0.0001375632824309165, "epoch": 0.5350947424606352, "percentage": 26.75, "elapsed_time": "0:22:45", "remaining_time": "1:02:19"} +{"current_steps": 2010, "total_steps": 7494, "loss": 0.6661, "lr": 0.00013746677285224082, "epoch": 0.5364291433146517, "percentage": 26.82, "elapsed_time": "0:23:38", "remaining_time": "1:04:30"} +{"current_steps": 2015, "total_steps": 7494, "loss": 0.658, "lr": 0.00013736992438766123, "epoch": 0.5377635441686682, "percentage": 26.89, "elapsed_time": "0:24:09", "remaining_time": "1:05:41"} +{"current_steps": 2020, "total_steps": 7494, "loss": 0.6595, "lr": 0.00013727273756258633, "epoch": 0.5390979450226848, "percentage": 26.95, "elapsed_time": "0:24:35", "remaining_time": "1:06:37"} +{"current_steps": 2025, "total_steps": 7494, "loss": 0.6584, "lr": 0.00013717521290426034, "epoch": 0.5404323458767014, "percentage": 27.02, "elapsed_time": "0:25:00", "remaining_time": "1:07:31"} +{"current_steps": 2030, "total_steps": 7494, "loss": 0.663, "lr": 0.00013707735094176026, "epoch": 0.5417667467307179, "percentage": 27.09, "elapsed_time": "0:25:56", "remaining_time": "1:09:50"} +{"current_steps": 2035, "total_steps": 7494, "loss": 0.6694, "lr": 0.00013697915220599294, "epoch": 0.5431011475847345, "percentage": 27.16, "elapsed_time": "0:26:22", "remaining_time": "1:10:45"} +{"current_steps": 2040, "total_steps": 7494, "loss": 0.6617, "lr": 0.0001368806172296923, "epoch": 0.544435548438751, "percentage": 27.22, "elapsed_time": "0:26:47", "remaining_time": "1:11:38"} +{"current_steps": 2045, "total_steps": 7494, "loss": 0.6478, "lr": 0.00013678174654741638, "epoch": 0.5457699492927676, "percentage": 27.29, "elapsed_time": "0:27:19", "remaining_time": "1:12:47"} +{"current_steps": 2050, "total_steps": 7494, "loss": 0.6764, "lr": 0.00013668254069554439, "epoch": 0.547104350146784, "percentage": 27.36, "elapsed_time": "0:28:12", "remaining_time": "1:14:54"} +{"current_steps": 2055, "total_steps": 7494, "loss": 0.6746, "lr": 0.00013658300021227387, "epoch": 0.5484387510008006, "percentage": 27.42, "elapsed_time": "0:28:37", "remaining_time": "1:15:46"} +{"current_steps": 2060, "total_steps": 7494, "loss": 0.6497, "lr": 0.00013648312563761784, "epoch": 0.5497731518548172, "percentage": 27.49, "elapsed_time": "0:29:02", "remaining_time": "1:16:37"} +{"current_steps": 2065, "total_steps": 7494, "loss": 0.6569, "lr": 0.0001363829175134017, "epoch": 0.5511075527088337, "percentage": 27.56, "elapsed_time": "0:29:53", "remaining_time": "1:18:35"} +{"current_steps": 2070, "total_steps": 7494, "loss": 0.6684, "lr": 0.00013628237638326038, "epoch": 0.5524419535628503, "percentage": 27.62, "elapsed_time": "0:30:29", "remaining_time": "1:19:54"} +{"current_steps": 2075, "total_steps": 7494, "loss": 0.6607, "lr": 0.0001361815027926354, "epoch": 0.5537763544168668, "percentage": 27.69, "elapsed_time": "0:30:54", "remaining_time": "1:20:43"} +{"current_steps": 2080, "total_steps": 7494, "loss": 0.6572, "lr": 0.00013608029728877195, "epoch": 0.5551107552708834, "percentage": 27.76, "elapsed_time": "0:31:20", "remaining_time": "1:21:33"} +{"current_steps": 2085, "total_steps": 7494, "loss": 0.6703, "lr": 0.00013597876042071574, "epoch": 0.5564451561248999, "percentage": 27.82, "elapsed_time": "0:32:17", "remaining_time": "1:23:46"} +{"current_steps": 2090, "total_steps": 7494, "loss": 0.6631, "lr": 0.00013587689273931032, "epoch": 0.5577795569789165, "percentage": 27.89, "elapsed_time": "0:32:44", "remaining_time": "1:24:39"} +{"current_steps": 2095, "total_steps": 7494, "loss": 0.6818, "lr": 0.00013577469479719376, "epoch": 0.559113957832933, "percentage": 27.96, "elapsed_time": "0:33:09", "remaining_time": "1:25:27"} +{"current_steps": 2100, "total_steps": 7494, "loss": 0.6575, "lr": 0.00013567216714879593, "epoch": 0.5604483586869495, "percentage": 28.02, "elapsed_time": "0:33:37", "remaining_time": "1:26:22"} +{"current_steps": 2105, "total_steps": 7494, "loss": 0.6993, "lr": 0.00013556931035033526, "epoch": 0.5617827595409661, "percentage": 28.09, "elapsed_time": "0:34:46", "remaining_time": "1:29:00"} +{"current_steps": 2110, "total_steps": 7494, "loss": 0.6811, "lr": 0.00013546612495981603, "epoch": 0.5631171603949826, "percentage": 28.16, "elapsed_time": "0:35:11", "remaining_time": "1:29:47"} +{"current_steps": 2115, "total_steps": 7494, "loss": 0.661, "lr": 0.00013536261153702494, "epoch": 0.5644515612489992, "percentage": 28.22, "elapsed_time": "0:35:36", "remaining_time": "1:30:33"} +{"current_steps": 2120, "total_steps": 7494, "loss": 0.6495, "lr": 0.0001352587706435284, "epoch": 0.5657859621030158, "percentage": 28.29, "elapsed_time": "0:36:18", "remaining_time": "1:32:02"} +{"current_steps": 2125, "total_steps": 7494, "loss": 0.6653, "lr": 0.00013515460284266933, "epoch": 0.5671203629570323, "percentage": 28.36, "elapsed_time": "0:37:02", "remaining_time": "1:33:34"} +{"current_steps": 2130, "total_steps": 7494, "loss": 0.6567, "lr": 0.0001350501086995642, "epoch": 0.5684547638110489, "percentage": 28.42, "elapsed_time": "0:37:27", "remaining_time": "1:34:19"} +{"current_steps": 2135, "total_steps": 7494, "loss": 0.6756, "lr": 0.00013494528878109978, "epoch": 0.5697891646650654, "percentage": 28.49, "elapsed_time": "0:37:52", "remaining_time": "1:35:03"} +{"current_steps": 2140, "total_steps": 7494, "loss": 0.6668, "lr": 0.00013484014365593036, "epoch": 0.5711235655190819, "percentage": 28.56, "elapsed_time": "0:38:47", "remaining_time": "1:37:03"} +{"current_steps": 2145, "total_steps": 7494, "loss": 0.6559, "lr": 0.00013473467389447436, "epoch": 0.5724579663730984, "percentage": 28.62, "elapsed_time": "0:39:19", "remaining_time": "1:38:03"} +{"current_steps": 2150, "total_steps": 7494, "loss": 0.6521, "lr": 0.0001346288800689114, "epoch": 0.573792367227115, "percentage": 28.69, "elapsed_time": "0:39:44", "remaining_time": "1:38:47"} +{"current_steps": 2155, "total_steps": 7494, "loss": 0.6762, "lr": 0.00013452276275317926, "epoch": 0.5751267680811316, "percentage": 28.76, "elapsed_time": "0:40:10", "remaining_time": "1:39:31"} +{"current_steps": 2160, "total_steps": 7494, "loss": 0.6537, "lr": 0.00013441632252297054, "epoch": 0.5764611689351481, "percentage": 28.82, "elapsed_time": "0:41:11", "remaining_time": "1:41:42"} +{"current_steps": 2165, "total_steps": 7494, "loss": 0.6663, "lr": 0.0001343095599557297, "epoch": 0.5777955697891647, "percentage": 28.89, "elapsed_time": "0:41:38", "remaining_time": "1:42:29"} +{"current_steps": 2170, "total_steps": 7494, "loss": 0.6739, "lr": 0.00013420247563064998, "epoch": 0.5791299706431812, "percentage": 28.96, "elapsed_time": "0:42:03", "remaining_time": "1:43:10"} +{"current_steps": 2175, "total_steps": 7494, "loss": 0.6695, "lr": 0.0001340950701286701, "epoch": 0.5804643714971978, "percentage": 29.02, "elapsed_time": "0:42:36", "remaining_time": "1:44:12"} +{"current_steps": 2180, "total_steps": 7494, "loss": 0.6705, "lr": 0.0001339873440324712, "epoch": 0.5817987723512144, "percentage": 29.09, "elapsed_time": "0:43:30", "remaining_time": "1:46:03"} +{"current_steps": 2185, "total_steps": 7494, "loss": 0.6558, "lr": 0.00013387929792647366, "epoch": 0.5831331732052308, "percentage": 29.16, "elapsed_time": "0:43:56", "remaining_time": "1:46:45"} +{"current_steps": 2190, "total_steps": 7494, "loss": 0.6719, "lr": 0.00013377093239683396, "epoch": 0.5844675740592474, "percentage": 29.22, "elapsed_time": "0:44:21", "remaining_time": "1:47:26"} +{"current_steps": 2195, "total_steps": 7494, "loss": 0.686, "lr": 0.0001336622480314414, "epoch": 0.5858019749132639, "percentage": 29.29, "elapsed_time": "0:45:09", "remaining_time": "1:49:01"} +{"current_steps": 2200, "total_steps": 7494, "loss": 0.6544, "lr": 0.00013355324541991512, "epoch": 0.5871363757672805, "percentage": 29.36, "elapsed_time": "0:45:49", "remaining_time": "1:50:16"} +{"current_steps": 2205, "total_steps": 7494, "loss": 0.6435, "lr": 0.00013344392515360055, "epoch": 0.588470776621297, "percentage": 29.42, "elapsed_time": "0:46:49", "remaining_time": "1:52:18"} +{"current_steps": 2210, "total_steps": 7494, "loss": 0.6601, "lr": 0.0001333342878255667, "epoch": 0.5898051774753136, "percentage": 29.49, "elapsed_time": "0:47:14", "remaining_time": "1:52:57"} +{"current_steps": 2215, "total_steps": 7494, "loss": 0.6628, "lr": 0.00013322433403060237, "epoch": 0.5911395783293302, "percentage": 29.56, "elapsed_time": "0:48:11", "remaining_time": "1:54:51"} +{"current_steps": 2220, "total_steps": 7494, "loss": 0.6544, "lr": 0.0001331140643652134, "epoch": 0.5924739791833467, "percentage": 29.62, "elapsed_time": "0:48:40", "remaining_time": "1:55:39"} +{"current_steps": 2225, "total_steps": 7494, "loss": 0.6569, "lr": 0.00013300347942761916, "epoch": 0.5938083800373632, "percentage": 29.69, "elapsed_time": "0:49:31", "remaining_time": "1:57:17"} +{"current_steps": 2230, "total_steps": 7494, "loss": 0.6663, "lr": 0.00013289257981774944, "epoch": 0.5951427808913797, "percentage": 29.76, "elapsed_time": "0:49:59", "remaining_time": "1:57:59"} +{"current_steps": 2235, "total_steps": 7494, "loss": 0.6717, "lr": 0.0001327813661372411, "epoch": 0.5964771817453963, "percentage": 29.82, "elapsed_time": "0:51:34", "remaining_time": "2:01:21"} +{"current_steps": 2240, "total_steps": 7494, "loss": 0.6473, "lr": 0.00013266983898943495, "epoch": 0.5978115825994129, "percentage": 29.89, "elapsed_time": "0:53:35", "remaining_time": "2:05:41"} +{"current_steps": 2245, "total_steps": 7494, "loss": 0.6732, "lr": 0.00013255799897937218, "epoch": 0.5991459834534294, "percentage": 29.96, "elapsed_time": "0:55:44", "remaining_time": "2:10:18"} +{"current_steps": 2250, "total_steps": 7494, "loss": 0.6703, "lr": 0.0001324458467137915, "epoch": 0.600480384307446, "percentage": 30.02, "elapsed_time": "0:56:22", "remaining_time": "2:11:23"} +{"current_steps": 2255, "total_steps": 7494, "loss": 0.6554, "lr": 0.00013233338280112548, "epoch": 0.6018147851614625, "percentage": 30.09, "elapsed_time": "0:57:11", "remaining_time": "2:12:52"} +{"current_steps": 2260, "total_steps": 7494, "loss": 0.6673, "lr": 0.00013222060785149744, "epoch": 0.6031491860154791, "percentage": 30.16, "elapsed_time": "0:57:36", "remaining_time": "2:13:25"} +{"current_steps": 2265, "total_steps": 7494, "loss": 0.6774, "lr": 0.00013210752247671813, "epoch": 0.6044835868694955, "percentage": 30.22, "elapsed_time": "0:58:01", "remaining_time": "2:13:58"} +{"current_steps": 2270, "total_steps": 7494, "loss": 0.6598, "lr": 0.00013199412729028226, "epoch": 0.6058179877235121, "percentage": 30.29, "elapsed_time": "0:58:50", "remaining_time": "2:15:24"} +{"current_steps": 2275, "total_steps": 7494, "loss": 0.6705, "lr": 0.00013188042290736542, "epoch": 0.6071523885775287, "percentage": 30.36, "elapsed_time": "0:59:26", "remaining_time": "2:16:22"} +{"current_steps": 2280, "total_steps": 7494, "loss": 0.6441, "lr": 0.00013176640994482056, "epoch": 0.6084867894315452, "percentage": 30.42, "elapsed_time": "1:00:45", "remaining_time": "2:18:56"} +{"current_steps": 2285, "total_steps": 7494, "loss": 0.6681, "lr": 0.00013165208902117466, "epoch": 0.6098211902855618, "percentage": 30.49, "elapsed_time": "1:01:11", "remaining_time": "2:19:29"} +{"current_steps": 2290, "total_steps": 7494, "loss": 0.6626, "lr": 0.0001315374607566254, "epoch": 0.6111555911395783, "percentage": 30.56, "elapsed_time": "1:02:39", "remaining_time": "2:22:23"} +{"current_steps": 2295, "total_steps": 7494, "loss": 0.6702, "lr": 0.0001314225257730379, "epoch": 0.6124899919935949, "percentage": 30.62, "elapsed_time": "1:04:17", "remaining_time": "2:25:37"} +{"current_steps": 2300, "total_steps": 7494, "loss": 0.662, "lr": 0.00013130728469394113, "epoch": 0.6138243928476115, "percentage": 30.69, "elapsed_time": "1:07:40", "remaining_time": "2:32:50"} +{"current_steps": 2305, "total_steps": 7494, "loss": 0.6623, "lr": 0.00013119173814452474, "epoch": 0.615158793701628, "percentage": 30.76, "elapsed_time": "1:09:04", "remaining_time": "2:35:30"} +{"current_steps": 2310, "total_steps": 7494, "loss": 0.6636, "lr": 0.0001310758867516355, "epoch": 0.6164931945556446, "percentage": 30.82, "elapsed_time": "1:10:01", "remaining_time": "2:37:08"} +{"current_steps": 2315, "total_steps": 7494, "loss": 0.6504, "lr": 0.00013095973114377401, "epoch": 0.617827595409661, "percentage": 30.89, "elapsed_time": "1:10:28", "remaining_time": "2:37:39"} +{"current_steps": 2320, "total_steps": 7494, "loss": 0.6712, "lr": 0.00013084327195109127, "epoch": 0.6191619962636776, "percentage": 30.96, "elapsed_time": "1:10:53", "remaining_time": "2:38:06"} +{"current_steps": 2325, "total_steps": 7494, "loss": 0.6776, "lr": 0.0001307265098053852, "epoch": 0.6204963971176941, "percentage": 31.02, "elapsed_time": "1:11:31", "remaining_time": "2:39:00"} +{"current_steps": 2330, "total_steps": 7494, "loss": 0.6592, "lr": 0.00013060944534009727, "epoch": 0.6218307979717107, "percentage": 31.09, "elapsed_time": "1:12:21", "remaining_time": "2:40:22"} +{"current_steps": 2335, "total_steps": 7494, "loss": 0.6713, "lr": 0.00013049207919030913, "epoch": 0.6231651988257273, "percentage": 31.16, "elapsed_time": "1:12:46", "remaining_time": "2:40:47"} +{"current_steps": 2340, "total_steps": 7494, "loss": 0.6717, "lr": 0.000130374411992739, "epoch": 0.6244995996797438, "percentage": 31.22, "elapsed_time": "1:13:12", "remaining_time": "2:41:13"} +{"current_steps": 2345, "total_steps": 7494, "loss": 0.6736, "lr": 0.00013025644438573828, "epoch": 0.6258340005337604, "percentage": 31.29, "elapsed_time": "1:13:57", "remaining_time": "2:42:24"} +{"current_steps": 2350, "total_steps": 7494, "loss": 0.6603, "lr": 0.0001301381770092882, "epoch": 0.6271684013877769, "percentage": 31.36, "elapsed_time": "1:14:39", "remaining_time": "2:43:26"} +{"current_steps": 2355, "total_steps": 7494, "loss": 0.6598, "lr": 0.00013001961050499618, "epoch": 0.6285028022417934, "percentage": 31.43, "elapsed_time": "1:15:05", "remaining_time": "2:43:50"} +{"current_steps": 2360, "total_steps": 7494, "loss": 0.6479, "lr": 0.00012990074551609248, "epoch": 0.6298372030958099, "percentage": 31.49, "elapsed_time": "1:15:30", "remaining_time": "2:44:15"} +{"current_steps": 2365, "total_steps": 7494, "loss": 0.646, "lr": 0.00012978158268742656, "epoch": 0.6311716039498265, "percentage": 31.56, "elapsed_time": "1:16:24", "remaining_time": "2:45:42"} +{"current_steps": 2370, "total_steps": 7494, "loss": 0.6737, "lr": 0.00012966212266546384, "epoch": 0.6325060048038431, "percentage": 31.63, "elapsed_time": "1:16:55", "remaining_time": "2:46:19"} +{"current_steps": 2375, "total_steps": 7494, "loss": 0.677, "lr": 0.0001295423660982819, "epoch": 0.6338404056578596, "percentage": 31.69, "elapsed_time": "1:17:20", "remaining_time": "2:46:42"} +{"current_steps": 2380, "total_steps": 7494, "loss": 0.6729, "lr": 0.00012942231363556717, "epoch": 0.6351748065118762, "percentage": 31.76, "elapsed_time": "1:17:49", "remaining_time": "2:47:13"} +{"current_steps": 2385, "total_steps": 7494, "loss": 0.6387, "lr": 0.00012930196592861123, "epoch": 0.6365092073658927, "percentage": 31.83, "elapsed_time": "1:18:49", "remaining_time": "2:48:52"} +{"current_steps": 2390, "total_steps": 7494, "loss": 0.6617, "lr": 0.0001291813236303075, "epoch": 0.6378436082199093, "percentage": 31.89, "elapsed_time": "1:19:18", "remaining_time": "2:49:21"} +{"current_steps": 2395, "total_steps": 7494, "loss": 0.6613, "lr": 0.0001290603873951475, "epoch": 0.6391780090739259, "percentage": 31.96, "elapsed_time": "1:19:43", "remaining_time": "2:49:44"} +{"current_steps": 2400, "total_steps": 7494, "loss": 0.6552, "lr": 0.0001289391578792174, "epoch": 0.6405124099279423, "percentage": 32.03, "elapsed_time": "1:20:18", "remaining_time": "2:50:26"} +{"current_steps": 2405, "total_steps": 7494, "loss": 0.6609, "lr": 0.0001288176357401944, "epoch": 0.6418468107819589, "percentage": 32.09, "elapsed_time": "1:21:18", "remaining_time": "2:52:02"} +{"current_steps": 2410, "total_steps": 7494, "loss": 0.6621, "lr": 0.00012869582163734327, "epoch": 0.6431812116359754, "percentage": 32.16, "elapsed_time": "1:21:44", "remaining_time": "2:52:25"} +{"current_steps": 2415, "total_steps": 7494, "loss": 0.6459, "lr": 0.00012857371623151265, "epoch": 0.644515612489992, "percentage": 32.23, "elapsed_time": "1:22:09", "remaining_time": "2:52:47"} +{"current_steps": 2420, "total_steps": 7494, "loss": 0.6576, "lr": 0.00012845132018513147, "epoch": 0.6458500133440085, "percentage": 32.29, "elapsed_time": "1:22:54", "remaining_time": "2:53:49"} +{"current_steps": 2425, "total_steps": 7494, "loss": 0.6704, "lr": 0.00012832863416220556, "epoch": 0.6471844141980251, "percentage": 32.36, "elapsed_time": "1:23:37", "remaining_time": "2:54:48"} +{"current_steps": 2430, "total_steps": 7494, "loss": 0.6504, "lr": 0.00012820565882831365, "epoch": 0.6485188150520417, "percentage": 32.43, "elapsed_time": "1:24:03", "remaining_time": "2:55:09"} +{"current_steps": 2435, "total_steps": 7494, "loss": 0.6475, "lr": 0.00012808239485060426, "epoch": 0.6498532159060582, "percentage": 32.49, "elapsed_time": "1:24:28", "remaining_time": "2:55:29"} +{"current_steps": 2440, "total_steps": 7494, "loss": 0.6545, "lr": 0.00012795884289779161, "epoch": 0.6511876167600748, "percentage": 32.56, "elapsed_time": "1:26:09", "remaining_time": "2:58:27"} +{"current_steps": 2445, "total_steps": 7494, "loss": 0.6486, "lr": 0.00012783500364015233, "epoch": 0.6525220176140912, "percentage": 32.63, "elapsed_time": "1:26:46", "remaining_time": "2:59:11"} +{"current_steps": 2450, "total_steps": 7494, "loss": 0.6638, "lr": 0.00012771087774952165, "epoch": 0.6538564184681078, "percentage": 32.69, "elapsed_time": "1:27:11", "remaining_time": "2:59:30"} +{"current_steps": 2455, "total_steps": 7494, "loss": 0.6575, "lr": 0.00012758646589928975, "epoch": 0.6551908193221244, "percentage": 32.76, "elapsed_time": "1:27:37", "remaining_time": "2:59:51"} +{"current_steps": 2460, "total_steps": 7494, "loss": 0.677, "lr": 0.00012746176876439824, "epoch": 0.6565252201761409, "percentage": 32.83, "elapsed_time": "1:29:39", "remaining_time": "3:03:28"} +{"current_steps": 2465, "total_steps": 7494, "loss": 0.6493, "lr": 0.00012733678702133642, "epoch": 0.6578596210301575, "percentage": 32.89, "elapsed_time": "1:31:00", "remaining_time": "3:05:39"} +{"current_steps": 2470, "total_steps": 7494, "loss": 0.6624, "lr": 0.00012721152134813755, "epoch": 0.659194021884174, "percentage": 32.96, "elapsed_time": "1:31:25", "remaining_time": "3:05:58"} +{"current_steps": 2475, "total_steps": 7494, "loss": 0.6568, "lr": 0.00012708597242437524, "epoch": 0.6605284227381906, "percentage": 33.03, "elapsed_time": "1:31:56", "remaining_time": "3:06:26"} +{"current_steps": 2480, "total_steps": 7494, "loss": 0.6717, "lr": 0.00012696014093115974, "epoch": 0.661862823592207, "percentage": 33.09, "elapsed_time": "1:33:19", "remaining_time": "3:08:40"} +{"current_steps": 2485, "total_steps": 7494, "loss": 0.6475, "lr": 0.00012683402755113432, "epoch": 0.6631972244462236, "percentage": 33.16, "elapsed_time": "1:37:11", "remaining_time": "3:15:54"} +{"current_steps": 2490, "total_steps": 7494, "loss": 0.6509, "lr": 0.0001267076329684714, "epoch": 0.6645316253002402, "percentage": 33.23, "elapsed_time": "1:38:23", "remaining_time": "3:17:44"} +{"current_steps": 2495, "total_steps": 7494, "loss": 0.6578, "lr": 0.0001265809578688691, "epoch": 0.6658660261542567, "percentage": 33.29, "elapsed_time": "1:39:02", "remaining_time": "3:18:26"} +{"current_steps": 2500, "total_steps": 7494, "loss": 0.664, "lr": 0.00012645400293954714, "epoch": 0.6672004270082733, "percentage": 33.36, "elapsed_time": "1:41:21", "remaining_time": "3:22:28"} +{"current_steps": 2505, "total_steps": 7494, "loss": 0.6793, "lr": 0.0001263267688692435, "epoch": 0.6685348278622898, "percentage": 33.43, "elapsed_time": "1:42:19", "remaining_time": "3:23:48"} +{"current_steps": 2510, "total_steps": 7494, "loss": 0.6613, "lr": 0.00012619925634821052, "epoch": 0.6698692287163064, "percentage": 33.49, "elapsed_time": "1:42:45", "remaining_time": "3:24:01"} +{"current_steps": 2515, "total_steps": 7494, "loss": 0.6525, "lr": 0.00012607146606821105, "epoch": 0.671203629570323, "percentage": 33.56, "elapsed_time": "1:43:59", "remaining_time": "3:25:52"} +{"current_steps": 2520, "total_steps": 7494, "loss": 0.6644, "lr": 0.00012594339872251483, "epoch": 0.6725380304243395, "percentage": 33.63, "elapsed_time": "1:46:20", "remaining_time": "3:29:54"} +{"current_steps": 2525, "total_steps": 7494, "loss": 0.6616, "lr": 0.00012581505500589474, "epoch": 0.673872431278356, "percentage": 33.69, "elapsed_time": "1:49:26", "remaining_time": "3:35:21"} +{"current_steps": 2530, "total_steps": 7494, "loss": 0.6539, "lr": 0.00012568643561462298, "epoch": 0.6752068321323725, "percentage": 33.76, "elapsed_time": "1:50:59", "remaining_time": "3:37:45"} +{"current_steps": 2535, "total_steps": 7494, "loss": 0.6505, "lr": 0.00012555754124646729, "epoch": 0.6765412329863891, "percentage": 33.83, "elapsed_time": "1:53:06", "remaining_time": "3:41:15"} +{"current_steps": 2540, "total_steps": 7494, "loss": 0.6487, "lr": 0.0001254283726006871, "epoch": 0.6778756338404056, "percentage": 33.89, "elapsed_time": "1:53:40", "remaining_time": "3:41:43"} +{"current_steps": 2545, "total_steps": 7494, "loss": 0.6621, "lr": 0.00012529893037803, "epoch": 0.6792100346944222, "percentage": 33.96, "elapsed_time": "1:54:06", "remaining_time": "3:41:53"} +{"current_steps": 2550, "total_steps": 7494, "loss": 0.6497, "lr": 0.00012516921528072752, "epoch": 0.6805444355484388, "percentage": 34.03, "elapsed_time": "1:55:03", "remaining_time": "3:43:04"} +{"current_steps": 2555, "total_steps": 7494, "loss": 0.679, "lr": 0.00012503922801249172, "epoch": 0.6818788364024553, "percentage": 34.09, "elapsed_time": "1:56:30", "remaining_time": "3:45:12"} +{"current_steps": 2560, "total_steps": 7494, "loss": 0.6606, "lr": 0.00012490896927851118, "epoch": 0.6832132372564719, "percentage": 34.16, "elapsed_time": "1:57:21", "remaining_time": "3:46:12"} +{"current_steps": 2565, "total_steps": 7494, "loss": 0.6505, "lr": 0.0001247784397854471, "epoch": 0.6845476381104884, "percentage": 34.23, "elapsed_time": "1:57:47", "remaining_time": "3:46:20"} +{"current_steps": 2570, "total_steps": 7494, "loss": 0.6612, "lr": 0.0001246476402414297, "epoch": 0.685882038964505, "percentage": 34.29, "elapsed_time": "1:58:21", "remaining_time": "3:46:45"} +{"current_steps": 2575, "total_steps": 7494, "loss": 0.6641, "lr": 0.0001245165713560541, "epoch": 0.6872164398185214, "percentage": 34.36, "elapsed_time": "1:59:15", "remaining_time": "3:47:49"} +{"current_steps": 2580, "total_steps": 7494, "loss": 0.6644, "lr": 0.00012438523384037675, "epoch": 0.688550840672538, "percentage": 34.43, "elapsed_time": "1:59:42", "remaining_time": "3:48:00"} +{"current_steps": 2585, "total_steps": 7494, "loss": 0.6394, "lr": 0.0001242536284069113, "epoch": 0.6898852415265546, "percentage": 34.49, "elapsed_time": "2:00:07", "remaining_time": "3:48:07"} +{"current_steps": 2590, "total_steps": 7494, "loss": 0.6508, "lr": 0.00012412175576962504, "epoch": 0.6912196423805711, "percentage": 34.56, "elapsed_time": "2:00:49", "remaining_time": "3:48:46"} +{"current_steps": 2595, "total_steps": 7494, "loss": 0.6638, "lr": 0.00012398961664393467, "epoch": 0.6925540432345877, "percentage": 34.63, "elapsed_time": "2:02:47", "remaining_time": "3:51:48"} +{"current_steps": 2600, "total_steps": 7494, "loss": 0.6659, "lr": 0.0001238572117467027, "epoch": 0.6938884440886042, "percentage": 34.69, "elapsed_time": "2:03:13", "remaining_time": "3:51:56"} +{"current_steps": 2605, "total_steps": 7494, "loss": 0.6479, "lr": 0.0001237245417962335, "epoch": 0.6952228449426208, "percentage": 34.76, "elapsed_time": "2:04:11", "remaining_time": "3:53:04"} +{"current_steps": 2610, "total_steps": 7494, "loss": 0.6692, "lr": 0.0001235916075122693, "epoch": 0.6965572457966374, "percentage": 34.83, "elapsed_time": "2:06:27", "remaining_time": "3:56:37"} +{"current_steps": 2615, "total_steps": 7494, "loss": 0.6831, "lr": 0.00012345840961598638, "epoch": 0.6978916466506538, "percentage": 34.89, "elapsed_time": "2:09:12", "remaining_time": "4:01:05"} +{"current_steps": 2620, "total_steps": 7494, "loss": 0.6675, "lr": 0.00012332494882999113, "epoch": 0.6992260475046704, "percentage": 34.96, "elapsed_time": "2:10:00", "remaining_time": "4:01:51"} +{"current_steps": 2625, "total_steps": 7494, "loss": 0.6466, "lr": 0.00012319122587831614, "epoch": 0.7005604483586869, "percentage": 35.03, "elapsed_time": "2:10:27", "remaining_time": "4:01:58"} +{"current_steps": 2630, "total_steps": 7494, "loss": 0.6563, "lr": 0.00012305724148641627, "epoch": 0.7018948492127035, "percentage": 35.09, "elapsed_time": "2:11:19", "remaining_time": "4:02:53"} +{"current_steps": 2635, "total_steps": 7494, "loss": 0.6601, "lr": 0.00012292299638116472, "epoch": 0.70322925006672, "percentage": 35.16, "elapsed_time": "2:11:54", "remaining_time": "4:03:15"} +{"current_steps": 2640, "total_steps": 7494, "loss": 0.6451, "lr": 0.00012278849129084902, "epoch": 0.7045636509207366, "percentage": 35.23, "elapsed_time": "2:12:20", "remaining_time": "4:03:19"} +{"current_steps": 2645, "total_steps": 7494, "loss": 0.6629, "lr": 0.00012265372694516714, "epoch": 0.7058980517747532, "percentage": 35.29, "elapsed_time": "2:13:25", "remaining_time": "4:04:36"} +{"current_steps": 2650, "total_steps": 7494, "loss": 0.6626, "lr": 0.00012251870407522364, "epoch": 0.7072324526287697, "percentage": 35.36, "elapsed_time": "2:14:45", "remaining_time": "4:06:19"} +{"current_steps": 2655, "total_steps": 7494, "loss": 0.6458, "lr": 0.00012238342341352546, "epoch": 0.7085668534827863, "percentage": 35.43, "elapsed_time": "2:16:25", "remaining_time": "4:08:39"} +{"current_steps": 2660, "total_steps": 7494, "loss": 0.6685, "lr": 0.00012224788569397806, "epoch": 0.7099012543368027, "percentage": 35.5, "elapsed_time": "2:16:51", "remaining_time": "4:08:42"} +{"current_steps": 2665, "total_steps": 7494, "loss": 0.6707, "lr": 0.0001221120916518816, "epoch": 0.7112356551908193, "percentage": 35.56, "elapsed_time": "2:17:24", "remaining_time": "4:08:59"} +{"current_steps": 2670, "total_steps": 7494, "loss": 0.6371, "lr": 0.0001219760420239267, "epoch": 0.7125700560448359, "percentage": 35.63, "elapsed_time": "2:19:48", "remaining_time": "4:12:35"} +{"current_steps": 2675, "total_steps": 7494, "loss": 0.6376, "lr": 0.00012183973754819051, "epoch": 0.7139044568988524, "percentage": 35.7, "elapsed_time": "2:20:16", "remaining_time": "4:12:42"} +{"current_steps": 2680, "total_steps": 7494, "loss": 0.6458, "lr": 0.00012170317896413284, "epoch": 0.715238857752869, "percentage": 35.76, "elapsed_time": "2:20:41", "remaining_time": "4:12:43"} +{"current_steps": 2685, "total_steps": 7494, "loss": 0.6503, "lr": 0.00012156636701259202, "epoch": 0.7165732586068855, "percentage": 35.83, "elapsed_time": "2:21:41", "remaining_time": "4:13:47"} +{"current_steps": 2690, "total_steps": 7494, "loss": 0.6447, "lr": 0.00012142930243578092, "epoch": 0.7179076594609021, "percentage": 35.9, "elapsed_time": "2:23:42", "remaining_time": "4:16:38"} +{"current_steps": 2695, "total_steps": 7494, "loss": 0.6613, "lr": 0.00012129198597728285, "epoch": 0.7192420603149186, "percentage": 35.96, "elapsed_time": "2:25:10", "remaining_time": "4:18:30"} +{"current_steps": 2700, "total_steps": 7494, "loss": 0.662, "lr": 0.00012115441838204767, "epoch": 0.7205764611689351, "percentage": 36.03, "elapsed_time": "2:25:35", "remaining_time": "4:18:31"} +{"current_steps": 2705, "total_steps": 7494, "loss": 0.6272, "lr": 0.00012101660039638766, "epoch": 0.7219108620229517, "percentage": 36.1, "elapsed_time": "2:26:31", "remaining_time": "4:19:25"} +{"current_steps": 2710, "total_steps": 7494, "loss": 0.6594, "lr": 0.00012087853276797346, "epoch": 0.7232452628769682, "percentage": 36.16, "elapsed_time": "2:27:59", "remaining_time": "4:21:14"} +{"current_steps": 2715, "total_steps": 7494, "loss": 0.6672, "lr": 0.00012074021624583005, "epoch": 0.7245796637309848, "percentage": 36.23, "elapsed_time": "2:29:50", "remaining_time": "4:23:46"} +{"current_steps": 2720, "total_steps": 7494, "loss": 0.6445, "lr": 0.00012060165158033268, "epoch": 0.7259140645850013, "percentage": 36.3, "elapsed_time": "2:32:35", "remaining_time": "4:27:49"} +{"current_steps": 2725, "total_steps": 7494, "loss": 0.6596, "lr": 0.00012046283952320275, "epoch": 0.7272484654390179, "percentage": 36.36, "elapsed_time": "2:33:28", "remaining_time": "4:28:35"} +{"current_steps": 2730, "total_steps": 7494, "loss": 0.641, "lr": 0.00012032378082750382, "epoch": 0.7285828662930345, "percentage": 36.43, "elapsed_time": "2:35:23", "remaining_time": "4:31:10"} +{"current_steps": 2735, "total_steps": 7494, "loss": 0.6664, "lr": 0.00012018447624763748, "epoch": 0.729917267147051, "percentage": 36.5, "elapsed_time": "2:35:49", "remaining_time": "4:31:07"} +{"current_steps": 2740, "total_steps": 7494, "loss": 0.6544, "lr": 0.00012004492653933923, "epoch": 0.7312516680010676, "percentage": 36.56, "elapsed_time": "2:37:07", "remaining_time": "4:32:36"} +{"current_steps": 2745, "total_steps": 7494, "loss": 0.6548, "lr": 0.0001199051324596744, "epoch": 0.732586068855084, "percentage": 36.63, "elapsed_time": "2:39:29", "remaining_time": "4:35:56"} +{"current_steps": 2750, "total_steps": 7494, "loss": 0.6562, "lr": 0.00011976509476703408, "epoch": 0.7339204697091006, "percentage": 36.7, "elapsed_time": "2:40:02", "remaining_time": "4:36:04"} +{"current_steps": 2755, "total_steps": 7494, "loss": 0.6641, "lr": 0.00011962481422113098, "epoch": 0.7352548705631171, "percentage": 36.76, "elapsed_time": "2:40:51", "remaining_time": "4:36:42"} +{"current_steps": 2760, "total_steps": 7494, "loss": 0.6414, "lr": 0.00011948429158299523, "epoch": 0.7365892714171337, "percentage": 36.83, "elapsed_time": "2:41:24", "remaining_time": "4:36:50"} +{"current_steps": 2765, "total_steps": 7494, "loss": 0.6562, "lr": 0.00011934352761497043, "epoch": 0.7379236722711503, "percentage": 36.9, "elapsed_time": "2:42:18", "remaining_time": "4:37:35"} +{"current_steps": 2770, "total_steps": 7494, "loss": 0.654, "lr": 0.00011920252308070936, "epoch": 0.7392580731251668, "percentage": 36.96, "elapsed_time": "2:42:47", "remaining_time": "4:37:36"} +{"current_steps": 2775, "total_steps": 7494, "loss": 0.6794, "lr": 0.00011906127874516985, "epoch": 0.7405924739791834, "percentage": 37.03, "elapsed_time": "2:43:38", "remaining_time": "4:38:17"} +{"current_steps": 2780, "total_steps": 7494, "loss": 0.6482, "lr": 0.00011891979537461069, "epoch": 0.7419268748331999, "percentage": 37.1, "elapsed_time": "2:44:16", "remaining_time": "4:38:34"} +{"current_steps": 2785, "total_steps": 7494, "loss": 0.6588, "lr": 0.00011877807373658751, "epoch": 0.7432612756872164, "percentage": 37.16, "elapsed_time": "2:45:12", "remaining_time": "4:39:19"} +{"current_steps": 2790, "total_steps": 7494, "loss": 0.6355, "lr": 0.00011863611459994845, "epoch": 0.7445956765412329, "percentage": 37.23, "elapsed_time": "2:45:38", "remaining_time": "4:39:17"} +{"current_steps": 2795, "total_steps": 7494, "loss": 0.6563, "lr": 0.00011849391873483016, "epoch": 0.7459300773952495, "percentage": 37.3, "elapsed_time": "2:47:23", "remaining_time": "4:41:25"} +{"current_steps": 2800, "total_steps": 7494, "loss": 0.6423, "lr": 0.00011835148691265355, "epoch": 0.7472644782492661, "percentage": 37.36, "elapsed_time": "2:48:07", "remaining_time": "4:41:50"} +{"current_steps": 2805, "total_steps": 7494, "loss": 0.6584, "lr": 0.00011820881990611963, "epoch": 0.7485988791032826, "percentage": 37.43, "elapsed_time": "2:49:00", "remaining_time": "4:42:31"} +{"current_steps": 2810, "total_steps": 7494, "loss": 0.6543, "lr": 0.00011806591848920521, "epoch": 0.7499332799572992, "percentage": 37.5, "elapsed_time": "2:49:26", "remaining_time": "4:42:25"} +{"current_steps": 2815, "total_steps": 7494, "loss": 0.6698, "lr": 0.00011792278343715892, "epoch": 0.7512676808113157, "percentage": 37.56, "elapsed_time": "2:49:52", "remaining_time": "4:42:20"} +{"current_steps": 2820, "total_steps": 7494, "loss": 0.6507, "lr": 0.00011777941552649674, "epoch": 0.7526020816653323, "percentage": 37.63, "elapsed_time": "2:50:42", "remaining_time": "4:42:56"} +{"current_steps": 2825, "total_steps": 7494, "loss": 0.6689, "lr": 0.00011763581553499803, "epoch": 0.7539364825193489, "percentage": 37.7, "elapsed_time": "2:51:23", "remaining_time": "4:43:15"} +{"current_steps": 2830, "total_steps": 7494, "loss": 0.636, "lr": 0.00011749198424170117, "epoch": 0.7552708833733653, "percentage": 37.76, "elapsed_time": "2:51:48", "remaining_time": "4:43:09"} +{"current_steps": 2835, "total_steps": 7494, "loss": 0.6503, "lr": 0.00011734792242689934, "epoch": 0.7566052842273819, "percentage": 37.83, "elapsed_time": "2:52:15", "remaining_time": "4:43:04"} +{"current_steps": 2840, "total_steps": 7494, "loss": 0.6492, "lr": 0.00011720363087213629, "epoch": 0.7579396850813984, "percentage": 37.9, "elapsed_time": "2:53:15", "remaining_time": "4:43:54"} +{"current_steps": 2845, "total_steps": 7494, "loss": 0.6547, "lr": 0.00011705911036020222, "epoch": 0.759274085935415, "percentage": 37.96, "elapsed_time": "2:53:49", "remaining_time": "4:44:03"} +{"current_steps": 2850, "total_steps": 7494, "loss": 0.6558, "lr": 0.00011691436167512938, "epoch": 0.7606084867894315, "percentage": 38.03, "elapsed_time": "2:58:21", "remaining_time": "4:50:37"} +{"current_steps": 2855, "total_steps": 7494, "loss": 0.6692, "lr": 0.00011676938560218781, "epoch": 0.7619428876434481, "percentage": 38.1, "elapsed_time": "2:59:15", "remaining_time": "4:51:15"} +{"current_steps": 2860, "total_steps": 7494, "loss": 0.6383, "lr": 0.00011662418292788127, "epoch": 0.7632772884974647, "percentage": 38.16, "elapsed_time": "3:00:34", "remaining_time": "4:52:35"} +{"current_steps": 2865, "total_steps": 7494, "loss": 0.6536, "lr": 0.00011647875443994271, "epoch": 0.7646116893514812, "percentage": 38.23, "elapsed_time": "3:01:06", "remaining_time": "4:52:36"} +{"current_steps": 2870, "total_steps": 7494, "loss": 0.654, "lr": 0.00011633310092733027, "epoch": 0.7659460902054978, "percentage": 38.3, "elapsed_time": "3:03:05", "remaining_time": "4:54:59"} +{"current_steps": 2875, "total_steps": 7494, "loss": 0.6469, "lr": 0.00011618722318022273, "epoch": 0.7672804910595142, "percentage": 38.36, "elapsed_time": "3:05:12", "remaining_time": "4:57:33"} +{"current_steps": 2880, "total_steps": 7494, "loss": 0.6591, "lr": 0.00011604112199001546, "epoch": 0.7686148919135308, "percentage": 38.43, "elapsed_time": "3:06:38", "remaining_time": "4:59:01"} +{"current_steps": 2885, "total_steps": 7494, "loss": 0.6747, "lr": 0.00011589479814931598, "epoch": 0.7699492927675474, "percentage": 38.5, "elapsed_time": "3:07:07", "remaining_time": "4:58:56"} +{"current_steps": 2890, "total_steps": 7494, "loss": 0.6484, "lr": 0.0001157482524519397, "epoch": 0.7712836936215639, "percentage": 38.56, "elapsed_time": "3:13:40", "remaining_time": "5:08:32"} +{"current_steps": 2895, "total_steps": 7494, "loss": 0.6631, "lr": 0.00011560148569290558, "epoch": 0.7726180944755805, "percentage": 38.63, "elapsed_time": "3:15:23", "remaining_time": "5:10:23"} +{"current_steps": 2900, "total_steps": 7494, "loss": 0.6525, "lr": 0.00011545449866843194, "epoch": 0.773952495329597, "percentage": 38.7, "elapsed_time": "3:19:40", "remaining_time": "5:16:19"} +{"current_steps": 2905, "total_steps": 7494, "loss": 0.6611, "lr": 0.00011530729217593198, "epoch": 0.7752868961836136, "percentage": 38.76, "elapsed_time": "3:21:40", "remaining_time": "5:18:35"} +{"current_steps": 2910, "total_steps": 7494, "loss": 0.6486, "lr": 0.00011515986701400955, "epoch": 0.77662129703763, "percentage": 38.83, "elapsed_time": "3:22:30", "remaining_time": "5:19:00"} +{"current_steps": 2915, "total_steps": 7494, "loss": 0.6492, "lr": 0.00011501222398245478, "epoch": 0.7779556978916466, "percentage": 38.9, "elapsed_time": "3:23:52", "remaining_time": "5:20:15"} +{"current_steps": 2920, "total_steps": 7494, "loss": 0.6506, "lr": 0.00011486436388223977, "epoch": 0.7792900987456632, "percentage": 38.96, "elapsed_time": "3:24:38", "remaining_time": "5:20:33"} +{"current_steps": 2925, "total_steps": 7494, "loss": 0.6476, "lr": 0.00011471628751551426, "epoch": 0.7806244995996797, "percentage": 39.03, "elapsed_time": "3:26:19", "remaining_time": "5:22:17"} +{"current_steps": 2930, "total_steps": 7494, "loss": 0.6519, "lr": 0.0001145679956856012, "epoch": 0.7819589004536963, "percentage": 39.1, "elapsed_time": "3:28:17", "remaining_time": "5:24:26"} +{"current_steps": 2935, "total_steps": 7494, "loss": 0.641, "lr": 0.00011441948919699249, "epoch": 0.7832933013077128, "percentage": 39.16, "elapsed_time": "3:31:48", "remaining_time": "5:29:00"} +{"current_steps": 2940, "total_steps": 7494, "loss": 0.6586, "lr": 0.00011427076885534445, "epoch": 0.7846277021617294, "percentage": 39.23, "elapsed_time": "3:32:28", "remaining_time": "5:29:07"} +{"current_steps": 2945, "total_steps": 7494, "loss": 0.6717, "lr": 0.00011412183546747374, "epoch": 0.785962103015746, "percentage": 39.3, "elapsed_time": "3:34:17", "remaining_time": "5:30:59"} +{"current_steps": 2950, "total_steps": 7494, "loss": 0.6529, "lr": 0.00011397268984135266, "epoch": 0.7872965038697625, "percentage": 39.36, "elapsed_time": "3:35:19", "remaining_time": "5:31:41"} +{"current_steps": 2955, "total_steps": 7494, "loss": 0.656, "lr": 0.00011382333278610503, "epoch": 0.7886309047237791, "percentage": 39.43, "elapsed_time": "3:36:13", "remaining_time": "5:32:08"} +{"current_steps": 2960, "total_steps": 7494, "loss": 0.6344, "lr": 0.00011367376511200157, "epoch": 0.7899653055777955, "percentage": 39.5, "elapsed_time": "3:36:47", "remaining_time": "5:32:04"} +{"current_steps": 2965, "total_steps": 7494, "loss": 0.6529, "lr": 0.00011352398763045569, "epoch": 0.7912997064318121, "percentage": 39.56, "elapsed_time": "3:37:39", "remaining_time": "5:32:28"} +{"current_steps": 2970, "total_steps": 7494, "loss": 0.6375, "lr": 0.00011337400115401905, "epoch": 0.7926341072858286, "percentage": 39.63, "elapsed_time": "3:38:38", "remaining_time": "5:33:02"} +{"current_steps": 2975, "total_steps": 7494, "loss": 0.6394, "lr": 0.00011322380649637704, "epoch": 0.7939685081398452, "percentage": 39.7, "elapsed_time": "3:39:32", "remaining_time": "5:33:28"} +{"current_steps": 2980, "total_steps": 7494, "loss": 0.6561, "lr": 0.00011307340447234449, "epoch": 0.7953029089938618, "percentage": 39.77, "elapsed_time": "3:40:02", "remaining_time": "5:33:18"} +{"current_steps": 2985, "total_steps": 7494, "loss": 0.6415, "lr": 0.00011292279589786115, "epoch": 0.7966373098478783, "percentage": 39.83, "elapsed_time": "3:40:28", "remaining_time": "5:33:01"} +{"current_steps": 2990, "total_steps": 7494, "loss": 0.6521, "lr": 0.00011277198158998744, "epoch": 0.7979717107018949, "percentage": 39.9, "elapsed_time": "3:43:13", "remaining_time": "5:36:16"} +{"current_steps": 2995, "total_steps": 7494, "loss": 0.6571, "lr": 0.00011262096236689978, "epoch": 0.7993061115559114, "percentage": 39.97, "elapsed_time": "3:44:07", "remaining_time": "5:36:40"} +{"current_steps": 3000, "total_steps": 7494, "loss": 0.6353, "lr": 0.0001124697390478863, "epoch": 0.800640512409928, "percentage": 40.03, "elapsed_time": "3:44:36", "remaining_time": "5:36:27"} +{"current_steps": 3005, "total_steps": 7494, "loss": 0.6576, "lr": 0.00011231831245334238, "epoch": 0.8019749132639445, "percentage": 40.1, "elapsed_time": "3:47:43", "remaining_time": "5:40:10"} +{"current_steps": 3010, "total_steps": 7494, "loss": 0.6382, "lr": 0.00011216668340476618, "epoch": 0.803309314117961, "percentage": 40.17, "elapsed_time": "3:48:58", "remaining_time": "5:41:06"} +{"current_steps": 3015, "total_steps": 7494, "loss": 0.6626, "lr": 0.00011201485272475416, "epoch": 0.8046437149719776, "percentage": 40.23, "elapsed_time": "3:51:42", "remaining_time": "5:44:12"} +{"current_steps": 3020, "total_steps": 7494, "loss": 0.6548, "lr": 0.00011186282123699664, "epoch": 0.8059781158259941, "percentage": 40.3, "elapsed_time": "3:52:33", "remaining_time": "5:44:31"} +{"current_steps": 3025, "total_steps": 7494, "loss": 0.654, "lr": 0.00011171058976627341, "epoch": 0.8073125166800107, "percentage": 40.37, "elapsed_time": "3:53:52", "remaining_time": "5:45:30"} +{"current_steps": 3030, "total_steps": 7494, "loss": 0.6462, "lr": 0.00011155815913844906, "epoch": 0.8086469175340272, "percentage": 40.43, "elapsed_time": "3:56:13", "remaining_time": "5:48:01"} +{"current_steps": 3035, "total_steps": 7494, "loss": 0.6598, "lr": 0.00011140553018046872, "epoch": 0.8099813183880438, "percentage": 40.5, "elapsed_time": "3:58:13", "remaining_time": "5:49:59"} +{"current_steps": 3040, "total_steps": 7494, "loss": 0.6473, "lr": 0.00011125270372035342, "epoch": 0.8113157192420604, "percentage": 40.57, "elapsed_time": "4:00:46", "remaining_time": "5:52:45"} +{"current_steps": 3045, "total_steps": 7494, "loss": 0.6451, "lr": 0.00011109968058719565, "epoch": 0.8126501200960768, "percentage": 40.63, "elapsed_time": "4:01:12", "remaining_time": "5:52:25"} +{"current_steps": 3050, "total_steps": 7494, "loss": 0.6412, "lr": 0.00011094646161115489, "epoch": 0.8139845209500934, "percentage": 40.7, "elapsed_time": "4:02:03", "remaining_time": "5:52:41"} +{"current_steps": 3055, "total_steps": 7494, "loss": 0.6458, "lr": 0.00011079304762345307, "epoch": 0.8153189218041099, "percentage": 40.77, "elapsed_time": "4:02:46", "remaining_time": "5:52:44"} +{"current_steps": 3060, "total_steps": 7494, "loss": 0.6355, "lr": 0.00011063943945637005, "epoch": 0.8166533226581265, "percentage": 40.83, "elapsed_time": "4:03:11", "remaining_time": "5:52:23"} +{"current_steps": 3065, "total_steps": 7494, "loss": 0.6463, "lr": 0.00011048563794323915, "epoch": 0.817987723512143, "percentage": 40.9, "elapsed_time": "4:03:39", "remaining_time": "5:52:05"} +{"current_steps": 3070, "total_steps": 7494, "loss": 0.6508, "lr": 0.00011033164391844259, "epoch": 0.8193221243661596, "percentage": 40.97, "elapsed_time": "4:04:33", "remaining_time": "5:52:25"} +{"current_steps": 3075, "total_steps": 7494, "loss": 0.6507, "lr": 0.00011017745821740696, "epoch": 0.8206565252201762, "percentage": 41.03, "elapsed_time": "4:05:12", "remaining_time": "5:52:22"} +{"current_steps": 3080, "total_steps": 7494, "loss": 0.6611, "lr": 0.00011002308167659877, "epoch": 0.8219909260741927, "percentage": 41.1, "elapsed_time": "4:07:54", "remaining_time": "5:55:16"} +{"current_steps": 3085, "total_steps": 7494, "loss": 0.6627, "lr": 0.00010986851513351976, "epoch": 0.8233253269282093, "percentage": 41.17, "elapsed_time": "4:09:37", "remaining_time": "5:56:46"} +{"current_steps": 3090, "total_steps": 7494, "loss": 0.6897, "lr": 0.00010971375942670251, "epoch": 0.8246597277822257, "percentage": 41.23, "elapsed_time": "4:12:56", "remaining_time": "6:00:29"} +{"current_steps": 3095, "total_steps": 7494, "loss": 0.6474, "lr": 0.00010955881539570581, "epoch": 0.8259941286362423, "percentage": 41.3, "elapsed_time": "4:13:29", "remaining_time": "6:00:17"} +{"current_steps": 3100, "total_steps": 7494, "loss": 0.6332, "lr": 0.00010940368388111008, "epoch": 0.8273285294902589, "percentage": 41.37, "elapsed_time": "4:13:54", "remaining_time": "5:59:53"} +{"current_steps": 3105, "total_steps": 7494, "loss": 0.6519, "lr": 0.00010924836572451287, "epoch": 0.8286629303442754, "percentage": 41.43, "elapsed_time": "4:17:33", "remaining_time": "6:04:03"} +{"current_steps": 3110, "total_steps": 7494, "loss": 0.6529, "lr": 0.00010909286176852432, "epoch": 0.829997331198292, "percentage": 41.5, "elapsed_time": "4:18:27", "remaining_time": "6:04:19"} +{"current_steps": 3115, "total_steps": 7494, "loss": 0.644, "lr": 0.0001089371728567625, "epoch": 0.8313317320523085, "percentage": 41.57, "elapsed_time": "4:18:57", "remaining_time": "6:04:02"} +{"current_steps": 3120, "total_steps": 7494, "loss": 0.6421, "lr": 0.00010878129983384886, "epoch": 0.8326661329063251, "percentage": 41.63, "elapsed_time": "4:19:22", "remaining_time": "6:03:37"} +{"current_steps": 3125, "total_steps": 7494, "loss": 0.6392, "lr": 0.00010862524354540369, "epoch": 0.8340005337603416, "percentage": 41.7, "elapsed_time": "4:21:46", "remaining_time": "6:05:59"} +{"current_steps": 3130, "total_steps": 7494, "loss": 0.6536, "lr": 0.00010846900483804152, "epoch": 0.8353349346143581, "percentage": 41.77, "elapsed_time": "4:25:08", "remaining_time": "6:09:40"} +{"current_steps": 3135, "total_steps": 7494, "loss": 0.6523, "lr": 0.00010831258455936645, "epoch": 0.8366693354683747, "percentage": 41.83, "elapsed_time": "4:26:48", "remaining_time": "6:10:58"} +{"current_steps": 3140, "total_steps": 7494, "loss": 0.653, "lr": 0.00010815598355796771, "epoch": 0.8380037363223912, "percentage": 41.9, "elapsed_time": "4:27:13", "remaining_time": "6:10:32"} +{"current_steps": 3145, "total_steps": 7494, "loss": 0.6595, "lr": 0.0001079992026834149, "epoch": 0.8393381371764078, "percentage": 41.97, "elapsed_time": "4:29:04", "remaining_time": "6:12:04"} +{"current_steps": 3150, "total_steps": 7494, "loss": 0.6499, "lr": 0.00010784224278625345, "epoch": 0.8406725380304243, "percentage": 42.03, "elapsed_time": "4:31:24", "remaining_time": "6:14:17"} +{"current_steps": 3155, "total_steps": 7494, "loss": 0.6392, "lr": 0.00010768510471799996, "epoch": 0.8420069388844409, "percentage": 42.1, "elapsed_time": "4:34:28", "remaining_time": "6:17:29"} +{"current_steps": 3160, "total_steps": 7494, "loss": 0.6496, "lr": 0.00010752778933113774, "epoch": 0.8433413397384575, "percentage": 42.17, "elapsed_time": "4:34:54", "remaining_time": "6:17:02"} +{"current_steps": 3165, "total_steps": 7494, "loss": 0.6658, "lr": 0.00010737029747911191, "epoch": 0.844675740592474, "percentage": 42.23, "elapsed_time": "4:37:07", "remaining_time": "6:19:02"} +{"current_steps": 3170, "total_steps": 7494, "loss": 0.6531, "lr": 0.00010721263001632503, "epoch": 0.8460101414464906, "percentage": 42.3, "elapsed_time": "4:38:11", "remaining_time": "6:19:27"} +{"current_steps": 3175, "total_steps": 7494, "loss": 0.6551, "lr": 0.00010705478779813235, "epoch": 0.847344542300507, "percentage": 42.37, "elapsed_time": "4:38:37", "remaining_time": "6:19:01"} +{"current_steps": 3180, "total_steps": 7494, "loss": 0.6374, "lr": 0.00010689677168083711, "epoch": 0.8486789431545236, "percentage": 42.43, "elapsed_time": "4:39:04", "remaining_time": "6:18:36"} +{"current_steps": 3185, "total_steps": 7494, "loss": 0.6542, "lr": 0.00010673858252168603, "epoch": 0.8500133440085401, "percentage": 42.5, "elapsed_time": "4:39:55", "remaining_time": "6:18:42"} +{"current_steps": 3190, "total_steps": 7494, "loss": 0.6511, "lr": 0.00010658022117886457, "epoch": 0.8513477448625567, "percentage": 42.57, "elapsed_time": "4:40:35", "remaining_time": "6:18:34"} +{"current_steps": 3195, "total_steps": 7494, "loss": 0.6588, "lr": 0.00010642168851149229, "epoch": 0.8526821457165733, "percentage": 42.63, "elapsed_time": "4:41:00", "remaining_time": "6:18:06"} +{"current_steps": 3200, "total_steps": 7494, "loss": 0.6423, "lr": 0.00010626298537961821, "epoch": 0.8540165465705898, "percentage": 42.7, "elapsed_time": "4:41:55", "remaining_time": "6:18:18"} +{"current_steps": 3205, "total_steps": 7494, "loss": 0.6507, "lr": 0.00010610411264421611, "epoch": 0.8553509474246064, "percentage": 42.77, "elapsed_time": "4:44:30", "remaining_time": "6:20:43"} +{"current_steps": 3210, "total_steps": 7494, "loss": 0.6544, "lr": 0.0001059450711671799, "epoch": 0.8566853482786229, "percentage": 42.83, "elapsed_time": "4:46:35", "remaining_time": "6:22:29"} +{"current_steps": 3215, "total_steps": 7494, "loss": 0.6644, "lr": 0.0001057858618113189, "epoch": 0.8580197491326395, "percentage": 42.9, "elapsed_time": "4:47:00", "remaining_time": "6:22:00"} +{"current_steps": 3220, "total_steps": 7494, "loss": 0.6449, "lr": 0.00010562648544035323, "epoch": 0.859354149986656, "percentage": 42.97, "elapsed_time": "4:48:06", "remaining_time": "6:22:24"} +{"current_steps": 3225, "total_steps": 7494, "loss": 0.6254, "lr": 0.00010546694291890902, "epoch": 0.8606885508406725, "percentage": 43.03, "elapsed_time": "4:54:35", "remaining_time": "6:29:56"} +{"current_steps": 3230, "total_steps": 7494, "loss": 0.6544, "lr": 0.00010530723511251382, "epoch": 0.8620229516946891, "percentage": 43.1, "elapsed_time": "4:55:49", "remaining_time": "6:30:31"} +{"current_steps": 3235, "total_steps": 7494, "loss": 0.6468, "lr": 0.0001051473628875918, "epoch": 0.8633573525487056, "percentage": 43.17, "elapsed_time": "4:57:03", "remaining_time": "6:31:05"} +{"current_steps": 3240, "total_steps": 7494, "loss": 0.6601, "lr": 0.00010498732711145918, "epoch": 0.8646917534027222, "percentage": 43.23, "elapsed_time": "4:57:39", "remaining_time": "6:30:48"} +{"current_steps": 3245, "total_steps": 7494, "loss": 0.623, "lr": 0.00010482712865231942, "epoch": 0.8660261542567387, "percentage": 43.3, "elapsed_time": "4:58:29", "remaining_time": "6:30:50"} +{"current_steps": 3250, "total_steps": 7494, "loss": 0.6441, "lr": 0.00010466676837925857, "epoch": 0.8673605551107553, "percentage": 43.37, "elapsed_time": "4:58:58", "remaining_time": "6:30:25"} +{"current_steps": 3255, "total_steps": 7494, "loss": 0.6573, "lr": 0.00010450624716224045, "epoch": 0.8686949559647719, "percentage": 43.43, "elapsed_time": "5:01:15", "remaining_time": "6:32:20"} +{"current_steps": 3260, "total_steps": 7494, "loss": 0.6394, "lr": 0.00010434556587210214, "epoch": 0.8700293568187883, "percentage": 43.5, "elapsed_time": "5:03:06", "remaining_time": "6:33:40"} +{"current_steps": 3265, "total_steps": 7494, "loss": 0.6619, "lr": 0.000104184725380549, "epoch": 0.8713637576728049, "percentage": 43.57, "elapsed_time": "5:04:21", "remaining_time": "6:34:13"} +{"current_steps": 3270, "total_steps": 7494, "loss": 0.6511, "lr": 0.0001040237265601502, "epoch": 0.8726981585268214, "percentage": 43.63, "elapsed_time": "5:04:49", "remaining_time": "6:33:45"} +{"current_steps": 3275, "total_steps": 7494, "loss": 0.6427, "lr": 0.00010386257028433366, "epoch": 0.874032559380838, "percentage": 43.7, "elapsed_time": "5:05:15", "remaining_time": "6:33:14"} +{"current_steps": 3280, "total_steps": 7494, "loss": 0.6424, "lr": 0.00010370125742738173, "epoch": 0.8753669602348545, "percentage": 43.77, "elapsed_time": "5:07:09", "remaining_time": "6:34:37"} +{"current_steps": 3285, "total_steps": 7494, "loss": 0.6662, "lr": 0.00010353978886442605, "epoch": 0.8767013610888711, "percentage": 43.84, "elapsed_time": "5:13:26", "remaining_time": "6:41:36"} +{"current_steps": 3290, "total_steps": 7494, "loss": 0.6708, "lr": 0.00010337816547144308, "epoch": 0.8780357619428877, "percentage": 43.9, "elapsed_time": "5:15:21", "remaining_time": "6:42:58"} +{"current_steps": 3295, "total_steps": 7494, "loss": 0.6547, "lr": 0.00010321638812524917, "epoch": 0.8793701627969042, "percentage": 43.97, "elapsed_time": "5:17:32", "remaining_time": "6:44:39"} +{"current_steps": 3300, "total_steps": 7494, "loss": 0.6414, "lr": 0.00010305445770349593, "epoch": 0.8807045636509208, "percentage": 44.04, "elapsed_time": "5:18:53", "remaining_time": "6:45:17"} +{"current_steps": 3305, "total_steps": 7494, "loss": 0.6448, "lr": 0.00010289237508466536, "epoch": 0.8820389645049372, "percentage": 44.1, "elapsed_time": "5:22:01", "remaining_time": "6:48:09"} +{"current_steps": 3310, "total_steps": 7494, "loss": 0.6388, "lr": 0.00010273014114806517, "epoch": 0.8833733653589538, "percentage": 44.17, "elapsed_time": "5:23:23", "remaining_time": "6:48:46"} +{"current_steps": 3315, "total_steps": 7494, "loss": 0.6527, "lr": 0.000102567756773824, "epoch": 0.8847077662129704, "percentage": 44.24, "elapsed_time": "5:27:13", "remaining_time": "6:52:31"} +{"current_steps": 3320, "total_steps": 7494, "loss": 0.6404, "lr": 0.00010240522284288657, "epoch": 0.8860421670669869, "percentage": 44.3, "elapsed_time": "5:32:03", "remaining_time": "6:57:27"} +{"current_steps": 3325, "total_steps": 7494, "loss": 0.652, "lr": 0.00010224254023700899, "epoch": 0.8873765679210035, "percentage": 44.37, "elapsed_time": "5:35:58", "remaining_time": "7:01:15"} +{"current_steps": 3330, "total_steps": 7494, "loss": 0.6522, "lr": 0.00010207970983875395, "epoch": 0.88871096877502, "percentage": 44.44, "elapsed_time": "5:36:23", "remaining_time": "7:00:38"} +{"current_steps": 3335, "total_steps": 7494, "loss": 0.6484, "lr": 0.00010191673253148589, "epoch": 0.8900453696290366, "percentage": 44.5, "elapsed_time": "5:36:54", "remaining_time": "7:00:08"} +{"current_steps": 3340, "total_steps": 7494, "loss": 0.6506, "lr": 0.00010175360919936623, "epoch": 0.8913797704830531, "percentage": 44.57, "elapsed_time": "5:37:43", "remaining_time": "7:00:02"} +{"current_steps": 3345, "total_steps": 7494, "loss": 0.63, "lr": 0.00010159034072734865, "epoch": 0.8927141713370697, "percentage": 44.64, "elapsed_time": "5:38:19", "remaining_time": "6:59:38"} +{"current_steps": 3350, "total_steps": 7494, "loss": 0.6418, "lr": 0.00010142692800117416, "epoch": 0.8940485721910862, "percentage": 44.7, "elapsed_time": "5:38:44", "remaining_time": "6:59:01"} +{"current_steps": 3355, "total_steps": 7494, "loss": 0.65, "lr": 0.00010126337190736636, "epoch": 0.8953829730451027, "percentage": 44.77, "elapsed_time": "5:39:17", "remaining_time": "6:58:34"} +{"current_steps": 3360, "total_steps": 7494, "loss": 0.6475, "lr": 0.00010109967333322669, "epoch": 0.8967173738991193, "percentage": 44.84, "elapsed_time": "5:40:09", "remaining_time": "6:58:30"} +{"current_steps": 3365, "total_steps": 7494, "loss": 0.6475, "lr": 0.00010093583316682945, "epoch": 0.8980517747531358, "percentage": 44.9, "elapsed_time": "5:40:41", "remaining_time": "6:58:02"} +{"current_steps": 3370, "total_steps": 7494, "loss": 0.6438, "lr": 0.00010077185229701722, "epoch": 0.8993861756071524, "percentage": 44.97, "elapsed_time": "5:41:06", "remaining_time": "6:57:26"} +{"current_steps": 3375, "total_steps": 7494, "loss": 0.6381, "lr": 0.00010060773161339574, "epoch": 0.900720576461169, "percentage": 45.04, "elapsed_time": "5:41:41", "remaining_time": "6:57:00"} +{"current_steps": 3380, "total_steps": 7494, "loss": 0.638, "lr": 0.00010044347200632943, "epoch": 0.9020549773151855, "percentage": 45.1, "elapsed_time": "5:42:33", "remaining_time": "6:56:57"} +{"current_steps": 3385, "total_steps": 7494, "loss": 0.6494, "lr": 0.00010027907436693623, "epoch": 0.9033893781692021, "percentage": 45.17, "elapsed_time": "5:43:04", "remaining_time": "6:56:26"} +{"current_steps": 3390, "total_steps": 7494, "loss": 0.6508, "lr": 0.00010011453958708297, "epoch": 0.9047237790232185, "percentage": 45.24, "elapsed_time": "5:43:29", "remaining_time": "6:55:50"} +{"current_steps": 3395, "total_steps": 7494, "loss": 0.6501, "lr": 9.994986855938047e-05, "epoch": 0.9060581798772351, "percentage": 45.3, "elapsed_time": "5:44:07", "remaining_time": "6:55:29"} +{"current_steps": 3400, "total_steps": 7494, "loss": 0.6419, "lr": 9.978506217717874e-05, "epoch": 0.9073925807312516, "percentage": 45.37, "elapsed_time": "5:44:57", "remaining_time": "6:55:22"} +{"current_steps": 3405, "total_steps": 7494, "loss": 0.6531, "lr": 9.962012133456204e-05, "epoch": 0.9087269815852682, "percentage": 45.44, "elapsed_time": "5:45:35", "remaining_time": "6:55:01"} +{"current_steps": 3410, "total_steps": 7494, "loss": 0.6384, "lr": 9.945504692634409e-05, "epoch": 0.9100613824392848, "percentage": 45.5, "elapsed_time": "5:46:01", "remaining_time": "6:54:24"} +{"current_steps": 3415, "total_steps": 7494, "loss": 0.6405, "lr": 9.928983984806326e-05, "epoch": 0.9113957832933013, "percentage": 45.57, "elapsed_time": "5:46:43", "remaining_time": "6:54:08"} +{"current_steps": 3420, "total_steps": 7494, "loss": 0.6429, "lr": 9.912450099597765e-05, "epoch": 0.9127301841473179, "percentage": 45.64, "elapsed_time": "5:47:29", "remaining_time": "6:53:56"} +{"current_steps": 3425, "total_steps": 7494, "loss": 0.6478, "lr": 9.895903126706019e-05, "epoch": 0.9140645850013344, "percentage": 45.7, "elapsed_time": "5:47:57", "remaining_time": "6:53:23"} +{"current_steps": 3430, "total_steps": 7494, "loss": 0.6342, "lr": 9.879343155899382e-05, "epoch": 0.915398985855351, "percentage": 45.77, "elapsed_time": "5:48:23", "remaining_time": "6:52:47"} +{"current_steps": 3435, "total_steps": 7494, "loss": 0.647, "lr": 9.862770277016676e-05, "epoch": 0.9167333867093675, "percentage": 45.84, "elapsed_time": "5:49:09", "remaining_time": "6:52:35"} +{"current_steps": 3440, "total_steps": 7494, "loss": 0.6416, "lr": 9.846184579966733e-05, "epoch": 0.918067787563384, "percentage": 45.9, "elapsed_time": "5:49:54", "remaining_time": "6:52:22"} +{"current_steps": 3445, "total_steps": 7494, "loss": 0.6507, "lr": 9.829586154727933e-05, "epoch": 0.9194021884174006, "percentage": 45.97, "elapsed_time": "5:50:21", "remaining_time": "6:51:46"} +{"current_steps": 3450, "total_steps": 7494, "loss": 0.6359, "lr": 9.812975091347706e-05, "epoch": 0.9207365892714171, "percentage": 46.04, "elapsed_time": "5:50:48", "remaining_time": "6:51:11"} +{"current_steps": 3455, "total_steps": 7494, "loss": 0.6491, "lr": 9.796351479942047e-05, "epoch": 0.9220709901254337, "percentage": 46.1, "elapsed_time": "5:51:33", "remaining_time": "6:50:59"} +{"current_steps": 3460, "total_steps": 7494, "loss": 0.6463, "lr": 9.779715410695015e-05, "epoch": 0.9234053909794502, "percentage": 46.17, "elapsed_time": "5:52:13", "remaining_time": "6:50:39"} +{"current_steps": 3465, "total_steps": 7494, "loss": 0.6502, "lr": 9.76306697385827e-05, "epoch": 0.9247397918334668, "percentage": 46.24, "elapsed_time": "5:52:40", "remaining_time": "6:50:04"} +{"current_steps": 3470, "total_steps": 7494, "loss": 0.6614, "lr": 9.746406259750552e-05, "epoch": 0.9260741926874834, "percentage": 46.3, "elapsed_time": "5:53:30", "remaining_time": "6:49:57"} +{"current_steps": 3475, "total_steps": 7494, "loss": 0.6312, "lr": 9.729733358757213e-05, "epoch": 0.9274085935414998, "percentage": 46.37, "elapsed_time": "5:54:20", "remaining_time": "6:49:49"} +{"current_steps": 3480, "total_steps": 7494, "loss": 0.644, "lr": 9.713048361329715e-05, "epoch": 0.9287429943955164, "percentage": 46.44, "elapsed_time": "5:54:57", "remaining_time": "6:49:25"} +{"current_steps": 3485, "total_steps": 7494, "loss": 0.6605, "lr": 9.696351357985154e-05, "epoch": 0.9300773952495329, "percentage": 46.5, "elapsed_time": "5:55:23", "remaining_time": "6:48:49"} +{"current_steps": 3490, "total_steps": 7494, "loss": 0.6589, "lr": 9.679642439305744e-05, "epoch": 0.9314117961035495, "percentage": 46.57, "elapsed_time": "5:55:54", "remaining_time": "6:48:19"} +{"current_steps": 3495, "total_steps": 7494, "loss": 0.6379, "lr": 9.662921695938354e-05, "epoch": 0.932746196957566, "percentage": 46.64, "elapsed_time": "5:56:45", "remaining_time": "6:48:12"} +{"current_steps": 3500, "total_steps": 7494, "loss": 0.647, "lr": 9.646189218593992e-05, "epoch": 0.9340805978115826, "percentage": 46.7, "elapsed_time": "5:57:20", "remaining_time": "6:47:46"} +{"current_steps": 3505, "total_steps": 7494, "loss": 0.6566, "lr": 9.629445098047334e-05, "epoch": 0.9354149986655992, "percentage": 46.77, "elapsed_time": "5:57:54", "remaining_time": "6:47:20"} +{"current_steps": 3510, "total_steps": 7494, "loss": 0.6338, "lr": 9.61268942513621e-05, "epoch": 0.9367493995196157, "percentage": 46.84, "elapsed_time": "5:58:28", "remaining_time": "6:46:52"} +{"current_steps": 3515, "total_steps": 7494, "loss": 0.6516, "lr": 9.595922290761128e-05, "epoch": 0.9380838003736323, "percentage": 46.9, "elapsed_time": "5:59:17", "remaining_time": "6:46:42"} +{"current_steps": 3520, "total_steps": 7494, "loss": 0.6287, "lr": 9.579143785884779e-05, "epoch": 0.9394182012276487, "percentage": 46.97, "elapsed_time": "5:59:50", "remaining_time": "6:46:14"} +{"current_steps": 3525, "total_steps": 7494, "loss": 0.655, "lr": 9.562354001531532e-05, "epoch": 0.9407526020816653, "percentage": 47.04, "elapsed_time": "6:00:15", "remaining_time": "6:45:38"} +{"current_steps": 3530, "total_steps": 7494, "loss": 0.6315, "lr": 9.545553028786952e-05, "epoch": 0.9420870029356819, "percentage": 47.1, "elapsed_time": "6:00:51", "remaining_time": "6:45:13"} +{"current_steps": 3535, "total_steps": 7494, "loss": 0.6407, "lr": 9.5287409587973e-05, "epoch": 0.9434214037896984, "percentage": 47.17, "elapsed_time": "6:01:42", "remaining_time": "6:45:05"} +{"current_steps": 3540, "total_steps": 7494, "loss": 0.6391, "lr": 9.511917882769042e-05, "epoch": 0.944755804643715, "percentage": 47.24, "elapsed_time": "6:02:13", "remaining_time": "6:44:34"} +{"current_steps": 3545, "total_steps": 7494, "loss": 0.6486, "lr": 9.495083891968351e-05, "epoch": 0.9460902054977315, "percentage": 47.3, "elapsed_time": "6:03:27", "remaining_time": "6:44:52"} +{"current_steps": 3550, "total_steps": 7494, "loss": 0.6499, "lr": 9.478239077720615e-05, "epoch": 0.9474246063517481, "percentage": 47.37, "elapsed_time": "6:04:06", "remaining_time": "6:44:31"} +{"current_steps": 3555, "total_steps": 7494, "loss": 0.6389, "lr": 9.461383531409937e-05, "epoch": 0.9487590072057646, "percentage": 47.44, "elapsed_time": "6:04:55", "remaining_time": "6:44:21"} +{"current_steps": 3560, "total_steps": 7494, "loss": 0.6482, "lr": 9.444517344478645e-05, "epoch": 0.9500934080597812, "percentage": 47.5, "elapsed_time": "6:05:24", "remaining_time": "6:43:47"} +{"current_steps": 3565, "total_steps": 7494, "loss": 0.6425, "lr": 9.427640608426789e-05, "epoch": 0.9514278089137977, "percentage": 47.57, "elapsed_time": "6:05:49", "remaining_time": "6:43:11"} +{"current_steps": 3570, "total_steps": 7494, "loss": 0.6377, "lr": 9.410753414811654e-05, "epoch": 0.9527622097678142, "percentage": 47.64, "elapsed_time": "6:06:32", "remaining_time": "6:42:53"} +{"current_steps": 3575, "total_steps": 7494, "loss": 0.6687, "lr": 9.393855855247254e-05, "epoch": 0.9540966106218308, "percentage": 47.7, "elapsed_time": "6:07:16", "remaining_time": "6:42:37"} +{"current_steps": 3580, "total_steps": 7494, "loss": 0.6567, "lr": 9.376948021403838e-05, "epoch": 0.9554310114758473, "percentage": 47.77, "elapsed_time": "6:07:45", "remaining_time": "6:42:03"} +{"current_steps": 3585, "total_steps": 7494, "loss": 0.647, "lr": 9.360030005007399e-05, "epoch": 0.9567654123298639, "percentage": 47.84, "elapsed_time": "6:08:10", "remaining_time": "6:41:27"} +{"current_steps": 3590, "total_steps": 7494, "loss": 0.6508, "lr": 9.343101897839169e-05, "epoch": 0.9580998131838805, "percentage": 47.9, "elapsed_time": "6:08:57", "remaining_time": "6:41:14"} +{"current_steps": 3595, "total_steps": 7494, "loss": 0.6292, "lr": 9.326163791735116e-05, "epoch": 0.959434214037897, "percentage": 47.97, "elapsed_time": "6:09:42", "remaining_time": "6:40:58"} +{"current_steps": 3600, "total_steps": 7494, "loss": 0.6457, "lr": 9.309215778585461e-05, "epoch": 0.9607686148919136, "percentage": 48.04, "elapsed_time": "6:10:09", "remaining_time": "6:40:22"} +{"current_steps": 3605, "total_steps": 7494, "loss": 0.6541, "lr": 9.29225795033417e-05, "epoch": 0.96210301574593, "percentage": 48.11, "elapsed_time": "6:10:44", "remaining_time": "6:39:56"} +{"current_steps": 3610, "total_steps": 7494, "loss": 0.6652, "lr": 9.275290398978454e-05, "epoch": 0.9634374165999466, "percentage": 48.17, "elapsed_time": "6:11:32", "remaining_time": "6:39:44"} +{"current_steps": 3615, "total_steps": 7494, "loss": 0.6461, "lr": 9.258313216568273e-05, "epoch": 0.9647718174539631, "percentage": 48.24, "elapsed_time": "6:12:12", "remaining_time": "6:39:23"} +{"current_steps": 3620, "total_steps": 7494, "loss": 0.6539, "lr": 9.241326495205836e-05, "epoch": 0.9661062183079797, "percentage": 48.31, "elapsed_time": "6:12:39", "remaining_time": "6:38:47"} +{"current_steps": 3625, "total_steps": 7494, "loss": 0.6348, "lr": 9.224330327045105e-05, "epoch": 0.9674406191619963, "percentage": 48.37, "elapsed_time": "6:13:07", "remaining_time": "6:38:14"} +{"current_steps": 3630, "total_steps": 7494, "loss": 0.6475, "lr": 9.207324804291285e-05, "epoch": 0.9687750200160128, "percentage": 48.44, "elapsed_time": "6:13:57", "remaining_time": "6:38:03"} +{"current_steps": 3635, "total_steps": 7494, "loss": 0.6444, "lr": 9.190310019200338e-05, "epoch": 0.9701094208700294, "percentage": 48.51, "elapsed_time": "6:14:36", "remaining_time": "6:37:41"} +{"current_steps": 3640, "total_steps": 7494, "loss": 0.6639, "lr": 9.173286064078465e-05, "epoch": 0.9714438217240459, "percentage": 48.57, "elapsed_time": "6:15:02", "remaining_time": "6:37:05"} +{"current_steps": 3645, "total_steps": 7494, "loss": 0.6588, "lr": 9.156253031281625e-05, "epoch": 0.9727782225780625, "percentage": 48.64, "elapsed_time": "6:15:33", "remaining_time": "6:36:34"} +{"current_steps": 3650, "total_steps": 7494, "loss": 0.6547, "lr": 9.139211013215013e-05, "epoch": 0.974112623432079, "percentage": 48.71, "elapsed_time": "6:16:24", "remaining_time": "6:36:25"} +{"current_steps": 3655, "total_steps": 7494, "loss": 0.6503, "lr": 9.122160102332583e-05, "epoch": 0.9754470242860955, "percentage": 48.77, "elapsed_time": "6:16:59", "remaining_time": "6:35:57"} +{"current_steps": 3660, "total_steps": 7494, "loss": 0.6346, "lr": 9.105100391136523e-05, "epoch": 0.9767814251401121, "percentage": 48.84, "elapsed_time": "6:17:24", "remaining_time": "6:35:20"} +{"current_steps": 3665, "total_steps": 7494, "loss": 0.6362, "lr": 9.088031972176764e-05, "epoch": 0.9781158259941286, "percentage": 48.91, "elapsed_time": "6:17:58", "remaining_time": "6:34:53"} +{"current_steps": 3670, "total_steps": 7494, "loss": 0.6569, "lr": 9.070954938050482e-05, "epoch": 0.9794502268481452, "percentage": 48.97, "elapsed_time": "6:19:09", "remaining_time": "6:35:04"} +{"current_steps": 3675, "total_steps": 7494, "loss": 0.6471, "lr": 9.053869381401589e-05, "epoch": 0.9807846277021617, "percentage": 49.04, "elapsed_time": "6:20:15", "remaining_time": "6:35:09"} +{"current_steps": 3680, "total_steps": 7494, "loss": 0.6474, "lr": 9.036775394920228e-05, "epoch": 0.9821190285561783, "percentage": 49.11, "elapsed_time": "6:21:09", "remaining_time": "6:35:01"} +{"current_steps": 3685, "total_steps": 7494, "loss": 0.643, "lr": 9.01967307134228e-05, "epoch": 0.9834534294101949, "percentage": 49.17, "elapsed_time": "6:21:44", "remaining_time": "6:34:35"} +{"current_steps": 3690, "total_steps": 7494, "loss": 0.6352, "lr": 9.00256250344885e-05, "epoch": 0.9847878302642114, "percentage": 49.24, "elapsed_time": "6:22:33", "remaining_time": "6:34:22"} +{"current_steps": 3695, "total_steps": 7494, "loss": 0.6347, "lr": 8.985443784065774e-05, "epoch": 0.9861222311182279, "percentage": 49.31, "elapsed_time": "6:23:04", "remaining_time": "6:33:51"} +{"current_steps": 3700, "total_steps": 7494, "loss": 0.643, "lr": 8.968317006063107e-05, "epoch": 0.9874566319722444, "percentage": 49.37, "elapsed_time": "6:23:29", "remaining_time": "6:33:14"} +{"current_steps": 3705, "total_steps": 7494, "loss": 0.6226, "lr": 8.951182262354624e-05, "epoch": 0.988791032826261, "percentage": 49.44, "elapsed_time": "6:24:19", "remaining_time": "6:33:01"} +{"current_steps": 3710, "total_steps": 7494, "loss": 0.6508, "lr": 8.934039645897316e-05, "epoch": 0.9901254336802775, "percentage": 49.51, "elapsed_time": "6:25:04", "remaining_time": "6:32:45"} +{"current_steps": 3715, "total_steps": 7494, "loss": 0.6598, "lr": 8.916889249690877e-05, "epoch": 0.9914598345342941, "percentage": 49.57, "elapsed_time": "6:25:35", "remaining_time": "6:32:13"} +{"current_steps": 3720, "total_steps": 7494, "loss": 0.6583, "lr": 8.899731166777216e-05, "epoch": 0.9927942353883107, "percentage": 49.64, "elapsed_time": "6:26:00", "remaining_time": "6:31:36"} +{"current_steps": 3725, "total_steps": 7494, "loss": 0.6259, "lr": 8.882565490239935e-05, "epoch": 0.9941286362423272, "percentage": 49.71, "elapsed_time": "6:26:41", "remaining_time": "6:31:15"} +{"current_steps": 3730, "total_steps": 7494, "loss": 0.6402, "lr": 8.865392313203839e-05, "epoch": 0.9954630370963438, "percentage": 49.77, "elapsed_time": "6:27:53", "remaining_time": "6:31:25"} +{"current_steps": 3735, "total_steps": 7494, "loss": 0.6633, "lr": 8.848211728834415e-05, "epoch": 0.9967974379503602, "percentage": 49.84, "elapsed_time": "6:28:21", "remaining_time": "6:30:51"} +{"current_steps": 3740, "total_steps": 7494, "loss": 0.6602, "lr": 8.831023830337348e-05, "epoch": 0.9981318388043768, "percentage": 49.91, "elapsed_time": "6:28:47", "remaining_time": "6:30:14"} +{"current_steps": 3745, "total_steps": 7494, "loss": 0.6247, "lr": 8.813828710957987e-05, "epoch": 0.9994662396583934, "percentage": 49.97, "elapsed_time": "6:29:33", "remaining_time": "6:29:58"} +{"current_steps": 3750, "total_steps": 7494, "loss": 0.6313, "lr": 8.796626463980863e-05, "epoch": 1.00080064051241, "percentage": 50.04, "elapsed_time": "6:30:22", "remaining_time": "6:29:44"} +{"current_steps": 3755, "total_steps": 7494, "loss": 0.6395, "lr": 8.779417182729181e-05, "epoch": 1.0021350413664265, "percentage": 50.11, "elapsed_time": "6:30:51", "remaining_time": "6:29:11"} +{"current_steps": 3760, "total_steps": 7494, "loss": 0.6428, "lr": 8.762200960564295e-05, "epoch": 1.003469442220443, "percentage": 50.17, "elapsed_time": "6:31:20", "remaining_time": "6:28:37"} +{"current_steps": 3765, "total_steps": 7494, "loss": 0.6372, "lr": 8.744977890885218e-05, "epoch": 1.0048038430744595, "percentage": 50.24, "elapsed_time": "6:32:44", "remaining_time": "6:28:58"} +{"current_steps": 3770, "total_steps": 7494, "loss": 0.6441, "lr": 8.727748067128116e-05, "epoch": 1.006138243928476, "percentage": 50.31, "elapsed_time": "6:33:29", "remaining_time": "6:28:41"} +{"current_steps": 3775, "total_steps": 7494, "loss": 0.6408, "lr": 8.71051158276579e-05, "epoch": 1.0074726447824927, "percentage": 50.37, "elapsed_time": "6:33:57", "remaining_time": "6:28:06"} +{"current_steps": 3780, "total_steps": 7494, "loss": 0.6495, "lr": 8.693268531307182e-05, "epoch": 1.0088070456365092, "percentage": 50.44, "elapsed_time": "6:34:25", "remaining_time": "6:27:31"} +{"current_steps": 3785, "total_steps": 7494, "loss": 0.6424, "lr": 8.676019006296851e-05, "epoch": 1.0101414464905258, "percentage": 50.51, "elapsed_time": "6:35:16", "remaining_time": "6:27:20"} +{"current_steps": 3790, "total_steps": 7494, "loss": 0.647, "lr": 8.658763101314484e-05, "epoch": 1.0114758473445422, "percentage": 50.57, "elapsed_time": "6:35:55", "remaining_time": "6:26:56"} +{"current_steps": 3795, "total_steps": 7494, "loss": 0.6323, "lr": 8.64150090997438e-05, "epoch": 1.0128102481985588, "percentage": 50.64, "elapsed_time": "6:36:21", "remaining_time": "6:26:20"} +{"current_steps": 3800, "total_steps": 7494, "loss": 0.6433, "lr": 8.624232525924936e-05, "epoch": 1.0141446490525754, "percentage": 50.71, "elapsed_time": "6:36:53", "remaining_time": "6:25:49"} +{"current_steps": 3805, "total_steps": 7494, "loss": 0.6422, "lr": 8.606958042848145e-05, "epoch": 1.015479049906592, "percentage": 50.77, "elapsed_time": "6:37:53", "remaining_time": "6:25:46"} +{"current_steps": 3810, "total_steps": 7494, "loss": 0.625, "lr": 8.589677554459094e-05, "epoch": 1.0168134507606086, "percentage": 50.84, "elapsed_time": "6:38:32", "remaining_time": "6:25:21"} +{"current_steps": 3815, "total_steps": 7494, "loss": 0.6216, "lr": 8.572391154505444e-05, "epoch": 1.018147851614625, "percentage": 50.91, "elapsed_time": "6:38:58", "remaining_time": "6:24:44"} +{"current_steps": 3820, "total_steps": 7494, "loss": 0.6308, "lr": 8.555098936766927e-05, "epoch": 1.0194822524686415, "percentage": 50.97, "elapsed_time": "6:39:32", "remaining_time": "6:24:16"} +{"current_steps": 3825, "total_steps": 7494, "loss": 0.6519, "lr": 8.537800995054838e-05, "epoch": 1.0208166533226581, "percentage": 51.04, "elapsed_time": "6:40:24", "remaining_time": "6:24:04"} +{"current_steps": 3830, "total_steps": 7494, "loss": 0.6176, "lr": 8.520497423211527e-05, "epoch": 1.0221510541766747, "percentage": 51.11, "elapsed_time": "6:40:59", "remaining_time": "6:23:37"} +{"current_steps": 3835, "total_steps": 7494, "loss": 0.6472, "lr": 8.503188315109881e-05, "epoch": 1.0234854550306913, "percentage": 51.17, "elapsed_time": "6:41:25", "remaining_time": "6:22:59"} +{"current_steps": 3840, "total_steps": 7494, "loss": 0.6325, "lr": 8.485873764652832e-05, "epoch": 1.0248198558847077, "percentage": 51.24, "elapsed_time": "6:42:01", "remaining_time": "6:22:32"} +{"current_steps": 3845, "total_steps": 7494, "loss": 0.6202, "lr": 8.468553865772826e-05, "epoch": 1.0261542567387243, "percentage": 51.31, "elapsed_time": "6:42:49", "remaining_time": "6:22:17"} +{"current_steps": 3850, "total_steps": 7494, "loss": 0.6344, "lr": 8.451228712431332e-05, "epoch": 1.0274886575927409, "percentage": 51.37, "elapsed_time": "6:43:23", "remaining_time": "6:21:48"} +{"current_steps": 3855, "total_steps": 7494, "loss": 0.6433, "lr": 8.433898398618319e-05, "epoch": 1.0288230584467575, "percentage": 51.44, "elapsed_time": "6:43:48", "remaining_time": "6:21:10"} +{"current_steps": 3860, "total_steps": 7494, "loss": 0.6209, "lr": 8.416563018351758e-05, "epoch": 1.0301574593007738, "percentage": 51.51, "elapsed_time": "6:44:27", "remaining_time": "6:20:46"} +{"current_steps": 3865, "total_steps": 7494, "loss": 0.646, "lr": 8.399222665677105e-05, "epoch": 1.0314918601547904, "percentage": 51.57, "elapsed_time": "6:45:14", "remaining_time": "6:20:30"} +{"current_steps": 3870, "total_steps": 7494, "loss": 0.6246, "lr": 8.381877434666784e-05, "epoch": 1.032826261008807, "percentage": 51.64, "elapsed_time": "6:45:46", "remaining_time": "6:19:58"} +{"current_steps": 3875, "total_steps": 7494, "loss": 0.6268, "lr": 8.364527419419696e-05, "epoch": 1.0341606618628236, "percentage": 51.71, "elapsed_time": "6:46:11", "remaining_time": "6:19:21"} +{"current_steps": 3880, "total_steps": 7494, "loss": 0.6366, "lr": 8.347172714060686e-05, "epoch": 1.0354950627168402, "percentage": 51.77, "elapsed_time": "6:46:53", "remaining_time": "6:19:00"} +{"current_steps": 3885, "total_steps": 7494, "loss": 0.6228, "lr": 8.32981341274005e-05, "epoch": 1.0368294635708566, "percentage": 51.84, "elapsed_time": "6:47:44", "remaining_time": "6:18:46"} +{"current_steps": 3890, "total_steps": 7494, "loss": 0.634, "lr": 8.312449609633014e-05, "epoch": 1.0381638644248732, "percentage": 51.91, "elapsed_time": "6:48:13", "remaining_time": "6:18:12"} +{"current_steps": 3895, "total_steps": 7494, "loss": 0.6264, "lr": 8.295081398939227e-05, "epoch": 1.0394982652788898, "percentage": 51.97, "elapsed_time": "6:48:39", "remaining_time": "6:17:36"} +{"current_steps": 3900, "total_steps": 7494, "loss": 0.6278, "lr": 8.277708874882252e-05, "epoch": 1.0408326661329064, "percentage": 52.04, "elapsed_time": "6:49:23", "remaining_time": "6:17:16"} +{"current_steps": 3905, "total_steps": 7494, "loss": 0.6284, "lr": 8.26033213170905e-05, "epoch": 1.042167066986923, "percentage": 52.11, "elapsed_time": "6:50:19", "remaining_time": "6:17:07"} +{"current_steps": 3910, "total_steps": 7494, "loss": 0.6477, "lr": 8.242951263689468e-05, "epoch": 1.0435014678409393, "percentage": 52.18, "elapsed_time": "6:50:48", "remaining_time": "6:16:33"} +{"current_steps": 3915, "total_steps": 7494, "loss": 0.6357, "lr": 8.225566365115738e-05, "epoch": 1.044835868694956, "percentage": 52.24, "elapsed_time": "6:51:14", "remaining_time": "6:15:57"} +{"current_steps": 3920, "total_steps": 7494, "loss": 0.6354, "lr": 8.20817753030195e-05, "epoch": 1.0461702695489725, "percentage": 52.31, "elapsed_time": "6:52:02", "remaining_time": "6:15:40"} +{"current_steps": 3925, "total_steps": 7494, "loss": 0.656, "lr": 8.190784853583554e-05, "epoch": 1.0475046704029891, "percentage": 52.38, "elapsed_time": "6:52:48", "remaining_time": "6:15:21"} +{"current_steps": 3930, "total_steps": 7494, "loss": 0.6417, "lr": 8.17338842931684e-05, "epoch": 1.0488390712570057, "percentage": 52.44, "elapsed_time": "6:53:15", "remaining_time": "6:14:46"} +{"current_steps": 3935, "total_steps": 7494, "loss": 0.6276, "lr": 8.155988351878433e-05, "epoch": 1.050173472111022, "percentage": 52.51, "elapsed_time": "6:53:43", "remaining_time": "6:14:11"} +{"current_steps": 3940, "total_steps": 7494, "loss": 0.6578, "lr": 8.138584715664766e-05, "epoch": 1.0515078729650387, "percentage": 52.58, "elapsed_time": "6:54:57", "remaining_time": "6:14:18"} +{"current_steps": 3945, "total_steps": 7494, "loss": 0.6457, "lr": 8.121177615091591e-05, "epoch": 1.0528422738190553, "percentage": 52.64, "elapsed_time": "6:55:39", "remaining_time": "6:13:55"} +{"current_steps": 3950, "total_steps": 7494, "loss": 0.6341, "lr": 8.103767144593445e-05, "epoch": 1.0541766746730719, "percentage": 52.71, "elapsed_time": "6:56:06", "remaining_time": "6:13:20"} +{"current_steps": 3955, "total_steps": 7494, "loss": 0.628, "lr": 8.086353398623154e-05, "epoch": 1.0555110755270882, "percentage": 52.78, "elapsed_time": "6:57:02", "remaining_time": "6:13:10"} +{"current_steps": 3960, "total_steps": 7494, "loss": 0.6425, "lr": 8.068936471651308e-05, "epoch": 1.0568454763811048, "percentage": 52.84, "elapsed_time": "6:58:14", "remaining_time": "6:13:14"} +{"current_steps": 3965, "total_steps": 7494, "loss": 0.6308, "lr": 8.051516458165759e-05, "epoch": 1.0581798772351214, "percentage": 52.91, "elapsed_time": "6:58:55", "remaining_time": "6:12:51"} +{"current_steps": 3970, "total_steps": 7494, "loss": 0.6433, "lr": 8.0340934526711e-05, "epoch": 1.059514278089138, "percentage": 52.98, "elapsed_time": "6:59:54", "remaining_time": "6:12:43"} +{"current_steps": 3975, "total_steps": 7494, "loss": 0.633, "lr": 8.016667549688157e-05, "epoch": 1.0608486789431546, "percentage": 53.04, "elapsed_time": "7:00:58", "remaining_time": "6:12:40"} +{"current_steps": 3980, "total_steps": 7494, "loss": 0.6357, "lr": 7.999238843753474e-05, "epoch": 1.062183079797171, "percentage": 53.11, "elapsed_time": "7:01:47", "remaining_time": "6:12:24"} +{"current_steps": 3985, "total_steps": 7494, "loss": 0.6644, "lr": 7.981807429418803e-05, "epoch": 1.0635174806511876, "percentage": 53.18, "elapsed_time": "7:04:20", "remaining_time": "6:13:39"} +{"current_steps": 3990, "total_steps": 7494, "loss": 0.6214, "lr": 7.96437340125059e-05, "epoch": 1.0648518815052042, "percentage": 53.24, "elapsed_time": "7:04:46", "remaining_time": "6:13:02"} +{"current_steps": 3995, "total_steps": 7494, "loss": 0.6405, "lr": 7.946936853829458e-05, "epoch": 1.0661862823592207, "percentage": 53.31, "elapsed_time": "7:05:20", "remaining_time": "6:12:31"} +{"current_steps": 4000, "total_steps": 7494, "loss": 0.6363, "lr": 7.929497881749699e-05, "epoch": 1.0675206832132373, "percentage": 53.38, "elapsed_time": "7:06:11", "remaining_time": "6:12:16"} +{"current_steps": 4005, "total_steps": 7494, "loss": 0.648, "lr": 7.912056579618759e-05, "epoch": 1.0688550840672537, "percentage": 53.44, "elapsed_time": "7:06:57", "remaining_time": "6:11:56"} +{"current_steps": 4010, "total_steps": 7494, "loss": 0.6189, "lr": 7.894613042056721e-05, "epoch": 1.0701894849212703, "percentage": 53.51, "elapsed_time": "7:07:22", "remaining_time": "6:11:19"} +{"current_steps": 4015, "total_steps": 7494, "loss": 0.6405, "lr": 7.877167363695805e-05, "epoch": 1.071523885775287, "percentage": 53.58, "elapsed_time": "7:07:59", "remaining_time": "6:10:51"} +{"current_steps": 4020, "total_steps": 7494, "loss": 0.6227, "lr": 7.859719639179834e-05, "epoch": 1.0728582866293035, "percentage": 53.64, "elapsed_time": "7:08:50", "remaining_time": "6:10:35"} +{"current_steps": 4025, "total_steps": 7494, "loss": 0.6403, "lr": 7.842269963163735e-05, "epoch": 1.07419268748332, "percentage": 53.71, "elapsed_time": "7:10:36", "remaining_time": "6:11:07"} +{"current_steps": 4030, "total_steps": 7494, "loss": 0.635, "lr": 7.824818430313028e-05, "epoch": 1.0755270883373365, "percentage": 53.78, "elapsed_time": "7:11:02", "remaining_time": "6:10:30"} +{"current_steps": 4035, "total_steps": 7494, "loss": 0.6517, "lr": 7.807365135303299e-05, "epoch": 1.076861489191353, "percentage": 53.84, "elapsed_time": "7:11:41", "remaining_time": "6:10:04"} +{"current_steps": 4040, "total_steps": 7494, "loss": 0.635, "lr": 7.789910172819693e-05, "epoch": 1.0781958900453696, "percentage": 53.91, "elapsed_time": "7:14:47", "remaining_time": "6:11:43"} +{"current_steps": 4045, "total_steps": 7494, "loss": 0.6592, "lr": 7.772453637556411e-05, "epoch": 1.0795302908993862, "percentage": 53.98, "elapsed_time": "7:16:30", "remaining_time": "6:12:11"} +{"current_steps": 4050, "total_steps": 7494, "loss": 0.6371, "lr": 7.754995624216176e-05, "epoch": 1.0808646917534026, "percentage": 54.04, "elapsed_time": "7:19:08", "remaining_time": "6:13:26"} +{"current_steps": 4055, "total_steps": 7494, "loss": 0.6304, "lr": 7.737536227509734e-05, "epoch": 1.0821990926074192, "percentage": 54.11, "elapsed_time": "7:19:49", "remaining_time": "6:13:01"} +{"current_steps": 4060, "total_steps": 7494, "loss": 0.6645, "lr": 7.720075542155336e-05, "epoch": 1.0835334934614358, "percentage": 54.18, "elapsed_time": "7:20:33", "remaining_time": "6:12:38"} +{"current_steps": 4065, "total_steps": 7494, "loss": 0.6523, "lr": 7.702613662878223e-05, "epoch": 1.0848678943154524, "percentage": 54.24, "elapsed_time": "7:21:06", "remaining_time": "6:12:05"} +{"current_steps": 4070, "total_steps": 7494, "loss": 0.6336, "lr": 7.685150684410114e-05, "epoch": 1.086202295169469, "percentage": 54.31, "elapsed_time": "7:22:44", "remaining_time": "6:12:27"} +{"current_steps": 4075, "total_steps": 7494, "loss": 0.6369, "lr": 7.667686701488688e-05, "epoch": 1.0875366960234856, "percentage": 54.38, "elapsed_time": "7:24:53", "remaining_time": "6:13:16"} +{"current_steps": 4080, "total_steps": 7494, "loss": 0.6425, "lr": 7.650221808857081e-05, "epoch": 1.088871096877502, "percentage": 54.44, "elapsed_time": "7:25:41", "remaining_time": "6:12:56"} +{"current_steps": 4085, "total_steps": 7494, "loss": 0.6231, "lr": 7.632756101263358e-05, "epoch": 1.0902054977315185, "percentage": 54.51, "elapsed_time": "7:29:00", "remaining_time": "6:14:42"} +{"current_steps": 4090, "total_steps": 7494, "loss": 0.6376, "lr": 7.615289673460003e-05, "epoch": 1.0915398985855351, "percentage": 54.58, "elapsed_time": "7:29:53", "remaining_time": "6:14:26"} +{"current_steps": 4095, "total_steps": 7494, "loss": 0.6268, "lr": 7.59782262020341e-05, "epoch": 1.0928742994395517, "percentage": 54.64, "elapsed_time": "7:31:48", "remaining_time": "6:15:00"} +{"current_steps": 4100, "total_steps": 7494, "loss": 0.6381, "lr": 7.580355036253372e-05, "epoch": 1.094208700293568, "percentage": 54.71, "elapsed_time": "7:33:18", "remaining_time": "6:15:14"} +{"current_steps": 4105, "total_steps": 7494, "loss": 0.6436, "lr": 7.562887016372551e-05, "epoch": 1.0955431011475847, "percentage": 54.78, "elapsed_time": "7:33:56", "remaining_time": "6:14:45"} +{"current_steps": 4110, "total_steps": 7494, "loss": 0.6389, "lr": 7.54541865532598e-05, "epoch": 1.0968775020016013, "percentage": 54.84, "elapsed_time": "7:34:24", "remaining_time": "6:14:08"} +{"current_steps": 4115, "total_steps": 7494, "loss": 0.6378, "lr": 7.527950047880543e-05, "epoch": 1.0982119028556179, "percentage": 54.91, "elapsed_time": "7:35:10", "remaining_time": "6:13:45"} +{"current_steps": 4120, "total_steps": 7494, "loss": 0.644, "lr": 7.51048128880446e-05, "epoch": 1.0995463037096345, "percentage": 54.98, "elapsed_time": "7:35:52", "remaining_time": "6:13:20"} +{"current_steps": 4125, "total_steps": 7494, "loss": 0.6383, "lr": 7.493012472866769e-05, "epoch": 1.1008807045636508, "percentage": 55.04, "elapsed_time": "7:36:20", "remaining_time": "6:12:42"} +{"current_steps": 4130, "total_steps": 7494, "loss": 0.6371, "lr": 7.47554369483682e-05, "epoch": 1.1022151054176674, "percentage": 55.11, "elapsed_time": "7:36:50", "remaining_time": "6:12:06"} +{"current_steps": 4135, "total_steps": 7494, "loss": 0.6299, "lr": 7.458075049483762e-05, "epoch": 1.103549506271684, "percentage": 55.18, "elapsed_time": "7:37:39", "remaining_time": "6:11:46"} +{"current_steps": 4140, "total_steps": 7494, "loss": 0.6378, "lr": 7.44060663157602e-05, "epoch": 1.1048839071257006, "percentage": 55.24, "elapsed_time": "7:39:54", "remaining_time": "6:12:35"} +{"current_steps": 4145, "total_steps": 7494, "loss": 0.638, "lr": 7.423138535880779e-05, "epoch": 1.1062183079797172, "percentage": 55.31, "elapsed_time": "7:40:21", "remaining_time": "6:11:57"} +{"current_steps": 4150, "total_steps": 7494, "loss": 0.6476, "lr": 7.405670857163489e-05, "epoch": 1.1075527088337336, "percentage": 55.38, "elapsed_time": "7:40:52", "remaining_time": "6:11:21"} +{"current_steps": 4155, "total_steps": 7494, "loss": 0.6384, "lr": 7.388203690187325e-05, "epoch": 1.1088871096877502, "percentage": 55.44, "elapsed_time": "7:41:41", "remaining_time": "6:11:00"} +{"current_steps": 4160, "total_steps": 7494, "loss": 0.6242, "lr": 7.370737129712695e-05, "epoch": 1.1102215105417668, "percentage": 55.51, "elapsed_time": "7:42:20", "remaining_time": "6:10:32"} +{"current_steps": 4165, "total_steps": 7494, "loss": 0.6458, "lr": 7.353271270496713e-05, "epoch": 1.1115559113957834, "percentage": 55.58, "elapsed_time": "7:42:46", "remaining_time": "6:09:53"} +{"current_steps": 4170, "total_steps": 7494, "loss": 0.6408, "lr": 7.335806207292687e-05, "epoch": 1.1128903122498, "percentage": 55.64, "elapsed_time": "7:43:19", "remaining_time": "6:09:19"} +{"current_steps": 4175, "total_steps": 7494, "loss": 0.6408, "lr": 7.31834203484961e-05, "epoch": 1.1142247131038163, "percentage": 55.71, "elapsed_time": "7:44:07", "remaining_time": "6:08:57"} +{"current_steps": 4180, "total_steps": 7494, "loss": 0.6432, "lr": 7.300878847911642e-05, "epoch": 1.115559113957833, "percentage": 55.78, "elapsed_time": "7:44:44", "remaining_time": "6:08:27"} +{"current_steps": 4185, "total_steps": 7494, "loss": 0.6211, "lr": 7.283416741217595e-05, "epoch": 1.1168935148118495, "percentage": 55.84, "elapsed_time": "7:45:10", "remaining_time": "6:07:48"} +{"current_steps": 4190, "total_steps": 7494, "loss": 0.6513, "lr": 7.26595580950042e-05, "epoch": 1.118227915665866, "percentage": 55.91, "elapsed_time": "7:45:46", "remaining_time": "6:07:17"} +{"current_steps": 4195, "total_steps": 7494, "loss": 0.6189, "lr": 7.248496147486695e-05, "epoch": 1.1195623165198825, "percentage": 55.98, "elapsed_time": "7:46:36", "remaining_time": "6:06:56"} +{"current_steps": 4200, "total_steps": 7494, "loss": 0.6451, "lr": 7.23103784989611e-05, "epoch": 1.120896717373899, "percentage": 56.04, "elapsed_time": "7:47:10", "remaining_time": "6:06:23"} +{"current_steps": 4205, "total_steps": 7494, "loss": 0.6671, "lr": 7.213581011440954e-05, "epoch": 1.1222311182279157, "percentage": 56.11, "elapsed_time": "7:47:44", "remaining_time": "6:05:51"} +{"current_steps": 4210, "total_steps": 7494, "loss": 0.6377, "lr": 7.1961257268256e-05, "epoch": 1.1235655190819323, "percentage": 56.18, "elapsed_time": "7:48:40", "remaining_time": "6:05:35"} +{"current_steps": 4215, "total_steps": 7494, "loss": 0.6286, "lr": 7.178672090745986e-05, "epoch": 1.1248999199359488, "percentage": 56.24, "elapsed_time": "7:50:05", "remaining_time": "6:05:42"} +{"current_steps": 4220, "total_steps": 7494, "loss": 0.6409, "lr": 7.161220197889114e-05, "epoch": 1.1262343207899652, "percentage": 56.31, "elapsed_time": "7:50:39", "remaining_time": "6:05:08"} +{"current_steps": 4225, "total_steps": 7494, "loss": 0.6389, "lr": 7.143770142932524e-05, "epoch": 1.1275687216439818, "percentage": 56.38, "elapsed_time": "7:52:17", "remaining_time": "6:05:25"} +{"current_steps": 4230, "total_steps": 7494, "loss": 0.6336, "lr": 7.126322020543785e-05, "epoch": 1.1289031224979984, "percentage": 56.45, "elapsed_time": "7:52:56", "remaining_time": "6:04:56"} +{"current_steps": 4235, "total_steps": 7494, "loss": 0.6333, "lr": 7.108875925379991e-05, "epoch": 1.130237523352015, "percentage": 56.51, "elapsed_time": "7:53:44", "remaining_time": "6:04:34"} +{"current_steps": 4240, "total_steps": 7494, "loss": 0.6535, "lr": 7.091431952087221e-05, "epoch": 1.1315719242060316, "percentage": 56.58, "elapsed_time": "7:54:17", "remaining_time": "6:03:59"} +{"current_steps": 4245, "total_steps": 7494, "loss": 0.6308, "lr": 7.073990195300058e-05, "epoch": 1.132906325060048, "percentage": 56.65, "elapsed_time": "7:54:42", "remaining_time": "6:03:20"} +{"current_steps": 4250, "total_steps": 7494, "loss": 0.6361, "lr": 7.056550749641056e-05, "epoch": 1.1342407259140646, "percentage": 56.71, "elapsed_time": "7:55:25", "remaining_time": "6:02:53"} +{"current_steps": 4255, "total_steps": 7494, "loss": 0.6367, "lr": 7.039113709720227e-05, "epoch": 1.1355751267680811, "percentage": 56.78, "elapsed_time": "7:56:11", "remaining_time": "6:02:29"} +{"current_steps": 4260, "total_steps": 7494, "loss": 0.6264, "lr": 7.021679170134533e-05, "epoch": 1.1369095276220977, "percentage": 56.85, "elapsed_time": "7:56:43", "remaining_time": "6:01:54"} +{"current_steps": 4265, "total_steps": 7494, "loss": 0.6317, "lr": 7.004247225467381e-05, "epoch": 1.1382439284761143, "percentage": 56.91, "elapsed_time": "7:57:10", "remaining_time": "6:01:16"} +{"current_steps": 4270, "total_steps": 7494, "loss": 0.6356, "lr": 6.986817970288082e-05, "epoch": 1.1395783293301307, "percentage": 56.98, "elapsed_time": "7:57:54", "remaining_time": "6:00:50"} +{"current_steps": 4275, "total_steps": 7494, "loss": 0.6208, "lr": 6.969391499151371e-05, "epoch": 1.1409127301841473, "percentage": 57.05, "elapsed_time": "7:58:41", "remaining_time": "6:00:26"} +{"current_steps": 4280, "total_steps": 7494, "loss": 0.6332, "lr": 6.95196790659688e-05, "epoch": 1.1422471310381639, "percentage": 57.11, "elapsed_time": "7:59:10", "remaining_time": "5:59:49"} +{"current_steps": 4285, "total_steps": 7494, "loss": 0.6453, "lr": 6.934547287148614e-05, "epoch": 1.1435815318921805, "percentage": 57.18, "elapsed_time": "7:59:38", "remaining_time": "5:59:12"} +{"current_steps": 4290, "total_steps": 7494, "loss": 0.6393, "lr": 6.917129735314455e-05, "epoch": 1.1449159327461969, "percentage": 57.25, "elapsed_time": "8:00:22", "remaining_time": "5:58:46"} +{"current_steps": 4295, "total_steps": 7494, "loss": 0.6215, "lr": 6.899715345585649e-05, "epoch": 1.1462503336002134, "percentage": 57.31, "elapsed_time": "8:01:07", "remaining_time": "5:58:21"} +{"current_steps": 4300, "total_steps": 7494, "loss": 0.6413, "lr": 6.882304212436272e-05, "epoch": 1.14758473445423, "percentage": 57.38, "elapsed_time": "8:01:36", "remaining_time": "5:57:44"} +{"current_steps": 4305, "total_steps": 7494, "loss": 0.6659, "lr": 6.864896430322745e-05, "epoch": 1.1489191353082466, "percentage": 57.45, "elapsed_time": "8:02:14", "remaining_time": "5:57:13"} +{"current_steps": 4310, "total_steps": 7494, "loss": 0.6176, "lr": 6.84749209368331e-05, "epoch": 1.1502535361622632, "percentage": 57.51, "elapsed_time": "8:04:16", "remaining_time": "5:57:45"} +{"current_steps": 4315, "total_steps": 7494, "loss": 0.6325, "lr": 6.830091296937509e-05, "epoch": 1.1515879370162796, "percentage": 57.58, "elapsed_time": "8:04:59", "remaining_time": "5:57:18"} +{"current_steps": 4320, "total_steps": 7494, "loss": 0.6368, "lr": 6.812694134485686e-05, "epoch": 1.1529223378702962, "percentage": 57.65, "elapsed_time": "8:05:27", "remaining_time": "5:56:40"} +{"current_steps": 4325, "total_steps": 7494, "loss": 0.6403, "lr": 6.795300700708466e-05, "epoch": 1.1542567387243128, "percentage": 57.71, "elapsed_time": "8:05:57", "remaining_time": "5:56:04"} +{"current_steps": 4330, "total_steps": 7494, "loss": 0.6278, "lr": 6.777911089966245e-05, "epoch": 1.1555911395783294, "percentage": 57.78, "elapsed_time": "8:06:42", "remaining_time": "5:55:38"} +{"current_steps": 4335, "total_steps": 7494, "loss": 0.6498, "lr": 6.760525396598686e-05, "epoch": 1.156925540432346, "percentage": 57.85, "elapsed_time": "8:07:25", "remaining_time": "5:55:11"} +{"current_steps": 4340, "total_steps": 7494, "loss": 0.6239, "lr": 6.74314371492419e-05, "epoch": 1.1582599412863623, "percentage": 57.91, "elapsed_time": "8:07:52", "remaining_time": "5:54:33"} +{"current_steps": 4345, "total_steps": 7494, "loss": 0.6372, "lr": 6.725766139239399e-05, "epoch": 1.159594342140379, "percentage": 57.98, "elapsed_time": "8:08:24", "remaining_time": "5:53:57"} +{"current_steps": 4350, "total_steps": 7494, "loss": 0.6347, "lr": 6.708392763818681e-05, "epoch": 1.1609287429943955, "percentage": 58.05, "elapsed_time": "8:09:09", "remaining_time": "5:53:32"} +{"current_steps": 4355, "total_steps": 7494, "loss": 0.6488, "lr": 6.691023682913616e-05, "epoch": 1.1622631438484121, "percentage": 58.11, "elapsed_time": "8:09:48", "remaining_time": "5:53:02"} +{"current_steps": 4360, "total_steps": 7494, "loss": 0.6301, "lr": 6.673658990752484e-05, "epoch": 1.1635975447024287, "percentage": 58.18, "elapsed_time": "8:11:51", "remaining_time": "5:53:33"} +{"current_steps": 4365, "total_steps": 7494, "loss": 0.6268, "lr": 6.656298781539764e-05, "epoch": 1.164931945556445, "percentage": 58.25, "elapsed_time": "8:12:27", "remaining_time": "5:53:01"} +{"current_steps": 4370, "total_steps": 7494, "loss": 0.6417, "lr": 6.638943149455598e-05, "epoch": 1.1662663464104617, "percentage": 58.31, "elapsed_time": "8:13:58", "remaining_time": "5:53:08"} +{"current_steps": 4375, "total_steps": 7494, "loss": 0.6298, "lr": 6.621592188655314e-05, "epoch": 1.1676007472644783, "percentage": 58.38, "elapsed_time": "8:15:02", "remaining_time": "5:52:55"} +{"current_steps": 4380, "total_steps": 7494, "loss": 0.6266, "lr": 6.604245993268893e-05, "epoch": 1.1689351481184949, "percentage": 58.45, "elapsed_time": "8:15:28", "remaining_time": "5:52:15"} +{"current_steps": 4385, "total_steps": 7494, "loss": 0.635, "lr": 6.586904657400457e-05, "epoch": 1.1702695489725112, "percentage": 58.51, "elapsed_time": "8:16:54", "remaining_time": "5:52:18"} +{"current_steps": 4390, "total_steps": 7494, "loss": 0.6164, "lr": 6.569568275127769e-05, "epoch": 1.1716039498265278, "percentage": 58.58, "elapsed_time": "8:17:43", "remaining_time": "5:51:55"} +{"current_steps": 4395, "total_steps": 7494, "loss": 0.6168, "lr": 6.552236940501725e-05, "epoch": 1.1729383506805444, "percentage": 58.65, "elapsed_time": "8:18:39", "remaining_time": "5:51:37"} +{"current_steps": 4400, "total_steps": 7494, "loss": 0.6199, "lr": 6.534910747545825e-05, "epoch": 1.174272751534561, "percentage": 58.71, "elapsed_time": "8:19:06", "remaining_time": "5:50:57"} +{"current_steps": 4405, "total_steps": 7494, "loss": 0.6488, "lr": 6.517589790255686e-05, "epoch": 1.1756071523885776, "percentage": 58.78, "elapsed_time": "8:19:53", "remaining_time": "5:50:32"} +{"current_steps": 4410, "total_steps": 7494, "loss": 0.6411, "lr": 6.500274162598512e-05, "epoch": 1.1769415532425942, "percentage": 58.85, "elapsed_time": "8:20:45", "remaining_time": "5:50:11"} +{"current_steps": 4415, "total_steps": 7494, "loss": 0.6342, "lr": 6.482963958512599e-05, "epoch": 1.1782759540966106, "percentage": 58.91, "elapsed_time": "8:22:07", "remaining_time": "5:50:10"} +{"current_steps": 4420, "total_steps": 7494, "loss": 0.6277, "lr": 6.465659271906823e-05, "epoch": 1.1796103549506272, "percentage": 58.98, "elapsed_time": "8:22:33", "remaining_time": "5:49:30"} +{"current_steps": 4425, "total_steps": 7494, "loss": 0.6371, "lr": 6.448360196660116e-05, "epoch": 1.1809447558046438, "percentage": 59.05, "elapsed_time": "8:25:25", "remaining_time": "5:50:32"} +{"current_steps": 4430, "total_steps": 7494, "loss": 0.629, "lr": 6.43106682662098e-05, "epoch": 1.1822791566586603, "percentage": 59.11, "elapsed_time": "8:26:13", "remaining_time": "5:50:08"} +{"current_steps": 4435, "total_steps": 7494, "loss": 0.6173, "lr": 6.413779255606961e-05, "epoch": 1.1836135575126767, "percentage": 59.18, "elapsed_time": "8:26:47", "remaining_time": "5:49:33"} +{"current_steps": 4440, "total_steps": 7494, "loss": 0.6455, "lr": 6.396497577404143e-05, "epoch": 1.1849479583666933, "percentage": 59.25, "elapsed_time": "8:27:13", "remaining_time": "5:48:53"} +{"current_steps": 4445, "total_steps": 7494, "loss": 0.6293, "lr": 6.379221885766643e-05, "epoch": 1.18628235922071, "percentage": 59.31, "elapsed_time": "8:27:53", "remaining_time": "5:48:23"} +{"current_steps": 4450, "total_steps": 7494, "loss": 0.6231, "lr": 6.361952274416106e-05, "epoch": 1.1876167600747265, "percentage": 59.38, "elapsed_time": "8:29:51", "remaining_time": "5:48:45"} +{"current_steps": 4455, "total_steps": 7494, "loss": 0.6262, "lr": 6.344688837041177e-05, "epoch": 1.188951160928743, "percentage": 59.45, "elapsed_time": "8:30:23", "remaining_time": "5:48:09"} +{"current_steps": 4460, "total_steps": 7494, "loss": 0.6359, "lr": 6.32743166729702e-05, "epoch": 1.1902855617827595, "percentage": 59.51, "elapsed_time": "8:31:13", "remaining_time": "5:47:46"} +{"current_steps": 4465, "total_steps": 7494, "loss": 0.6485, "lr": 6.310180858804794e-05, "epoch": 1.191619962636776, "percentage": 59.58, "elapsed_time": "8:31:55", "remaining_time": "5:47:17"} +{"current_steps": 4470, "total_steps": 7494, "loss": 0.6412, "lr": 6.292936505151145e-05, "epoch": 1.1929543634907926, "percentage": 59.65, "elapsed_time": "8:32:42", "remaining_time": "5:46:50"} +{"current_steps": 4475, "total_steps": 7494, "loss": 0.6161, "lr": 6.275698699887699e-05, "epoch": 1.1942887643448092, "percentage": 59.71, "elapsed_time": "8:33:12", "remaining_time": "5:46:13"} +{"current_steps": 4480, "total_steps": 7494, "loss": 0.6344, "lr": 6.258467536530565e-05, "epoch": 1.1956231651988256, "percentage": 59.78, "elapsed_time": "8:33:40", "remaining_time": "5:45:34"} +{"current_steps": 4485, "total_steps": 7494, "loss": 0.6354, "lr": 6.241243108559811e-05, "epoch": 1.1969575660528422, "percentage": 59.85, "elapsed_time": "8:34:23", "remaining_time": "5:45:06"} +{"current_steps": 4490, "total_steps": 7494, "loss": 0.6491, "lr": 6.224025509418971e-05, "epoch": 1.1982919669068588, "percentage": 59.91, "elapsed_time": "8:35:09", "remaining_time": "5:44:39"} +{"current_steps": 4495, "total_steps": 7494, "loss": 0.6343, "lr": 6.206814832514525e-05, "epoch": 1.1996263677608754, "percentage": 59.98, "elapsed_time": "8:35:37", "remaining_time": "5:44:01"} +{"current_steps": 4500, "total_steps": 7494, "loss": 0.6299, "lr": 6.189611171215405e-05, "epoch": 1.200960768614892, "percentage": 60.05, "elapsed_time": "8:36:06", "remaining_time": "5:43:23"} +{"current_steps": 4505, "total_steps": 7494, "loss": 0.6394, "lr": 6.172414618852488e-05, "epoch": 1.2022951694689086, "percentage": 60.11, "elapsed_time": "8:36:59", "remaining_time": "5:43:00"} +{"current_steps": 4510, "total_steps": 7494, "loss": 0.6193, "lr": 6.155225268718069e-05, "epoch": 1.203629570322925, "percentage": 60.18, "elapsed_time": "8:37:44", "remaining_time": "5:42:33"} +{"current_steps": 4515, "total_steps": 7494, "loss": 0.6274, "lr": 6.138043214065385e-05, "epoch": 1.2049639711769415, "percentage": 60.25, "elapsed_time": "8:38:11", "remaining_time": "5:41:54"} +{"current_steps": 4520, "total_steps": 7494, "loss": 0.6194, "lr": 6.120868548108093e-05, "epoch": 1.2062983720309581, "percentage": 60.31, "elapsed_time": "8:40:13", "remaining_time": "5:42:17"} +{"current_steps": 4525, "total_steps": 7494, "loss": 0.6327, "lr": 6.103701364019754e-05, "epoch": 1.2076327728849747, "percentage": 60.38, "elapsed_time": "8:41:00", "remaining_time": "5:41:50"} +{"current_steps": 4530, "total_steps": 7494, "loss": 0.6431, "lr": 6.0865417549333536e-05, "epoch": 1.208967173738991, "percentage": 60.45, "elapsed_time": "8:45:10", "remaining_time": "5:43:37"} +{"current_steps": 4535, "total_steps": 7494, "loss": 0.6433, "lr": 6.0693898139407786e-05, "epoch": 1.2103015745930077, "percentage": 60.52, "elapsed_time": "8:45:38", "remaining_time": "5:42:58"} +{"current_steps": 4540, "total_steps": 7494, "loss": 0.6261, "lr": 6.0522456340923085e-05, "epoch": 1.2116359754470243, "percentage": 60.58, "elapsed_time": "8:46:10", "remaining_time": "5:42:21"} +{"current_steps": 4545, "total_steps": 7494, "loss": 0.6203, "lr": 6.0351093083961267e-05, "epoch": 1.2129703763010409, "percentage": 60.65, "elapsed_time": "8:46:57", "remaining_time": "5:41:54"} +{"current_steps": 4550, "total_steps": 7494, "loss": 0.6292, "lr": 6.017980929817807e-05, "epoch": 1.2143047771550575, "percentage": 60.72, "elapsed_time": "8:48:07", "remaining_time": "5:41:42"} +{"current_steps": 4555, "total_steps": 7494, "loss": 0.6325, "lr": 6.000860591279801e-05, "epoch": 1.2156391780090738, "percentage": 60.78, "elapsed_time": "8:49:34", "remaining_time": "5:41:41"} +{"current_steps": 4560, "total_steps": 7494, "loss": 0.6353, "lr": 5.9837483856609527e-05, "epoch": 1.2169735788630904, "percentage": 60.85, "elapsed_time": "8:50:06", "remaining_time": "5:41:05"} +{"current_steps": 4565, "total_steps": 7494, "loss": 0.631, "lr": 5.966644405795982e-05, "epoch": 1.218307979717107, "percentage": 60.92, "elapsed_time": "8:50:55", "remaining_time": "5:40:39"} +{"current_steps": 4570, "total_steps": 7494, "loss": 0.6214, "lr": 5.949548744474978e-05, "epoch": 1.2196423805711236, "percentage": 60.98, "elapsed_time": "8:53:02", "remaining_time": "5:41:03"} +{"current_steps": 4575, "total_steps": 7494, "loss": 0.6387, "lr": 5.9324614944429095e-05, "epoch": 1.22097678142514, "percentage": 61.05, "elapsed_time": "8:53:29", "remaining_time": "5:40:23"} +{"current_steps": 4580, "total_steps": 7494, "loss": 0.6431, "lr": 5.915382748399105e-05, "epoch": 1.2223111822791566, "percentage": 61.12, "elapsed_time": "8:54:04", "remaining_time": "5:39:48"} +{"current_steps": 4585, "total_steps": 7494, "loss": 0.6493, "lr": 5.8983125989967646e-05, "epoch": 1.2236455831331732, "percentage": 61.18, "elapsed_time": "8:54:53", "remaining_time": "5:39:22"} +{"current_steps": 4590, "total_steps": 7494, "loss": 0.6277, "lr": 5.881251138842453e-05, "epoch": 1.2249799839871898, "percentage": 61.25, "elapsed_time": "8:55:29", "remaining_time": "5:38:47"} +{"current_steps": 4595, "total_steps": 7494, "loss": 0.6351, "lr": 5.864198460495585e-05, "epoch": 1.2263143848412064, "percentage": 61.32, "elapsed_time": "8:55:55", "remaining_time": "5:38:07"} +{"current_steps": 4600, "total_steps": 7494, "loss": 0.6319, "lr": 5.847154656467944e-05, "epoch": 1.227648785695223, "percentage": 61.38, "elapsed_time": "8:56:52", "remaining_time": "5:37:45"} +{"current_steps": 4605, "total_steps": 7494, "loss": 0.6267, "lr": 5.830119819223166e-05, "epoch": 1.2289831865492393, "percentage": 61.45, "elapsed_time": "8:58:15", "remaining_time": "5:37:40"} +{"current_steps": 4610, "total_steps": 7494, "loss": 0.6249, "lr": 5.8130940411762406e-05, "epoch": 1.230317587403256, "percentage": 61.52, "elapsed_time": "8:58:49", "remaining_time": "5:37:05"} +{"current_steps": 4615, "total_steps": 7494, "loss": 0.6445, "lr": 5.79607741469301e-05, "epoch": 1.2316519882572725, "percentage": 61.58, "elapsed_time": "8:59:37", "remaining_time": "5:36:38"} +{"current_steps": 4620, "total_steps": 7494, "loss": 0.6387, "lr": 5.779070032089674e-05, "epoch": 1.232986389111289, "percentage": 61.65, "elapsed_time": "9:00:16", "remaining_time": "5:36:05"} +{"current_steps": 4625, "total_steps": 7494, "loss": 0.6263, "lr": 5.762071985632276e-05, "epoch": 1.2343207899653055, "percentage": 61.72, "elapsed_time": "9:01:04", "remaining_time": "5:35:38"} +{"current_steps": 4630, "total_steps": 7494, "loss": 0.6245, "lr": 5.745083367536217e-05, "epoch": 1.235655190819322, "percentage": 61.78, "elapsed_time": "9:01:37", "remaining_time": "5:35:01"} +{"current_steps": 4635, "total_steps": 7494, "loss": 0.6388, "lr": 5.7281042699657465e-05, "epoch": 1.2369895916733387, "percentage": 61.85, "elapsed_time": "9:02:03", "remaining_time": "5:34:21"} +{"current_steps": 4640, "total_steps": 7494, "loss": 0.633, "lr": 5.71113478503346e-05, "epoch": 1.2383239925273553, "percentage": 61.92, "elapsed_time": "9:02:43", "remaining_time": "5:33:49"} +{"current_steps": 4645, "total_steps": 7494, "loss": 0.6361, "lr": 5.694175004799814e-05, "epoch": 1.2396583933813718, "percentage": 61.98, "elapsed_time": "9:03:27", "remaining_time": "5:33:19"} +{"current_steps": 4650, "total_steps": 7494, "loss": 0.6229, "lr": 5.6772250212726025e-05, "epoch": 1.2409927942353882, "percentage": 62.05, "elapsed_time": "9:04:47", "remaining_time": "5:33:11"} +{"current_steps": 4655, "total_steps": 7494, "loss": 0.6241, "lr": 5.660284926406484e-05, "epoch": 1.2423271950894048, "percentage": 62.12, "elapsed_time": "9:05:14", "remaining_time": "5:32:32"} +{"current_steps": 4660, "total_steps": 7494, "loss": 0.6395, "lr": 5.64335481210247e-05, "epoch": 1.2436615959434214, "percentage": 62.18, "elapsed_time": "9:07:47", "remaining_time": "5:33:08"} +{"current_steps": 4665, "total_steps": 7494, "loss": 0.6264, "lr": 5.626434770207414e-05, "epoch": 1.244995996797438, "percentage": 62.25, "elapsed_time": "9:08:57", "remaining_time": "5:32:54"} +{"current_steps": 4670, "total_steps": 7494, "loss": 0.627, "lr": 5.60952489251354e-05, "epoch": 1.2463303976514546, "percentage": 62.32, "elapsed_time": "9:09:49", "remaining_time": "5:32:29"} +{"current_steps": 4675, "total_steps": 7494, "loss": 0.6383, "lr": 5.592625270757928e-05, "epoch": 1.247664798505471, "percentage": 62.38, "elapsed_time": "9:12:14", "remaining_time": "5:33:00"} +{"current_steps": 4680, "total_steps": 7494, "loss": 0.6178, "lr": 5.575735996622011e-05, "epoch": 1.2489991993594876, "percentage": 62.45, "elapsed_time": "9:14:04", "remaining_time": "5:33:09"} +{"current_steps": 4685, "total_steps": 7494, "loss": 0.6328, "lr": 5.558857161731093e-05, "epoch": 1.2503336002135041, "percentage": 62.52, "elapsed_time": "9:14:52", "remaining_time": "5:32:41"} +{"current_steps": 4690, "total_steps": 7494, "loss": 0.6305, "lr": 5.541988857653847e-05, "epoch": 1.2516680010675207, "percentage": 62.58, "elapsed_time": "9:15:22", "remaining_time": "5:32:02"} +{"current_steps": 4695, "total_steps": 7494, "loss": 0.6289, "lr": 5.5251311759018046e-05, "epoch": 1.2530024019215373, "percentage": 62.65, "elapsed_time": "9:16:11", "remaining_time": "5:31:35"} +{"current_steps": 4700, "total_steps": 7494, "loss": 0.6305, "lr": 5.508284207928879e-05, "epoch": 1.2543368027755537, "percentage": 62.72, "elapsed_time": "9:16:55", "remaining_time": "5:31:04"} +{"current_steps": 4705, "total_steps": 7494, "loss": 0.6244, "lr": 5.491448045130865e-05, "epoch": 1.2556712036295703, "percentage": 62.78, "elapsed_time": "9:17:50", "remaining_time": "5:30:40"} +{"current_steps": 4710, "total_steps": 7494, "loss": 0.6192, "lr": 5.4746227788449236e-05, "epoch": 1.257005604483587, "percentage": 62.85, "elapsed_time": "9:18:19", "remaining_time": "5:30:01"} +{"current_steps": 4715, "total_steps": 7494, "loss": 0.633, "lr": 5.457808500349115e-05, "epoch": 1.2583400053376035, "percentage": 62.92, "elapsed_time": "9:18:49", "remaining_time": "5:29:22"} +{"current_steps": 4720, "total_steps": 7494, "loss": 0.6271, "lr": 5.441005300861887e-05, "epoch": 1.2596744061916199, "percentage": 62.98, "elapsed_time": "9:21:33", "remaining_time": "5:30:02"} +{"current_steps": 4725, "total_steps": 7494, "loss": 0.6518, "lr": 5.424213271541578e-05, "epoch": 1.2610088070456364, "percentage": 63.05, "elapsed_time": "9:22:17", "remaining_time": "5:29:31"} +{"current_steps": 4730, "total_steps": 7494, "loss": 0.6266, "lr": 5.4074325034859336e-05, "epoch": 1.262343207899653, "percentage": 63.12, "elapsed_time": "9:22:46", "remaining_time": "5:28:51"} +{"current_steps": 4735, "total_steps": 7494, "loss": 0.641, "lr": 5.390663087731605e-05, "epoch": 1.2636776087536696, "percentage": 63.18, "elapsed_time": "9:23:16", "remaining_time": "5:28:12"} +{"current_steps": 4740, "total_steps": 7494, "loss": 0.6199, "lr": 5.3739051152536506e-05, "epoch": 1.2650120096076862, "percentage": 63.25, "elapsed_time": "9:24:01", "remaining_time": "5:27:42"} +{"current_steps": 4745, "total_steps": 7494, "loss": 0.634, "lr": 5.357158676965059e-05, "epoch": 1.2663464104617028, "percentage": 63.32, "elapsed_time": "9:24:42", "remaining_time": "5:27:09"} +{"current_steps": 4750, "total_steps": 7494, "loss": 0.6364, "lr": 5.3404238637162364e-05, "epoch": 1.2676808113157192, "percentage": 63.38, "elapsed_time": "9:25:10", "remaining_time": "5:26:29"} +{"current_steps": 4755, "total_steps": 7494, "loss": 0.6269, "lr": 5.323700766294526e-05, "epoch": 1.2690152121697358, "percentage": 63.45, "elapsed_time": "9:25:43", "remaining_time": "5:25:52"} +{"current_steps": 4760, "total_steps": 7494, "loss": 0.625, "lr": 5.306989475423712e-05, "epoch": 1.2703496130237524, "percentage": 63.52, "elapsed_time": "9:26:30", "remaining_time": "5:25:22"} +{"current_steps": 4765, "total_steps": 7494, "loss": 0.6395, "lr": 5.2902900817635264e-05, "epoch": 1.2716840138777687, "percentage": 63.58, "elapsed_time": "9:27:08", "remaining_time": "5:24:48"} +{"current_steps": 4770, "total_steps": 7494, "loss": 0.6528, "lr": 5.273602675909159e-05, "epoch": 1.2730184147317853, "percentage": 63.65, "elapsed_time": "9:27:36", "remaining_time": "5:24:08"} +{"current_steps": 4775, "total_steps": 7494, "loss": 0.6384, "lr": 5.256927348390765e-05, "epoch": 1.274352815585802, "percentage": 63.72, "elapsed_time": "9:28:10", "remaining_time": "5:23:31"} +{"current_steps": 4780, "total_steps": 7494, "loss": 0.6329, "lr": 5.24026418967297e-05, "epoch": 1.2756872164398185, "percentage": 63.78, "elapsed_time": "9:28:57", "remaining_time": "5:23:02"} +{"current_steps": 4785, "total_steps": 7494, "loss": 0.6168, "lr": 5.2236132901543895e-05, "epoch": 1.2770216172938351, "percentage": 63.85, "elapsed_time": "9:29:34", "remaining_time": "5:22:27"} +{"current_steps": 4790, "total_steps": 7494, "loss": 0.6283, "lr": 5.2069747401671334e-05, "epoch": 1.2783560181478517, "percentage": 63.92, "elapsed_time": "9:30:01", "remaining_time": "5:21:47"} +{"current_steps": 4795, "total_steps": 7494, "loss": 0.6343, "lr": 5.1903486299763026e-05, "epoch": 1.279690419001868, "percentage": 63.98, "elapsed_time": "9:31:27", "remaining_time": "5:21:39"} +{"current_steps": 4800, "total_steps": 7494, "loss": 0.6427, "lr": 5.173735049779523e-05, "epoch": 1.2810248198558847, "percentage": 64.05, "elapsed_time": "9:32:59", "remaining_time": "5:21:35"} +{"current_steps": 4805, "total_steps": 7494, "loss": 0.6323, "lr": 5.1571340897064454e-05, "epoch": 1.2823592207099013, "percentage": 64.12, "elapsed_time": "9:35:12", "remaining_time": "5:21:54"} +{"current_steps": 4810, "total_steps": 7494, "loss": 0.6201, "lr": 5.140545839818242e-05, "epoch": 1.2836936215639179, "percentage": 64.18, "elapsed_time": "9:35:40", "remaining_time": "5:21:13"} +{"current_steps": 4815, "total_steps": 7494, "loss": 0.6119, "lr": 5.1239703901071506e-05, "epoch": 1.2850280224179342, "percentage": 64.25, "elapsed_time": "9:38:15", "remaining_time": "5:21:44"} +{"current_steps": 4820, "total_steps": 7494, "loss": 0.6274, "lr": 5.1074078304959474e-05, "epoch": 1.2863624232719508, "percentage": 64.32, "elapsed_time": "9:40:00", "remaining_time": "5:21:46"} +{"current_steps": 4825, "total_steps": 7494, "loss": 0.6358, "lr": 5.090858250837495e-05, "epoch": 1.2876968241259674, "percentage": 64.38, "elapsed_time": "9:40:34", "remaining_time": "5:21:09"} +{"current_steps": 4830, "total_steps": 7494, "loss": 0.6267, "lr": 5.0743217409142344e-05, "epoch": 1.289031224979984, "percentage": 64.45, "elapsed_time": "9:41:02", "remaining_time": "5:20:28"} +{"current_steps": 4835, "total_steps": 7494, "loss": 0.6363, "lr": 5.057798390437696e-05, "epoch": 1.2903656258340006, "percentage": 64.52, "elapsed_time": "9:41:38", "remaining_time": "5:19:52"} +{"current_steps": 4840, "total_steps": 7494, "loss": 0.6312, "lr": 5.0412882890480266e-05, "epoch": 1.2917000266880172, "percentage": 64.59, "elapsed_time": "9:42:25", "remaining_time": "5:19:22"} +{"current_steps": 4845, "total_steps": 7494, "loss": 0.6364, "lr": 5.0247915263134984e-05, "epoch": 1.2930344275420336, "percentage": 64.65, "elapsed_time": "9:42:59", "remaining_time": "5:18:45"} +{"current_steps": 4850, "total_steps": 7494, "loss": 0.6501, "lr": 5.0083081917300086e-05, "epoch": 1.2943688283960502, "percentage": 64.72, "elapsed_time": "9:46:15", "remaining_time": "5:19:36"} +{"current_steps": 4855, "total_steps": 7494, "loss": 0.6462, "lr": 4.991838374720618e-05, "epoch": 1.2957032292500668, "percentage": 64.79, "elapsed_time": "9:49:07", "remaining_time": "5:20:13"} +{"current_steps": 4860, "total_steps": 7494, "loss": 0.6126, "lr": 4.975382164635051e-05, "epoch": 1.2970376301040831, "percentage": 64.85, "elapsed_time": "9:49:55", "remaining_time": "5:19:43"} +{"current_steps": 4865, "total_steps": 7494, "loss": 0.6373, "lr": 4.9589396507492044e-05, "epoch": 1.2983720309580997, "percentage": 64.92, "elapsed_time": "9:50:29", "remaining_time": "5:19:05"} +{"current_steps": 4870, "total_steps": 7494, "loss": 0.634, "lr": 4.942510922264686e-05, "epoch": 1.2997064318121163, "percentage": 64.99, "elapsed_time": "9:50:56", "remaining_time": "5:18:24"} +{"current_steps": 4875, "total_steps": 7494, "loss": 0.6265, "lr": 4.926096068308312e-05, "epoch": 1.301040832666133, "percentage": 65.05, "elapsed_time": "9:51:36", "remaining_time": "5:17:49"} +{"current_steps": 4880, "total_steps": 7494, "loss": 0.6388, "lr": 4.90969517793162e-05, "epoch": 1.3023752335201495, "percentage": 65.12, "elapsed_time": "9:52:22", "remaining_time": "5:17:18"} +{"current_steps": 4885, "total_steps": 7494, "loss": 0.6356, "lr": 4.893308340110407e-05, "epoch": 1.303709634374166, "percentage": 65.19, "elapsed_time": "9:52:54", "remaining_time": "5:16:39"} +{"current_steps": 4890, "total_steps": 7494, "loss": 0.6411, "lr": 4.876935643744229e-05, "epoch": 1.3050440352281825, "percentage": 65.25, "elapsed_time": "9:53:49", "remaining_time": "5:16:13"} +{"current_steps": 4895, "total_steps": 7494, "loss": 0.6362, "lr": 4.860577177655922e-05, "epoch": 1.306378436082199, "percentage": 65.32, "elapsed_time": "9:56:09", "remaining_time": "5:16:31"} +{"current_steps": 4900, "total_steps": 7494, "loss": 0.6321, "lr": 4.844233030591122e-05, "epoch": 1.3077128369362157, "percentage": 65.39, "elapsed_time": "9:57:18", "remaining_time": "5:16:12"} +{"current_steps": 4905, "total_steps": 7494, "loss": 0.6428, "lr": 4.827903291217785e-05, "epoch": 1.3090472377902322, "percentage": 65.45, "elapsed_time": "0:06:31", "remaining_time": "0:03:26"} +{"current_steps": 4910, "total_steps": 7494, "loss": 0.6271, "lr": 4.8115880481257066e-05, "epoch": 1.3103816386442486, "percentage": 65.52, "elapsed_time": "0:07:00", "remaining_time": "0:03:41"} +{"current_steps": 4915, "total_steps": 7494, "loss": 0.6139, "lr": 4.795287389826035e-05, "epoch": 1.3117160394982652, "percentage": 65.59, "elapsed_time": "0:07:27", "remaining_time": "0:03:54"} +{"current_steps": 4920, "total_steps": 7494, "loss": 0.6234, "lr": 4.779001404750797e-05, "epoch": 1.3130504403522818, "percentage": 65.65, "elapsed_time": "0:08:27", "remaining_time": "0:04:25"} +{"current_steps": 4925, "total_steps": 7494, "loss": 0.6248, "lr": 4.762730181252415e-05, "epoch": 1.3143848412062984, "percentage": 65.72, "elapsed_time": "0:08:53", "remaining_time": "0:04:38"} +{"current_steps": 4930, "total_steps": 7494, "loss": 0.6481, "lr": 4.746473807603235e-05, "epoch": 1.315719242060315, "percentage": 65.79, "elapsed_time": "0:09:19", "remaining_time": "0:04:50"} +{"current_steps": 4935, "total_steps": 7494, "loss": 0.6273, "lr": 4.730232371995029e-05, "epoch": 1.3170536429143316, "percentage": 65.85, "elapsed_time": "0:09:49", "remaining_time": "0:05:05"} +{"current_steps": 4940, "total_steps": 7494, "loss": 0.6367, "lr": 4.714005962538543e-05, "epoch": 1.318388043768348, "percentage": 65.92, "elapsed_time": "0:10:40", "remaining_time": "0:05:31"} +{"current_steps": 4945, "total_steps": 7494, "loss": 0.63, "lr": 4.6977946672630004e-05, "epoch": 1.3197224446223645, "percentage": 65.99, "elapsed_time": "0:11:05", "remaining_time": "0:05:43"} +{"current_steps": 4950, "total_steps": 7494, "loss": 0.6287, "lr": 4.681598574115622e-05, "epoch": 1.3210568454763811, "percentage": 66.05, "elapsed_time": "0:11:31", "remaining_time": "0:05:55"} +{"current_steps": 4955, "total_steps": 7494, "loss": 0.6276, "lr": 4.665417770961166e-05, "epoch": 1.3223912463303977, "percentage": 66.12, "elapsed_time": "0:12:23", "remaining_time": "0:06:20"} +{"current_steps": 4960, "total_steps": 7494, "loss": 0.6094, "lr": 4.6492523455814415e-05, "epoch": 1.323725647184414, "percentage": 66.19, "elapsed_time": "0:12:53", "remaining_time": "0:06:35"} +{"current_steps": 4965, "total_steps": 7494, "loss": 0.6304, "lr": 4.633102385674821e-05, "epoch": 1.3250600480384307, "percentage": 66.25, "elapsed_time": "0:13:18", "remaining_time": "0:06:46"} +{"current_steps": 4970, "total_steps": 7494, "loss": 0.6144, "lr": 4.616967978855788e-05, "epoch": 1.3263944488924473, "percentage": 66.32, "elapsed_time": "0:13:43", "remaining_time": "0:06:58"} +{"current_steps": 4975, "total_steps": 7494, "loss": 0.6229, "lr": 4.6008492126544476e-05, "epoch": 1.3277288497464639, "percentage": 66.39, "elapsed_time": "0:14:42", "remaining_time": "0:07:26"} +{"current_steps": 4980, "total_steps": 7494, "loss": 0.6172, "lr": 4.584746174516045e-05, "epoch": 1.3290632506004805, "percentage": 66.45, "elapsed_time": "0:15:07", "remaining_time": "0:07:38"} +{"current_steps": 4985, "total_steps": 7494, "loss": 0.6276, "lr": 4.568658951800512e-05, "epoch": 1.330397651454497, "percentage": 66.52, "elapsed_time": "0:15:32", "remaining_time": "0:07:49"} +{"current_steps": 4990, "total_steps": 7494, "loss": 0.6104, "lr": 4.552587631781969e-05, "epoch": 1.3317320523085134, "percentage": 66.59, "elapsed_time": "0:16:05", "remaining_time": "0:08:04"} +{"current_steps": 4995, "total_steps": 7494, "loss": 0.6313, "lr": 4.536532301648271e-05, "epoch": 1.33306645316253, "percentage": 66.65, "elapsed_time": "0:16:58", "remaining_time": "0:08:29"} +{"current_steps": 5000, "total_steps": 7494, "loss": 0.6297, "lr": 4.5204930485005306e-05, "epoch": 1.3344008540165466, "percentage": 66.72, "elapsed_time": "0:17:23", "remaining_time": "0:08:40"} +{"current_steps": 5005, "total_steps": 7494, "loss": 0.6221, "lr": 4.504469959352627e-05, "epoch": 1.335735254870563, "percentage": 66.79, "elapsed_time": "0:17:58", "remaining_time": "0:08:56"} +{"current_steps": 5010, "total_steps": 7494, "loss": 0.6239, "lr": 4.488463121130762e-05, "epoch": 1.3370696557245796, "percentage": 66.85, "elapsed_time": "0:18:53", "remaining_time": "0:09:22"} +{"current_steps": 5015, "total_steps": 7494, "loss": 0.621, "lr": 4.472472620672976e-05, "epoch": 1.3384040565785962, "percentage": 66.92, "elapsed_time": "0:19:22", "remaining_time": "0:09:34"} +{"current_steps": 5020, "total_steps": 7494, "loss": 0.6421, "lr": 4.4564985447286614e-05, "epoch": 1.3397384574326128, "percentage": 66.99, "elapsed_time": "0:19:47", "remaining_time": "0:09:45"} +{"current_steps": 5025, "total_steps": 7494, "loss": 0.6355, "lr": 4.440540979958124e-05, "epoch": 1.3410728582866294, "percentage": 67.05, "elapsed_time": "0:20:12", "remaining_time": "0:09:55"} +{"current_steps": 5030, "total_steps": 7494, "loss": 0.6356, "lr": 4.4246000129320867e-05, "epoch": 1.342407259140646, "percentage": 67.12, "elapsed_time": "0:21:09", "remaining_time": "0:10:21"} +{"current_steps": 5035, "total_steps": 7494, "loss": 0.6303, "lr": 4.408675730131227e-05, "epoch": 1.3437416599946623, "percentage": 67.19, "elapsed_time": "0:21:34", "remaining_time": "0:10:32"} +{"current_steps": 5040, "total_steps": 7494, "loss": 0.6183, "lr": 4.3927682179457144e-05, "epoch": 1.345076060848679, "percentage": 67.25, "elapsed_time": "0:21:59", "remaining_time": "0:10:42"} +{"current_steps": 5045, "total_steps": 7494, "loss": 0.6267, "lr": 4.376877562674737e-05, "epoch": 1.3464104617026955, "percentage": 67.32, "elapsed_time": "0:22:31", "remaining_time": "0:10:56"} +{"current_steps": 5050, "total_steps": 7494, "loss": 0.6469, "lr": 4.3610038505260264e-05, "epoch": 1.347744862556712, "percentage": 67.39, "elapsed_time": "0:23:25", "remaining_time": "0:11:20"} +{"current_steps": 5055, "total_steps": 7494, "loss": 0.6172, "lr": 4.3451471676154035e-05, "epoch": 1.3490792634107285, "percentage": 67.45, "elapsed_time": "0:23:50", "remaining_time": "0:11:30"} +{"current_steps": 5060, "total_steps": 7494, "loss": 0.6398, "lr": 4.329307599966306e-05, "epoch": 1.350413664264745, "percentage": 67.52, "elapsed_time": "0:24:15", "remaining_time": "0:11:40"} +{"current_steps": 5065, "total_steps": 7494, "loss": 0.641, "lr": 4.313485233509309e-05, "epoch": 1.3517480651187617, "percentage": 67.59, "elapsed_time": "0:25:03", "remaining_time": "0:12:01"} +{"current_steps": 5070, "total_steps": 7494, "loss": 0.628, "lr": 4.297680154081686e-05, "epoch": 1.3530824659727783, "percentage": 67.65, "elapsed_time": "0:25:39", "remaining_time": "0:12:16"} +{"current_steps": 5075, "total_steps": 7494, "loss": 0.6307, "lr": 4.2818924474269126e-05, "epoch": 1.3544168668267949, "percentage": 67.72, "elapsed_time": "0:26:04", "remaining_time": "0:12:25"} +{"current_steps": 5080, "total_steps": 7494, "loss": 0.6294, "lr": 4.266122199194226e-05, "epoch": 1.3557512676808114, "percentage": 67.79, "elapsed_time": "0:26:30", "remaining_time": "0:12:35"} +{"current_steps": 5085, "total_steps": 7494, "loss": 0.6314, "lr": 4.250369494938146e-05, "epoch": 1.3570856685348278, "percentage": 67.85, "elapsed_time": "0:27:28", "remaining_time": "0:13:00"} +{"current_steps": 5090, "total_steps": 7494, "loss": 0.6288, "lr": 4.234634420118021e-05, "epoch": 1.3584200693888444, "percentage": 67.92, "elapsed_time": "0:27:54", "remaining_time": "0:13:11"} +{"current_steps": 5095, "total_steps": 7494, "loss": 0.6506, "lr": 4.218917060097547e-05, "epoch": 1.359754470242861, "percentage": 67.99, "elapsed_time": "0:28:19", "remaining_time": "0:13:20"} +{"current_steps": 5100, "total_steps": 7494, "loss": 0.6207, "lr": 4.203217500144326e-05, "epoch": 1.3610888710968774, "percentage": 68.05, "elapsed_time": "0:28:48", "remaining_time": "0:13:31"} +{"current_steps": 5105, "total_steps": 7494, "loss": 0.6311, "lr": 4.187535825429396e-05, "epoch": 1.362423271950894, "percentage": 68.12, "elapsed_time": "0:29:54", "remaining_time": "0:13:59"} +{"current_steps": 5110, "total_steps": 7494, "loss": 0.6431, "lr": 4.171872121026753e-05, "epoch": 1.3637576728049106, "percentage": 68.19, "elapsed_time": "0:30:19", "remaining_time": "0:14:09"} +{"current_steps": 5115, "total_steps": 7494, "loss": 0.6172, "lr": 4.1562264719129165e-05, "epoch": 1.3650920736589272, "percentage": 68.25, "elapsed_time": "0:30:44", "remaining_time": "0:14:18"} +{"current_steps": 5120, "total_steps": 7494, "loss": 0.636, "lr": 4.140598962966447e-05, "epoch": 1.3664264745129437, "percentage": 68.32, "elapsed_time": "0:31:27", "remaining_time": "0:14:34"} +{"current_steps": 5125, "total_steps": 7494, "loss": 0.6253, "lr": 4.124989678967503e-05, "epoch": 1.3677608753669603, "percentage": 68.39, "elapsed_time": "0:32:10", "remaining_time": "0:14:52"} +{"current_steps": 5130, "total_steps": 7494, "loss": 0.6248, "lr": 4.109398704597357e-05, "epoch": 1.3690952762209767, "percentage": 68.45, "elapsed_time": "0:32:35", "remaining_time": "0:15:01"} +{"current_steps": 5135, "total_steps": 7494, "loss": 0.6198, "lr": 4.093826124437962e-05, "epoch": 1.3704296770749933, "percentage": 68.52, "elapsed_time": "0:33:34", "remaining_time": "0:15:25"} +{"current_steps": 5140, "total_steps": 7494, "loss": 0.6279, "lr": 4.078272022971481e-05, "epoch": 1.37176407792901, "percentage": 68.59, "elapsed_time": "0:34:31", "remaining_time": "0:15:48"} +{"current_steps": 5145, "total_steps": 7494, "loss": 0.6272, "lr": 4.06273648457982e-05, "epoch": 1.3730984787830265, "percentage": 68.65, "elapsed_time": "0:35:01", "remaining_time": "0:15:59"} +{"current_steps": 5150, "total_steps": 7494, "loss": 0.6371, "lr": 4.0472195935441904e-05, "epoch": 1.3744328796370429, "percentage": 68.72, "elapsed_time": "0:35:26", "remaining_time": "0:16:07"} +{"current_steps": 5155, "total_steps": 7494, "loss": 0.624, "lr": 4.031721434044635e-05, "epoch": 1.3757672804910595, "percentage": 68.79, "elapsed_time": "0:35:53", "remaining_time": "0:16:16"} +{"current_steps": 5160, "total_steps": 7494, "loss": 0.6139, "lr": 4.016242090159574e-05, "epoch": 1.377101681345076, "percentage": 68.86, "elapsed_time": "0:36:52", "remaining_time": "0:16:40"} +{"current_steps": 5165, "total_steps": 7494, "loss": 0.6104, "lr": 4.0007816458653566e-05, "epoch": 1.3784360821990926, "percentage": 68.92, "elapsed_time": "0:37:18", "remaining_time": "0:16:49"} +{"current_steps": 5170, "total_steps": 7494, "loss": 0.6257, "lr": 3.9853401850358036e-05, "epoch": 1.3797704830531092, "percentage": 68.99, "elapsed_time": "0:37:43", "remaining_time": "0:16:57"} +{"current_steps": 5175, "total_steps": 7494, "loss": 0.6298, "lr": 3.969917791441739e-05, "epoch": 1.3811048839071258, "percentage": 69.06, "elapsed_time": "0:38:19", "remaining_time": "0:17:10"} +{"current_steps": 5180, "total_steps": 7494, "loss": 0.6251, "lr": 3.954514548750553e-05, "epoch": 1.3824392847611422, "percentage": 69.12, "elapsed_time": "0:39:11", "remaining_time": "0:17:30"} +{"current_steps": 5185, "total_steps": 7494, "loss": 0.623, "lr": 3.939130540525746e-05, "epoch": 1.3837736856151588, "percentage": 69.19, "elapsed_time": "0:39:36", "remaining_time": "0:17:38"} +{"current_steps": 5190, "total_steps": 7494, "loss": 0.6362, "lr": 3.923765850226456e-05, "epoch": 1.3851080864691754, "percentage": 69.26, "elapsed_time": "0:40:01", "remaining_time": "0:17:46"} +{"current_steps": 5195, "total_steps": 7494, "loss": 0.6226, "lr": 3.908420561207032e-05, "epoch": 1.3864424873231918, "percentage": 69.32, "elapsed_time": "0:40:47", "remaining_time": "0:18:03"} +{"current_steps": 5200, "total_steps": 7494, "loss": 0.6415, "lr": 3.893094756716569e-05, "epoch": 1.3877768881772083, "percentage": 69.39, "elapsed_time": "0:41:27", "remaining_time": "0:18:17"} +{"current_steps": 5205, "total_steps": 7494, "loss": 0.6279, "lr": 3.87778851989845e-05, "epoch": 1.389111289031225, "percentage": 69.46, "elapsed_time": "0:42:01", "remaining_time": "0:18:29"} +{"current_steps": 5210, "total_steps": 7494, "loss": 0.6235, "lr": 3.862501933789908e-05, "epoch": 1.3904456898852415, "percentage": 69.52, "elapsed_time": "0:42:26", "remaining_time": "0:18:36"} +{"current_steps": 5215, "total_steps": 7494, "loss": 0.643, "lr": 3.847235081321573e-05, "epoch": 1.3917800907392581, "percentage": 69.59, "elapsed_time": "0:43:25", "remaining_time": "0:18:58"} +{"current_steps": 5220, "total_steps": 7494, "loss": 0.614, "lr": 3.831988045317007e-05, "epoch": 1.3931144915932747, "percentage": 69.66, "elapsed_time": "0:43:54", "remaining_time": "0:19:07"} +{"current_steps": 5225, "total_steps": 7494, "loss": 0.6127, "lr": 3.816760908492282e-05, "epoch": 1.394448892447291, "percentage": 69.72, "elapsed_time": "0:44:19", "remaining_time": "0:19:15"} +{"current_steps": 5230, "total_steps": 7494, "loss": 0.6554, "lr": 3.8015537534555e-05, "epoch": 1.3957832933013077, "percentage": 69.79, "elapsed_time": "0:44:49", "remaining_time": "0:19:24"} +{"current_steps": 5235, "total_steps": 7494, "loss": 0.635, "lr": 3.786366662706372e-05, "epoch": 1.3971176941553243, "percentage": 69.86, "elapsed_time": "0:45:49", "remaining_time": "0:19:46"} +{"current_steps": 5240, "total_steps": 7494, "loss": 0.6295, "lr": 3.771199718635758e-05, "epoch": 1.3984520950093409, "percentage": 69.92, "elapsed_time": "0:46:14", "remaining_time": "0:19:53"} +{"current_steps": 5245, "total_steps": 7494, "loss": 0.6258, "lr": 3.756053003525213e-05, "epoch": 1.3997864958633572, "percentage": 69.99, "elapsed_time": "0:47:10", "remaining_time": "0:20:13"} +{"current_steps": 5250, "total_steps": 7494, "loss": 0.6433, "lr": 3.7409265995465577e-05, "epoch": 1.4011208967173738, "percentage": 70.06, "elapsed_time": "0:47:47", "remaining_time": "0:20:25"} +{"current_steps": 5255, "total_steps": 7494, "loss": 0.6332, "lr": 3.725820588761422e-05, "epoch": 1.4024552975713904, "percentage": 70.12, "elapsed_time": "0:48:40", "remaining_time": "0:20:44"} +{"current_steps": 5260, "total_steps": 7494, "loss": 0.6228, "lr": 3.7107350531207944e-05, "epoch": 1.403789698425407, "percentage": 70.19, "elapsed_time": "0:49:04", "remaining_time": "0:20:50"} +{"current_steps": 5265, "total_steps": 7494, "loss": 0.6378, "lr": 3.6956700744645934e-05, "epoch": 1.4051240992794236, "percentage": 70.26, "elapsed_time": "0:49:30", "remaining_time": "0:20:57"} +{"current_steps": 5270, "total_steps": 7494, "loss": 0.63, "lr": 3.6806257345212136e-05, "epoch": 1.4064585001334402, "percentage": 70.32, "elapsed_time": "0:50:19", "remaining_time": "0:21:14"} +{"current_steps": 5275, "total_steps": 7494, "loss": 0.6247, "lr": 3.665602114907075e-05, "epoch": 1.4077929009874566, "percentage": 70.39, "elapsed_time": "0:50:57", "remaining_time": "0:21:26"} +{"current_steps": 5280, "total_steps": 7494, "loss": 0.6138, "lr": 3.650599297126198e-05, "epoch": 1.4091273018414732, "percentage": 70.46, "elapsed_time": "0:51:22", "remaining_time": "0:21:32"} +{"current_steps": 5285, "total_steps": 7494, "loss": 0.6428, "lr": 3.63561736256975e-05, "epoch": 1.4104617026954898, "percentage": 70.52, "elapsed_time": "0:51:47", "remaining_time": "0:21:38"} +{"current_steps": 5290, "total_steps": 7494, "loss": 0.6222, "lr": 3.6206563925156e-05, "epoch": 1.4117961035495064, "percentage": 70.59, "elapsed_time": "0:52:44", "remaining_time": "0:21:58"} +{"current_steps": 5295, "total_steps": 7494, "loss": 0.627, "lr": 3.605716468127889e-05, "epoch": 1.4131305044035227, "percentage": 70.66, "elapsed_time": "0:53:14", "remaining_time": "0:22:06"} +{"current_steps": 5300, "total_steps": 7494, "loss": 0.6345, "lr": 3.590797670456586e-05, "epoch": 1.4144649052575393, "percentage": 70.72, "elapsed_time": "0:53:40", "remaining_time": "0:22:13"} +{"current_steps": 5305, "total_steps": 7494, "loss": 0.6368, "lr": 3.575900080437036e-05, "epoch": 1.415799306111556, "percentage": 70.79, "elapsed_time": "0:54:18", "remaining_time": "0:22:24"} +{"current_steps": 5310, "total_steps": 7494, "loss": 0.6175, "lr": 3.561023778889545e-05, "epoch": 1.4171337069655725, "percentage": 70.86, "elapsed_time": "0:55:15", "remaining_time": "0:22:43"} +{"current_steps": 5315, "total_steps": 7494, "loss": 0.6221, "lr": 3.546168846518915e-05, "epoch": 1.418468107819589, "percentage": 70.92, "elapsed_time": "0:55:40", "remaining_time": "0:22:49"} +{"current_steps": 5320, "total_steps": 7494, "loss": 0.6201, "lr": 3.531335363914027e-05, "epoch": 1.4198025086736055, "percentage": 70.99, "elapsed_time": "0:56:05", "remaining_time": "0:22:55"} +{"current_steps": 5325, "total_steps": 7494, "loss": 0.6347, "lr": 3.516523411547397e-05, "epoch": 1.421136909527622, "percentage": 71.06, "elapsed_time": "0:56:42", "remaining_time": "0:23:05"} +{"current_steps": 5330, "total_steps": 7494, "loss": 0.6259, "lr": 3.5017330697747276e-05, "epoch": 1.4224713103816387, "percentage": 71.12, "elapsed_time": "0:57:33", "remaining_time": "0:23:21"} +{"current_steps": 5335, "total_steps": 7494, "loss": 0.6299, "lr": 3.486964418834495e-05, "epoch": 1.4238057112356552, "percentage": 71.19, "elapsed_time": "0:57:58", "remaining_time": "0:23:27"} +{"current_steps": 5340, "total_steps": 7494, "loss": 0.6272, "lr": 3.472217538847496e-05, "epoch": 1.4251401120896716, "percentage": 71.26, "elapsed_time": "0:58:23", "remaining_time": "0:23:33"} +{"current_steps": 5345, "total_steps": 7494, "loss": 0.6195, "lr": 3.457492509816416e-05, "epoch": 1.4264745129436882, "percentage": 71.32, "elapsed_time": "0:59:08", "remaining_time": "0:23:46"} +{"current_steps": 5350, "total_steps": 7494, "loss": 0.6365, "lr": 3.442789411625402e-05, "epoch": 1.4278089137977048, "percentage": 71.39, "elapsed_time": "0:59:49", "remaining_time": "0:23:58"} +{"current_steps": 5355, "total_steps": 7494, "loss": 0.6354, "lr": 3.428108324039626e-05, "epoch": 1.4291433146517214, "percentage": 71.46, "elapsed_time": "1:00:15", "remaining_time": "0:24:04"} +{"current_steps": 5360, "total_steps": 7494, "loss": 0.6091, "lr": 3.413449326704843e-05, "epoch": 1.430477715505738, "percentage": 71.52, "elapsed_time": "1:00:41", "remaining_time": "0:24:09"} +{"current_steps": 5365, "total_steps": 7494, "loss": 0.6477, "lr": 3.3988124991469764e-05, "epoch": 1.4318121163597546, "percentage": 71.59, "elapsed_time": "1:01:37", "remaining_time": "0:24:27"} +{"current_steps": 5370, "total_steps": 7494, "loss": 0.6156, "lr": 3.384197920771676e-05, "epoch": 1.433146517213771, "percentage": 71.66, "elapsed_time": "1:02:11", "remaining_time": "0:24:35"} +{"current_steps": 5375, "total_steps": 7494, "loss": 0.6454, "lr": 3.36960567086388e-05, "epoch": 1.4344809180677875, "percentage": 71.72, "elapsed_time": "1:02:36", "remaining_time": "0:24:40"} +{"current_steps": 5380, "total_steps": 7494, "loss": 0.6236, "lr": 3.355035828587403e-05, "epoch": 1.4358153189218041, "percentage": 71.79, "elapsed_time": "1:03:04", "remaining_time": "0:24:47"} +{"current_steps": 5385, "total_steps": 7494, "loss": 0.6216, "lr": 3.340488472984493e-05, "epoch": 1.4371497197758207, "percentage": 71.86, "elapsed_time": "1:04:03", "remaining_time": "0:25:05"} +{"current_steps": 5390, "total_steps": 7494, "loss": 0.6291, "lr": 3.3259636829754086e-05, "epoch": 1.438484120629837, "percentage": 71.92, "elapsed_time": "1:04:30", "remaining_time": "0:25:10"} +{"current_steps": 5395, "total_steps": 7494, "loss": 0.6155, "lr": 3.3114615373579827e-05, "epoch": 1.4398185214838537, "percentage": 71.99, "elapsed_time": "1:04:55", "remaining_time": "0:25:15"} +{"current_steps": 5400, "total_steps": 7494, "loss": 0.6366, "lr": 3.296982114807207e-05, "epoch": 1.4411529223378703, "percentage": 72.06, "elapsed_time": "1:05:30", "remaining_time": "0:25:24"} +{"current_steps": 5405, "total_steps": 7494, "loss": 0.6258, "lr": 3.282525493874798e-05, "epoch": 1.4424873231918869, "percentage": 72.12, "elapsed_time": "1:06:31", "remaining_time": "0:25:42"} +{"current_steps": 5410, "total_steps": 7494, "loss": 0.6339, "lr": 3.2680917529887746e-05, "epoch": 1.4438217240459035, "percentage": 72.19, "elapsed_time": "1:06:56", "remaining_time": "0:25:47"} +{"current_steps": 5415, "total_steps": 7494, "loss": 0.6117, "lr": 3.2536809704530206e-05, "epoch": 1.44515612489992, "percentage": 72.26, "elapsed_time": "1:07:21", "remaining_time": "0:25:51"} +{"current_steps": 5420, "total_steps": 7494, "loss": 0.6285, "lr": 3.239293224446879e-05, "epoch": 1.4464905257539364, "percentage": 72.32, "elapsed_time": "1:08:04", "remaining_time": "0:26:03"} +{"current_steps": 5425, "total_steps": 7494, "loss": 0.6161, "lr": 3.224928593024719e-05, "epoch": 1.447824926607953, "percentage": 72.39, "elapsed_time": "1:08:48", "remaining_time": "0:26:14"} +{"current_steps": 5430, "total_steps": 7494, "loss": 0.6377, "lr": 3.210587154115501e-05, "epoch": 1.4491593274619696, "percentage": 72.46, "elapsed_time": "1:09:13", "remaining_time": "0:26:18"} +{"current_steps": 5435, "total_steps": 7494, "loss": 0.629, "lr": 3.196268985522376e-05, "epoch": 1.450493728315986, "percentage": 72.52, "elapsed_time": "1:09:39", "remaining_time": "0:26:23"} +{"current_steps": 5440, "total_steps": 7494, "loss": 0.6189, "lr": 3.1819741649222485e-05, "epoch": 1.4518281291700026, "percentage": 72.59, "elapsed_time": "1:10:34", "remaining_time": "0:26:38"} +{"current_steps": 5445, "total_steps": 7494, "loss": 0.649, "lr": 3.167702769865354e-05, "epoch": 1.4531625300240192, "percentage": 72.66, "elapsed_time": "1:11:10", "remaining_time": "0:26:46"} +{"current_steps": 5450, "total_steps": 7494, "loss": 0.6273, "lr": 3.153454877774849e-05, "epoch": 1.4544969308780358, "percentage": 72.72, "elapsed_time": "1:11:35", "remaining_time": "0:26:50"} +{"current_steps": 5455, "total_steps": 7494, "loss": 0.6218, "lr": 3.139230565946387e-05, "epoch": 1.4558313317320524, "percentage": 72.79, "elapsed_time": "1:12:01", "remaining_time": "0:26:55"} +{"current_steps": 5460, "total_steps": 7494, "loss": 0.6399, "lr": 3.1250299115476874e-05, "epoch": 1.457165732586069, "percentage": 72.86, "elapsed_time": "1:12:58", "remaining_time": "0:27:11"} +{"current_steps": 5465, "total_steps": 7494, "loss": 0.6288, "lr": 3.110852991618135e-05, "epoch": 1.4585001334400853, "percentage": 72.93, "elapsed_time": "1:13:28", "remaining_time": "0:27:16"} +{"current_steps": 5470, "total_steps": 7494, "loss": 0.626, "lr": 3.0966998830683536e-05, "epoch": 1.459834534294102, "percentage": 72.99, "elapsed_time": "1:13:53", "remaining_time": "0:27:20"} +{"current_steps": 5475, "total_steps": 7494, "loss": 0.6222, "lr": 3.082570662679782e-05, "epoch": 1.4611689351481185, "percentage": 73.06, "elapsed_time": "1:14:23", "remaining_time": "0:27:26"} +{"current_steps": 5480, "total_steps": 7494, "loss": 0.6261, "lr": 3.068465407104275e-05, "epoch": 1.4625033360021351, "percentage": 73.13, "elapsed_time": "1:15:18", "remaining_time": "0:27:40"} +{"current_steps": 5485, "total_steps": 7494, "loss": 0.61, "lr": 3.054384192863664e-05, "epoch": 1.4638377368561515, "percentage": 73.19, "elapsed_time": "1:15:44", "remaining_time": "0:27:44"} +{"current_steps": 5490, "total_steps": 7494, "loss": 0.6209, "lr": 3.0403270963493657e-05, "epoch": 1.465172137710168, "percentage": 73.26, "elapsed_time": "1:16:10", "remaining_time": "0:27:48"} +{"current_steps": 5495, "total_steps": 7494, "loss": 0.6313, "lr": 3.026294193821954e-05, "epoch": 1.4665065385641847, "percentage": 73.33, "elapsed_time": "1:16:49", "remaining_time": "0:27:56"} +{"current_steps": 5500, "total_steps": 7494, "loss": 0.6244, "lr": 3.012285561410742e-05, "epoch": 1.4678409394182013, "percentage": 73.39, "elapsed_time": "1:17:40", "remaining_time": "0:28:09"} +{"current_steps": 5505, "total_steps": 7494, "loss": 0.6246, "lr": 2.9983012751133852e-05, "epoch": 1.4691753402722179, "percentage": 73.46, "elapsed_time": "1:18:14", "remaining_time": "0:28:16"} +{"current_steps": 5510, "total_steps": 7494, "loss": 0.6175, "lr": 2.9843414107954588e-05, "epoch": 1.4705097411262344, "percentage": 73.53, "elapsed_time": "1:18:39", "remaining_time": "0:28:19"} +{"current_steps": 5515, "total_steps": 7494, "loss": 0.6382, "lr": 2.9704060441900402e-05, "epoch": 1.4718441419802508, "percentage": 73.59, "elapsed_time": "1:19:25", "remaining_time": "0:28:30"} +{"current_steps": 5520, "total_steps": 7494, "loss": 0.6234, "lr": 2.956495250897311e-05, "epoch": 1.4731785428342674, "percentage": 73.66, "elapsed_time": "1:20:09", "remaining_time": "0:28:39"} +{"current_steps": 5525, "total_steps": 7494, "loss": 0.6013, "lr": 2.9426091063841444e-05, "epoch": 1.474512943688284, "percentage": 73.73, "elapsed_time": "1:20:34", "remaining_time": "0:28:42"} +{"current_steps": 5530, "total_steps": 7494, "loss": 0.6269, "lr": 2.9287476859836817e-05, "epoch": 1.4758473445423004, "percentage": 73.79, "elapsed_time": "1:20:59", "remaining_time": "0:28:45"} +{"current_steps": 5535, "total_steps": 7494, "loss": 0.6364, "lr": 2.9149110648949447e-05, "epoch": 1.477181745396317, "percentage": 73.86, "elapsed_time": "1:21:50", "remaining_time": "0:28:57"} +{"current_steps": 5540, "total_steps": 7494, "loss": 0.6278, "lr": 2.9010993181824158e-05, "epoch": 1.4785161462503336, "percentage": 73.93, "elapsed_time": "1:22:25", "remaining_time": "0:29:04"} +{"current_steps": 5545, "total_steps": 7494, "loss": 0.6263, "lr": 2.8873125207756255e-05, "epoch": 1.4798505471043502, "percentage": 73.99, "elapsed_time": "1:22:50", "remaining_time": "0:29:07"} +{"current_steps": 5550, "total_steps": 7494, "loss": 0.6286, "lr": 2.8735507474687603e-05, "epoch": 1.4811849479583667, "percentage": 74.06, "elapsed_time": "1:23:17", "remaining_time": "0:29:10"} +{"current_steps": 5555, "total_steps": 7494, "loss": 0.6152, "lr": 2.859814072920249e-05, "epoch": 1.4825193488123833, "percentage": 74.13, "elapsed_time": "1:24:16", "remaining_time": "0:29:25"} +{"current_steps": 5560, "total_steps": 7494, "loss": 0.6297, "lr": 2.846102571652352e-05, "epoch": 1.4838537496663997, "percentage": 74.19, "elapsed_time": "1:24:45", "remaining_time": "0:29:29"} +{"current_steps": 5565, "total_steps": 7494, "loss": 0.6269, "lr": 2.8324163180507716e-05, "epoch": 1.4851881505204163, "percentage": 74.26, "elapsed_time": "1:25:10", "remaining_time": "0:29:31"} +{"current_steps": 5570, "total_steps": 7494, "loss": 0.6191, "lr": 2.8187553863642314e-05, "epoch": 1.486522551374433, "percentage": 74.33, "elapsed_time": "1:25:42", "remaining_time": "0:29:36"} +{"current_steps": 5575, "total_steps": 7494, "loss": 0.6375, "lr": 2.8051198507040876e-05, "epoch": 1.4878569522284495, "percentage": 74.39, "elapsed_time": "1:26:39", "remaining_time": "0:29:49"} +{"current_steps": 5580, "total_steps": 7494, "loss": 0.6257, "lr": 2.7915097850439238e-05, "epoch": 1.4891913530824659, "percentage": 74.46, "elapsed_time": "1:27:05", "remaining_time": "0:29:52"} +{"current_steps": 5585, "total_steps": 7494, "loss": 0.622, "lr": 2.7779252632191394e-05, "epoch": 1.4905257539364825, "percentage": 74.53, "elapsed_time": "1:27:30", "remaining_time": "0:29:54"} +{"current_steps": 5590, "total_steps": 7494, "loss": 0.6309, "lr": 2.7643663589265642e-05, "epoch": 1.491860154790499, "percentage": 74.59, "elapsed_time": "1:28:10", "remaining_time": "0:30:02"} +{"current_steps": 5595, "total_steps": 7494, "loss": 0.6368, "lr": 2.750833145724049e-05, "epoch": 1.4931945556445156, "percentage": 74.66, "elapsed_time": "1:29:00", "remaining_time": "0:30:12"} +{"current_steps": 5600, "total_steps": 7494, "loss": 0.6319, "lr": 2.7373256970300663e-05, "epoch": 1.4945289564985322, "percentage": 74.73, "elapsed_time": "1:29:25", "remaining_time": "0:30:14"} +{"current_steps": 5605, "total_steps": 7494, "loss": 0.6427, "lr": 2.7238440861233176e-05, "epoch": 1.4958633573525488, "percentage": 74.79, "elapsed_time": "1:30:00", "remaining_time": "0:30:20"} +{"current_steps": 5610, "total_steps": 7494, "loss": 0.6366, "lr": 2.710388386142335e-05, "epoch": 1.4971977582065652, "percentage": 74.86, "elapsed_time": "1:31:10", "remaining_time": "0:30:37"} +{"current_steps": 5615, "total_steps": 7494, "loss": 0.6328, "lr": 2.6969586700850753e-05, "epoch": 1.4985321590605818, "percentage": 74.93, "elapsed_time": "1:31:52", "remaining_time": "0:30:44"} +{"current_steps": 5620, "total_steps": 7494, "loss": 0.6234, "lr": 2.6835550108085373e-05, "epoch": 1.4998665599145984, "percentage": 74.99, "elapsed_time": "1:32:17", "remaining_time": "0:30:46"} +{"current_steps": 5625, "total_steps": 7494, "loss": 0.6214, "lr": 2.67017748102836e-05, "epoch": 1.5012009607686148, "percentage": 75.06, "elapsed_time": "1:32:44", "remaining_time": "0:30:48"} +{"current_steps": 5630, "total_steps": 7494, "loss": 0.634, "lr": 2.6568261533184233e-05, "epoch": 1.5025353616226313, "percentage": 75.13, "elapsed_time": "1:33:40", "remaining_time": "0:31:00"} +{"current_steps": 5635, "total_steps": 7494, "loss": 0.6228, "lr": 2.643501100110463e-05, "epoch": 1.503869762476648, "percentage": 75.19, "elapsed_time": "1:34:14", "remaining_time": "0:31:05"} +{"current_steps": 5640, "total_steps": 7494, "loss": 0.6309, "lr": 2.6302023936936776e-05, "epoch": 1.5052041633306645, "percentage": 75.26, "elapsed_time": "1:34:39", "remaining_time": "0:31:07"} +{"current_steps": 5645, "total_steps": 7494, "loss": 0.6271, "lr": 2.616930106214323e-05, "epoch": 1.5065385641846811, "percentage": 75.33, "elapsed_time": "1:35:08", "remaining_time": "0:31:09"} +{"current_steps": 5650, "total_steps": 7494, "loss": 0.6201, "lr": 2.6036843096753394e-05, "epoch": 1.5078729650386977, "percentage": 75.39, "elapsed_time": "1:36:05", "remaining_time": "0:31:21"} +{"current_steps": 5655, "total_steps": 7494, "loss": 0.6359, "lr": 2.5904650759359528e-05, "epoch": 1.5092073658927143, "percentage": 75.46, "elapsed_time": "1:36:34", "remaining_time": "0:31:24"} +{"current_steps": 5660, "total_steps": 7494, "loss": 0.6231, "lr": 2.5772724767112753e-05, "epoch": 1.5105417667467307, "percentage": 75.53, "elapsed_time": "1:36:59", "remaining_time": "0:31:25"} +{"current_steps": 5665, "total_steps": 7494, "loss": 0.6435, "lr": 2.564106583571933e-05, "epoch": 1.5118761676007473, "percentage": 75.59, "elapsed_time": "1:37:32", "remaining_time": "0:31:29"} +{"current_steps": 5670, "total_steps": 7494, "loss": 0.6233, "lr": 2.550967467943668e-05, "epoch": 1.5132105684547636, "percentage": 75.66, "elapsed_time": "1:38:26", "remaining_time": "0:31:40"} +{"current_steps": 5675, "total_steps": 7494, "loss": 0.6281, "lr": 2.537855201106955e-05, "epoch": 1.5145449693087802, "percentage": 75.73, "elapsed_time": "1:38:52", "remaining_time": "0:31:41"} +{"current_steps": 5680, "total_steps": 7494, "loss": 0.6366, "lr": 2.5247698541966066e-05, "epoch": 1.5158793701627968, "percentage": 75.79, "elapsed_time": "1:39:17", "remaining_time": "0:31:42"} +{"current_steps": 5685, "total_steps": 7494, "loss": 0.6266, "lr": 2.511711498201397e-05, "epoch": 1.5172137710168134, "percentage": 75.86, "elapsed_time": "1:39:57", "remaining_time": "0:31:48"} +{"current_steps": 5690, "total_steps": 7494, "loss": 0.6259, "lr": 2.4986802039636773e-05, "epoch": 1.51854817187083, "percentage": 75.93, "elapsed_time": "1:40:47", "remaining_time": "0:31:57"} +{"current_steps": 5695, "total_steps": 7494, "loss": 0.6279, "lr": 2.485676042178976e-05, "epoch": 1.5198825727248466, "percentage": 75.99, "elapsed_time": "1:41:13", "remaining_time": "0:31:58"} +{"current_steps": 5700, "total_steps": 7494, "loss": 0.6313, "lr": 2.4726990833956363e-05, "epoch": 1.5212169735788632, "percentage": 76.06, "elapsed_time": "1:41:38", "remaining_time": "0:31:59"} +{"current_steps": 5705, "total_steps": 7494, "loss": 0.6199, "lr": 2.45974939801442e-05, "epoch": 1.5225513744328798, "percentage": 76.13, "elapsed_time": "1:42:35", "remaining_time": "0:32:10"} +{"current_steps": 5710, "total_steps": 7494, "loss": 0.6134, "lr": 2.446827056288131e-05, "epoch": 1.5238857752868962, "percentage": 76.19, "elapsed_time": "1:43:19", "remaining_time": "0:32:16"} +{"current_steps": 5715, "total_steps": 7494, "loss": 0.628, "lr": 2.4339321283212276e-05, "epoch": 1.5252201761409128, "percentage": 76.26, "elapsed_time": "1:43:44", "remaining_time": "0:32:17"} +{"current_steps": 5720, "total_steps": 7494, "loss": 0.6343, "lr": 2.421064684069453e-05, "epoch": 1.5265545769949291, "percentage": 76.33, "elapsed_time": "1:44:10", "remaining_time": "0:32:18"} +{"current_steps": 5725, "total_steps": 7494, "loss": 0.6317, "lr": 2.4082247933394414e-05, "epoch": 1.5278889778489457, "percentage": 76.39, "elapsed_time": "1:45:04", "remaining_time": "0:32:28"} +{"current_steps": 5730, "total_steps": 7494, "loss": 0.6258, "lr": 2.3954125257883558e-05, "epoch": 1.5292233787029623, "percentage": 76.46, "elapsed_time": "1:45:40", "remaining_time": "0:32:31"} +{"current_steps": 5735, "total_steps": 7494, "loss": 0.6268, "lr": 2.382627950923501e-05, "epoch": 1.530557779556979, "percentage": 76.53, "elapsed_time": "1:46:05", "remaining_time": "0:32:32"} +{"current_steps": 5740, "total_steps": 7494, "loss": 0.627, "lr": 2.3698711381019398e-05, "epoch": 1.5318921804109955, "percentage": 76.59, "elapsed_time": "1:46:34", "remaining_time": "0:32:34"} +{"current_steps": 5745, "total_steps": 7494, "loss": 0.6159, "lr": 2.3571421565301315e-05, "epoch": 1.533226581265012, "percentage": 76.66, "elapsed_time": "1:47:32", "remaining_time": "0:32:44"} +{"current_steps": 5750, "total_steps": 7494, "loss": 0.6324, "lr": 2.3444410752635512e-05, "epoch": 1.5345609821190287, "percentage": 76.73, "elapsed_time": "1:48:05", "remaining_time": "0:32:47"} +{"current_steps": 5755, "total_steps": 7494, "loss": 0.6174, "lr": 2.331767963206302e-05, "epoch": 1.535895382973045, "percentage": 76.79, "elapsed_time": "1:48:31", "remaining_time": "0:32:47"} +{"current_steps": 5760, "total_steps": 7494, "loss": 0.6219, "lr": 2.319122889110763e-05, "epoch": 1.5372297838270617, "percentage": 76.86, "elapsed_time": "1:49:02", "remaining_time": "0:32:49"} +{"current_steps": 5765, "total_steps": 7494, "loss": 0.6176, "lr": 2.3065059215772057e-05, "epoch": 1.5385641846810783, "percentage": 76.93, "elapsed_time": "1:49:59", "remaining_time": "0:32:59"} +{"current_steps": 5770, "total_steps": 7494, "loss": 0.6152, "lr": 2.2939171290534127e-05, "epoch": 1.5398985855350946, "percentage": 76.99, "elapsed_time": "1:50:27", "remaining_time": "0:33:00"} +{"current_steps": 5775, "total_steps": 7494, "loss": 0.6249, "lr": 2.281356579834324e-05, "epoch": 1.5412329863891112, "percentage": 77.06, "elapsed_time": "1:50:52", "remaining_time": "0:33:00"} +{"current_steps": 5780, "total_steps": 7494, "loss": 0.6162, "lr": 2.2688243420616573e-05, "epoch": 1.5425673872431278, "percentage": 77.13, "elapsed_time": "1:51:30", "remaining_time": "0:33:04"} +{"current_steps": 5785, "total_steps": 7494, "loss": 0.637, "lr": 2.2563204837235323e-05, "epoch": 1.5439017880971444, "percentage": 77.2, "elapsed_time": "1:52:23", "remaining_time": "0:33:12"} +{"current_steps": 5790, "total_steps": 7494, "loss": 0.6082, "lr": 2.243845072654115e-05, "epoch": 1.545236188951161, "percentage": 77.26, "elapsed_time": "1:52:49", "remaining_time": "0:33:12"} +{"current_steps": 5795, "total_steps": 7494, "loss": 0.6252, "lr": 2.2313981765332464e-05, "epoch": 1.5465705898051776, "percentage": 77.33, "elapsed_time": "1:53:15", "remaining_time": "0:33:12"} +{"current_steps": 5800, "total_steps": 7494, "loss": 0.6246, "lr": 2.2189798628860604e-05, "epoch": 1.5479049906591942, "percentage": 77.4, "elapsed_time": "1:53:59", "remaining_time": "0:33:17"} +{"current_steps": 5805, "total_steps": 7494, "loss": 0.6215, "lr": 2.206590199082642e-05, "epoch": 1.5492393915132106, "percentage": 77.46, "elapsed_time": "1:54:57", "remaining_time": "0:33:26"} +{"current_steps": 5810, "total_steps": 7494, "loss": 0.6246, "lr": 2.194229252337639e-05, "epoch": 1.5505737923672271, "percentage": 77.53, "elapsed_time": "1:55:23", "remaining_time": "0:33:26"} +{"current_steps": 5815, "total_steps": 7494, "loss": 0.6169, "lr": 2.181897089709913e-05, "epoch": 1.5519081932212435, "percentage": 77.6, "elapsed_time": "1:55:49", "remaining_time": "0:33:26"} +{"current_steps": 5820, "total_steps": 7494, "loss": 0.6162, "lr": 2.1695937781021736e-05, "epoch": 1.55324259407526, "percentage": 77.66, "elapsed_time": "1:56:41", "remaining_time": "0:33:33"} +{"current_steps": 5825, "total_steps": 7494, "loss": 0.6212, "lr": 2.1573193842606007e-05, "epoch": 1.5545769949292767, "percentage": 77.73, "elapsed_time": "1:57:21", "remaining_time": "0:33:37"} +{"current_steps": 5830, "total_steps": 7494, "loss": 0.6232, "lr": 2.1450739747745034e-05, "epoch": 1.5559113957832933, "percentage": 77.8, "elapsed_time": "1:57:47", "remaining_time": "0:33:37"} +{"current_steps": 5835, "total_steps": 7494, "loss": 0.6184, "lr": 2.1328576160759486e-05, "epoch": 1.5572457966373099, "percentage": 77.86, "elapsed_time": "1:58:15", "remaining_time": "0:33:37"} +{"current_steps": 5840, "total_steps": 7494, "loss": 0.6477, "lr": 2.1206703744393936e-05, "epoch": 1.5585801974913265, "percentage": 77.93, "elapsed_time": "1:59:10", "remaining_time": "0:33:45"} +{"current_steps": 5845, "total_steps": 7494, "loss": 0.6249, "lr": 2.1085123159813398e-05, "epoch": 1.559914598345343, "percentage": 78.0, "elapsed_time": "1:59:46", "remaining_time": "0:33:47"} +{"current_steps": 5850, "total_steps": 7494, "loss": 0.6153, "lr": 2.0963835066599703e-05, "epoch": 1.5612489991993594, "percentage": 78.06, "elapsed_time": "2:00:12", "remaining_time": "0:33:46"} +{"current_steps": 5855, "total_steps": 7494, "loss": 0.6387, "lr": 2.084284012274781e-05, "epoch": 1.562583400053376, "percentage": 78.13, "elapsed_time": "2:01:09", "remaining_time": "0:33:54"} +{"current_steps": 5860, "total_steps": 7494, "loss": 0.6134, "lr": 2.0722138984662415e-05, "epoch": 1.5639178009073926, "percentage": 78.2, "elapsed_time": "2:02:08", "remaining_time": "0:34:03"} +{"current_steps": 5865, "total_steps": 7494, "loss": 0.6241, "lr": 2.0601732307154283e-05, "epoch": 1.565252201761409, "percentage": 78.26, "elapsed_time": "2:02:40", "remaining_time": "0:34:04"} +{"current_steps": 5870, "total_steps": 7494, "loss": 0.6079, "lr": 2.048162074343665e-05, "epoch": 1.5665866026154256, "percentage": 78.33, "elapsed_time": "2:03:05", "remaining_time": "0:34:03"} +{"current_steps": 5875, "total_steps": 7494, "loss": 0.6194, "lr": 2.036180494512181e-05, "epoch": 1.5679210034694422, "percentage": 78.4, "elapsed_time": "2:03:39", "remaining_time": "0:34:04"} +{"current_steps": 5880, "total_steps": 7494, "loss": 0.6357, "lr": 2.024228556221752e-05, "epoch": 1.5692554043234588, "percentage": 78.46, "elapsed_time": "2:04:36", "remaining_time": "0:34:12"} +{"current_steps": 5885, "total_steps": 7494, "loss": 0.6309, "lr": 2.0123063243123395e-05, "epoch": 1.5705898051774754, "percentage": 78.53, "elapsed_time": "2:05:03", "remaining_time": "0:34:11"} +{"current_steps": 5890, "total_steps": 7494, "loss": 0.6178, "lr": 2.000413863462754e-05, "epoch": 1.571924206031492, "percentage": 78.6, "elapsed_time": "2:05:28", "remaining_time": "0:34:10"} +{"current_steps": 5895, "total_steps": 7494, "loss": 0.6099, "lr": 1.988551238190288e-05, "epoch": 1.5732586068855086, "percentage": 78.66, "elapsed_time": "2:06:09", "remaining_time": "0:34:13"} +{"current_steps": 5900, "total_steps": 7494, "loss": 0.6257, "lr": 1.9767185128503817e-05, "epoch": 1.574593007739525, "percentage": 78.73, "elapsed_time": "2:07:00", "remaining_time": "0:34:18"} +{"current_steps": 5905, "total_steps": 7494, "loss": 0.6298, "lr": 1.9649157516362663e-05, "epoch": 1.5759274085935415, "percentage": 78.8, "elapsed_time": "2:07:35", "remaining_time": "0:34:20"} +{"current_steps": 5910, "total_steps": 7494, "loss": 0.6245, "lr": 1.953143018578607e-05, "epoch": 1.577261809447558, "percentage": 78.86, "elapsed_time": "2:08:01", "remaining_time": "0:34:18"} +{"current_steps": 5915, "total_steps": 7494, "loss": 0.6281, "lr": 1.9414003775451754e-05, "epoch": 1.5785962103015745, "percentage": 78.93, "elapsed_time": "2:08:46", "remaining_time": "0:34:22"} +{"current_steps": 5920, "total_steps": 7494, "loss": 0.6295, "lr": 1.9296878922404868e-05, "epoch": 1.579930611155591, "percentage": 79.0, "elapsed_time": "2:09:32", "remaining_time": "0:34:26"} +{"current_steps": 5925, "total_steps": 7494, "loss": 0.6268, "lr": 1.9180056262054575e-05, "epoch": 1.5812650120096077, "percentage": 79.06, "elapsed_time": "2:09:57", "remaining_time": "0:34:24"} +{"current_steps": 5930, "total_steps": 7494, "loss": 0.6261, "lr": 1.9063536428170682e-05, "epoch": 1.5825994128636243, "percentage": 79.13, "elapsed_time": "2:10:24", "remaining_time": "0:34:23"} +{"current_steps": 5935, "total_steps": 7494, "loss": 0.6265, "lr": 1.8947320052880106e-05, "epoch": 1.5839338137176409, "percentage": 79.2, "elapsed_time": "2:11:12", "remaining_time": "0:34:28"} +{"current_steps": 5940, "total_steps": 7494, "loss": 0.633, "lr": 1.8831407766663513e-05, "epoch": 1.5852682145716575, "percentage": 79.26, "elapsed_time": "2:11:54", "remaining_time": "0:34:30"} +{"current_steps": 5945, "total_steps": 7494, "loss": 0.6283, "lr": 1.8715800198351824e-05, "epoch": 1.5866026154256738, "percentage": 79.33, "elapsed_time": "2:12:19", "remaining_time": "0:34:28"} +{"current_steps": 5950, "total_steps": 7494, "loss": 0.609, "lr": 1.8600497975122877e-05, "epoch": 1.5879370162796904, "percentage": 79.4, "elapsed_time": "2:12:47", "remaining_time": "0:34:27"} +{"current_steps": 5955, "total_steps": 7494, "loss": 0.6252, "lr": 1.8485501722498024e-05, "epoch": 1.589271417133707, "percentage": 79.46, "elapsed_time": "2:13:39", "remaining_time": "0:34:32"} +{"current_steps": 5960, "total_steps": 7494, "loss": 0.6192, "lr": 1.8370812064338624e-05, "epoch": 1.5906058179877234, "percentage": 79.53, "elapsed_time": "2:14:13", "remaining_time": "0:34:32"} +{"current_steps": 5965, "total_steps": 7494, "loss": 0.6184, "lr": 1.8256429622842818e-05, "epoch": 1.59194021884174, "percentage": 79.6, "elapsed_time": "2:14:38", "remaining_time": "0:34:30"} +{"current_steps": 5970, "total_steps": 7494, "loss": 0.6188, "lr": 1.814235501854206e-05, "epoch": 1.5932746196957566, "percentage": 79.66, "elapsed_time": "2:15:09", "remaining_time": "0:34:30"} +{"current_steps": 5975, "total_steps": 7494, "loss": 0.6289, "lr": 1.8028588870297774e-05, "epoch": 1.5946090205497732, "percentage": 79.73, "elapsed_time": "2:16:03", "remaining_time": "0:34:35"} +{"current_steps": 5980, "total_steps": 7494, "loss": 0.6275, "lr": 1.7915131795297956e-05, "epoch": 1.5959434214037898, "percentage": 79.8, "elapsed_time": "2:16:35", "remaining_time": "0:34:34"} +{"current_steps": 5985, "total_steps": 7494, "loss": 0.6195, "lr": 1.7801984409053897e-05, "epoch": 1.5972778222578063, "percentage": 79.86, "elapsed_time": "2:17:00", "remaining_time": "0:34:32"} +{"current_steps": 5990, "total_steps": 7494, "loss": 0.6195, "lr": 1.7689147325396822e-05, "epoch": 1.598612223111823, "percentage": 79.93, "elapsed_time": "2:17:34", "remaining_time": "0:34:32"} +{"current_steps": 5995, "total_steps": 7494, "loss": 0.6315, "lr": 1.757662115647448e-05, "epoch": 1.5999466239658393, "percentage": 80.0, "elapsed_time": "2:18:30", "remaining_time": "0:34:37"} +{"current_steps": 6000, "total_steps": 7494, "loss": 0.6244, "lr": 1.7464406512747964e-05, "epoch": 1.601281024819856, "percentage": 80.06, "elapsed_time": "2:18:59", "remaining_time": "0:34:36"} +{"current_steps": 6005, "total_steps": 7494, "loss": 0.6293, "lr": 1.7352504002988303e-05, "epoch": 1.6026154256738723, "percentage": 80.13, "elapsed_time": "2:19:33", "remaining_time": "0:34:36"} +{"current_steps": 6010, "total_steps": 7494, "loss": 0.64, "lr": 1.7240914234273126e-05, "epoch": 1.6039498265278889, "percentage": 80.2, "elapsed_time": "2:20:13", "remaining_time": "0:34:37"} +{"current_steps": 6015, "total_steps": 7494, "loss": 0.6195, "lr": 1.7129637811983507e-05, "epoch": 1.6052842273819055, "percentage": 80.26, "elapsed_time": "2:21:06", "remaining_time": "0:34:41"} +{"current_steps": 6020, "total_steps": 7494, "loss": 0.6288, "lr": 1.7018675339800557e-05, "epoch": 1.606618628235922, "percentage": 80.33, "elapsed_time": "2:21:33", "remaining_time": "0:34:39"} +{"current_steps": 6025, "total_steps": 7494, "loss": 0.6217, "lr": 1.690802741970217e-05, "epoch": 1.6079530290899386, "percentage": 80.4, "elapsed_time": "2:21:59", "remaining_time": "0:34:37"} +{"current_steps": 6030, "total_steps": 7494, "loss": 0.6146, "lr": 1.6797694651959806e-05, "epoch": 1.6092874299439552, "percentage": 80.46, "elapsed_time": "2:22:45", "remaining_time": "0:34:39"} +{"current_steps": 6035, "total_steps": 7494, "loss": 0.6304, "lr": 1.6687677635135218e-05, "epoch": 1.6106218307979718, "percentage": 80.53, "elapsed_time": "2:23:30", "remaining_time": "0:34:41"} +{"current_steps": 6040, "total_steps": 7494, "loss": 0.631, "lr": 1.657797696607714e-05, "epoch": 1.6119562316519882, "percentage": 80.6, "elapsed_time": "2:23:56", "remaining_time": "0:34:38"} +{"current_steps": 6045, "total_steps": 7494, "loss": 0.6325, "lr": 1.6468593239918136e-05, "epoch": 1.6132906325060048, "percentage": 80.66, "elapsed_time": "2:24:22", "remaining_time": "0:34:36"} +{"current_steps": 6050, "total_steps": 7494, "loss": 0.6177, "lr": 1.635952705007136e-05, "epoch": 1.6146250333600214, "percentage": 80.73, "elapsed_time": "2:25:13", "remaining_time": "0:34:39"} +{"current_steps": 6055, "total_steps": 7494, "loss": 0.6375, "lr": 1.6250778988227248e-05, "epoch": 1.6159594342140378, "percentage": 80.8, "elapsed_time": "2:25:54", "remaining_time": "0:34:40"} +{"current_steps": 6060, "total_steps": 7494, "loss": 0.6128, "lr": 1.614234964435044e-05, "epoch": 1.6172938350680544, "percentage": 80.86, "elapsed_time": "2:26:20", "remaining_time": "0:34:37"} +{"current_steps": 6065, "total_steps": 7494, "loss": 0.6282, "lr": 1.603423960667645e-05, "epoch": 1.618628235922071, "percentage": 80.93, "elapsed_time": "2:26:48", "remaining_time": "0:34:35"} +{"current_steps": 6070, "total_steps": 7494, "loss": 0.6325, "lr": 1.5926449461708577e-05, "epoch": 1.6199626367760875, "percentage": 81.0, "elapsed_time": "2:27:39", "remaining_time": "0:34:38"} +{"current_steps": 6075, "total_steps": 7494, "loss": 0.6296, "lr": 1.581897979421471e-05, "epoch": 1.6212970376301041, "percentage": 81.06, "elapsed_time": "2:28:17", "remaining_time": "0:34:38"} +{"current_steps": 6080, "total_steps": 7494, "loss": 0.6261, "lr": 1.571183118722405e-05, "epoch": 1.6226314384841207, "percentage": 81.13, "elapsed_time": "2:28:42", "remaining_time": "0:34:35"} +{"current_steps": 6085, "total_steps": 7494, "loss": 0.6316, "lr": 1.5605004222024074e-05, "epoch": 1.6239658393381373, "percentage": 81.2, "elapsed_time": "2:29:12", "remaining_time": "0:34:33"} +{"current_steps": 6090, "total_steps": 7494, "loss": 0.6307, "lr": 1.549849947815737e-05, "epoch": 1.6253002401921537, "percentage": 81.27, "elapsed_time": "2:30:07", "remaining_time": "0:34:36"} +{"current_steps": 6095, "total_steps": 7494, "loss": 0.6336, "lr": 1.5392317533418366e-05, "epoch": 1.6266346410461703, "percentage": 81.33, "elapsed_time": "2:30:40", "remaining_time": "0:34:35"} +{"current_steps": 6100, "total_steps": 7494, "loss": 0.6164, "lr": 1.5286458963850363e-05, "epoch": 1.6279690419001867, "percentage": 81.4, "elapsed_time": "2:31:05", "remaining_time": "0:34:31"} +{"current_steps": 6105, "total_steps": 7494, "loss": 0.6209, "lr": 1.5180924343742316e-05, "epoch": 1.6293034427542032, "percentage": 81.47, "elapsed_time": "2:31:48", "remaining_time": "0:34:32"} +{"current_steps": 6110, "total_steps": 7494, "loss": 0.6094, "lr": 1.5075714245625689e-05, "epoch": 1.6306378436082198, "percentage": 81.53, "elapsed_time": "2:32:44", "remaining_time": "0:34:35"} +{"current_steps": 6115, "total_steps": 7494, "loss": 0.6174, "lr": 1.4970829240271448e-05, "epoch": 1.6319722444622364, "percentage": 81.6, "elapsed_time": "2:33:13", "remaining_time": "0:34:33"} +{"current_steps": 6120, "total_steps": 7494, "loss": 0.6557, "lr": 1.4866269896686917e-05, "epoch": 1.633306645316253, "percentage": 81.67, "elapsed_time": "2:33:39", "remaining_time": "0:34:29"} +{"current_steps": 6125, "total_steps": 7494, "loss": 0.6305, "lr": 1.4762036782112624e-05, "epoch": 1.6346410461702696, "percentage": 81.73, "elapsed_time": "2:34:18", "remaining_time": "0:34:29"} +{"current_steps": 6130, "total_steps": 7494, "loss": 0.6189, "lr": 1.465813046201934e-05, "epoch": 1.6359754470242862, "percentage": 81.8, "elapsed_time": "2:35:10", "remaining_time": "0:34:31"} +{"current_steps": 6135, "total_steps": 7494, "loss": 0.621, "lr": 1.4554551500104971e-05, "epoch": 1.6373098478783028, "percentage": 81.87, "elapsed_time": "2:35:38", "remaining_time": "0:34:28"} +{"current_steps": 6140, "total_steps": 7494, "loss": 0.625, "lr": 1.4451300458291401e-05, "epoch": 1.6386442487323192, "percentage": 81.93, "elapsed_time": "2:36:03", "remaining_time": "0:34:24"} +{"current_steps": 6145, "total_steps": 7494, "loss": 0.6175, "lr": 1.4348377896721635e-05, "epoch": 1.6399786495863358, "percentage": 82.0, "elapsed_time": "2:36:46", "remaining_time": "0:34:24"} +{"current_steps": 6150, "total_steps": 7494, "loss": 0.6243, "lr": 1.4245784373756566e-05, "epoch": 1.6413130504403521, "percentage": 82.07, "elapsed_time": "2:37:33", "remaining_time": "0:34:26"} +{"current_steps": 6155, "total_steps": 7494, "loss": 0.6307, "lr": 1.4143520445972078e-05, "epoch": 1.6426474512943687, "percentage": 82.13, "elapsed_time": "2:38:00", "remaining_time": "0:34:22"} +{"current_steps": 6160, "total_steps": 7494, "loss": 0.6298, "lr": 1.4041586668155989e-05, "epoch": 1.6439818521483853, "percentage": 82.2, "elapsed_time": "2:38:26", "remaining_time": "0:34:18"} +{"current_steps": 6165, "total_steps": 7494, "loss": 0.6049, "lr": 1.3939983593304992e-05, "epoch": 1.645316253002402, "percentage": 82.27, "elapsed_time": "2:39:13", "remaining_time": "0:34:19"} +{"current_steps": 6170, "total_steps": 7494, "loss": 0.6239, "lr": 1.3838711772621743e-05, "epoch": 1.6466506538564185, "percentage": 82.33, "elapsed_time": "2:39:56", "remaining_time": "0:34:19"} +{"current_steps": 6175, "total_steps": 7494, "loss": 0.6301, "lr": 1.3737771755511811e-05, "epoch": 1.647985054710435, "percentage": 82.4, "elapsed_time": "2:40:22", "remaining_time": "0:34:15"} +{"current_steps": 6180, "total_steps": 7494, "loss": 0.6179, "lr": 1.3637164089580673e-05, "epoch": 1.6493194555644517, "percentage": 82.47, "elapsed_time": "2:40:49", "remaining_time": "0:34:11"} +{"current_steps": 6185, "total_steps": 7494, "loss": 0.626, "lr": 1.3536889320630841e-05, "epoch": 1.650653856418468, "percentage": 82.53, "elapsed_time": "2:41:38", "remaining_time": "0:34:12"} +{"current_steps": 6190, "total_steps": 7494, "loss": 0.608, "lr": 1.3436947992658814e-05, "epoch": 1.6519882572724847, "percentage": 82.6, "elapsed_time": "2:42:20", "remaining_time": "0:34:11"} +{"current_steps": 6195, "total_steps": 7494, "loss": 0.6236, "lr": 1.3337340647852135e-05, "epoch": 1.6533226581265013, "percentage": 82.67, "elapsed_time": "2:42:45", "remaining_time": "0:34:07"} +{"current_steps": 6200, "total_steps": 7494, "loss": 0.629, "lr": 1.3238067826586491e-05, "epoch": 1.6546570589805176, "percentage": 82.73, "elapsed_time": "2:43:13", "remaining_time": "0:34:03"} +{"current_steps": 6205, "total_steps": 7494, "loss": 0.6255, "lr": 1.3139130067422792e-05, "epoch": 1.6559914598345342, "percentage": 82.8, "elapsed_time": "2:44:14", "remaining_time": "0:34:07"} +{"current_steps": 6210, "total_steps": 7494, "loss": 0.6354, "lr": 1.3040527907104126e-05, "epoch": 1.6573258606885508, "percentage": 82.87, "elapsed_time": "2:44:51", "remaining_time": "0:34:05"} +{"current_steps": 6215, "total_steps": 7494, "loss": 0.6194, "lr": 1.2942261880553012e-05, "epoch": 1.6586602615425674, "percentage": 82.93, "elapsed_time": "2:45:16", "remaining_time": "0:34:00"} +{"current_steps": 6220, "total_steps": 7494, "loss": 0.6166, "lr": 1.2844332520868433e-05, "epoch": 1.659994662396584, "percentage": 83.0, "elapsed_time": "2:45:47", "remaining_time": "0:33:57"} +{"current_steps": 6225, "total_steps": 7494, "loss": 0.6316, "lr": 1.2746740359322857e-05, "epoch": 1.6613290632506006, "percentage": 83.07, "elapsed_time": "2:46:42", "remaining_time": "0:33:58"} +{"current_steps": 6230, "total_steps": 7494, "loss": 0.6315, "lr": 1.2649485925359514e-05, "epoch": 1.6626634641046172, "percentage": 83.13, "elapsed_time": "2:47:15", "remaining_time": "0:33:55"} +{"current_steps": 6235, "total_steps": 7494, "loss": 0.6129, "lr": 1.2552569746589386e-05, "epoch": 1.6639978649586336, "percentage": 83.2, "elapsed_time": "2:47:40", "remaining_time": "0:33:51"} +{"current_steps": 6240, "total_steps": 7494, "loss": 0.6177, "lr": 1.245599234878846e-05, "epoch": 1.6653322658126501, "percentage": 83.27, "elapsed_time": "2:48:14", "remaining_time": "0:33:48"} +{"current_steps": 6245, "total_steps": 7494, "loss": 0.6274, "lr": 1.2359754255894737e-05, "epoch": 1.6666666666666665, "percentage": 83.33, "elapsed_time": "2:49:07", "remaining_time": "0:33:49"} +{"current_steps": 6250, "total_steps": 7494, "loss": 0.6341, "lr": 1.2263855990005527e-05, "epoch": 1.6680010675206831, "percentage": 83.4, "elapsed_time": "2:49:38", "remaining_time": "0:33:45"} +{"current_steps": 6255, "total_steps": 7494, "loss": 0.6287, "lr": 1.2168298071374543e-05, "epoch": 1.6693354683746997, "percentage": 83.47, "elapsed_time": "2:50:03", "remaining_time": "0:33:41"} +{"current_steps": 6260, "total_steps": 7494, "loss": 0.6193, "lr": 1.2073081018409112e-05, "epoch": 1.6706698692287163, "percentage": 83.53, "elapsed_time": "2:50:43", "remaining_time": "0:33:39"} +{"current_steps": 6265, "total_steps": 7494, "loss": 0.6278, "lr": 1.1978205347667303e-05, "epoch": 1.672004270082733, "percentage": 83.6, "elapsed_time": "2:51:35", "remaining_time": "0:33:39"} +{"current_steps": 6270, "total_steps": 7494, "loss": 0.6231, "lr": 1.1883671573855186e-05, "epoch": 1.6733386709367495, "percentage": 83.67, "elapsed_time": "2:52:03", "remaining_time": "0:33:35"} +{"current_steps": 6275, "total_steps": 7494, "loss": 0.6142, "lr": 1.1789480209824064e-05, "epoch": 1.674673071790766, "percentage": 83.73, "elapsed_time": "2:52:29", "remaining_time": "0:33:30"} +{"current_steps": 6280, "total_steps": 7494, "loss": 0.6238, "lr": 1.1695631766567562e-05, "epoch": 1.6760074726447824, "percentage": 83.8, "elapsed_time": "2:53:12", "remaining_time": "0:33:28"} +{"current_steps": 6285, "total_steps": 7494, "loss": 0.6117, "lr": 1.1602126753219005e-05, "epoch": 1.677341873498799, "percentage": 83.87, "elapsed_time": "2:53:59", "remaining_time": "0:33:28"} +{"current_steps": 6290, "total_steps": 7494, "loss": 0.628, "lr": 1.1508965677048585e-05, "epoch": 1.6786762743528156, "percentage": 83.93, "elapsed_time": "2:54:26", "remaining_time": "0:33:23"} +{"current_steps": 6295, "total_steps": 7494, "loss": 0.6156, "lr": 1.1416149043460562e-05, "epoch": 1.680010675206832, "percentage": 84.0, "elapsed_time": "2:54:52", "remaining_time": "0:33:18"} +{"current_steps": 6300, "total_steps": 7494, "loss": 0.644, "lr": 1.132367735599066e-05, "epoch": 1.6813450760608486, "percentage": 84.07, "elapsed_time": "2:55:40", "remaining_time": "0:33:17"} +{"current_steps": 6305, "total_steps": 7494, "loss": 0.6336, "lr": 1.1231551116303162e-05, "epoch": 1.6826794769148652, "percentage": 84.13, "elapsed_time": "2:56:34", "remaining_time": "0:33:17"} +{"current_steps": 6310, "total_steps": 7494, "loss": 0.6193, "lr": 1.1139770824188334e-05, "epoch": 1.6840138777688818, "percentage": 84.2, "elapsed_time": "2:57:00", "remaining_time": "0:33:12"} +{"current_steps": 6315, "total_steps": 7494, "loss": 0.6189, "lr": 1.1048336977559666e-05, "epoch": 1.6853482786228984, "percentage": 84.27, "elapsed_time": "2:57:28", "remaining_time": "0:33:08"} +{"current_steps": 6320, "total_steps": 7494, "loss": 0.6292, "lr": 1.0957250072451084e-05, "epoch": 1.686682679476915, "percentage": 84.33, "elapsed_time": "2:58:18", "remaining_time": "0:33:07"} +{"current_steps": 6325, "total_steps": 7494, "loss": 0.634, "lr": 1.0866510603014411e-05, "epoch": 1.6880170803309316, "percentage": 84.4, "elapsed_time": "2:59:01", "remaining_time": "0:33:05"} +{"current_steps": 6330, "total_steps": 7494, "loss": 0.6304, "lr": 1.0776119061516613e-05, "epoch": 1.689351481184948, "percentage": 84.47, "elapsed_time": "2:59:26", "remaining_time": "0:32:59"} +{"current_steps": 6335, "total_steps": 7494, "loss": 0.6021, "lr": 1.0686075938337055e-05, "epoch": 1.6906858820389645, "percentage": 84.53, "elapsed_time": "2:59:56", "remaining_time": "0:32:55"} +{"current_steps": 6340, "total_steps": 7494, "loss": 0.6366, "lr": 1.0596381721964984e-05, "epoch": 1.692020282892981, "percentage": 84.6, "elapsed_time": "3:00:46", "remaining_time": "0:32:54"} +{"current_steps": 6345, "total_steps": 7494, "loss": 0.6139, "lr": 1.0507036898996787e-05, "epoch": 1.6933546837469975, "percentage": 84.67, "elapsed_time": "3:01:23", "remaining_time": "0:32:50"} +{"current_steps": 6350, "total_steps": 7494, "loss": 0.6214, "lr": 1.0418041954133346e-05, "epoch": 1.694689084601014, "percentage": 84.73, "elapsed_time": "3:01:48", "remaining_time": "0:32:45"} +{"current_steps": 6355, "total_steps": 7494, "loss": 0.6276, "lr": 1.032939737017745e-05, "epoch": 1.6960234854550307, "percentage": 84.8, "elapsed_time": "3:02:19", "remaining_time": "0:32:40"} +{"current_steps": 6360, "total_steps": 7494, "loss": 0.6516, "lr": 1.02411036280312e-05, "epoch": 1.6973578863090473, "percentage": 84.87, "elapsed_time": "3:03:11", "remaining_time": "0:32:39"} +{"current_steps": 6365, "total_steps": 7494, "loss": 0.6237, "lr": 1.0153161206693269e-05, "epoch": 1.6986922871630639, "percentage": 84.93, "elapsed_time": "3:03:45", "remaining_time": "0:32:35"} +{"current_steps": 6370, "total_steps": 7494, "loss": 0.6234, "lr": 1.0065570583256483e-05, "epoch": 1.7000266880170805, "percentage": 85.0, "elapsed_time": "3:04:10", "remaining_time": "0:32:29"} +{"current_steps": 6375, "total_steps": 7494, "loss": 0.6162, "lr": 9.978332232905114e-06, "epoch": 1.7013610888710968, "percentage": 85.07, "elapsed_time": "3:04:45", "remaining_time": "0:32:25"} +{"current_steps": 6380, "total_steps": 7494, "loss": 0.6244, "lr": 9.891446628912286e-06, "epoch": 1.7026954897251134, "percentage": 85.13, "elapsed_time": "3:05:39", "remaining_time": "0:32:24"} +{"current_steps": 6385, "total_steps": 7494, "loss": 0.6195, "lr": 9.804914242637541e-06, "epoch": 1.70402989057913, "percentage": 85.2, "elapsed_time": "3:06:09", "remaining_time": "0:32:20"} +{"current_steps": 6390, "total_steps": 7494, "loss": 0.6184, "lr": 9.718735543524103e-06, "epoch": 1.7053642914331464, "percentage": 85.27, "elapsed_time": "3:06:35", "remaining_time": "0:32:14"} +{"current_steps": 6395, "total_steps": 7494, "loss": 0.6302, "lr": 9.632910999096486e-06, "epoch": 1.706698692287163, "percentage": 85.33, "elapsed_time": "3:07:14", "remaining_time": "0:32:10"} +{"current_steps": 6400, "total_steps": 7494, "loss": 0.6206, "lr": 9.547441074957884e-06, "epoch": 1.7080330931411796, "percentage": 85.4, "elapsed_time": "3:08:02", "remaining_time": "0:32:08"} +{"current_steps": 6405, "total_steps": 7494, "loss": 0.6177, "lr": 9.462326234787621e-06, "epoch": 1.7093674939951962, "percentage": 85.47, "elapsed_time": "3:08:40", "remaining_time": "0:32:04"} +{"current_steps": 6410, "total_steps": 7494, "loss": 0.6341, "lr": 9.377566940338712e-06, "epoch": 1.7107018948492128, "percentage": 85.54, "elapsed_time": "3:09:06", "remaining_time": "0:31:58"} +{"current_steps": 6415, "total_steps": 7494, "loss": 0.6171, "lr": 9.293163651435298e-06, "epoch": 1.7120362957032293, "percentage": 85.6, "elapsed_time": "3:09:49", "remaining_time": "0:31:55"} +{"current_steps": 6420, "total_steps": 7494, "loss": 0.6092, "lr": 9.20911682597015e-06, "epoch": 1.713370696557246, "percentage": 85.67, "elapsed_time": "3:10:37", "remaining_time": "0:31:53"} +{"current_steps": 6425, "total_steps": 7494, "loss": 0.5973, "lr": 9.125426919902231e-06, "epoch": 1.7147050974112623, "percentage": 85.74, "elapsed_time": "3:11:05", "remaining_time": "0:31:47"} +{"current_steps": 6430, "total_steps": 7494, "loss": 0.622, "lr": 9.042094387254212e-06, "epoch": 1.716039498265279, "percentage": 85.8, "elapsed_time": "3:11:31", "remaining_time": "0:31:41"} +{"current_steps": 6435, "total_steps": 7494, "loss": 0.6139, "lr": 8.959119680109918e-06, "epoch": 1.7173738991192953, "percentage": 85.87, "elapsed_time": "3:12:14", "remaining_time": "0:31:38"} +{"current_steps": 6440, "total_steps": 7494, "loss": 0.6222, "lr": 8.876503248612036e-06, "epoch": 1.7187082999733119, "percentage": 85.94, "elapsed_time": "3:13:00", "remaining_time": "0:31:35"} +{"current_steps": 6445, "total_steps": 7494, "loss": 0.6221, "lr": 8.794245540959546e-06, "epoch": 1.7200427008273285, "percentage": 86.0, "elapsed_time": "3:13:26", "remaining_time": "0:31:29"} +{"current_steps": 6450, "total_steps": 7494, "loss": 0.6093, "lr": 8.712347003405304e-06, "epoch": 1.721377101681345, "percentage": 86.07, "elapsed_time": "3:13:54", "remaining_time": "0:31:23"} +{"current_steps": 6455, "total_steps": 7494, "loss": 0.6162, "lr": 8.630808080253701e-06, "epoch": 1.7227115025353616, "percentage": 86.14, "elapsed_time": "3:14:40", "remaining_time": "0:31:20"} +{"current_steps": 6460, "total_steps": 7494, "loss": 0.6194, "lr": 8.549629213858192e-06, "epoch": 1.7240459033893782, "percentage": 86.2, "elapsed_time": "3:15:21", "remaining_time": "0:31:16"} +{"current_steps": 6465, "total_steps": 7494, "loss": 0.629, "lr": 8.468810844618842e-06, "epoch": 1.7253803042433948, "percentage": 86.27, "elapsed_time": "3:15:47", "remaining_time": "0:31:09"} +{"current_steps": 6470, "total_steps": 7494, "loss": 0.6222, "lr": 8.388353410980075e-06, "epoch": 1.7267147050974114, "percentage": 86.34, "elapsed_time": "3:16:16", "remaining_time": "0:31:03"} +{"current_steps": 6475, "total_steps": 7494, "loss": 0.617, "lr": 8.308257349428154e-06, "epoch": 1.7280491059514278, "percentage": 86.4, "elapsed_time": "3:17:05", "remaining_time": "0:31:01"} +{"current_steps": 6480, "total_steps": 7494, "loss": 0.6147, "lr": 8.228523094488928e-06, "epoch": 1.7293835068054444, "percentage": 86.47, "elapsed_time": "3:17:45", "remaining_time": "0:30:56"} +{"current_steps": 6485, "total_steps": 7494, "loss": 0.6319, "lr": 8.149151078725416e-06, "epoch": 1.7307179076594608, "percentage": 86.54, "elapsed_time": "3:18:11", "remaining_time": "0:30:50"} +{"current_steps": 6490, "total_steps": 7494, "loss": 0.6173, "lr": 8.070141732735424e-06, "epoch": 1.7320523085134774, "percentage": 86.6, "elapsed_time": "3:18:42", "remaining_time": "0:30:44"} +{"current_steps": 6495, "total_steps": 7494, "loss": 0.6272, "lr": 7.991495485149294e-06, "epoch": 1.733386709367494, "percentage": 86.67, "elapsed_time": "3:19:33", "remaining_time": "0:30:41"} +{"current_steps": 6500, "total_steps": 7494, "loss": 0.6255, "lr": 7.913212762627539e-06, "epoch": 1.7347211102215105, "percentage": 86.74, "elapsed_time": "3:20:10", "remaining_time": "0:30:36"} +{"current_steps": 6505, "total_steps": 7494, "loss": 0.6234, "lr": 7.835293989858527e-06, "epoch": 1.7360555110755271, "percentage": 86.8, "elapsed_time": "3:20:44", "remaining_time": "0:30:31"} +{"current_steps": 6510, "total_steps": 7494, "loss": 0.6115, "lr": 7.75773958955614e-06, "epoch": 1.7373899119295437, "percentage": 86.87, "elapsed_time": "3:21:18", "remaining_time": "0:30:25"} +{"current_steps": 6515, "total_steps": 7494, "loss": 0.6259, "lr": 7.680549982457553e-06, "epoch": 1.7387243127835603, "percentage": 86.94, "elapsed_time": "3:22:09", "remaining_time": "0:30:22"} +{"current_steps": 6520, "total_steps": 7494, "loss": 0.6347, "lr": 7.6037255873209165e-06, "epoch": 1.7400587136375767, "percentage": 87.0, "elapsed_time": "3:22:42", "remaining_time": "0:30:16"} +{"current_steps": 6525, "total_steps": 7494, "loss": 0.6265, "lr": 7.527266820923089e-06, "epoch": 1.7413931144915933, "percentage": 87.07, "elapsed_time": "3:23:07", "remaining_time": "0:30:09"} +{"current_steps": 6530, "total_steps": 7494, "loss": 0.6227, "lr": 7.45117409805733e-06, "epoch": 1.7427275153456097, "percentage": 87.14, "elapsed_time": "3:23:42", "remaining_time": "0:30:04"} +{"current_steps": 6535, "total_steps": 7494, "loss": 0.6198, "lr": 7.375447831531128e-06, "epoch": 1.7440619161996262, "percentage": 87.2, "elapsed_time": "3:24:30", "remaining_time": "0:30:00"} +{"current_steps": 6540, "total_steps": 7494, "loss": 0.6215, "lr": 7.300088432163945e-06, "epoch": 1.7453963170536428, "percentage": 87.27, "elapsed_time": "3:25:02", "remaining_time": "0:29:54"} +{"current_steps": 6545, "total_steps": 7494, "loss": 0.602, "lr": 7.2250963087849e-06, "epoch": 1.7467307179076594, "percentage": 87.34, "elapsed_time": "3:25:27", "remaining_time": "0:29:47"} +{"current_steps": 6550, "total_steps": 7494, "loss": 0.6276, "lr": 7.1504718682306754e-06, "epoch": 1.748065118761676, "percentage": 87.4, "elapsed_time": "3:26:07", "remaining_time": "0:29:42"} +{"current_steps": 6555, "total_steps": 7494, "loss": 0.6152, "lr": 7.076215515343256e-06, "epoch": 1.7493995196156926, "percentage": 87.47, "elapsed_time": "3:26:59", "remaining_time": "0:29:39"} +{"current_steps": 6560, "total_steps": 7494, "loss": 0.6431, "lr": 7.0023276529676655e-06, "epoch": 1.7507339204697092, "percentage": 87.54, "elapsed_time": "3:27:27", "remaining_time": "0:29:32"} +{"current_steps": 6565, "total_steps": 7494, "loss": 0.6173, "lr": 6.928808681949919e-06, "epoch": 1.7520683213237258, "percentage": 87.6, "elapsed_time": "3:27:53", "remaining_time": "0:29:25"} +{"current_steps": 6570, "total_steps": 7494, "loss": 0.6368, "lr": 6.855659001134739e-06, "epoch": 1.7534027221777422, "percentage": 87.67, "elapsed_time": "3:28:35", "remaining_time": "0:29:20"} +{"current_steps": 6575, "total_steps": 7494, "loss": 0.618, "lr": 6.78287900736342e-06, "epoch": 1.7547371230317588, "percentage": 87.74, "elapsed_time": "3:29:23", "remaining_time": "0:29:16"} +{"current_steps": 6580, "total_steps": 7494, "loss": 0.6122, "lr": 6.710469095471701e-06, "epoch": 1.7560715238857751, "percentage": 87.8, "elapsed_time": "3:29:52", "remaining_time": "0:29:09"} +{"current_steps": 6585, "total_steps": 7494, "loss": 0.6204, "lr": 6.638429658287603e-06, "epoch": 1.7574059247397917, "percentage": 87.87, "elapsed_time": "3:30:19", "remaining_time": "0:29:01"} +{"current_steps": 6590, "total_steps": 7494, "loss": 0.6166, "lr": 6.566761086629285e-06, "epoch": 1.7587403255938083, "percentage": 87.94, "elapsed_time": "3:31:02", "remaining_time": "0:28:56"} +{"current_steps": 6595, "total_steps": 7494, "loss": 0.6269, "lr": 6.495463769302952e-06, "epoch": 1.760074726447825, "percentage": 88.0, "elapsed_time": "3:31:49", "remaining_time": "0:28:52"} +{"current_steps": 6600, "total_steps": 7494, "loss": 0.6302, "lr": 6.424538093100745e-06, "epoch": 1.7614091273018415, "percentage": 88.07, "elapsed_time": "3:32:15", "remaining_time": "0:28:45"} +{"current_steps": 6605, "total_steps": 7494, "loss": 0.6273, "lr": 6.353984442798582e-06, "epoch": 1.762743528155858, "percentage": 88.14, "elapsed_time": "3:32:52", "remaining_time": "0:28:39"} +{"current_steps": 6610, "total_steps": 7494, "loss": 0.6126, "lr": 6.283803201154173e-06, "epoch": 1.7640779290098747, "percentage": 88.2, "elapsed_time": "3:33:37", "remaining_time": "0:28:34"} +{"current_steps": 6615, "total_steps": 7494, "loss": 0.6174, "lr": 6.213994748904866e-06, "epoch": 1.765412329863891, "percentage": 88.27, "elapsed_time": "3:34:22", "remaining_time": "0:28:29"} +{"current_steps": 6620, "total_steps": 7494, "loss": 0.6216, "lr": 6.144559464765605e-06, "epoch": 1.7667467307179077, "percentage": 88.34, "elapsed_time": "3:34:48", "remaining_time": "0:28:21"} +{"current_steps": 6625, "total_steps": 7494, "loss": 0.6267, "lr": 6.075497725426862e-06, "epoch": 1.7680811315719243, "percentage": 88.4, "elapsed_time": "3:35:17", "remaining_time": "0:28:14"} +{"current_steps": 6630, "total_steps": 7494, "loss": 0.6325, "lr": 6.0068099055526505e-06, "epoch": 1.7694155324259406, "percentage": 88.47, "elapsed_time": "3:36:06", "remaining_time": "0:28:09"} +{"current_steps": 6635, "total_steps": 7494, "loss": 0.6277, "lr": 5.938496377778395e-06, "epoch": 1.7707499332799572, "percentage": 88.54, "elapsed_time": "3:36:46", "remaining_time": "0:28:03"} +{"current_steps": 6640, "total_steps": 7494, "loss": 0.6237, "lr": 5.870557512709001e-06, "epoch": 1.7720843341339738, "percentage": 88.6, "elapsed_time": "3:37:12", "remaining_time": "0:27:56"} +{"current_steps": 6645, "total_steps": 7494, "loss": 0.6333, "lr": 5.802993678916773e-06, "epoch": 1.7734187349879904, "percentage": 88.67, "elapsed_time": "3:37:43", "remaining_time": "0:27:49"} +{"current_steps": 6650, "total_steps": 7494, "loss": 0.6253, "lr": 5.7358052429394785e-06, "epoch": 1.774753135842007, "percentage": 88.74, "elapsed_time": "3:38:33", "remaining_time": "0:27:44"} +{"current_steps": 6655, "total_steps": 7494, "loss": 0.6242, "lr": 5.668992569278347e-06, "epoch": 1.7760875366960236, "percentage": 88.8, "elapsed_time": "3:39:10", "remaining_time": "0:27:37"} +{"current_steps": 6660, "total_steps": 7494, "loss": 0.604, "lr": 5.602556020396004e-06, "epoch": 1.7774219375500402, "percentage": 88.87, "elapsed_time": "3:39:36", "remaining_time": "0:27:30"} +{"current_steps": 6665, "total_steps": 7494, "loss": 0.624, "lr": 5.5364959567146514e-06, "epoch": 1.7787563384040566, "percentage": 88.94, "elapsed_time": "3:40:09", "remaining_time": "0:27:23"} +{"current_steps": 6670, "total_steps": 7494, "loss": 0.6278, "lr": 5.470812736614014e-06, "epoch": 1.7800907392580732, "percentage": 89.0, "elapsed_time": "3:41:02", "remaining_time": "0:27:18"} +{"current_steps": 6675, "total_steps": 7494, "loss": 0.62, "lr": 5.405506716429378e-06, "epoch": 1.7814251401120895, "percentage": 89.07, "elapsed_time": "3:41:36", "remaining_time": "0:27:11"} +{"current_steps": 6680, "total_steps": 7494, "loss": 0.6066, "lr": 5.340578250449742e-06, "epoch": 1.7827595409661061, "percentage": 89.14, "elapsed_time": "3:42:01", "remaining_time": "0:27:03"} +{"current_steps": 6685, "total_steps": 7494, "loss": 0.6335, "lr": 5.276027690915868e-06, "epoch": 1.7840939418201227, "percentage": 89.2, "elapsed_time": "3:42:37", "remaining_time": "0:26:56"} +{"current_steps": 6690, "total_steps": 7494, "loss": 0.6329, "lr": 5.211855388018282e-06, "epoch": 1.7854283426741393, "percentage": 89.27, "elapsed_time": "3:43:28", "remaining_time": "0:26:51"} +{"current_steps": 6695, "total_steps": 7494, "loss": 0.6356, "lr": 5.148061689895519e-06, "epoch": 1.786762743528156, "percentage": 89.34, "elapsed_time": "3:44:00", "remaining_time": "0:26:44"} +{"current_steps": 6700, "total_steps": 7494, "loss": 0.6149, "lr": 5.084646942632123e-06, "epoch": 1.7880971443821725, "percentage": 89.4, "elapsed_time": "3:44:27", "remaining_time": "0:26:35"} +{"current_steps": 6705, "total_steps": 7494, "loss": 0.6165, "lr": 5.0216114902567995e-06, "epoch": 1.789431545236189, "percentage": 89.47, "elapsed_time": "3:45:12", "remaining_time": "0:26:30"} +{"current_steps": 6710, "total_steps": 7494, "loss": 0.6132, "lr": 4.9589556747406e-06, "epoch": 1.7907659460902055, "percentage": 89.54, "elapsed_time": "3:46:03", "remaining_time": "0:26:24"} +{"current_steps": 6715, "total_steps": 7494, "loss": 0.6083, "lr": 4.896679835994965e-06, "epoch": 1.792100346944222, "percentage": 89.61, "elapsed_time": "3:46:33", "remaining_time": "0:26:17"} +{"current_steps": 6720, "total_steps": 7494, "loss": 0.606, "lr": 4.834784311869985e-06, "epoch": 1.7934347477982386, "percentage": 89.67, "elapsed_time": "3:47:00", "remaining_time": "0:26:08"} +{"current_steps": 6725, "total_steps": 7494, "loss": 0.6313, "lr": 4.773269438152516e-06, "epoch": 1.794769148652255, "percentage": 89.74, "elapsed_time": "3:47:41", "remaining_time": "0:26:02"} +{"current_steps": 6730, "total_steps": 7494, "loss": 0.6032, "lr": 4.712135548564333e-06, "epoch": 1.7961035495062716, "percentage": 89.81, "elapsed_time": "3:48:29", "remaining_time": "0:25:56"} +{"current_steps": 6735, "total_steps": 7494, "loss": 0.6265, "lr": 4.651382974760382e-06, "epoch": 1.7974379503602882, "percentage": 89.87, "elapsed_time": "3:48:59", "remaining_time": "0:25:48"} +{"current_steps": 6740, "total_steps": 7494, "loss": 0.6138, "lr": 4.591012046326944e-06, "epoch": 1.7987723512143048, "percentage": 89.94, "elapsed_time": "3:49:26", "remaining_time": "0:25:40"} +{"current_steps": 6745, "total_steps": 7494, "loss": 0.6212, "lr": 4.5310230907798285e-06, "epoch": 1.8001067520683214, "percentage": 90.01, "elapsed_time": "3:50:11", "remaining_time": "0:25:33"} +{"current_steps": 6750, "total_steps": 7494, "loss": 0.6148, "lr": 4.471416433562638e-06, "epoch": 1.801441152922338, "percentage": 90.07, "elapsed_time": "3:50:55", "remaining_time": "0:25:27"} +{"current_steps": 6755, "total_steps": 7494, "loss": 0.611, "lr": 4.412192398044997e-06, "epoch": 1.8027755537763546, "percentage": 90.14, "elapsed_time": "3:51:23", "remaining_time": "0:25:18"} +{"current_steps": 6760, "total_steps": 7494, "loss": 0.6223, "lr": 4.353351305520747e-06, "epoch": 1.804109954630371, "percentage": 90.21, "elapsed_time": "3:51:51", "remaining_time": "0:25:10"} +{"current_steps": 6765, "total_steps": 7494, "loss": 0.6358, "lr": 4.2948934752062655e-06, "epoch": 1.8054443554843875, "percentage": 90.27, "elapsed_time": "3:52:37", "remaining_time": "0:25:04"} +{"current_steps": 6770, "total_steps": 7494, "loss": 0.627, "lr": 4.2368192242387355e-06, "epoch": 1.806778756338404, "percentage": 90.34, "elapsed_time": "3:53:21", "remaining_time": "0:24:57"} +{"current_steps": 6775, "total_steps": 7494, "loss": 0.6016, "lr": 4.179128867674348e-06, "epoch": 1.8081131571924205, "percentage": 90.41, "elapsed_time": "3:53:47", "remaining_time": "0:24:48"} +{"current_steps": 6780, "total_steps": 7494, "loss": 0.6237, "lr": 4.121822718486664e-06, "epoch": 1.809447558046437, "percentage": 90.47, "elapsed_time": "3:54:15", "remaining_time": "0:24:40"} +{"current_steps": 6785, "total_steps": 7494, "loss": 0.6359, "lr": 4.064901087564918e-06, "epoch": 1.8107819589004537, "percentage": 90.54, "elapsed_time": "3:55:06", "remaining_time": "0:24:34"} +{"current_steps": 6790, "total_steps": 7494, "loss": 0.6049, "lr": 4.008364283712298e-06, "epoch": 1.8121163597544703, "percentage": 90.61, "elapsed_time": "3:55:46", "remaining_time": "0:24:26"} +{"current_steps": 6795, "total_steps": 7494, "loss": 0.613, "lr": 3.9522126136442515e-06, "epoch": 1.8134507606084869, "percentage": 90.67, "elapsed_time": "3:56:13", "remaining_time": "0:24:17"} +{"current_steps": 6800, "total_steps": 7494, "loss": 0.6174, "lr": 3.896446381986901e-06, "epoch": 1.8147851614625035, "percentage": 90.74, "elapsed_time": "3:56:44", "remaining_time": "0:24:09"} +{"current_steps": 6805, "total_steps": 7494, "loss": 0.6106, "lr": 3.841065891275328e-06, "epoch": 1.8161195623165198, "percentage": 90.81, "elapsed_time": "3:57:41", "remaining_time": "0:24:03"} +{"current_steps": 6810, "total_steps": 7494, "loss": 0.6003, "lr": 3.786071441951918e-06, "epoch": 1.8174539631705364, "percentage": 90.87, "elapsed_time": "3:58:19", "remaining_time": "0:23:56"} +{"current_steps": 6815, "total_steps": 7494, "loss": 0.6287, "lr": 3.7314633323647952e-06, "epoch": 1.818788364024553, "percentage": 90.94, "elapsed_time": "3:58:45", "remaining_time": "0:23:47"} +{"current_steps": 6820, "total_steps": 7494, "loss": 0.6185, "lr": 3.6772418587661474e-06, "epoch": 1.8201227648785694, "percentage": 91.01, "elapsed_time": "3:59:17", "remaining_time": "0:23:38"} +{"current_steps": 6825, "total_steps": 7494, "loss": 0.6392, "lr": 3.623407315310667e-06, "epoch": 1.821457165732586, "percentage": 91.07, "elapsed_time": "4:00:08", "remaining_time": "0:23:32"} +{"current_steps": 6830, "total_steps": 7494, "loss": 0.622, "lr": 3.5699599940538836e-06, "epoch": 1.8227915665866026, "percentage": 91.14, "elapsed_time": "4:00:44", "remaining_time": "0:23:24"} +{"current_steps": 6835, "total_steps": 7494, "loss": 0.6443, "lr": 3.5169001849506496e-06, "epoch": 1.8241259674406192, "percentage": 91.21, "elapsed_time": "4:01:10", "remaining_time": "0:23:15"} +{"current_steps": 6840, "total_steps": 7494, "loss": 0.6246, "lr": 3.4642281758535645e-06, "epoch": 1.8254603682946358, "percentage": 91.27, "elapsed_time": "4:01:45", "remaining_time": "0:23:06"} +{"current_steps": 6845, "total_steps": 7494, "loss": 0.6236, "lr": 3.4119442525113283e-06, "epoch": 1.8267947691486524, "percentage": 91.34, "elapsed_time": "4:02:34", "remaining_time": "0:22:59"} +{"current_steps": 6850, "total_steps": 7494, "loss": 0.6147, "lr": 3.3600486985673163e-06, "epoch": 1.828129170002669, "percentage": 91.41, "elapsed_time": "4:03:08", "remaining_time": "0:22:51"} +{"current_steps": 6855, "total_steps": 7494, "loss": 0.6244, "lr": 3.308541795557948e-06, "epoch": 1.8294635708566853, "percentage": 91.47, "elapsed_time": "4:03:34", "remaining_time": "0:22:42"} +{"current_steps": 6860, "total_steps": 7494, "loss": 0.6201, "lr": 3.2574238229111704e-06, "epoch": 1.830797971710702, "percentage": 91.54, "elapsed_time": "4:04:09", "remaining_time": "0:22:33"} +{"current_steps": 6865, "total_steps": 7494, "loss": 0.6118, "lr": 3.2066950579450024e-06, "epoch": 1.8321323725647183, "percentage": 91.61, "elapsed_time": "4:04:58", "remaining_time": "0:22:26"} +{"current_steps": 6870, "total_steps": 7494, "loss": 0.6076, "lr": 3.156355775865968e-06, "epoch": 1.8334667734187349, "percentage": 91.67, "elapsed_time": "4:05:30", "remaining_time": "0:22:17"} +{"current_steps": 6875, "total_steps": 7494, "loss": 0.6107, "lr": 3.106406249767607e-06, "epoch": 1.8348011742727515, "percentage": 91.74, "elapsed_time": "4:05:56", "remaining_time": "0:22:08"} +{"current_steps": 6880, "total_steps": 7494, "loss": 0.6327, "lr": 3.056846750629041e-06, "epoch": 1.836135575126768, "percentage": 91.81, "elapsed_time": "4:06:35", "remaining_time": "0:22:00"} +{"current_steps": 6885, "total_steps": 7494, "loss": 0.6252, "lr": 3.007677547313436e-06, "epoch": 1.8374699759807847, "percentage": 91.87, "elapsed_time": "4:07:27", "remaining_time": "0:21:53"} +{"current_steps": 6890, "total_steps": 7494, "loss": 0.6258, "lr": 2.958898906566626e-06, "epoch": 1.8388043768348012, "percentage": 91.94, "elapsed_time": "4:07:57", "remaining_time": "0:21:44"} +{"current_steps": 6895, "total_steps": 7494, "loss": 0.6283, "lr": 2.910511093015588e-06, "epoch": 1.8401387776888178, "percentage": 92.01, "elapsed_time": "4:08:24", "remaining_time": "0:21:34"} +{"current_steps": 6900, "total_steps": 7494, "loss": 0.6164, "lr": 2.8625143691670404e-06, "epoch": 1.8414731785428344, "percentage": 92.07, "elapsed_time": "4:09:04", "remaining_time": "0:21:26"} +{"current_steps": 6905, "total_steps": 7494, "loss": 0.6141, "lr": 2.8149089954060287e-06, "epoch": 1.8428075793968508, "percentage": 92.14, "elapsed_time": "4:10:02", "remaining_time": "0:21:19"} +{"current_steps": 6910, "total_steps": 7494, "loss": 0.6416, "lr": 2.767695229994507e-06, "epoch": 1.8441419802508674, "percentage": 92.21, "elapsed_time": "4:10:30", "remaining_time": "0:21:10"} +{"current_steps": 6915, "total_steps": 7494, "loss": 0.6183, "lr": 2.720873329069895e-06, "epoch": 1.8454763811048838, "percentage": 92.27, "elapsed_time": "4:10:58", "remaining_time": "0:21:00"} +{"current_steps": 6920, "total_steps": 7494, "loss": 0.6195, "lr": 2.6744435466437535e-06, "epoch": 1.8468107819589004, "percentage": 92.34, "elapsed_time": "4:11:43", "remaining_time": "0:20:52"} +{"current_steps": 6925, "total_steps": 7494, "loss": 0.6177, "lr": 2.6284061346004055e-06, "epoch": 1.848145182812917, "percentage": 92.41, "elapsed_time": "4:12:29", "remaining_time": "0:20:44"} +{"current_steps": 6930, "total_steps": 7494, "loss": 0.6256, "lr": 2.5827613426954664e-06, "epoch": 1.8494795836669335, "percentage": 92.47, "elapsed_time": "4:12:57", "remaining_time": "0:20:35"} +{"current_steps": 6935, "total_steps": 7494, "loss": 0.6215, "lr": 2.537509418554631e-06, "epoch": 1.8508139845209501, "percentage": 92.54, "elapsed_time": "4:13:26", "remaining_time": "0:20:25"} +{"current_steps": 6940, "total_steps": 7494, "loss": 0.6288, "lr": 2.4926506076722417e-06, "epoch": 1.8521483853749667, "percentage": 92.61, "elapsed_time": "4:14:12", "remaining_time": "0:20:17"} +{"current_steps": 6945, "total_steps": 7494, "loss": 0.6151, "lr": 2.4481851534099707e-06, "epoch": 1.8534827862289833, "percentage": 92.67, "elapsed_time": "4:14:55", "remaining_time": "0:20:09"} +{"current_steps": 6950, "total_steps": 7494, "loss": 0.6321, "lr": 2.404113296995505e-06, "epoch": 1.8548171870829997, "percentage": 92.74, "elapsed_time": "4:15:23", "remaining_time": "0:19:59"} +{"current_steps": 6955, "total_steps": 7494, "loss": 0.6201, "lr": 2.360435277521275e-06, "epoch": 1.8561515879370163, "percentage": 92.81, "elapsed_time": "4:15:52", "remaining_time": "0:19:49"} +{"current_steps": 6960, "total_steps": 7494, "loss": 0.6346, "lr": 2.3171513319430596e-06, "epoch": 1.8574859887910327, "percentage": 92.87, "elapsed_time": "4:16:39", "remaining_time": "0:19:41"} +{"current_steps": 6965, "total_steps": 7494, "loss": 0.6268, "lr": 2.274261695078841e-06, "epoch": 1.8588203896450493, "percentage": 92.94, "elapsed_time": "4:17:20", "remaining_time": "0:19:32"} +{"current_steps": 6970, "total_steps": 7494, "loss": 0.5995, "lr": 2.231766599607371e-06, "epoch": 1.8601547904990658, "percentage": 93.01, "elapsed_time": "4:17:47", "remaining_time": "0:19:22"} +{"current_steps": 6975, "total_steps": 7494, "loss": 0.621, "lr": 2.1896662760670618e-06, "epoch": 1.8614891913530824, "percentage": 93.07, "elapsed_time": "4:18:20", "remaining_time": "0:19:13"} +{"current_steps": 6980, "total_steps": 7494, "loss": 0.6248, "lr": 2.1479609528546328e-06, "epoch": 1.862823592207099, "percentage": 93.14, "elapsed_time": "4:19:07", "remaining_time": "0:19:04"} +{"current_steps": 6985, "total_steps": 7494, "loss": 0.6274, "lr": 2.106650856223899e-06, "epoch": 1.8641579930611156, "percentage": 93.21, "elapsed_time": "4:19:43", "remaining_time": "0:18:55"} +{"current_steps": 6990, "total_steps": 7494, "loss": 0.6138, "lr": 2.0657362102845576e-06, "epoch": 1.8654923939151322, "percentage": 93.27, "elapsed_time": "4:20:10", "remaining_time": "0:18:45"} +{"current_steps": 6995, "total_steps": 7494, "loss": 0.6018, "lr": 2.0252172370009646e-06, "epoch": 1.8668267947691488, "percentage": 93.34, "elapsed_time": "4:20:43", "remaining_time": "0:18:35"} +{"current_steps": 7000, "total_steps": 7494, "loss": 0.6345, "lr": 1.985094156190925e-06, "epoch": 1.8681611956231652, "percentage": 93.41, "elapsed_time": "4:21:31", "remaining_time": "0:18:27"} +{"current_steps": 7005, "total_steps": 7494, "loss": 0.6211, "lr": 1.9453671855244963e-06, "epoch": 1.8694955964771818, "percentage": 93.47, "elapsed_time": "4:22:17", "remaining_time": "0:18:18"} +{"current_steps": 7010, "total_steps": 7494, "loss": 0.6272, "lr": 1.906036540522829e-06, "epoch": 1.8708299973311981, "percentage": 93.54, "elapsed_time": "4:22:44", "remaining_time": "0:18:08"} +{"current_steps": 7015, "total_steps": 7494, "loss": 0.6295, "lr": 1.8671024345569773e-06, "epoch": 1.8721643981852147, "percentage": 93.61, "elapsed_time": "4:23:18", "remaining_time": "0:17:58"} +{"current_steps": 7020, "total_steps": 7494, "loss": 0.6117, "lr": 1.8285650788467415e-06, "epoch": 1.8734987990392313, "percentage": 93.67, "elapsed_time": "4:24:05", "remaining_time": "0:17:49"} +{"current_steps": 7025, "total_steps": 7494, "loss": 0.621, "lr": 1.7904246824595514e-06, "epoch": 1.874833199893248, "percentage": 93.74, "elapsed_time": "4:24:40", "remaining_time": "0:17:40"} +{"current_steps": 7030, "total_steps": 7494, "loss": 0.634, "lr": 1.7526814523092763e-06, "epoch": 1.8761676007472645, "percentage": 93.81, "elapsed_time": "4:25:07", "remaining_time": "0:17:29"} +{"current_steps": 7035, "total_steps": 7494, "loss": 0.6462, "lr": 1.7153355931551592e-06, "epoch": 1.8775020016012811, "percentage": 93.88, "elapsed_time": "4:25:44", "remaining_time": "0:17:20"} +{"current_steps": 7040, "total_steps": 7494, "loss": 0.6337, "lr": 1.678387307600676e-06, "epoch": 1.8788364024552977, "percentage": 93.94, "elapsed_time": "4:26:34", "remaining_time": "0:17:11"} +{"current_steps": 7045, "total_steps": 7494, "loss": 0.6135, "lr": 1.6418367960924271e-06, "epoch": 1.880170803309314, "percentage": 94.01, "elapsed_time": "4:27:06", "remaining_time": "0:17:01"} +{"current_steps": 7050, "total_steps": 7494, "loss": 0.6217, "lr": 1.6056842569190987e-06, "epoch": 1.8815052041633307, "percentage": 94.08, "elapsed_time": "4:27:33", "remaining_time": "0:16:51"} +{"current_steps": 7055, "total_steps": 7494, "loss": 0.6179, "lr": 1.5699298862103276e-06, "epoch": 1.8828396050173473, "percentage": 94.14, "elapsed_time": "4:28:12", "remaining_time": "0:16:41"} +{"current_steps": 7060, "total_steps": 7494, "loss": 0.6301, "lr": 1.5345738779356714e-06, "epoch": 1.8841740058713636, "percentage": 94.21, "elapsed_time": "4:29:01", "remaining_time": "0:16:32"} +{"current_steps": 7065, "total_steps": 7494, "loss": 0.6039, "lr": 1.4996164239035408e-06, "epoch": 1.8855084067253802, "percentage": 94.28, "elapsed_time": "4:29:32", "remaining_time": "0:16:22"} +{"current_steps": 7070, "total_steps": 7494, "loss": 0.6246, "lr": 1.4650577137601843e-06, "epoch": 1.8868428075793968, "percentage": 94.34, "elapsed_time": "4:29:58", "remaining_time": "0:16:11"} +{"current_steps": 7075, "total_steps": 7494, "loss": 0.6202, "lr": 1.4308979349886146e-06, "epoch": 1.8881772084334134, "percentage": 94.41, "elapsed_time": "4:30:39", "remaining_time": "0:16:01"} +{"current_steps": 7080, "total_steps": 7494, "loss": 0.6312, "lr": 1.3971372729076503e-06, "epoch": 1.88951160928743, "percentage": 94.48, "elapsed_time": "4:31:28", "remaining_time": "0:15:52"} +{"current_steps": 7085, "total_steps": 7494, "loss": 0.6266, "lr": 1.3637759106708501e-06, "epoch": 1.8908460101414466, "percentage": 94.54, "elapsed_time": "4:31:57", "remaining_time": "0:15:41"} +{"current_steps": 7090, "total_steps": 7494, "loss": 0.608, "lr": 1.3308140292655645e-06, "epoch": 1.8921804109954632, "percentage": 94.61, "elapsed_time": "4:32:23", "remaining_time": "0:15:31"} +{"current_steps": 7095, "total_steps": 7494, "loss": 0.6046, "lr": 1.2982518075119352e-06, "epoch": 1.8935148118494796, "percentage": 94.68, "elapsed_time": "4:33:08", "remaining_time": "0:15:21"} +{"current_steps": 7100, "total_steps": 7494, "loss": 0.625, "lr": 1.2660894220619139e-06, "epoch": 1.8948492127034962, "percentage": 94.74, "elapsed_time": "4:33:54", "remaining_time": "0:15:12"} +{"current_steps": 7105, "total_steps": 7494, "loss": 0.6265, "lr": 1.2343270473983286e-06, "epoch": 1.8961836135575125, "percentage": 94.81, "elapsed_time": "4:34:31", "remaining_time": "0:15:01"} +{"current_steps": 7110, "total_steps": 7494, "loss": 0.6133, "lr": 1.202964855833935e-06, "epoch": 1.8975180144115291, "percentage": 94.88, "elapsed_time": "4:34:58", "remaining_time": "0:14:51"} +{"current_steps": 7115, "total_steps": 7494, "loss": 0.6281, "lr": 1.1720030175104506e-06, "epoch": 1.8988524152655457, "percentage": 94.94, "elapsed_time": "4:35:40", "remaining_time": "0:14:41"} +{"current_steps": 7120, "total_steps": 7494, "loss": 0.6074, "lr": 1.1414417003976634e-06, "epoch": 1.9001868161195623, "percentage": 95.01, "elapsed_time": "4:36:26", "remaining_time": "0:14:31"} +{"current_steps": 7125, "total_steps": 7494, "loss": 0.6139, "lr": 1.1112810702925163e-06, "epoch": 1.901521216973579, "percentage": 95.08, "elapsed_time": "4:36:53", "remaining_time": "0:14:20"} +{"current_steps": 7130, "total_steps": 7494, "loss": 0.6133, "lr": 1.0815212908181825e-06, "epoch": 1.9028556178275955, "percentage": 95.14, "elapsed_time": "4:37:22", "remaining_time": "0:14:09"} +{"current_steps": 7135, "total_steps": 7494, "loss": 0.624, "lr": 1.0521625234232333e-06, "epoch": 1.904190018681612, "percentage": 95.21, "elapsed_time": "4:38:09", "remaining_time": "0:13:59"} +{"current_steps": 7140, "total_steps": 7494, "loss": 0.6309, "lr": 1.023204927380672e-06, "epoch": 1.9055244195356285, "percentage": 95.28, "elapsed_time": "4:38:51", "remaining_time": "0:13:49"} +{"current_steps": 7145, "total_steps": 7494, "loss": 0.6228, "lr": 9.946486597871672e-07, "epoch": 1.906858820389645, "percentage": 95.34, "elapsed_time": "4:39:18", "remaining_time": "0:13:38"} +{"current_steps": 7150, "total_steps": 7494, "loss": 0.6145, "lr": 9.664938755621632e-07, "epoch": 1.9081932212436616, "percentage": 95.41, "elapsed_time": "4:39:48", "remaining_time": "0:13:27"} +{"current_steps": 7155, "total_steps": 7494, "loss": 0.6189, "lr": 9.387407274469793e-07, "epoch": 1.909527622097678, "percentage": 95.48, "elapsed_time": "4:40:32", "remaining_time": "0:13:17"} +{"current_steps": 7160, "total_steps": 7494, "loss": 0.6156, "lr": 9.113893660041033e-07, "epoch": 1.9108620229516946, "percentage": 95.54, "elapsed_time": "4:41:14", "remaining_time": "0:13:07"} +{"current_steps": 7165, "total_steps": 7494, "loss": 0.6096, "lr": 8.844399396162577e-07, "epoch": 1.9121964238057112, "percentage": 95.61, "elapsed_time": "4:41:42", "remaining_time": "0:12:56"} +{"current_steps": 7170, "total_steps": 7494, "loss": 0.6296, "lr": 8.578925944856596e-07, "epoch": 1.9135308246597278, "percentage": 95.68, "elapsed_time": "4:42:13", "remaining_time": "0:12:45"} +{"current_steps": 7175, "total_steps": 7494, "loss": 0.6045, "lr": 8.317474746332126e-07, "epoch": 1.9148652255137444, "percentage": 95.74, "elapsed_time": "4:43:00", "remaining_time": "0:12:34"} +{"current_steps": 7180, "total_steps": 7494, "loss": 0.6247, "lr": 8.060047218977323e-07, "epoch": 1.916199626367761, "percentage": 95.81, "elapsed_time": "4:43:39", "remaining_time": "0:12:24"} +{"current_steps": 7185, "total_steps": 7494, "loss": 0.6215, "lr": 7.806644759351471e-07, "epoch": 1.9175340272217776, "percentage": 95.88, "elapsed_time": "4:44:06", "remaining_time": "0:12:13"} +{"current_steps": 7190, "total_steps": 7494, "loss": 0.6245, "lr": 7.557268742177908e-07, "epoch": 1.918868428075794, "percentage": 95.94, "elapsed_time": "4:44:38", "remaining_time": "0:12:02"} +{"current_steps": 7195, "total_steps": 7494, "loss": 0.6185, "lr": 7.311920520336106e-07, "epoch": 1.9202028289298105, "percentage": 96.01, "elapsed_time": "4:45:26", "remaining_time": "0:11:51"} +{"current_steps": 7200, "total_steps": 7494, "loss": 0.6197, "lr": 7.070601424854522e-07, "epoch": 1.921537229783827, "percentage": 96.08, "elapsed_time": "4:46:02", "remaining_time": "0:11:40"} +{"current_steps": 7205, "total_steps": 7494, "loss": 0.6259, "lr": 6.833312764903343e-07, "epoch": 1.9228716306378435, "percentage": 96.14, "elapsed_time": "4:46:38", "remaining_time": "0:11:29"} +{"current_steps": 7210, "total_steps": 7494, "loss": 0.6175, "lr": 6.600055827787581e-07, "epoch": 1.92420603149186, "percentage": 96.21, "elapsed_time": "4:47:32", "remaining_time": "0:11:19"} +{"current_steps": 7215, "total_steps": 7494, "loss": 0.643, "lr": 6.370831878939747e-07, "epoch": 1.9255404323458767, "percentage": 96.28, "elapsed_time": "4:48:19", "remaining_time": "0:11:08"} +{"current_steps": 7220, "total_steps": 7494, "loss": 0.6088, "lr": 6.1456421619131e-07, "epoch": 1.9268748331998933, "percentage": 96.34, "elapsed_time": "4:48:53", "remaining_time": "0:10:57"} +{"current_steps": 7225, "total_steps": 7494, "loss": 0.6182, "lr": 5.924487898375158e-07, "epoch": 1.9282092340539099, "percentage": 96.41, "elapsed_time": "4:49:20", "remaining_time": "0:10:46"} +{"current_steps": 7230, "total_steps": 7494, "loss": 0.6333, "lr": 5.707370288100782e-07, "epoch": 1.9295436349079265, "percentage": 96.48, "elapsed_time": "4:49:59", "remaining_time": "0:10:35"} +{"current_steps": 7235, "total_steps": 7494, "loss": 0.6345, "lr": 5.494290508965605e-07, "epoch": 1.9308780357619428, "percentage": 96.54, "elapsed_time": "4:50:46", "remaining_time": "0:10:24"} +{"current_steps": 7240, "total_steps": 7494, "loss": 0.6132, "lr": 5.285249716940026e-07, "epoch": 1.9322124366159594, "percentage": 96.61, "elapsed_time": "4:51:20", "remaining_time": "0:10:13"} +{"current_steps": 7245, "total_steps": 7494, "loss": 0.6271, "lr": 5.080249046082563e-07, "epoch": 1.933546837469976, "percentage": 96.68, "elapsed_time": "4:51:46", "remaining_time": "0:10:01"} +{"current_steps": 7250, "total_steps": 7494, "loss": 0.6356, "lr": 4.879289608533926e-07, "epoch": 1.9348812383239924, "percentage": 96.74, "elapsed_time": "4:52:25", "remaining_time": "0:09:50"} +{"current_steps": 7255, "total_steps": 7494, "loss": 0.6165, "lr": 4.6823724945107e-07, "epoch": 1.936215639178009, "percentage": 96.81, "elapsed_time": "4:53:15", "remaining_time": "0:09:39"} +{"current_steps": 7260, "total_steps": 7494, "loss": 0.6257, "lr": 4.489498772299843e-07, "epoch": 1.9375500400320256, "percentage": 96.88, "elapsed_time": "4:53:46", "remaining_time": "0:09:28"} +{"current_steps": 7265, "total_steps": 7494, "loss": 0.6217, "lr": 4.3006694882526947e-07, "epoch": 1.9388844408860422, "percentage": 96.94, "elapsed_time": "4:54:13", "remaining_time": "0:09:16"} +{"current_steps": 7270, "total_steps": 7494, "loss": 0.622, "lr": 4.115885666779062e-07, "epoch": 1.9402188417400588, "percentage": 97.01, "elapsed_time": "4:54:56", "remaining_time": "0:09:05"} +{"current_steps": 7275, "total_steps": 7494, "loss": 0.6098, "lr": 3.9351483103420566e-07, "epoch": 1.9415532425940754, "percentage": 97.08, "elapsed_time": "4:55:42", "remaining_time": "0:08:54"} +{"current_steps": 7280, "total_steps": 7494, "loss": 0.6148, "lr": 3.758458399452519e-07, "epoch": 1.942887643448092, "percentage": 97.14, "elapsed_time": "4:56:12", "remaining_time": "0:08:42"} +{"current_steps": 7285, "total_steps": 7494, "loss": 0.616, "lr": 3.585816892663351e-07, "epoch": 1.9442220443021083, "percentage": 97.21, "elapsed_time": "4:56:39", "remaining_time": "0:08:30"} +{"current_steps": 7290, "total_steps": 7494, "loss": 0.6255, "lr": 3.4172247265650267e-07, "epoch": 1.945556445156125, "percentage": 97.28, "elapsed_time": "4:57:22", "remaining_time": "0:08:19"} +{"current_steps": 7295, "total_steps": 7494, "loss": 0.6279, "lr": 3.252682815779922e-07, "epoch": 1.9468908460101413, "percentage": 97.34, "elapsed_time": "4:58:08", "remaining_time": "0:08:07"} +{"current_steps": 7300, "total_steps": 7494, "loss": 0.6279, "lr": 3.0921920529574096e-07, "epoch": 1.9482252468641579, "percentage": 97.41, "elapsed_time": "4:58:37", "remaining_time": "0:07:56"} +{"current_steps": 7305, "total_steps": 7494, "loss": 0.6201, "lr": 2.9357533087694397e-07, "epoch": 1.9495596477181745, "percentage": 97.48, "elapsed_time": "4:59:15", "remaining_time": "0:07:44"} +{"current_steps": 7310, "total_steps": 7494, "loss": 0.6179, "lr": 2.7833674319052977e-07, "epoch": 1.950894048572191, "percentage": 97.54, "elapsed_time": "5:00:02", "remaining_time": "0:07:33"} +{"current_steps": 7315, "total_steps": 7494, "loss": 0.6222, "lr": 2.6350352490672746e-07, "epoch": 1.9522284494262077, "percentage": 97.61, "elapsed_time": "5:00:46", "remaining_time": "0:07:21"} +{"current_steps": 7320, "total_steps": 7494, "loss": 0.62, "lr": 2.49075756496625e-07, "epoch": 1.9535628502802243, "percentage": 97.68, "elapsed_time": "5:01:13", "remaining_time": "0:07:09"} +{"current_steps": 7325, "total_steps": 7494, "loss": 0.6365, "lr": 2.3505351623170353e-07, "epoch": 1.9548972511342408, "percentage": 97.74, "elapsed_time": "5:01:44", "remaining_time": "0:06:57"} +{"current_steps": 7330, "total_steps": 7494, "loss": 0.6376, "lr": 2.2143688018343707e-07, "epoch": 1.9562316519882574, "percentage": 97.81, "elapsed_time": "5:02:30", "remaining_time": "0:06:46"} +{"current_steps": 7335, "total_steps": 7494, "loss": 0.6263, "lr": 2.0822592222287659e-07, "epoch": 1.9575660528422738, "percentage": 97.88, "elapsed_time": "5:03:14", "remaining_time": "0:06:34"} +{"current_steps": 7340, "total_steps": 7494, "loss": 0.608, "lr": 1.9542071402024185e-07, "epoch": 1.9589004536962904, "percentage": 97.95, "elapsed_time": "5:03:42", "remaining_time": "0:06:22"} +{"current_steps": 7345, "total_steps": 7494, "loss": 0.6066, "lr": 1.830213250445467e-07, "epoch": 1.9602348545503068, "percentage": 98.01, "elapsed_time": "5:04:14", "remaining_time": "0:06:10"} +{"current_steps": 7350, "total_steps": 7494, "loss": 0.637, "lr": 1.7102782256319115e-07, "epoch": 1.9615692554043234, "percentage": 98.08, "elapsed_time": "5:04:58", "remaining_time": "0:05:58"} +{"current_steps": 7355, "total_steps": 7494, "loss": 0.6364, "lr": 1.5944027164163652e-07, "epoch": 1.96290365625834, "percentage": 98.15, "elapsed_time": "5:05:39", "remaining_time": "0:05:46"} +{"current_steps": 7360, "total_steps": 7494, "loss": 0.6258, "lr": 1.4825873514302257e-07, "epoch": 1.9642380571123566, "percentage": 98.21, "elapsed_time": "5:06:07", "remaining_time": "0:05:34"} +{"current_steps": 7365, "total_steps": 7494, "loss": 0.6263, "lr": 1.3748327372784252e-07, "epoch": 1.9655724579663731, "percentage": 98.28, "elapsed_time": "5:06:40", "remaining_time": "0:05:22"} +{"current_steps": 7370, "total_steps": 7494, "loss": 0.6221, "lr": 1.271139458536019e-07, "epoch": 1.9669068588203897, "percentage": 98.35, "elapsed_time": "5:07:25", "remaining_time": "0:05:10"} +{"current_steps": 7375, "total_steps": 7494, "loss": 0.6198, "lr": 1.1715080777451868e-07, "epoch": 1.9682412596744063, "percentage": 98.41, "elapsed_time": "5:08:03", "remaining_time": "0:04:58"} +{"current_steps": 7380, "total_steps": 7494, "loss": 0.6166, "lr": 1.0759391354119017e-07, "epoch": 1.9695756605284227, "percentage": 98.48, "elapsed_time": "5:08:30", "remaining_time": "0:04:45"} +{"current_steps": 7385, "total_steps": 7494, "loss": 0.6259, "lr": 9.844331500034331e-08, "epoch": 1.9709100613824393, "percentage": 98.55, "elapsed_time": "5:09:04", "remaining_time": "0:04:33"} +{"current_steps": 7390, "total_steps": 7494, "loss": 0.639, "lr": 8.969906179449316e-08, "epoch": 1.9722444622364559, "percentage": 98.61, "elapsed_time": "5:09:51", "remaining_time": "0:04:21"} +{"current_steps": 7395, "total_steps": 7494, "loss": 0.6347, "lr": 8.136120136174318e-08, "epoch": 1.9735788630904723, "percentage": 98.68, "elapsed_time": "5:10:26", "remaining_time": "0:04:09"} +{"current_steps": 7400, "total_steps": 7494, "loss": 0.6383, "lr": 7.342977893546875e-08, "epoch": 1.9749132639444889, "percentage": 98.75, "elapsed_time": "5:10:53", "remaining_time": "0:03:56"} +{"current_steps": 7405, "total_steps": 7494, "loss": 0.6017, "lr": 6.590483754409237e-08, "epoch": 1.9762476647985054, "percentage": 98.81, "elapsed_time": "5:11:38", "remaining_time": "0:03:44"} +{"current_steps": 7410, "total_steps": 7494, "loss": 0.6188, "lr": 5.878641801087547e-08, "epoch": 1.977582065652522, "percentage": 98.88, "elapsed_time": "5:12:26", "remaining_time": "0:03:32"} +{"current_steps": 7415, "total_steps": 7494, "loss": 0.6206, "lr": 5.207455895365198e-08, "epoch": 1.9789164665065386, "percentage": 98.95, "elapsed_time": "5:13:00", "remaining_time": "0:03:20"} +{"current_steps": 7420, "total_steps": 7494, "loss": 0.626, "lr": 4.5769296784653463e-08, "epoch": 1.9802508673605552, "percentage": 99.01, "elapsed_time": "5:13:28", "remaining_time": "0:03:07"} +{"current_steps": 7425, "total_steps": 7494, "loss": 0.6286, "lr": 3.9870665710300954e-08, "epoch": 1.9815852682145718, "percentage": 99.08, "elapsed_time": "5:14:04", "remaining_time": "0:02:55"} +{"current_steps": 7430, "total_steps": 7494, "loss": 0.6227, "lr": 3.437869773101343e-08, "epoch": 1.9829196690685882, "percentage": 99.15, "elapsed_time": "5:14:51", "remaining_time": "0:02:42"} +{"current_steps": 7435, "total_steps": 7494, "loss": 0.6079, "lr": 2.929342264103296e-08, "epoch": 1.9842540699226048, "percentage": 99.21, "elapsed_time": "5:15:26", "remaining_time": "0:02:30"} +{"current_steps": 7440, "total_steps": 7494, "loss": 0.6155, "lr": 2.4614868028274837e-08, "epoch": 1.9855884707766212, "percentage": 99.28, "elapsed_time": "5:16:16", "remaining_time": "0:02:17"} +{"current_steps": 7445, "total_steps": 7494, "loss": 0.6142, "lr": 2.034305927416935e-08, "epoch": 1.9869228716306377, "percentage": 99.35, "elapsed_time": "5:16:55", "remaining_time": "0:02:05"} +{"current_steps": 7450, "total_steps": 7494, "loss": 0.6058, "lr": 1.647801955354522e-08, "epoch": 1.9882572724846543, "percentage": 99.41, "elapsed_time": "5:17:41", "remaining_time": "0:01:52"} +{"current_steps": 7455, "total_steps": 7494, "loss": 0.6146, "lr": 1.301976983445474e-08, "epoch": 1.989591673338671, "percentage": 99.48, "elapsed_time": "5:18:13", "remaining_time": "0:01:39"} +{"current_steps": 7460, "total_steps": 7494, "loss": 0.6428, "lr": 9.968328878115495e-09, "epoch": 1.9909260741926875, "percentage": 99.55, "elapsed_time": "5:18:40", "remaining_time": "0:01:27"} +{"current_steps": 7465, "total_steps": 7494, "loss": 0.6364, "lr": 7.3237132387604646e-09, "epoch": 1.9922604750467041, "percentage": 99.61, "elapsed_time": "5:19:20", "remaining_time": "0:01:14"} +{"current_steps": 7470, "total_steps": 7494, "loss": 0.6105, "lr": 5.0859372635964065e-09, "epoch": 1.9935948759007207, "percentage": 99.68, "elapsed_time": "5:20:06", "remaining_time": "0:01:01"} +{"current_steps": 7475, "total_steps": 7494, "loss": 0.6222, "lr": 3.2550130926789487e-09, "epoch": 1.994929276754737, "percentage": 99.75, "elapsed_time": "5:20:36", "remaining_time": "0:00:48"} +{"current_steps": 7480, "total_steps": 7494, "loss": 0.6224, "lr": 1.8309506588959356e-09, "epoch": 1.9962636776087537, "percentage": 99.81, "elapsed_time": "5:21:04", "remaining_time": "0:00:36"} +{"current_steps": 7485, "total_steps": 7494, "loss": 0.6412, "lr": 8.137576878508578e-10, "epoch": 1.9975980784627703, "percentage": 99.88, "elapsed_time": "5:21:46", "remaining_time": "0:00:23"} +{"current_steps": 7490, "total_steps": 7494, "loss": 0.6171, "lr": 2.0343969787950387e-10, "epoch": 1.9989324793167866, "percentage": 99.95, "elapsed_time": "5:22:30", "remaining_time": "0:00:10"} +{"current_steps": 7494, "total_steps": 7494, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "5:23:01", "remaining_time": "0:00:00"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..da45106 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,16525 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.0, + "eval_steps": 500, + "global_step": 7494, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0013344008540165466, + "grad_norm": 1.5823220146867805, + "learning_rate": 7.999999999999999e-07, + "loss": 0.9535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.9687002301216125, + "step": 5, + "valid_targets_mean": 16998.1, + "valid_targets_min": 545 + }, + { + "epoch": 0.0026688017080330933, + "grad_norm": 1.4613232796627884, + "learning_rate": 1.8e-06, + "loss": 0.9367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.9529542326927185, + "step": 10, + "valid_targets_mean": 15522.0, + "valid_targets_min": 628 + }, + { + "epoch": 0.0040032025620496394, + "grad_norm": 0.9983532962437741, + "learning_rate": 2.8e-06, + "loss": 0.9145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.9085040092468262, + "step": 15, + "valid_targets_mean": 16460.8, + "valid_targets_min": 716 + }, + { + "epoch": 0.0053376034160661865, + "grad_norm": 0.6838873648945817, + "learning_rate": 3.7999999999999996e-06, + "loss": 0.9386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.9313464164733887, + "step": 20, + "valid_targets_mean": 15545.1, + "valid_targets_min": 608 + }, + { + "epoch": 0.006672004270082733, + "grad_norm": 0.692627322161273, + "learning_rate": 4.8e-06, + "loss": 0.8995, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.9295620322227478, + "step": 25, + "valid_targets_mean": 14973.8, + "valid_targets_min": 639 + }, + { + "epoch": 0.008006405124099279, + "grad_norm": 0.49043286997373386, + "learning_rate": 5.7999999999999995e-06, + "loss": 0.9114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8984705209732056, + "step": 30, + "valid_targets_mean": 16087.6, + "valid_targets_min": 569 + }, + { + "epoch": 0.009340805978115827, + "grad_norm": 0.3493870125757026, + "learning_rate": 6.8e-06, + "loss": 0.8679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.863591730594635, + "step": 35, + "valid_targets_mean": 15901.3, + "valid_targets_min": 760 + }, + { + "epoch": 0.010675206832132373, + "grad_norm": 0.28005099953823187, + "learning_rate": 7.799999999999998e-06, + "loss": 0.8752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8416589498519897, + "step": 40, + "valid_targets_mean": 17096.1, + "valid_targets_min": 487 + }, + { + "epoch": 0.01200960768614892, + "grad_norm": 0.2633854430730848, + "learning_rate": 8.799999999999999e-06, + "loss": 0.8419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8102971315383911, + "step": 45, + "valid_targets_mean": 16528.9, + "valid_targets_min": 664 + }, + { + "epoch": 0.013344008540165465, + "grad_norm": 0.2416755355371708, + "learning_rate": 9.799999999999998e-06, + "loss": 0.8621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8548877239227295, + "step": 50, + "valid_targets_mean": 15770.2, + "valid_targets_min": 549 + }, + { + "epoch": 0.014678409394182012, + "grad_norm": 0.22742192850097903, + "learning_rate": 1.0799999999999998e-05, + "loss": 0.8292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7773482799530029, + "step": 55, + "valid_targets_mean": 16897.5, + "valid_targets_min": 351 + }, + { + "epoch": 0.016012810248198558, + "grad_norm": 0.21185009825474607, + "learning_rate": 1.1799999999999999e-05, + "loss": 0.8224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8373425602912903, + "step": 60, + "valid_targets_mean": 15090.8, + "valid_targets_min": 695 + }, + { + "epoch": 0.017347211102215106, + "grad_norm": 0.16530947573341376, + "learning_rate": 1.2799999999999998e-05, + "loss": 0.8305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8192263841629028, + "step": 65, + "valid_targets_mean": 16723.2, + "valid_targets_min": 747 + }, + { + "epoch": 0.018681611956231654, + "grad_norm": 0.19595842220841034, + "learning_rate": 1.3799999999999998e-05, + "loss": 0.8164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8121230602264404, + "step": 70, + "valid_targets_mean": 15894.8, + "valid_targets_min": 85 + }, + { + "epoch": 0.020016012810248198, + "grad_norm": 0.14895354237962097, + "learning_rate": 1.4799999999999999e-05, + "loss": 0.7964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7786427736282349, + "step": 75, + "valid_targets_mean": 16543.0, + "valid_targets_min": 375 + }, + { + "epoch": 0.021350413664264746, + "grad_norm": 0.1893637073683363, + "learning_rate": 1.5799999999999998e-05, + "loss": 0.7989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8141142129898071, + "step": 80, + "valid_targets_mean": 16467.3, + "valid_targets_min": 271 + }, + { + "epoch": 0.02268481451828129, + "grad_norm": 0.20064348676009006, + "learning_rate": 1.68e-05, + "loss": 0.7965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7834018468856812, + "step": 85, + "valid_targets_mean": 15867.8, + "valid_targets_min": 566 + }, + { + "epoch": 0.02401921537229784, + "grad_norm": 0.1617554141425518, + "learning_rate": 1.78e-05, + "loss": 0.7926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7742629051208496, + "step": 90, + "valid_targets_mean": 16098.4, + "valid_targets_min": 834 + }, + { + "epoch": 0.025353616226314386, + "grad_norm": 0.21091252121676837, + "learning_rate": 1.8799999999999996e-05, + "loss": 0.8009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8052405714988708, + "step": 95, + "valid_targets_mean": 16067.6, + "valid_targets_min": 517 + }, + { + "epoch": 0.02668801708033093, + "grad_norm": 0.24666835856193395, + "learning_rate": 1.98e-05, + "loss": 0.772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7658431529998779, + "step": 100, + "valid_targets_mean": 15941.7, + "valid_targets_min": 568 + }, + { + "epoch": 0.02802241793434748, + "grad_norm": 0.23447043514026744, + "learning_rate": 2.0799999999999997e-05, + "loss": 0.7746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7565805315971375, + "step": 105, + "valid_targets_mean": 16312.7, + "valid_targets_min": 771 + }, + { + "epoch": 0.029356818788364023, + "grad_norm": 0.20646522638524778, + "learning_rate": 2.1799999999999998e-05, + "loss": 0.7691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7705087661743164, + "step": 110, + "valid_targets_mean": 17673.3, + "valid_targets_min": 408 + }, + { + "epoch": 0.03069121964238057, + "grad_norm": 0.2711537842641349, + "learning_rate": 2.28e-05, + "loss": 0.7771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7970471382141113, + "step": 115, + "valid_targets_mean": 14606.4, + "valid_targets_min": 603 + }, + { + "epoch": 0.032025620496397116, + "grad_norm": 0.35503609213795806, + "learning_rate": 2.38e-05, + "loss": 0.7815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.803318977355957, + "step": 120, + "valid_targets_mean": 15105.9, + "valid_targets_min": 360 + }, + { + "epoch": 0.03336002135041367, + "grad_norm": 0.2716354134035751, + "learning_rate": 2.4799999999999996e-05, + "loss": 0.7829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.799247145652771, + "step": 125, + "valid_targets_mean": 16679.2, + "valid_targets_min": 360 + }, + { + "epoch": 0.03469442220443021, + "grad_norm": 0.3091732932839323, + "learning_rate": 2.5799999999999997e-05, + "loss": 0.7623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7341678738594055, + "step": 130, + "valid_targets_mean": 16538.3, + "valid_targets_min": 426 + }, + { + "epoch": 0.036028823058446756, + "grad_norm": 0.2635427050582435, + "learning_rate": 2.6799999999999998e-05, + "loss": 0.7565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7394607067108154, + "step": 135, + "valid_targets_mean": 16406.4, + "valid_targets_min": 688 + }, + { + "epoch": 0.03736322391246331, + "grad_norm": 0.3435518610097947, + "learning_rate": 2.7799999999999995e-05, + "loss": 0.7886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8229363560676575, + "step": 140, + "valid_targets_mean": 14519.3, + "valid_targets_min": 284 + }, + { + "epoch": 0.03869762476647985, + "grad_norm": 0.417362036919672, + "learning_rate": 2.88e-05, + "loss": 0.7753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7946305871009827, + "step": 145, + "valid_targets_mean": 16715.3, + "valid_targets_min": 590 + }, + { + "epoch": 0.040032025620496396, + "grad_norm": 0.35755095831337047, + "learning_rate": 2.9799999999999996e-05, + "loss": 0.7661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7696456909179688, + "step": 150, + "valid_targets_mean": 17409.9, + "valid_targets_min": 849 + }, + { + "epoch": 0.04136642647451294, + "grad_norm": 0.28011910125099576, + "learning_rate": 3.0799999999999996e-05, + "loss": 0.7708, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7648700475692749, + "step": 155, + "valid_targets_mean": 15438.4, + "valid_targets_min": 356 + }, + { + "epoch": 0.04270082732852949, + "grad_norm": 0.27045959495765237, + "learning_rate": 3.1799999999999994e-05, + "loss": 0.7601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7666411399841309, + "step": 160, + "valid_targets_mean": 16994.8, + "valid_targets_min": 605 + }, + { + "epoch": 0.044035228182546036, + "grad_norm": 0.33884030644268365, + "learning_rate": 3.28e-05, + "loss": 0.7435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7470793128013611, + "step": 165, + "valid_targets_mean": 16104.6, + "valid_targets_min": 619 + }, + { + "epoch": 0.04536962903656258, + "grad_norm": 0.3712406411051424, + "learning_rate": 3.3799999999999995e-05, + "loss": 0.7605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7480790615081787, + "step": 170, + "valid_targets_mean": 16437.9, + "valid_targets_min": 409 + }, + { + "epoch": 0.04670402989057913, + "grad_norm": 0.3460176427784315, + "learning_rate": 3.48e-05, + "loss": 0.7376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7141637206077576, + "step": 175, + "valid_targets_mean": 16461.9, + "valid_targets_min": 509 + }, + { + "epoch": 0.04803843074459568, + "grad_norm": 0.2596570804564528, + "learning_rate": 3.5799999999999996e-05, + "loss": 0.7759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7451268434524536, + "step": 180, + "valid_targets_mean": 16862.6, + "valid_targets_min": 727 + }, + { + "epoch": 0.04937283159861222, + "grad_norm": 0.25687426933762886, + "learning_rate": 3.679999999999999e-05, + "loss": 0.7487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7626557946205139, + "step": 185, + "valid_targets_mean": 16003.7, + "valid_targets_min": 846 + }, + { + "epoch": 0.05070723245262877, + "grad_norm": 0.22447007810160508, + "learning_rate": 3.78e-05, + "loss": 0.7693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7929567098617554, + "step": 190, + "valid_targets_mean": 14926.7, + "valid_targets_min": 361 + }, + { + "epoch": 0.05204163330664532, + "grad_norm": 0.2391985466160003, + "learning_rate": 3.8799999999999994e-05, + "loss": 0.7515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.742867112159729, + "step": 195, + "valid_targets_mean": 16102.4, + "valid_targets_min": 97 + }, + { + "epoch": 0.05337603416066186, + "grad_norm": 0.23295188871090147, + "learning_rate": 3.979999999999999e-05, + "loss": 0.751, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7330241203308105, + "step": 200, + "valid_targets_mean": 16928.9, + "valid_targets_min": 122 + }, + { + "epoch": 0.054710435014678406, + "grad_norm": 0.2883432188312913, + "learning_rate": 4.08e-05, + "loss": 0.7633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7030720114707947, + "step": 205, + "valid_targets_mean": 16557.2, + "valid_targets_min": 537 + }, + { + "epoch": 0.05604483586869496, + "grad_norm": 0.2810220148951038, + "learning_rate": 4.18e-05, + "loss": 0.7607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7284795045852661, + "step": 210, + "valid_targets_mean": 15676.2, + "valid_targets_min": 713 + }, + { + "epoch": 0.0573792367227115, + "grad_norm": 0.44105767232030274, + "learning_rate": 4.28e-05, + "loss": 0.7494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6875466108322144, + "step": 215, + "valid_targets_mean": 16369.6, + "valid_targets_min": 546 + }, + { + "epoch": 0.058713637576728046, + "grad_norm": 0.31069975408639855, + "learning_rate": 4.3799999999999994e-05, + "loss": 0.7532, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7670011520385742, + "step": 220, + "valid_targets_mean": 16207.9, + "valid_targets_min": 785 + }, + { + "epoch": 0.0600480384307446, + "grad_norm": 0.38918464319312723, + "learning_rate": 4.48e-05, + "loss": 0.7452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7355377674102783, + "step": 225, + "valid_targets_mean": 16136.9, + "valid_targets_min": 741 + }, + { + "epoch": 0.06138243928476114, + "grad_norm": 0.39130577028120467, + "learning_rate": 4.5799999999999995e-05, + "loss": 0.7659, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7933982610702515, + "step": 230, + "valid_targets_mean": 14762.8, + "valid_targets_min": 425 + }, + { + "epoch": 0.0627168401387777, + "grad_norm": 0.34250803215849346, + "learning_rate": 4.68e-05, + "loss": 0.7531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.740280270576477, + "step": 235, + "valid_targets_mean": 15716.9, + "valid_targets_min": 179 + }, + { + "epoch": 0.06405124099279423, + "grad_norm": 0.34271827895918605, + "learning_rate": 4.7799999999999996e-05, + "loss": 0.7481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7414883375167847, + "step": 240, + "valid_targets_mean": 15428.0, + "valid_targets_min": 471 + }, + { + "epoch": 0.06538564184681078, + "grad_norm": 0.23278045941311432, + "learning_rate": 4.8799999999999994e-05, + "loss": 0.7361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7401506900787354, + "step": 245, + "valid_targets_mean": 16283.0, + "valid_targets_min": 625 + }, + { + "epoch": 0.06672004270082733, + "grad_norm": 0.27127309559658486, + "learning_rate": 4.98e-05, + "loss": 0.7647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7441200017929077, + "step": 250, + "valid_targets_mean": 16885.9, + "valid_targets_min": 716 + }, + { + "epoch": 0.06805444355484387, + "grad_norm": 0.481644259210808, + "learning_rate": 5.0799999999999995e-05, + "loss": 0.7516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7468514442443848, + "step": 255, + "valid_targets_mean": 15019.4, + "valid_targets_min": 672 + }, + { + "epoch": 0.06938884440886042, + "grad_norm": 0.4098831620054727, + "learning_rate": 5.179999999999999e-05, + "loss": 0.7373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7163417339324951, + "step": 260, + "valid_targets_mean": 16107.3, + "valid_targets_min": 691 + }, + { + "epoch": 0.07072324526287697, + "grad_norm": 0.39289466248174665, + "learning_rate": 5.279999999999999e-05, + "loss": 0.7385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7264701128005981, + "step": 265, + "valid_targets_mean": 15163.3, + "valid_targets_min": 105 + }, + { + "epoch": 0.07205764611689351, + "grad_norm": 0.36659091377537845, + "learning_rate": 5.38e-05, + "loss": 0.7459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7142473459243774, + "step": 270, + "valid_targets_mean": 16897.8, + "valid_targets_min": 135 + }, + { + "epoch": 0.07339204697091006, + "grad_norm": 0.29714942560135077, + "learning_rate": 5.48e-05, + "loss": 0.7382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7210055589675903, + "step": 275, + "valid_targets_mean": 16187.2, + "valid_targets_min": 632 + }, + { + "epoch": 0.07472644782492661, + "grad_norm": 0.25299625938272635, + "learning_rate": 5.5799999999999994e-05, + "loss": 0.7288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6921160221099854, + "step": 280, + "valid_targets_mean": 15581.8, + "valid_targets_min": 535 + }, + { + "epoch": 0.07606084867894315, + "grad_norm": 0.37119467794678546, + "learning_rate": 5.679999999999999e-05, + "loss": 0.7388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7240397334098816, + "step": 285, + "valid_targets_mean": 15023.2, + "valid_targets_min": 702 + }, + { + "epoch": 0.0773952495329597, + "grad_norm": 0.3945122893124607, + "learning_rate": 5.78e-05, + "loss": 0.7289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7283365726470947, + "step": 290, + "valid_targets_mean": 15270.7, + "valid_targets_min": 249 + }, + { + "epoch": 0.07872965038697624, + "grad_norm": 0.377065993532186, + "learning_rate": 5.88e-05, + "loss": 0.7277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7348593473434448, + "step": 295, + "valid_targets_mean": 16535.4, + "valid_targets_min": 130 + }, + { + "epoch": 0.08006405124099279, + "grad_norm": 0.2580659845527572, + "learning_rate": 5.98e-05, + "loss": 0.7596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.736121654510498, + "step": 300, + "valid_targets_mean": 15587.4, + "valid_targets_min": 591 + }, + { + "epoch": 0.08139845209500934, + "grad_norm": 0.4376033475371323, + "learning_rate": 6.0799999999999994e-05, + "loss": 0.7345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7281279563903809, + "step": 305, + "valid_targets_mean": 15663.5, + "valid_targets_min": 684 + }, + { + "epoch": 0.08273285294902588, + "grad_norm": 0.4820258206141076, + "learning_rate": 6.18e-05, + "loss": 0.7449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7241256237030029, + "step": 310, + "valid_targets_mean": 16960.6, + "valid_targets_min": 744 + }, + { + "epoch": 0.08406725380304243, + "grad_norm": 0.46073068241555637, + "learning_rate": 6.28e-05, + "loss": 0.7299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7059940695762634, + "step": 315, + "valid_targets_mean": 16698.9, + "valid_targets_min": 628 + }, + { + "epoch": 0.08540165465705898, + "grad_norm": 0.4089341185808167, + "learning_rate": 6.379999999999999e-05, + "loss": 0.7372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7223199605941772, + "step": 320, + "valid_targets_mean": 15688.4, + "valid_targets_min": 613 + }, + { + "epoch": 0.08673605551107552, + "grad_norm": 0.3223826554928393, + "learning_rate": 6.479999999999999e-05, + "loss": 0.7176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7099969983100891, + "step": 325, + "valid_targets_mean": 16591.9, + "valid_targets_min": 344 + }, + { + "epoch": 0.08807045636509207, + "grad_norm": 0.40317021543159837, + "learning_rate": 6.579999999999999e-05, + "loss": 0.716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7116838693618774, + "step": 330, + "valid_targets_mean": 15636.7, + "valid_targets_min": 619 + }, + { + "epoch": 0.08940485721910862, + "grad_norm": 0.3714431977080272, + "learning_rate": 6.68e-05, + "loss": 0.725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7317278385162354, + "step": 335, + "valid_targets_mean": 17115.1, + "valid_targets_min": 795 + }, + { + "epoch": 0.09073925807312516, + "grad_norm": 0.4525830067727992, + "learning_rate": 6.78e-05, + "loss": 0.7378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.711759090423584, + "step": 340, + "valid_targets_mean": 16281.7, + "valid_targets_min": 716 + }, + { + "epoch": 0.09207365892714171, + "grad_norm": 0.4673023679344057, + "learning_rate": 6.879999999999999e-05, + "loss": 0.7283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7156293392181396, + "step": 345, + "valid_targets_mean": 17035.9, + "valid_targets_min": 629 + }, + { + "epoch": 0.09340805978115826, + "grad_norm": 0.6302835443346549, + "learning_rate": 6.979999999999999e-05, + "loss": 0.7395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7281468510627747, + "step": 350, + "valid_targets_mean": 15777.8, + "valid_targets_min": 612 + }, + { + "epoch": 0.0947424606351748, + "grad_norm": 0.4776181444975064, + "learning_rate": 7.079999999999999e-05, + "loss": 0.7362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.731685221195221, + "step": 355, + "valid_targets_mean": 16132.8, + "valid_targets_min": 730 + }, + { + "epoch": 0.09607686148919135, + "grad_norm": 0.46366024009522955, + "learning_rate": 7.18e-05, + "loss": 0.7228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7093417644500732, + "step": 360, + "valid_targets_mean": 17213.5, + "valid_targets_min": 902 + }, + { + "epoch": 0.0974112623432079, + "grad_norm": 0.6669182877606497, + "learning_rate": 7.28e-05, + "loss": 0.7336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7283340692520142, + "step": 365, + "valid_targets_mean": 16158.5, + "valid_targets_min": 522 + }, + { + "epoch": 0.09874566319722444, + "grad_norm": 0.5530295536238364, + "learning_rate": 7.379999999999999e-05, + "loss": 0.7288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.730088472366333, + "step": 370, + "valid_targets_mean": 15394.1, + "valid_targets_min": 2 + }, + { + "epoch": 0.100080064051241, + "grad_norm": 0.625459475063553, + "learning_rate": 7.479999999999999e-05, + "loss": 0.7357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7494319677352905, + "step": 375, + "valid_targets_mean": 15665.5, + "valid_targets_min": 479 + }, + { + "epoch": 0.10141446490525755, + "grad_norm": 0.5768997718865845, + "learning_rate": 7.579999999999999e-05, + "loss": 0.7199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6803427338600159, + "step": 380, + "valid_targets_mean": 17104.0, + "valid_targets_min": 101 + }, + { + "epoch": 0.10274886575927408, + "grad_norm": 0.4506068757537433, + "learning_rate": 7.68e-05, + "loss": 0.7239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7258304357528687, + "step": 385, + "valid_targets_mean": 17220.1, + "valid_targets_min": 715 + }, + { + "epoch": 0.10408326661329063, + "grad_norm": 0.47171044726445444, + "learning_rate": 7.780000000000001e-05, + "loss": 0.7299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7591128349304199, + "step": 390, + "valid_targets_mean": 15987.7, + "valid_targets_min": 679 + }, + { + "epoch": 0.10541766746730719, + "grad_norm": 0.38595337799176016, + "learning_rate": 7.879999999999999e-05, + "loss": 0.7177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7050427198410034, + "step": 395, + "valid_targets_mean": 15030.2, + "valid_targets_min": 415 + }, + { + "epoch": 0.10675206832132372, + "grad_norm": 1.0374726912615833, + "learning_rate": 7.98e-05, + "loss": 0.73, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7716153264045715, + "step": 400, + "valid_targets_mean": 16188.2, + "valid_targets_min": 660 + }, + { + "epoch": 0.10808646917534027, + "grad_norm": 0.6324192761921746, + "learning_rate": 8.079999999999999e-05, + "loss": 0.7392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7432792782783508, + "step": 405, + "valid_targets_mean": 15845.6, + "valid_targets_min": 444 + }, + { + "epoch": 0.10942087002935681, + "grad_norm": 0.78537905081529, + "learning_rate": 8.18e-05, + "loss": 0.7268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7303118109703064, + "step": 410, + "valid_targets_mean": 15707.5, + "valid_targets_min": 541 + }, + { + "epoch": 0.11075527088337336, + "grad_norm": 0.9395811255221675, + "learning_rate": 8.28e-05, + "loss": 0.7005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7188759446144104, + "step": 415, + "valid_targets_mean": 15624.4, + "valid_targets_min": 678 + }, + { + "epoch": 0.11208967173738991, + "grad_norm": 0.9295266743546321, + "learning_rate": 8.379999999999999e-05, + "loss": 0.703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7148219347000122, + "step": 420, + "valid_targets_mean": 16225.2, + "valid_targets_min": 458 + }, + { + "epoch": 0.11342407259140645, + "grad_norm": 0.476696559517845, + "learning_rate": 8.48e-05, + "loss": 0.715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7083289623260498, + "step": 425, + "valid_targets_mean": 15491.8, + "valid_targets_min": 683 + }, + { + "epoch": 0.114758473445423, + "grad_norm": 0.43534945533869385, + "learning_rate": 8.579999999999998e-05, + "loss": 0.7204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7006481885910034, + "step": 430, + "valid_targets_mean": 17209.7, + "valid_targets_min": 598 + }, + { + "epoch": 0.11609287429943956, + "grad_norm": 0.6609645621259375, + "learning_rate": 8.68e-05, + "loss": 0.7315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7302699089050293, + "step": 435, + "valid_targets_mean": 14802.1, + "valid_targets_min": 544 + }, + { + "epoch": 0.11742727515345609, + "grad_norm": 0.7199278706441802, + "learning_rate": 8.779999999999999e-05, + "loss": 0.7176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7259851098060608, + "step": 440, + "valid_targets_mean": 16476.4, + "valid_targets_min": 750 + }, + { + "epoch": 0.11876167600747264, + "grad_norm": 0.4773065968592865, + "learning_rate": 8.879999999999999e-05, + "loss": 0.7136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7408217191696167, + "step": 445, + "valid_targets_mean": 17142.7, + "valid_targets_min": 478 + }, + { + "epoch": 0.1200960768614892, + "grad_norm": 0.37172351171758483, + "learning_rate": 8.98e-05, + "loss": 0.7237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7378139495849609, + "step": 450, + "valid_targets_mean": 15218.4, + "valid_targets_min": 462 + }, + { + "epoch": 0.12143047771550573, + "grad_norm": 0.39304827138785564, + "learning_rate": 9.079999999999998e-05, + "loss": 0.7107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7344069480895996, + "step": 455, + "valid_targets_mean": 16115.3, + "valid_targets_min": 81 + }, + { + "epoch": 0.12276487856952228, + "grad_norm": 0.42542723715742675, + "learning_rate": 9.18e-05, + "loss": 0.7134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7543541193008423, + "step": 460, + "valid_targets_mean": 14546.4, + "valid_targets_min": 531 + }, + { + "epoch": 0.12409927942353884, + "grad_norm": 0.541397629733599, + "learning_rate": 9.279999999999999e-05, + "loss": 0.7253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7133990526199341, + "step": 465, + "valid_targets_mean": 16384.3, + "valid_targets_min": 597 + }, + { + "epoch": 0.1254336802775554, + "grad_norm": 0.5822512924496642, + "learning_rate": 9.379999999999999e-05, + "loss": 0.7129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6963658928871155, + "step": 470, + "valid_targets_mean": 15760.1, + "valid_targets_min": 673 + }, + { + "epoch": 0.12676808113157192, + "grad_norm": 0.5030863279307085, + "learning_rate": 9.479999999999999e-05, + "loss": 0.734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7287914752960205, + "step": 475, + "valid_targets_mean": 16120.6, + "valid_targets_min": 562 + }, + { + "epoch": 0.12810248198558846, + "grad_norm": 0.4939684474512313, + "learning_rate": 9.58e-05, + "loss": 0.72, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7166863679885864, + "step": 480, + "valid_targets_mean": 15308.1, + "valid_targets_min": 718 + }, + { + "epoch": 0.12943688283960503, + "grad_norm": 1.1934926781005402, + "learning_rate": 9.68e-05, + "loss": 0.7278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7173789739608765, + "step": 485, + "valid_targets_mean": 15423.5, + "valid_targets_min": 147 + }, + { + "epoch": 0.13077128369362157, + "grad_norm": 0.5255232868822954, + "learning_rate": 9.779999999999999e-05, + "loss": 0.714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7186357975006104, + "step": 490, + "valid_targets_mean": 16427.6, + "valid_targets_min": 456 + }, + { + "epoch": 0.1321056845476381, + "grad_norm": 0.5484769961875839, + "learning_rate": 9.879999999999999e-05, + "loss": 0.7212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7366380095481873, + "step": 495, + "valid_targets_mean": 17284.8, + "valid_targets_min": 230 + }, + { + "epoch": 0.13344008540165467, + "grad_norm": 0.5074708333313445, + "learning_rate": 9.979999999999999e-05, + "loss": 0.7251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7222837209701538, + "step": 500, + "valid_targets_mean": 16145.7, + "valid_targets_min": 453 + }, + { + "epoch": 0.1347744862556712, + "grad_norm": 0.44933138863293226, + "learning_rate": 0.0001008, + "loss": 0.72, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7153065204620361, + "step": 505, + "valid_targets_mean": 16280.8, + "valid_targets_min": 537 + }, + { + "epoch": 0.13610888710968774, + "grad_norm": 0.44505945767105004, + "learning_rate": 0.00010179999999999998, + "loss": 0.7155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6971901655197144, + "step": 510, + "valid_targets_mean": 17205.7, + "valid_targets_min": 659 + }, + { + "epoch": 0.1374432879637043, + "grad_norm": 0.48703552246931575, + "learning_rate": 0.00010279999999999999, + "loss": 0.7102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6962928771972656, + "step": 515, + "valid_targets_mean": 15323.8, + "valid_targets_min": 219 + }, + { + "epoch": 0.13877768881772085, + "grad_norm": 0.5239136710241173, + "learning_rate": 0.00010379999999999999, + "loss": 0.7049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7096296548843384, + "step": 520, + "valid_targets_mean": 17015.6, + "valid_targets_min": 681 + }, + { + "epoch": 0.14011208967173738, + "grad_norm": 0.685550891317315, + "learning_rate": 0.00010479999999999999, + "loss": 0.7213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7331212162971497, + "step": 525, + "valid_targets_mean": 17924.0, + "valid_targets_min": 510 + }, + { + "epoch": 0.14144649052575395, + "grad_norm": 0.9371855061417276, + "learning_rate": 0.0001058, + "loss": 0.7189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.756299614906311, + "step": 530, + "valid_targets_mean": 15321.0, + "valid_targets_min": 745 + }, + { + "epoch": 0.14278089137977049, + "grad_norm": 0.5750367848876685, + "learning_rate": 0.00010679999999999998, + "loss": 0.7188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7179563045501709, + "step": 535, + "valid_targets_mean": 14206.7, + "valid_targets_min": 539 + }, + { + "epoch": 0.14411529223378702, + "grad_norm": 0.5833077589670811, + "learning_rate": 0.00010779999999999999, + "loss": 0.7283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7211377620697021, + "step": 540, + "valid_targets_mean": 16022.5, + "valid_targets_min": 509 + }, + { + "epoch": 0.1454496930878036, + "grad_norm": 0.7269177019931343, + "learning_rate": 0.0001088, + "loss": 0.7178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7293734550476074, + "step": 545, + "valid_targets_mean": 15989.6, + "valid_targets_min": 666 + }, + { + "epoch": 0.14678409394182013, + "grad_norm": 0.5334975069811895, + "learning_rate": 0.00010979999999999999, + "loss": 0.7393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7264102697372437, + "step": 550, + "valid_targets_mean": 15266.4, + "valid_targets_min": 668 + }, + { + "epoch": 0.14811849479583666, + "grad_norm": 0.6250384008635103, + "learning_rate": 0.0001108, + "loss": 0.6967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6969237923622131, + "step": 555, + "valid_targets_mean": 16026.1, + "valid_targets_min": 621 + }, + { + "epoch": 0.14945289564985323, + "grad_norm": 0.8468842115841293, + "learning_rate": 0.00011179999999999998, + "loss": 0.7226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7111748456954956, + "step": 560, + "valid_targets_mean": 15614.1, + "valid_targets_min": 486 + }, + { + "epoch": 0.15078729650386977, + "grad_norm": 0.8021724458590994, + "learning_rate": 0.00011279999999999999, + "loss": 0.689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6887655258178711, + "step": 565, + "valid_targets_mean": 17246.1, + "valid_targets_min": 740 + }, + { + "epoch": 0.1521216973578863, + "grad_norm": 0.6445231347491678, + "learning_rate": 0.0001138, + "loss": 0.7125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7299594283103943, + "step": 570, + "valid_targets_mean": 15399.9, + "valid_targets_min": 587 + }, + { + "epoch": 0.15345609821190287, + "grad_norm": 0.9632004486100639, + "learning_rate": 0.00011479999999999999, + "loss": 0.7258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.725225031375885, + "step": 575, + "valid_targets_mean": 16895.6, + "valid_targets_min": 871 + }, + { + "epoch": 0.1547904990659194, + "grad_norm": 0.6125391497023498, + "learning_rate": 0.0001158, + "loss": 0.7283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7031444907188416, + "step": 580, + "valid_targets_mean": 16781.4, + "valid_targets_min": 365 + }, + { + "epoch": 0.15612489991993594, + "grad_norm": 0.914929177218736, + "learning_rate": 0.00011679999999999998, + "loss": 0.73, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7310180068016052, + "step": 585, + "valid_targets_mean": 14891.6, + "valid_targets_min": 104 + }, + { + "epoch": 0.15745930077395248, + "grad_norm": 0.8814371014768175, + "learning_rate": 0.00011779999999999999, + "loss": 0.7309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7159960269927979, + "step": 590, + "valid_targets_mean": 14935.1, + "valid_targets_min": 473 + }, + { + "epoch": 0.15879370162796905, + "grad_norm": 0.5975243304153101, + "learning_rate": 0.0001188, + "loss": 0.7138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7245515584945679, + "step": 595, + "valid_targets_mean": 17035.9, + "valid_targets_min": 727 + }, + { + "epoch": 0.16012810248198558, + "grad_norm": 0.46679873052553167, + "learning_rate": 0.00011979999999999998, + "loss": 0.7085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6976876258850098, + "step": 600, + "valid_targets_mean": 15646.5, + "valid_targets_min": 459 + }, + { + "epoch": 0.16146250333600212, + "grad_norm": 0.5128674027346761, + "learning_rate": 0.0001208, + "loss": 0.7223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7510048151016235, + "step": 605, + "valid_targets_mean": 15762.4, + "valid_targets_min": 771 + }, + { + "epoch": 0.1627969041900187, + "grad_norm": 0.5819395696398177, + "learning_rate": 0.00012179999999999999, + "loss": 0.7157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.657742977142334, + "step": 610, + "valid_targets_mean": 16854.7, + "valid_targets_min": 746 + }, + { + "epoch": 0.16413130504403523, + "grad_norm": 0.5162670382257071, + "learning_rate": 0.00012279999999999998, + "loss": 0.7084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7006169557571411, + "step": 615, + "valid_targets_mean": 15703.4, + "valid_targets_min": 638 + }, + { + "epoch": 0.16546570589805176, + "grad_norm": 0.6945068724820247, + "learning_rate": 0.0001238, + "loss": 0.7216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.756109356880188, + "step": 620, + "valid_targets_mean": 15891.4, + "valid_targets_min": 360 + }, + { + "epoch": 0.16680010675206833, + "grad_norm": 0.9642949707242404, + "learning_rate": 0.00012479999999999997, + "loss": 0.7238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.695439875125885, + "step": 625, + "valid_targets_mean": 17157.8, + "valid_targets_min": 731 + }, + { + "epoch": 0.16813450760608487, + "grad_norm": 0.5833542867382966, + "learning_rate": 0.0001258, + "loss": 0.715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6990182399749756, + "step": 630, + "valid_targets_mean": 15990.5, + "valid_targets_min": 349 + }, + { + "epoch": 0.1694689084601014, + "grad_norm": 0.7007660146650656, + "learning_rate": 0.0001268, + "loss": 0.7157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7077897787094116, + "step": 635, + "valid_targets_mean": 15861.1, + "valid_targets_min": 678 + }, + { + "epoch": 0.17080330931411797, + "grad_norm": 0.49195751975639107, + "learning_rate": 0.0001278, + "loss": 0.7161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6865917444229126, + "step": 640, + "valid_targets_mean": 15295.1, + "valid_targets_min": 469 + }, + { + "epoch": 0.1721377101681345, + "grad_norm": 0.7191679724888371, + "learning_rate": 0.0001288, + "loss": 0.7069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7064446210861206, + "step": 645, + "valid_targets_mean": 16334.0, + "valid_targets_min": 557 + }, + { + "epoch": 0.17347211102215104, + "grad_norm": 0.5594698481432445, + "learning_rate": 0.00012979999999999998, + "loss": 0.7229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.708102822303772, + "step": 650, + "valid_targets_mean": 16455.3, + "valid_targets_min": 87 + }, + { + "epoch": 0.1748065118761676, + "grad_norm": 0.735025293283187, + "learning_rate": 0.00013079999999999998, + "loss": 0.7222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7207574248313904, + "step": 655, + "valid_targets_mean": 16754.3, + "valid_targets_min": 756 + }, + { + "epoch": 0.17614091273018415, + "grad_norm": 0.3958769606977501, + "learning_rate": 0.0001318, + "loss": 0.7019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6824870109558105, + "step": 660, + "valid_targets_mean": 16950.8, + "valid_targets_min": 823 + }, + { + "epoch": 0.17747531358420068, + "grad_norm": 0.38239059142969134, + "learning_rate": 0.00013279999999999998, + "loss": 0.718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6917785406112671, + "step": 665, + "valid_targets_mean": 16209.8, + "valid_targets_min": 613 + }, + { + "epoch": 0.17880971443821725, + "grad_norm": 0.5118945312941819, + "learning_rate": 0.0001338, + "loss": 0.7221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7017595767974854, + "step": 670, + "valid_targets_mean": 15769.2, + "valid_targets_min": 717 + }, + { + "epoch": 0.1801441152922338, + "grad_norm": 0.6464646630845813, + "learning_rate": 0.00013479999999999997, + "loss": 0.7236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7357965707778931, + "step": 675, + "valid_targets_mean": 16688.3, + "valid_targets_min": 411 + }, + { + "epoch": 0.18147851614625032, + "grad_norm": 0.4239557207049385, + "learning_rate": 0.0001358, + "loss": 0.7025, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6929694414138794, + "step": 680, + "valid_targets_mean": 15849.2, + "valid_targets_min": 360 + }, + { + "epoch": 0.1828129170002669, + "grad_norm": 0.7804567161815549, + "learning_rate": 0.0001368, + "loss": 0.7189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7219686508178711, + "step": 685, + "valid_targets_mean": 16094.0, + "valid_targets_min": 686 + }, + { + "epoch": 0.18414731785428343, + "grad_norm": 0.5732418331235286, + "learning_rate": 0.0001378, + "loss": 0.7047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6867932081222534, + "step": 690, + "valid_targets_mean": 15930.7, + "valid_targets_min": 42 + }, + { + "epoch": 0.18548171870829996, + "grad_norm": 0.42458958191005924, + "learning_rate": 0.00013879999999999999, + "loss": 0.7014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6767255067825317, + "step": 695, + "valid_targets_mean": 15631.3, + "valid_targets_min": 796 + }, + { + "epoch": 0.18681611956231653, + "grad_norm": 0.83041183706765, + "learning_rate": 0.00013979999999999998, + "loss": 0.7104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7344939112663269, + "step": 700, + "valid_targets_mean": 14661.2, + "valid_targets_min": 220 + }, + { + "epoch": 0.18815052041633307, + "grad_norm": 0.4551116123008287, + "learning_rate": 0.00014079999999999998, + "loss": 0.7053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6875162720680237, + "step": 705, + "valid_targets_mean": 17108.3, + "valid_targets_min": 429 + }, + { + "epoch": 0.1894849212703496, + "grad_norm": 0.42062013074810284, + "learning_rate": 0.0001418, + "loss": 0.7087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7142444849014282, + "step": 710, + "valid_targets_mean": 15786.6, + "valid_targets_min": 679 + }, + { + "epoch": 0.19081932212436617, + "grad_norm": 0.6305250919291718, + "learning_rate": 0.00014279999999999997, + "loss": 0.6996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.690528154373169, + "step": 715, + "valid_targets_mean": 16620.3, + "valid_targets_min": 530 + }, + { + "epoch": 0.1921537229783827, + "grad_norm": 0.49236440297808903, + "learning_rate": 0.0001438, + "loss": 0.6826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7059494256973267, + "step": 720, + "valid_targets_mean": 15789.3, + "valid_targets_min": 592 + }, + { + "epoch": 0.19348812383239924, + "grad_norm": 1.0246968836811798, + "learning_rate": 0.0001448, + "loss": 0.6966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7069756984710693, + "step": 725, + "valid_targets_mean": 15479.2, + "valid_targets_min": 694 + }, + { + "epoch": 0.1948225246864158, + "grad_norm": 0.9166310918813874, + "learning_rate": 0.0001458, + "loss": 0.712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.696449339389801, + "step": 730, + "valid_targets_mean": 17183.2, + "valid_targets_min": 510 + }, + { + "epoch": 0.19615692554043235, + "grad_norm": 1.0363387105812145, + "learning_rate": 0.0001468, + "loss": 0.7071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7203611135482788, + "step": 735, + "valid_targets_mean": 14946.1, + "valid_targets_min": 577 + }, + { + "epoch": 0.19749132639444889, + "grad_norm": 0.5417483344221564, + "learning_rate": 0.0001478, + "loss": 0.7106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7111995816230774, + "step": 740, + "valid_targets_mean": 14798.5, + "valid_targets_min": 314 + }, + { + "epoch": 0.19882572724846545, + "grad_norm": 0.777755567926226, + "learning_rate": 0.00014879999999999998, + "loss": 0.7001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6688179969787598, + "step": 745, + "valid_targets_mean": 15765.6, + "valid_targets_min": 130 + }, + { + "epoch": 0.200160128102482, + "grad_norm": 0.7871992497617583, + "learning_rate": 0.00014979999999999998, + "loss": 0.7054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7222711443901062, + "step": 750, + "valid_targets_mean": 15587.0, + "valid_targets_min": 142 + }, + { + "epoch": 0.20149452895649853, + "grad_norm": 0.7589612805003493, + "learning_rate": 0.00014999986979857214, + "loss": 0.7035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7213101387023926, + "step": 755, + "valid_targets_mean": 15475.6, + "valid_targets_min": 3 + }, + { + "epoch": 0.2028289298105151, + "grad_norm": 0.8806420553414223, + "learning_rate": 0.00014999934085604638, + "loss": 0.7045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.721771240234375, + "step": 760, + "valid_targets_mean": 15470.4, + "valid_targets_min": 469 + }, + { + "epoch": 0.20416333066453163, + "grad_norm": 0.6490469254239379, + "learning_rate": 0.00014999840503770068, + "loss": 0.7057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6929470300674438, + "step": 765, + "valid_targets_mean": 15379.0, + "valid_targets_min": 429 + }, + { + "epoch": 0.20549773151854817, + "grad_norm": 0.632766163326704, + "learning_rate": 0.00014999706234861205, + "loss": 0.7181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7145708799362183, + "step": 770, + "valid_targets_mean": 15203.7, + "valid_targets_min": 555 + }, + { + "epoch": 0.20683213237256473, + "grad_norm": 0.7382870047734233, + "learning_rate": 0.00014999531279606457, + "loss": 0.7086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7060419321060181, + "step": 775, + "valid_targets_mean": 16520.4, + "valid_targets_min": 507 + }, + { + "epoch": 0.20816653322658127, + "grad_norm": 0.9240426936239289, + "learning_rate": 0.00014999315638954965, + "loss": 0.7147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.709404468536377, + "step": 780, + "valid_targets_mean": 17228.6, + "valid_targets_min": 774 + }, + { + "epoch": 0.2095009340805978, + "grad_norm": 0.8934733650392805, + "learning_rate": 0.000149990593140766, + "loss": 0.7113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7076325416564941, + "step": 785, + "valid_targets_mean": 16678.5, + "valid_targets_min": 490 + }, + { + "epoch": 0.21083533493461437, + "grad_norm": 0.836599216200632, + "learning_rate": 0.00014998762306361933, + "loss": 0.694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6929929852485657, + "step": 790, + "valid_targets_mean": 16718.5, + "valid_targets_min": 658 + }, + { + "epoch": 0.2121697357886309, + "grad_norm": 3.5029546430195277, + "learning_rate": 0.00014998424617422253, + "loss": 0.7001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7014665603637695, + "step": 795, + "valid_targets_mean": 17313.6, + "valid_targets_min": 703 + }, + { + "epoch": 0.21350413664264745, + "grad_norm": 0.5418752118979653, + "learning_rate": 0.00014998046249089538, + "loss": 0.7014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.688701868057251, + "step": 800, + "valid_targets_mean": 16082.9, + "valid_targets_min": 554 + }, + { + "epoch": 0.214838537496664, + "grad_norm": 0.6706169884495433, + "learning_rate": 0.00014997627203416458, + "loss": 0.6998, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7123109102249146, + "step": 805, + "valid_targets_mean": 15668.5, + "valid_targets_min": 570 + }, + { + "epoch": 0.21617293835068055, + "grad_norm": 0.7159637795497619, + "learning_rate": 0.00014997167482676366, + "loss": 0.7013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7268193960189819, + "step": 810, + "valid_targets_mean": 14148.5, + "valid_targets_min": 714 + }, + { + "epoch": 0.2175073392046971, + "grad_norm": 0.39213537306358476, + "learning_rate": 0.00014996667089363272, + "loss": 0.6972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6896648406982422, + "step": 815, + "valid_targets_mean": 15892.1, + "valid_targets_min": 304 + }, + { + "epoch": 0.21884174005871362, + "grad_norm": 0.6142783873448505, + "learning_rate": 0.00014996126026191832, + "loss": 0.7162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7129541635513306, + "step": 820, + "valid_targets_mean": 16946.2, + "valid_targets_min": 491 + }, + { + "epoch": 0.2201761409127302, + "grad_norm": 0.5260685820283173, + "learning_rate": 0.00014995544296097355, + "loss": 0.7122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7193052768707275, + "step": 825, + "valid_targets_mean": 14956.7, + "valid_targets_min": 732 + }, + { + "epoch": 0.22151054176674673, + "grad_norm": 0.5686280764452485, + "learning_rate": 0.00014994921902235757, + "loss": 0.7094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7117457985877991, + "step": 830, + "valid_targets_mean": 15185.0, + "valid_targets_min": 461 + }, + { + "epoch": 0.22284494262076326, + "grad_norm": 0.6755060505696501, + "learning_rate": 0.0001499425884798356, + "loss": 0.6913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6957063674926758, + "step": 835, + "valid_targets_mean": 15872.1, + "valid_targets_min": 646 + }, + { + "epoch": 0.22417934347477983, + "grad_norm": 0.48553090040615876, + "learning_rate": 0.00014993555136937872, + "loss": 0.7015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6867814064025879, + "step": 840, + "valid_targets_mean": 16234.7, + "valid_targets_min": 405 + }, + { + "epoch": 0.22551374432879637, + "grad_norm": 0.40569646079083105, + "learning_rate": 0.0001499281077291637, + "loss": 0.7108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7366761565208435, + "step": 845, + "valid_targets_mean": 15982.0, + "valid_targets_min": 459 + }, + { + "epoch": 0.2268481451828129, + "grad_norm": 1.017546932562299, + "learning_rate": 0.00014992025759957267, + "loss": 0.7268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7172836065292358, + "step": 850, + "valid_targets_mean": 15778.7, + "valid_targets_min": 669 + }, + { + "epoch": 0.22818254603682947, + "grad_norm": 0.6688766038496526, + "learning_rate": 0.0001499120010231931, + "loss": 0.6981, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.687598705291748, + "step": 855, + "valid_targets_mean": 16142.9, + "valid_targets_min": 528 + }, + { + "epoch": 0.229516946890846, + "grad_norm": 0.6613026228057015, + "learning_rate": 0.00014990333804481738, + "loss": 0.6987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6992521286010742, + "step": 860, + "valid_targets_mean": 16895.7, + "valid_targets_min": 235 + }, + { + "epoch": 0.23085134774486255, + "grad_norm": 0.8302928138355796, + "learning_rate": 0.00014989426871144266, + "loss": 0.6985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7034393548965454, + "step": 865, + "valid_targets_mean": 16505.0, + "valid_targets_min": 799 + }, + { + "epoch": 0.2321857485988791, + "grad_norm": 0.7509998803398379, + "learning_rate": 0.00014988479307227062, + "loss": 0.6855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7085684537887573, + "step": 870, + "valid_targets_mean": 14895.0, + "valid_targets_min": 298 + }, + { + "epoch": 0.23352014945289565, + "grad_norm": 0.6037951591636942, + "learning_rate": 0.00014987491117870717, + "loss": 0.7033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6840174198150635, + "step": 875, + "valid_targets_mean": 16543.5, + "valid_targets_min": 812 + }, + { + "epoch": 0.23485455030691219, + "grad_norm": 0.5286893064532538, + "learning_rate": 0.00014986462308436214, + "loss": 0.6884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7020936012268066, + "step": 880, + "valid_targets_mean": 14788.7, + "valid_targets_min": 606 + }, + { + "epoch": 0.23618895116092875, + "grad_norm": 0.480456782545674, + "learning_rate": 0.00014985392884504903, + "loss": 0.7011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7093113660812378, + "step": 885, + "valid_targets_mean": 15861.4, + "valid_targets_min": 437 + }, + { + "epoch": 0.2375233520149453, + "grad_norm": 0.7679411381978142, + "learning_rate": 0.00014984282851878477, + "loss": 0.698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7077801823616028, + "step": 890, + "valid_targets_mean": 16783.0, + "valid_targets_min": 509 + }, + { + "epoch": 0.23885775286896183, + "grad_norm": 0.5231140658944428, + "learning_rate": 0.00014983132216578923, + "loss": 0.6982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6934367418289185, + "step": 895, + "valid_targets_mean": 16316.8, + "valid_targets_min": 551 + }, + { + "epoch": 0.2401921537229784, + "grad_norm": 0.42864022271796487, + "learning_rate": 0.00014981940984848508, + "loss": 0.6764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6391340494155884, + "step": 900, + "valid_targets_mean": 16328.9, + "valid_targets_min": 621 + }, + { + "epoch": 0.24152655457699493, + "grad_norm": 0.33650902419596107, + "learning_rate": 0.00014980709163149732, + "loss": 0.7052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7220794558525085, + "step": 905, + "valid_targets_mean": 15666.6, + "valid_targets_min": 513 + }, + { + "epoch": 0.24286095543101147, + "grad_norm": 0.6102385943286962, + "learning_rate": 0.000149794367581653, + "loss": 0.6993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7103188037872314, + "step": 910, + "valid_targets_mean": 16207.6, + "valid_targets_min": 361 + }, + { + "epoch": 0.24419535628502803, + "grad_norm": 0.6766800650304651, + "learning_rate": 0.00014978123776798082, + "loss": 0.6879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6693642735481262, + "step": 915, + "valid_targets_mean": 17180.4, + "valid_targets_min": 369 + }, + { + "epoch": 0.24552975713904457, + "grad_norm": 0.5708107933964744, + "learning_rate": 0.00014976770226171084, + "loss": 0.6906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6481786966323853, + "step": 920, + "valid_targets_mean": 17630.6, + "valid_targets_min": 669 + }, + { + "epoch": 0.2468641579930611, + "grad_norm": 0.45298074962402585, + "learning_rate": 0.00014975376113627394, + "loss": 0.6954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6705655455589294, + "step": 925, + "valid_targets_mean": 17155.6, + "valid_targets_min": 649 + }, + { + "epoch": 0.24819855884707767, + "grad_norm": 0.6539562997849696, + "learning_rate": 0.00014973941446730154, + "loss": 0.7149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7168123126029968, + "step": 930, + "valid_targets_mean": 16628.1, + "valid_targets_min": 430 + }, + { + "epoch": 0.2495329597010942, + "grad_norm": 0.5986561836133009, + "learning_rate": 0.00014972466233262517, + "loss": 0.6949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7100132703781128, + "step": 935, + "valid_targets_mean": 16743.7, + "valid_targets_min": 382 + }, + { + "epoch": 0.2508673605551108, + "grad_norm": 0.5148245538699373, + "learning_rate": 0.00014970950481227603, + "loss": 0.7109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6915335655212402, + "step": 940, + "valid_targets_mean": 15595.5, + "valid_targets_min": 419 + }, + { + "epoch": 0.2522017614091273, + "grad_norm": 0.786060251192184, + "learning_rate": 0.00014969394198848456, + "loss": 0.7029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7469134330749512, + "step": 945, + "valid_targets_mean": 14296.9, + "valid_targets_min": 651 + }, + { + "epoch": 0.25353616226314385, + "grad_norm": 0.43995264747649415, + "learning_rate": 0.00014967797394567993, + "loss": 0.6799, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6515603065490723, + "step": 950, + "valid_targets_mean": 16029.6, + "valid_targets_min": 502 + }, + { + "epoch": 0.2548705631171604, + "grad_norm": 0.7666679127339393, + "learning_rate": 0.00014966160077048982, + "loss": 0.6784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6881482601165771, + "step": 955, + "valid_targets_mean": 16402.8, + "valid_targets_min": 108 + }, + { + "epoch": 0.2562049639711769, + "grad_norm": 0.575233221839231, + "learning_rate": 0.00014964482255173958, + "loss": 0.703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.680946946144104, + "step": 960, + "valid_targets_mean": 15782.9, + "valid_targets_min": 13 + }, + { + "epoch": 0.25753936482519346, + "grad_norm": 0.4955657079524624, + "learning_rate": 0.00014962763938045206, + "loss": 0.7009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6926153898239136, + "step": 965, + "valid_targets_mean": 14686.8, + "valid_targets_min": 850 + }, + { + "epoch": 0.25887376567921005, + "grad_norm": 0.6172410048860858, + "learning_rate": 0.00014961005134984693, + "loss": 0.6866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6675003170967102, + "step": 970, + "valid_targets_mean": 17335.6, + "valid_targets_min": 688 + }, + { + "epoch": 0.2602081665332266, + "grad_norm": 0.5604574782581667, + "learning_rate": 0.00014959205855534036, + "loss": 0.6845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.705886721611023, + "step": 975, + "valid_targets_mean": 16804.7, + "valid_targets_min": 197 + }, + { + "epoch": 0.26154256738724313, + "grad_norm": 0.5313317151302402, + "learning_rate": 0.00014957366109454427, + "loss": 0.6816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6733583211898804, + "step": 980, + "valid_targets_mean": 16253.9, + "valid_targets_min": 660 + }, + { + "epoch": 0.26287696824125967, + "grad_norm": 0.43864368887865324, + "learning_rate": 0.00014955485906726596, + "loss": 0.6959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6941563487052917, + "step": 985, + "valid_targets_mean": 15571.7, + "valid_targets_min": 448 + }, + { + "epoch": 0.2642113690952762, + "grad_norm": 0.5181543388907015, + "learning_rate": 0.00014953565257550756, + "loss": 0.7069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6880620718002319, + "step": 990, + "valid_targets_mean": 16759.1, + "valid_targets_min": 399 + }, + { + "epoch": 0.26554576994929274, + "grad_norm": 0.7477865809506131, + "learning_rate": 0.00014951604172346535, + "loss": 0.6946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7352211475372314, + "step": 995, + "valid_targets_mean": 14561.0, + "valid_targets_min": 616 + }, + { + "epoch": 0.26688017080330934, + "grad_norm": 0.6373119718120067, + "learning_rate": 0.00014949602661752944, + "loss": 0.7005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6938153505325317, + "step": 1000, + "valid_targets_mean": 17262.1, + "valid_targets_min": 484 + }, + { + "epoch": 0.2682145716573259, + "grad_norm": 0.32709542106154893, + "learning_rate": 0.0001494756073662829, + "loss": 0.6683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6421211957931519, + "step": 1005, + "valid_targets_mean": 16814.7, + "valid_targets_min": 544 + }, + { + "epoch": 0.2695489725113424, + "grad_norm": 0.6698123080687065, + "learning_rate": 0.00014945478408050135, + "loss": 0.69, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6433126926422119, + "step": 1010, + "valid_targets_mean": 17187.6, + "valid_targets_min": 698 + }, + { + "epoch": 0.27088337336535895, + "grad_norm": 0.5130901199029623, + "learning_rate": 0.00014943355687315239, + "loss": 0.6932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.694229781627655, + "step": 1015, + "valid_targets_mean": 15706.6, + "valid_targets_min": 221 + }, + { + "epoch": 0.2722177742193755, + "grad_norm": 0.5310687957289015, + "learning_rate": 0.0001494119258593948, + "loss": 0.6833, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6675958633422852, + "step": 1020, + "valid_targets_mean": 16197.8, + "valid_targets_min": 647 + }, + { + "epoch": 0.273552175073392, + "grad_norm": 0.6328700461529049, + "learning_rate": 0.00014938989115657815, + "loss": 0.7083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7138117551803589, + "step": 1025, + "valid_targets_mean": 16780.0, + "valid_targets_min": 457 + }, + { + "epoch": 0.2748865759274086, + "grad_norm": 0.8323618177058604, + "learning_rate": 0.00014936745288424198, + "loss": 0.7071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7033565044403076, + "step": 1030, + "valid_targets_mean": 16363.2, + "valid_targets_min": 620 + }, + { + "epoch": 0.27622097678142515, + "grad_norm": 0.5615678318349799, + "learning_rate": 0.0001493446111641152, + "loss": 0.7001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6922980546951294, + "step": 1035, + "valid_targets_mean": 17032.3, + "valid_targets_min": 286 + }, + { + "epoch": 0.2775553776354417, + "grad_norm": 0.9216225408504705, + "learning_rate": 0.00014932136612011554, + "loss": 0.6806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6632153391838074, + "step": 1040, + "valid_targets_mean": 14829.7, + "valid_targets_min": 313 + }, + { + "epoch": 0.27888977848945823, + "grad_norm": 0.916779484221643, + "learning_rate": 0.00014929771787834868, + "loss": 0.6878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6791641712188721, + "step": 1045, + "valid_targets_mean": 14985.0, + "valid_targets_min": 708 + }, + { + "epoch": 0.28022417934347477, + "grad_norm": 0.5637979161337277, + "learning_rate": 0.00014927366656710772, + "loss": 0.6978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6769039630889893, + "step": 1050, + "valid_targets_mean": 16495.8, + "valid_targets_min": 605 + }, + { + "epoch": 0.2815585801974913, + "grad_norm": 0.7200961111808594, + "learning_rate": 0.00014924921231687245, + "loss": 0.7055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6782281398773193, + "step": 1055, + "valid_targets_mean": 16101.9, + "valid_targets_min": 115 + }, + { + "epoch": 0.2828929810515079, + "grad_norm": 1.0978604253731457, + "learning_rate": 0.0001492243552603086, + "loss": 0.6899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6719521284103394, + "step": 1060, + "valid_targets_mean": 16325.6, + "valid_targets_min": 619 + }, + { + "epoch": 0.28422738190552443, + "grad_norm": 0.7823473663674503, + "learning_rate": 0.00014919909553226716, + "loss": 0.6943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.658243715763092, + "step": 1065, + "valid_targets_mean": 17418.4, + "valid_targets_min": 39 + }, + { + "epoch": 0.28556178275954097, + "grad_norm": 0.8215632846087839, + "learning_rate": 0.00014917343326978366, + "loss": 0.689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6821578145027161, + "step": 1070, + "valid_targets_mean": 16322.2, + "valid_targets_min": 763 + }, + { + "epoch": 0.2868961836135575, + "grad_norm": 0.687488420158643, + "learning_rate": 0.00014914736861207733, + "loss": 0.6751, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6720151901245117, + "step": 1075, + "valid_targets_mean": 16538.7, + "valid_targets_min": 312 + }, + { + "epoch": 0.28823058446757405, + "grad_norm": 0.6210551753687071, + "learning_rate": 0.0001491209017005505, + "loss": 0.6952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.701689600944519, + "step": 1080, + "valid_targets_mean": 15265.4, + "valid_targets_min": 537 + }, + { + "epoch": 0.2895649853215906, + "grad_norm": 0.919751129443059, + "learning_rate": 0.00014909403267878771, + "loss": 0.6866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6928168535232544, + "step": 1085, + "valid_targets_mean": 15299.6, + "valid_targets_min": 275 + }, + { + "epoch": 0.2908993861756072, + "grad_norm": 0.6031403591660455, + "learning_rate": 0.000149066761692555, + "loss": 0.7153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7102971076965332, + "step": 1090, + "valid_targets_mean": 15627.9, + "valid_targets_min": 653 + }, + { + "epoch": 0.2922337870296237, + "grad_norm": 0.6644450276274809, + "learning_rate": 0.00014903908888979904, + "loss": 0.7205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7056329250335693, + "step": 1095, + "valid_targets_mean": 16785.1, + "valid_targets_min": 567 + }, + { + "epoch": 0.29356818788364025, + "grad_norm": 0.4764608245584093, + "learning_rate": 0.00014901101442064637, + "loss": 0.6987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6979807615280151, + "step": 1100, + "valid_targets_mean": 16167.7, + "valid_targets_min": 616 + }, + { + "epoch": 0.2949025887376568, + "grad_norm": 0.6014049267424753, + "learning_rate": 0.00014898253843740271, + "loss": 0.68, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6723406314849854, + "step": 1105, + "valid_targets_mean": 16871.1, + "valid_targets_min": 59 + }, + { + "epoch": 0.2962369895916733, + "grad_norm": 0.5448219489623065, + "learning_rate": 0.00014895366109455189, + "loss": 0.6838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6996907591819763, + "step": 1110, + "valid_targets_mean": 14544.4, + "valid_targets_min": 583 + }, + { + "epoch": 0.29757139044568987, + "grad_norm": 0.5583860198734728, + "learning_rate": 0.00014892438254875522, + "loss": 0.6971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6966080665588379, + "step": 1115, + "valid_targets_mean": 15939.2, + "valid_targets_min": 506 + }, + { + "epoch": 0.29890579129970646, + "grad_norm": 0.5808714512224714, + "learning_rate": 0.00014889470295885047, + "loss": 0.6898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7076345682144165, + "step": 1120, + "valid_targets_mean": 15790.9, + "valid_targets_min": 551 + }, + { + "epoch": 0.300240192153723, + "grad_norm": 0.4927279040965231, + "learning_rate": 0.0001488646224858512, + "loss": 0.6845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7084103226661682, + "step": 1125, + "valid_targets_mean": 16181.6, + "valid_targets_min": 477 + }, + { + "epoch": 0.30157459300773953, + "grad_norm": 0.4612855821814559, + "learning_rate": 0.00014883414129294575, + "loss": 0.6882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.674759030342102, + "step": 1130, + "valid_targets_mean": 16895.6, + "valid_targets_min": 204 + }, + { + "epoch": 0.30290899386175607, + "grad_norm": 0.46765724289815713, + "learning_rate": 0.00014880325954549635, + "loss": 0.6723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6812288761138916, + "step": 1135, + "valid_targets_mean": 16409.4, + "valid_targets_min": 538 + }, + { + "epoch": 0.3042433947157726, + "grad_norm": 0.4824982006416931, + "learning_rate": 0.00014877197741103827, + "loss": 0.6794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6763830184936523, + "step": 1140, + "valid_targets_mean": 16869.7, + "valid_targets_min": 16 + }, + { + "epoch": 0.30557779556978915, + "grad_norm": 0.6549002835261453, + "learning_rate": 0.00014874029505927897, + "loss": 0.6922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6630896925926208, + "step": 1145, + "valid_targets_mean": 15811.5, + "valid_targets_min": 441 + }, + { + "epoch": 0.30691219642380574, + "grad_norm": 0.4184651103712921, + "learning_rate": 0.00014870821266209705, + "loss": 0.7049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7090791463851929, + "step": 1150, + "valid_targets_mean": 16379.1, + "valid_targets_min": 337 + }, + { + "epoch": 0.3082465972778223, + "grad_norm": 0.5759381108213268, + "learning_rate": 0.00014867573039354138, + "loss": 0.7001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6881549954414368, + "step": 1155, + "valid_targets_mean": 16831.0, + "valid_targets_min": 602 + }, + { + "epoch": 0.3095809981318388, + "grad_norm": 0.8376894365561316, + "learning_rate": 0.00014864284842983018, + "loss": 0.7009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6884739398956299, + "step": 1160, + "valid_targets_mean": 17503.7, + "valid_targets_min": 769 + }, + { + "epoch": 0.31091539898585535, + "grad_norm": 0.616307622715748, + "learning_rate": 0.00014860956694935003, + "loss": 0.6803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.657461941242218, + "step": 1165, + "valid_targets_mean": 15582.3, + "valid_targets_min": 529 + }, + { + "epoch": 0.3122497998398719, + "grad_norm": 0.6537720899572182, + "learning_rate": 0.0001485758861326549, + "loss": 0.6737, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6778349876403809, + "step": 1170, + "valid_targets_mean": 15389.1, + "valid_targets_min": 209 + }, + { + "epoch": 0.3135842006938884, + "grad_norm": 0.5118272518220445, + "learning_rate": 0.00014854180616246523, + "loss": 0.6764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6655255556106567, + "step": 1175, + "valid_targets_mean": 14757.1, + "valid_targets_min": 695 + }, + { + "epoch": 0.31491860154790496, + "grad_norm": 0.5785910239800395, + "learning_rate": 0.00014850732722366682, + "loss": 0.6993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6939231753349304, + "step": 1180, + "valid_targets_mean": 16032.9, + "valid_targets_min": 497 + }, + { + "epoch": 0.31625300240192156, + "grad_norm": 0.6962605965216837, + "learning_rate": 0.00014847244950330998, + "loss": 0.6919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.672405481338501, + "step": 1185, + "valid_targets_mean": 15897.4, + "valid_targets_min": 658 + }, + { + "epoch": 0.3175874032559381, + "grad_norm": 0.7289269797910964, + "learning_rate": 0.00014843717319060833, + "loss": 0.697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6860827207565308, + "step": 1190, + "valid_targets_mean": 15977.2, + "valid_targets_min": 591 + }, + { + "epoch": 0.31892180410995463, + "grad_norm": 0.6757648389736319, + "learning_rate": 0.00014840149847693794, + "loss": 0.6903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6953767538070679, + "step": 1195, + "valid_targets_mean": 16016.2, + "valid_targets_min": 363 + }, + { + "epoch": 0.32025620496397117, + "grad_norm": 0.8798593401470403, + "learning_rate": 0.00014836542555583628, + "loss": 0.6804, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6733475923538208, + "step": 1200, + "valid_targets_mean": 15802.3, + "valid_targets_min": 677 + }, + { + "epoch": 0.3215906058179877, + "grad_norm": 0.5337148157641388, + "learning_rate": 0.000148328954623001, + "loss": 0.6931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6732375621795654, + "step": 1205, + "valid_targets_mean": 16520.0, + "valid_targets_min": 541 + }, + { + "epoch": 0.32292500667200424, + "grad_norm": 0.46270985298339473, + "learning_rate": 0.00014829208587628908, + "loss": 0.6782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6778278350830078, + "step": 1210, + "valid_targets_mean": 15218.8, + "valid_targets_min": 410 + }, + { + "epoch": 0.32425940752602084, + "grad_norm": 0.34954154788174924, + "learning_rate": 0.0001482548195157156, + "loss": 0.6792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7126316428184509, + "step": 1215, + "valid_targets_mean": 14662.9, + "valid_targets_min": 494 + }, + { + "epoch": 0.3255938083800374, + "grad_norm": 0.5194846979114964, + "learning_rate": 0.00014821715574345277, + "loss": 0.6724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6763893961906433, + "step": 1220, + "valid_targets_mean": 16349.8, + "valid_targets_min": 513 + }, + { + "epoch": 0.3269282092340539, + "grad_norm": 0.7093759511996763, + "learning_rate": 0.0001481790947638288, + "loss": 0.6786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7101802825927734, + "step": 1225, + "valid_targets_mean": 15322.1, + "valid_targets_min": 693 + }, + { + "epoch": 0.32826261008807045, + "grad_norm": 0.5192161153871548, + "learning_rate": 0.00014814063678332667, + "loss": 0.6756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6686065793037415, + "step": 1230, + "valid_targets_mean": 16233.2, + "valid_targets_min": 272 + }, + { + "epoch": 0.329597010942087, + "grad_norm": 0.5106099067287116, + "learning_rate": 0.00014810178201058323, + "loss": 0.6734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6661728620529175, + "step": 1235, + "valid_targets_mean": 15632.0, + "valid_targets_min": 780 + }, + { + "epoch": 0.3309314117961035, + "grad_norm": 0.4881815060864999, + "learning_rate": 0.00014806253065638786, + "loss": 0.674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6498801112174988, + "step": 1240, + "valid_targets_mean": 17617.5, + "valid_targets_min": 428 + }, + { + "epoch": 0.3322658126501201, + "grad_norm": 0.39268738643883516, + "learning_rate": 0.00014802288293368148, + "loss": 0.6727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6666196584701538, + "step": 1245, + "valid_targets_mean": 16153.7, + "valid_targets_min": 637 + }, + { + "epoch": 0.33360021350413666, + "grad_norm": 0.45417304392434, + "learning_rate": 0.0001479828390575553, + "loss": 0.6853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6876928210258484, + "step": 1250, + "valid_targets_mean": 15841.5, + "valid_targets_min": 632 + }, + { + "epoch": 0.3349346143581532, + "grad_norm": 0.5268128840871439, + "learning_rate": 0.00014794239924524968, + "loss": 0.6826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6616125106811523, + "step": 1255, + "valid_targets_mean": 16973.3, + "valid_targets_min": 465 + }, + { + "epoch": 0.33626901521216973, + "grad_norm": 0.39958555391425904, + "learning_rate": 0.00014790156371615303, + "loss": 0.6851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6925134062767029, + "step": 1260, + "valid_targets_mean": 16514.4, + "valid_targets_min": 289 + }, + { + "epoch": 0.33760341606618627, + "grad_norm": 0.5516259004118991, + "learning_rate": 0.00014786033269180044, + "loss": 0.6656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.663733959197998, + "step": 1265, + "valid_targets_mean": 16839.6, + "valid_targets_min": 320 + }, + { + "epoch": 0.3389378169202028, + "grad_norm": 0.5390064885544619, + "learning_rate": 0.00014781870639587262, + "loss": 0.688, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6990649700164795, + "step": 1270, + "valid_targets_mean": 15894.0, + "valid_targets_min": 315 + }, + { + "epoch": 0.3402722177742194, + "grad_norm": 0.5509217844316656, + "learning_rate": 0.0001477766850541947, + "loss": 0.703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6773085594177246, + "step": 1275, + "valid_targets_mean": 17158.7, + "valid_targets_min": 452 + }, + { + "epoch": 0.34160661862823594, + "grad_norm": 0.4521786173995471, + "learning_rate": 0.00014773426889473493, + "loss": 0.6944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6869018077850342, + "step": 1280, + "valid_targets_mean": 15783.5, + "valid_targets_min": 352 + }, + { + "epoch": 0.3429410194822525, + "grad_norm": 0.45400640165875983, + "learning_rate": 0.0001476914581476034, + "loss": 0.7053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6948401927947998, + "step": 1285, + "valid_targets_mean": 16444.6, + "valid_targets_min": 539 + }, + { + "epoch": 0.344275420336269, + "grad_norm": 0.362088704550205, + "learning_rate": 0.000147648253045051, + "loss": 0.6806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6431831121444702, + "step": 1290, + "valid_targets_mean": 16384.6, + "valid_targets_min": 797 + }, + { + "epoch": 0.34560982119028555, + "grad_norm": 0.48893960485771915, + "learning_rate": 0.0001476046538214679, + "loss": 0.6874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7072966694831848, + "step": 1295, + "valid_targets_mean": 14666.8, + "valid_targets_min": 152 + }, + { + "epoch": 0.3469442220443021, + "grad_norm": 0.41898598637304735, + "learning_rate": 0.00014756066071338247, + "loss": 0.7022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7229539155960083, + "step": 1300, + "valid_targets_mean": 15230.1, + "valid_targets_min": 707 + }, + { + "epoch": 0.3482786228983187, + "grad_norm": 0.3188940756358046, + "learning_rate": 0.00014751627395945984, + "loss": 0.6833, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6817530393600464, + "step": 1305, + "valid_targets_mean": 16233.5, + "valid_targets_min": 329 + }, + { + "epoch": 0.3496130237523352, + "grad_norm": 0.4933450593141746, + "learning_rate": 0.0001474714938005008, + "loss": 0.6801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7076213359832764, + "step": 1310, + "valid_targets_mean": 15680.3, + "valid_targets_min": 603 + }, + { + "epoch": 0.35094742460635175, + "grad_norm": 0.7583732357714017, + "learning_rate": 0.00014742632047944033, + "loss": 0.7026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7003888487815857, + "step": 1315, + "valid_targets_mean": 15842.3, + "valid_targets_min": 705 + }, + { + "epoch": 0.3522818254603683, + "grad_norm": 0.5317718895846837, + "learning_rate": 0.00014738075424134634, + "loss": 0.6867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.691694438457489, + "step": 1320, + "valid_targets_mean": 15884.4, + "valid_targets_min": 704 + }, + { + "epoch": 0.35361622631438483, + "grad_norm": 0.3501119585201358, + "learning_rate": 0.00014733479533341837, + "loss": 0.6798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6872516870498657, + "step": 1325, + "valid_targets_mean": 15958.3, + "valid_targets_min": 372 + }, + { + "epoch": 0.35495062716840137, + "grad_norm": 1.00059795566324, + "learning_rate": 0.00014728844400498616, + "loss": 0.6892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6725267767906189, + "step": 1330, + "valid_targets_mean": 17093.4, + "valid_targets_min": 768 + }, + { + "epoch": 0.35628502802241796, + "grad_norm": 0.48989419606651297, + "learning_rate": 0.00014724170050750836, + "loss": 0.6817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6638458967208862, + "step": 1335, + "valid_targets_mean": 16706.3, + "valid_targets_min": 477 + }, + { + "epoch": 0.3576194288764345, + "grad_norm": 0.7494594095135862, + "learning_rate": 0.00014719456509457122, + "loss": 0.6923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6833698749542236, + "step": 1340, + "valid_targets_mean": 15229.3, + "valid_targets_min": 565 + }, + { + "epoch": 0.35895382973045104, + "grad_norm": 0.37983172533408244, + "learning_rate": 0.00014714703802188713, + "loss": 0.6856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6993082165718079, + "step": 1345, + "valid_targets_mean": 16149.0, + "valid_targets_min": 650 + }, + { + "epoch": 0.3602882305844676, + "grad_norm": 0.3465469659019351, + "learning_rate": 0.0001470991195472932, + "loss": 0.6926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6387639045715332, + "step": 1350, + "valid_targets_mean": 17439.2, + "valid_targets_min": 264 + }, + { + "epoch": 0.3616226314384841, + "grad_norm": 0.5631916032503279, + "learning_rate": 0.00014705080993075, + "loss": 0.6797, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6804531812667847, + "step": 1355, + "valid_targets_mean": 16052.1, + "valid_targets_min": 602 + }, + { + "epoch": 0.36295703229250065, + "grad_norm": 0.37277054991570224, + "learning_rate": 0.00014700210943433998, + "loss": 0.6887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6752945184707642, + "step": 1360, + "valid_targets_mean": 16611.9, + "valid_targets_min": 441 + }, + { + "epoch": 0.36429143314651724, + "grad_norm": 0.3293587026381126, + "learning_rate": 0.00014695301832226627, + "loss": 0.6946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.674695611000061, + "step": 1365, + "valid_targets_mean": 15535.9, + "valid_targets_min": 382 + }, + { + "epoch": 0.3656258340005338, + "grad_norm": 0.4365531221583474, + "learning_rate": 0.00014690353686085098, + "loss": 0.6784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6803010702133179, + "step": 1370, + "valid_targets_mean": 15812.1, + "valid_targets_min": 197 + }, + { + "epoch": 0.3669602348545503, + "grad_norm": 0.7908663899399473, + "learning_rate": 0.00014685366531853395, + "loss": 0.6851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6726727485656738, + "step": 1375, + "valid_targets_mean": 15403.2, + "valid_targets_min": 677 + }, + { + "epoch": 0.36829463570856685, + "grad_norm": 1.3815189102486642, + "learning_rate": 0.00014680340396587118, + "loss": 0.6846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7047728300094604, + "step": 1380, + "valid_targets_mean": 15841.1, + "valid_targets_min": 567 + }, + { + "epoch": 0.3696290365625834, + "grad_norm": 0.40461431595371766, + "learning_rate": 0.0001467527530755335, + "loss": 0.6702, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6716399192810059, + "step": 1385, + "valid_targets_mean": 16679.5, + "valid_targets_min": 362 + }, + { + "epoch": 0.37096343741659993, + "grad_norm": 0.4068160169676624, + "learning_rate": 0.000146701712922305, + "loss": 0.6769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.665133535861969, + "step": 1390, + "valid_targets_mean": 16473.8, + "valid_targets_min": 716 + }, + { + "epoch": 0.37229783827061647, + "grad_norm": 0.3550489059286771, + "learning_rate": 0.00014665028378308138, + "loss": 0.6821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.682301938533783, + "step": 1395, + "valid_targets_mean": 15832.7, + "valid_targets_min": 590 + }, + { + "epoch": 0.37363223912463306, + "grad_norm": 0.4178343093762636, + "learning_rate": 0.00014659846593686885, + "loss": 0.6841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6964566707611084, + "step": 1400, + "valid_targets_mean": 15847.7, + "valid_targets_min": 470 + }, + { + "epoch": 0.3749666399786496, + "grad_norm": 0.401979565184018, + "learning_rate": 0.0001465462596647822, + "loss": 0.6889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.677052915096283, + "step": 1405, + "valid_targets_mean": 15447.2, + "valid_targets_min": 785 + }, + { + "epoch": 0.37630104083266613, + "grad_norm": 0.5448181658750829, + "learning_rate": 0.0001464936652500435, + "loss": 0.6584, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6615155339241028, + "step": 1410, + "valid_targets_mean": 16624.9, + "valid_targets_min": 658 + }, + { + "epoch": 0.37763544168668267, + "grad_norm": 0.5579138632655442, + "learning_rate": 0.0001464406829779806, + "loss": 0.6749, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.674919843673706, + "step": 1415, + "valid_targets_mean": 15348.1, + "valid_targets_min": 704 + }, + { + "epoch": 0.3789698425406992, + "grad_norm": 0.39013043281827303, + "learning_rate": 0.0001463873131360254, + "loss": 0.6687, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6693284511566162, + "step": 1420, + "valid_targets_mean": 16909.7, + "valid_targets_min": 660 + }, + { + "epoch": 0.38030424339471575, + "grad_norm": 0.5011272124507244, + "learning_rate": 0.0001463335560137124, + "loss": 0.6747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6802507042884827, + "step": 1425, + "valid_targets_mean": 16083.5, + "valid_targets_min": 425 + }, + { + "epoch": 0.38163864424873234, + "grad_norm": 0.5017249688669775, + "learning_rate": 0.00014627941190267717, + "loss": 0.6746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.670562744140625, + "step": 1430, + "valid_targets_mean": 16523.4, + "valid_targets_min": 744 + }, + { + "epoch": 0.3829730451027489, + "grad_norm": 0.4734565806098903, + "learning_rate": 0.00014622488109665468, + "loss": 0.6876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6966683864593506, + "step": 1435, + "valid_targets_mean": 16505.3, + "valid_targets_min": 559 + }, + { + "epoch": 0.3843074459567654, + "grad_norm": 0.6108752114255883, + "learning_rate": 0.0001461699638914777, + "loss": 0.6794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6841604709625244, + "step": 1440, + "valid_targets_mean": 15593.2, + "valid_targets_min": 529 + }, + { + "epoch": 0.38564184681078195, + "grad_norm": 0.6424892327231314, + "learning_rate": 0.00014611466058507536, + "loss": 0.674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6654868125915527, + "step": 1445, + "valid_targets_mean": 15160.8, + "valid_targets_min": 468 + }, + { + "epoch": 0.3869762476647985, + "grad_norm": 0.9055516118079188, + "learning_rate": 0.00014605897147747132, + "loss": 0.6856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6786572933197021, + "step": 1450, + "valid_targets_mean": 15595.1, + "valid_targets_min": 703 + }, + { + "epoch": 0.388310648518815, + "grad_norm": 0.8543812922261468, + "learning_rate": 0.0001460028968707822, + "loss": 0.6903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7012844681739807, + "step": 1455, + "valid_targets_mean": 14374.6, + "valid_targets_min": 518 + }, + { + "epoch": 0.3896450493728316, + "grad_norm": 0.8972686658958234, + "learning_rate": 0.0001459464370692161, + "loss": 0.676, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.676931619644165, + "step": 1460, + "valid_targets_mean": 16331.3, + "valid_targets_min": 490 + }, + { + "epoch": 0.39097945022684816, + "grad_norm": 0.7135716327186163, + "learning_rate": 0.0001458895923790707, + "loss": 0.6781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7019766569137573, + "step": 1465, + "valid_targets_mean": 15569.0, + "valid_targets_min": 520 + }, + { + "epoch": 0.3923138510808647, + "grad_norm": 0.6691202341390122, + "learning_rate": 0.0001458323631087318, + "loss": 0.6753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6568318009376526, + "step": 1470, + "valid_targets_mean": 16415.5, + "valid_targets_min": 501 + }, + { + "epoch": 0.39364825193488123, + "grad_norm": 0.7612668292031027, + "learning_rate": 0.00014577474956867155, + "loss": 0.6575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6636608839035034, + "step": 1475, + "valid_targets_mean": 15385.0, + "valid_targets_min": 492 + }, + { + "epoch": 0.39498265278889777, + "grad_norm": 0.6687924429811246, + "learning_rate": 0.00014571675207144676, + "loss": 0.6844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6870772838592529, + "step": 1480, + "valid_targets_mean": 14585.1, + "valid_targets_min": 676 + }, + { + "epoch": 0.3963170536429143, + "grad_norm": 0.7648107865260791, + "learning_rate": 0.00014565837093169728, + "loss": 0.6888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6783605813980103, + "step": 1485, + "valid_targets_mean": 16069.2, + "valid_targets_min": 490 + }, + { + "epoch": 0.3976514544969309, + "grad_norm": 0.7509803855864979, + "learning_rate": 0.00014559960646614418, + "loss": 0.6885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.670478343963623, + "step": 1490, + "valid_targets_mean": 15756.6, + "valid_targets_min": 645 + }, + { + "epoch": 0.39898585535094744, + "grad_norm": 0.5057989841414792, + "learning_rate": 0.00014554045899358814, + "loss": 0.6761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6895899772644043, + "step": 1495, + "valid_targets_mean": 16583.3, + "valid_targets_min": 696 + }, + { + "epoch": 0.400320256204964, + "grad_norm": 0.7744390589162883, + "learning_rate": 0.00014548092883490772, + "loss": 0.6789, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7109715938568115, + "step": 1500, + "valid_targets_mean": 16087.1, + "valid_targets_min": 352 + }, + { + "epoch": 0.4016546570589805, + "grad_norm": 0.5876072256129112, + "learning_rate": 0.00014542101631305745, + "loss": 0.691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.69822758436203, + "step": 1505, + "valid_targets_mean": 14998.5, + "valid_targets_min": 520 + }, + { + "epoch": 0.40298905791299705, + "grad_norm": 0.6284258613098378, + "learning_rate": 0.00014536072175306628, + "loss": 0.6722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6593598127365112, + "step": 1510, + "valid_targets_mean": 15673.6, + "valid_targets_min": 321 + }, + { + "epoch": 0.4043234587670136, + "grad_norm": 0.514432212840916, + "learning_rate": 0.00014530004548203573, + "loss": 0.6638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6542955040931702, + "step": 1515, + "valid_targets_mean": 15986.3, + "valid_targets_min": 487 + }, + { + "epoch": 0.4056578596210302, + "grad_norm": 0.5934282118071859, + "learning_rate": 0.00014523898782913818, + "loss": 0.6935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6390407681465149, + "step": 1520, + "valid_targets_mean": 17350.2, + "valid_targets_min": 253 + }, + { + "epoch": 0.4069922604750467, + "grad_norm": 0.4228690202369281, + "learning_rate": 0.00014517754912561496, + "loss": 0.679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6939337849617004, + "step": 1525, + "valid_targets_mean": 16316.9, + "valid_targets_min": 395 + }, + { + "epoch": 0.40832666132906326, + "grad_norm": 0.33703841726812556, + "learning_rate": 0.00014511572970477457, + "loss": 0.6636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6497060060501099, + "step": 1530, + "valid_targets_mean": 16643.3, + "valid_targets_min": 484 + }, + { + "epoch": 0.4096610621830798, + "grad_norm": 0.526601768832117, + "learning_rate": 0.00014505352990199107, + "loss": 0.6777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6721259355545044, + "step": 1535, + "valid_targets_mean": 16599.3, + "valid_targets_min": 562 + }, + { + "epoch": 0.41099546303709633, + "grad_norm": 0.3717319051316816, + "learning_rate": 0.000144990950054702, + "loss": 0.675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6512713432312012, + "step": 1540, + "valid_targets_mean": 15734.2, + "valid_targets_min": 379 + }, + { + "epoch": 0.41232986389111287, + "grad_norm": 0.3985153443670721, + "learning_rate": 0.0001449279905024067, + "loss": 0.6802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.680419921875, + "step": 1545, + "valid_targets_mean": 17000.0, + "valid_targets_min": 426 + }, + { + "epoch": 0.41366426474512946, + "grad_norm": 0.5620426536574632, + "learning_rate": 0.00014486465158666443, + "loss": 0.6786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6959854364395142, + "step": 1550, + "valid_targets_mean": 15257.2, + "valid_targets_min": 462 + }, + { + "epoch": 0.414998665599146, + "grad_norm": 0.5016374460094373, + "learning_rate": 0.00014480093365109252, + "loss": 0.6965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.681014895439148, + "step": 1555, + "valid_targets_mean": 16161.4, + "valid_targets_min": 82 + }, + { + "epoch": 0.41633306645316254, + "grad_norm": 0.45848828762812643, + "learning_rate": 0.00014473683704136454, + "loss": 0.6732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6678402423858643, + "step": 1560, + "valid_targets_mean": 15469.2, + "valid_targets_min": 516 + }, + { + "epoch": 0.4176674673071791, + "grad_norm": 0.4510235067643482, + "learning_rate": 0.0001446723621052083, + "loss": 0.6729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6836432218551636, + "step": 1565, + "valid_targets_mean": 15537.9, + "valid_targets_min": 792 + }, + { + "epoch": 0.4190018681611956, + "grad_norm": 0.2749325178114193, + "learning_rate": 0.00014460750919240416, + "loss": 0.661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6491097211837769, + "step": 1570, + "valid_targets_mean": 16182.7, + "valid_targets_min": 122 + }, + { + "epoch": 0.42033626901521215, + "grad_norm": 0.4048570514955066, + "learning_rate": 0.00014454227865478292, + "loss": 0.6766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6953452229499817, + "step": 1575, + "valid_targets_mean": 15749.0, + "valid_targets_min": 589 + }, + { + "epoch": 0.42167066986922874, + "grad_norm": 0.43507105267463514, + "learning_rate": 0.0001444766708462241, + "loss": 0.6901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6905909776687622, + "step": 1580, + "valid_targets_mean": 15047.8, + "valid_targets_min": 311 + }, + { + "epoch": 0.4230050707232453, + "grad_norm": 0.4023428012328776, + "learning_rate": 0.0001444106861226539, + "loss": 0.6758, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6905125379562378, + "step": 1585, + "valid_targets_mean": 16260.8, + "valid_targets_min": 577 + }, + { + "epoch": 0.4243394715772618, + "grad_norm": 0.32040888502490367, + "learning_rate": 0.00014434432484204335, + "loss": 0.669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6988633275032043, + "step": 1590, + "valid_targets_mean": 15973.1, + "valid_targets_min": 675 + }, + { + "epoch": 0.42567387243127836, + "grad_norm": 0.36245431872562145, + "learning_rate": 0.0001442775873644062, + "loss": 0.673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6784532070159912, + "step": 1595, + "valid_targets_mean": 16945.1, + "valid_targets_min": 285 + }, + { + "epoch": 0.4270082732852949, + "grad_norm": 0.7427033015141541, + "learning_rate": 0.00014421047405179725, + "loss": 0.6803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6956072449684143, + "step": 1600, + "valid_targets_mean": 16470.8, + "valid_targets_min": 118 + }, + { + "epoch": 0.42834267413931143, + "grad_norm": 0.693817834423677, + "learning_rate": 0.00014414298526831012, + "loss": 0.6798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6564275622367859, + "step": 1605, + "valid_targets_mean": 16161.4, + "valid_targets_min": 515 + }, + { + "epoch": 0.429677074993328, + "grad_norm": 0.5459010546987341, + "learning_rate": 0.00014407512138007547, + "loss": 0.6844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.674811065196991, + "step": 1610, + "valid_targets_mean": 15652.2, + "valid_targets_min": 475 + }, + { + "epoch": 0.43101147584734456, + "grad_norm": 0.5203042449073534, + "learning_rate": 0.0001440068827552588, + "loss": 0.6608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6763057708740234, + "step": 1615, + "valid_targets_mean": 15514.4, + "valid_targets_min": 482 + }, + { + "epoch": 0.4323458767013611, + "grad_norm": 0.5675075818567459, + "learning_rate": 0.0001439382697640587, + "loss": 0.6947, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6874855160713196, + "step": 1620, + "valid_targets_mean": 15263.9, + "valid_targets_min": 722 + }, + { + "epoch": 0.43368027755537764, + "grad_norm": 0.5359889737901847, + "learning_rate": 0.00014386928277870461, + "loss": 0.656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.669428825378418, + "step": 1625, + "valid_targets_mean": 16017.4, + "valid_targets_min": 632 + }, + { + "epoch": 0.4350146784093942, + "grad_norm": 0.5408636943550875, + "learning_rate": 0.00014379992217345504, + "loss": 0.6933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.659244954586029, + "step": 1630, + "valid_targets_mean": 15961.6, + "valid_targets_min": 616 + }, + { + "epoch": 0.4363490792634107, + "grad_norm": 0.37778085390205296, + "learning_rate": 0.0001437301883245953, + "loss": 0.6755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6465282440185547, + "step": 1635, + "valid_targets_mean": 16366.9, + "valid_targets_min": 70 + }, + { + "epoch": 0.43768348011742725, + "grad_norm": 0.6428136358402293, + "learning_rate": 0.0001436600816104356, + "loss": 0.6701, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6930896639823914, + "step": 1640, + "valid_targets_mean": 16816.4, + "valid_targets_min": 798 + }, + { + "epoch": 0.43901788097144384, + "grad_norm": 0.485887803251701, + "learning_rate": 0.000143589602411309, + "loss": 0.6714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6707935929298401, + "step": 1645, + "valid_targets_mean": 15216.7, + "valid_targets_min": 496 + }, + { + "epoch": 0.4403522818254604, + "grad_norm": 0.3717825278137594, + "learning_rate": 0.00014351875110956927, + "loss": 0.6682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7038379907608032, + "step": 1650, + "valid_targets_mean": 15937.6, + "valid_targets_min": 381 + }, + { + "epoch": 0.4416866826794769, + "grad_norm": 0.4670503910336374, + "learning_rate": 0.00014344752808958887, + "loss": 0.6872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7037096619606018, + "step": 1655, + "valid_targets_mean": 15996.4, + "valid_targets_min": 715 + }, + { + "epoch": 0.44302108353349345, + "grad_norm": 0.5130492428941893, + "learning_rate": 0.0001433759337377569, + "loss": 0.669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6803580522537231, + "step": 1660, + "valid_targets_mean": 15066.6, + "valid_targets_min": 436 + }, + { + "epoch": 0.44435548438751, + "grad_norm": 0.42492544340198113, + "learning_rate": 0.00014330396844247685, + "loss": 0.6658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6324959993362427, + "step": 1665, + "valid_targets_mean": 17875.3, + "valid_targets_min": 415 + }, + { + "epoch": 0.44568988524152653, + "grad_norm": 0.48243381726484286, + "learning_rate": 0.0001432316325941647, + "loss": 0.6726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6762223243713379, + "step": 1670, + "valid_targets_mean": 15398.0, + "valid_targets_min": 514 + }, + { + "epoch": 0.4470242860955431, + "grad_norm": 0.4262271531125559, + "learning_rate": 0.00014315892658524665, + "loss": 0.6806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6871470808982849, + "step": 1675, + "valid_targets_mean": 15288.2, + "valid_targets_min": 139 + }, + { + "epoch": 0.44835868694955966, + "grad_norm": 0.4564467834328404, + "learning_rate": 0.0001430858508101571, + "loss": 0.6527, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6515965461730957, + "step": 1680, + "valid_targets_mean": 16011.1, + "valid_targets_min": 482 + }, + { + "epoch": 0.4496930878035762, + "grad_norm": 0.3155919440895114, + "learning_rate": 0.00014301240566533637, + "loss": 0.6911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6801489591598511, + "step": 1685, + "valid_targets_mean": 16203.3, + "valid_targets_min": 590 + }, + { + "epoch": 0.45102748865759273, + "grad_norm": 0.39341185029050857, + "learning_rate": 0.00014293859154922866, + "loss": 0.6644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6648285388946533, + "step": 1690, + "valid_targets_mean": 15043.1, + "valid_targets_min": 335 + }, + { + "epoch": 0.45236188951160927, + "grad_norm": 0.5458457405844297, + "learning_rate": 0.00014286440886227995, + "loss": 0.6786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7056168913841248, + "step": 1695, + "valid_targets_mean": 15284.2, + "valid_targets_min": 389 + }, + { + "epoch": 0.4536962903656258, + "grad_norm": 0.5395188248855505, + "learning_rate": 0.00014278985800693562, + "loss": 0.6921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6924360990524292, + "step": 1700, + "valid_targets_mean": 16265.5, + "valid_targets_min": 695 + }, + { + "epoch": 0.4550306912196424, + "grad_norm": 0.5110930142156801, + "learning_rate": 0.0001427149393876384, + "loss": 0.6653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6504957675933838, + "step": 1705, + "valid_targets_mean": 15499.0, + "valid_targets_min": 465 + }, + { + "epoch": 0.45636509207365894, + "grad_norm": 0.38747352375826066, + "learning_rate": 0.00014263965341082622, + "loss": 0.6748, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6646894812583923, + "step": 1710, + "valid_targets_mean": 16010.1, + "valid_targets_min": 778 + }, + { + "epoch": 0.4576994929276755, + "grad_norm": 0.4157399117530123, + "learning_rate": 0.00014256400048492994, + "loss": 0.6913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.696425199508667, + "step": 1715, + "valid_targets_mean": 16692.4, + "valid_targets_min": 424 + }, + { + "epoch": 0.459033893781692, + "grad_norm": 0.40234560772772643, + "learning_rate": 0.00014248798102037106, + "loss": 0.652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6323100924491882, + "step": 1720, + "valid_targets_mean": 16598.7, + "valid_targets_min": 506 + }, + { + "epoch": 0.46036829463570855, + "grad_norm": 0.4105686175825738, + "learning_rate": 0.0001424115954295597, + "loss": 0.6779, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6720783710479736, + "step": 1725, + "valid_targets_mean": 15398.2, + "valid_targets_min": 546 + }, + { + "epoch": 0.4617026954897251, + "grad_norm": 0.5288517622927207, + "learning_rate": 0.00014233484412689212, + "loss": 0.6751, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7059606909751892, + "step": 1730, + "valid_targets_mean": 14793.6, + "valid_targets_min": 512 + }, + { + "epoch": 0.4630370963437417, + "grad_norm": 0.4151350926192914, + "learning_rate": 0.00014225772752874866, + "loss": 0.6628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6483746767044067, + "step": 1735, + "valid_targets_mean": 16105.2, + "valid_targets_min": 520 + }, + { + "epoch": 0.4643714971977582, + "grad_norm": 0.6172763590468829, + "learning_rate": 0.00014218024605349133, + "loss": 0.6557, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6697094440460205, + "step": 1740, + "valid_targets_mean": 16343.8, + "valid_targets_min": 346 + }, + { + "epoch": 0.46570589805177476, + "grad_norm": 0.4928889614387702, + "learning_rate": 0.00014210240012146178, + "loss": 0.6684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6752841472625732, + "step": 1745, + "valid_targets_mean": 16355.5, + "valid_targets_min": 7 + }, + { + "epoch": 0.4670402989057913, + "grad_norm": 0.5095363864894301, + "learning_rate": 0.00014202419015497863, + "loss": 0.6772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6391301155090332, + "step": 1750, + "valid_targets_mean": 14801.8, + "valid_targets_min": 595 + }, + { + "epoch": 0.46837469975980783, + "grad_norm": 0.40201996373625287, + "learning_rate": 0.00014194561657833563, + "loss": 0.6738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.663654625415802, + "step": 1755, + "valid_targets_mean": 15804.3, + "valid_targets_min": 678 + }, + { + "epoch": 0.46970910061382437, + "grad_norm": 0.3900175407918852, + "learning_rate": 0.000141866679817799, + "loss": 0.6652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6548658609390259, + "step": 1760, + "valid_targets_mean": 16266.0, + "valid_targets_min": 301 + }, + { + "epoch": 0.47104350146784096, + "grad_norm": 0.6979606870040465, + "learning_rate": 0.00014178738030160527, + "loss": 0.6765, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7068432569503784, + "step": 1765, + "valid_targets_mean": 15426.0, + "valid_targets_min": 497 + }, + { + "epoch": 0.4723779023218575, + "grad_norm": 0.43383345904843723, + "learning_rate": 0.000141707718459959, + "loss": 0.6717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6808011531829834, + "step": 1770, + "valid_targets_mean": 16582.9, + "valid_targets_min": 639 + }, + { + "epoch": 0.47371230317587404, + "grad_norm": 0.45845628788358933, + "learning_rate": 0.00014162769472503032, + "loss": 0.6519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384435892105103, + "step": 1775, + "valid_targets_mean": 16704.6, + "valid_targets_min": 470 + }, + { + "epoch": 0.4750467040298906, + "grad_norm": 0.3777800679246702, + "learning_rate": 0.00014154730953095274, + "loss": 0.6537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6459342241287231, + "step": 1780, + "valid_targets_mean": 16872.8, + "valid_targets_min": 451 + }, + { + "epoch": 0.4763811048839071, + "grad_norm": 0.4286481570503636, + "learning_rate": 0.0001414665633138206, + "loss": 0.6809, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6782388687133789, + "step": 1785, + "valid_targets_mean": 16174.8, + "valid_targets_min": 536 + }, + { + "epoch": 0.47771550573792365, + "grad_norm": 0.4005345889086281, + "learning_rate": 0.00014138545651168683, + "loss": 0.6836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6628920435905457, + "step": 1790, + "valid_targets_mean": 16390.7, + "valid_targets_min": 16 + }, + { + "epoch": 0.47904990659194024, + "grad_norm": 0.4115589182888216, + "learning_rate": 0.00014130398956456062, + "loss": 0.6641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6702592968940735, + "step": 1795, + "valid_targets_mean": 16677.2, + "valid_targets_min": 614 + }, + { + "epoch": 0.4803843074459568, + "grad_norm": 0.5386199146943589, + "learning_rate": 0.00014122216291440496, + "loss": 0.6713, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6504049301147461, + "step": 1800, + "valid_targets_mean": 16834.6, + "valid_targets_min": 631 + }, + { + "epoch": 0.4817187082999733, + "grad_norm": 0.43594882378266525, + "learning_rate": 0.00014113997700513422, + "loss": 0.6783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6663535237312317, + "step": 1805, + "valid_targets_mean": 16627.7, + "valid_targets_min": 390 + }, + { + "epoch": 0.48305310915398986, + "grad_norm": 0.36323537758193364, + "learning_rate": 0.00014105743228261174, + "loss": 0.6494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6430245637893677, + "step": 1810, + "valid_targets_mean": 15963.8, + "valid_targets_min": 10 + }, + { + "epoch": 0.4843875100080064, + "grad_norm": 0.4816559868698329, + "learning_rate": 0.00014097452919464748, + "loss": 0.6816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6982545852661133, + "step": 1815, + "valid_targets_mean": 15820.7, + "valid_targets_min": 787 + }, + { + "epoch": 0.48572191086202293, + "grad_norm": 0.637279774432971, + "learning_rate": 0.00014089126819099557, + "loss": 0.66, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6218864917755127, + "step": 1820, + "valid_targets_mean": 15937.6, + "valid_targets_min": 72 + }, + { + "epoch": 0.4870563117160395, + "grad_norm": 0.46051330636380267, + "learning_rate": 0.00014080764972335184, + "loss": 0.6817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7032638788223267, + "step": 1825, + "valid_targets_mean": 16084.2, + "valid_targets_min": 298 + }, + { + "epoch": 0.48839071257005606, + "grad_norm": 0.4185133479284188, + "learning_rate": 0.00014072367424535135, + "loss": 0.6693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.661512553691864, + "step": 1830, + "valid_targets_mean": 14985.0, + "valid_targets_min": 703 + }, + { + "epoch": 0.4897251134240726, + "grad_norm": 0.5342467862945137, + "learning_rate": 0.000140639342212566, + "loss": 0.6695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6464630961418152, + "step": 1835, + "valid_targets_mean": 17390.7, + "valid_targets_min": 577 + }, + { + "epoch": 0.49105951427808914, + "grad_norm": 0.6111007650530857, + "learning_rate": 0.000140554654082502, + "loss": 0.6667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6647217273712158, + "step": 1840, + "valid_targets_mean": 16947.6, + "valid_targets_min": 787 + }, + { + "epoch": 0.4923939151321057, + "grad_norm": 0.3474028404883341, + "learning_rate": 0.0001404696103145975, + "loss": 0.6849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6861566305160522, + "step": 1845, + "valid_targets_mean": 15907.7, + "valid_targets_min": 420 + }, + { + "epoch": 0.4937283159861222, + "grad_norm": 0.5451616019461446, + "learning_rate": 0.0001403842113702198, + "loss": 0.6609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6573194265365601, + "step": 1850, + "valid_targets_mean": 16478.6, + "valid_targets_min": 406 + }, + { + "epoch": 0.49506271684013875, + "grad_norm": 0.7004212131411925, + "learning_rate": 0.00014029845771266325, + "loss": 0.6801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6477423906326294, + "step": 1855, + "valid_targets_mean": 15260.8, + "valid_targets_min": 697 + }, + { + "epoch": 0.49639711769415534, + "grad_norm": 0.7048434342299513, + "learning_rate": 0.00014021234980714648, + "loss": 0.6827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6603525876998901, + "step": 1860, + "valid_targets_mean": 15962.9, + "valid_targets_min": 736 + }, + { + "epoch": 0.4977315185481719, + "grad_norm": 0.756775978206065, + "learning_rate": 0.00014012588812080992, + "loss": 0.6815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6624361276626587, + "step": 1865, + "valid_targets_mean": 16108.6, + "valid_targets_min": 254 + }, + { + "epoch": 0.4990659194021884, + "grad_norm": 0.5783522972899093, + "learning_rate": 0.00014003907312271319, + "loss": 0.6667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6649295091629028, + "step": 1870, + "valid_targets_mean": 16909.0, + "valid_targets_min": 666 + }, + { + "epoch": 0.500400320256205, + "grad_norm": 0.7832629887077739, + "learning_rate": 0.0001399519052838329, + "loss": 0.6664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6546527147293091, + "step": 1875, + "valid_targets_mean": 16595.7, + "valid_targets_min": 511 + }, + { + "epoch": 0.5017347211102215, + "grad_norm": 0.939021148548249, + "learning_rate": 0.00013986438507705958, + "loss": 0.6742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6604918241500854, + "step": 1880, + "valid_targets_mean": 15948.0, + "valid_targets_min": 689 + }, + { + "epoch": 0.503069121964238, + "grad_norm": 0.8662965417826878, + "learning_rate": 0.00013977651297719548, + "loss": 0.6739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6684395670890808, + "step": 1885, + "valid_targets_mean": 16201.3, + "valid_targets_min": 458 + }, + { + "epoch": 0.5044035228182546, + "grad_norm": 0.9088217892111629, + "learning_rate": 0.00013968828946095193, + "loss": 0.6594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6788122653961182, + "step": 1890, + "valid_targets_mean": 15575.2, + "valid_targets_min": 439 + }, + { + "epoch": 0.5057379236722711, + "grad_norm": 0.6344513905134873, + "learning_rate": 0.00013959971500694668, + "loss": 0.6672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6416043043136597, + "step": 1895, + "valid_targets_mean": 15835.0, + "valid_targets_min": 12 + }, + { + "epoch": 0.5070723245262877, + "grad_norm": 0.8336148657488304, + "learning_rate": 0.00013951079009570132, + "loss": 0.67, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6694490909576416, + "step": 1900, + "valid_targets_mean": 16032.9, + "valid_targets_min": 754 + }, + { + "epoch": 0.5084067253803043, + "grad_norm": 0.6260500989696588, + "learning_rate": 0.00013942151520963868, + "loss": 0.6659, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6914685964584351, + "step": 1905, + "valid_targets_mean": 16321.1, + "valid_targets_min": 723 + }, + { + "epoch": 0.5097411262343208, + "grad_norm": 0.7405051356611972, + "learning_rate": 0.00013933189083308031, + "loss": 0.6738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7031766176223755, + "step": 1910, + "valid_targets_mean": 17288.0, + "valid_targets_min": 281 + }, + { + "epoch": 0.5110755270883374, + "grad_norm": 0.6086327457057731, + "learning_rate": 0.00013924191745224364, + "loss": 0.6608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6749123334884644, + "step": 1915, + "valid_targets_mean": 15469.2, + "valid_targets_min": 426 + }, + { + "epoch": 0.5124099279423538, + "grad_norm": 0.6877904338270722, + "learning_rate": 0.00013915159555523957, + "loss": 0.6848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6368306279182434, + "step": 1920, + "valid_targets_mean": 16919.3, + "valid_targets_min": 711 + }, + { + "epoch": 0.5137443287963704, + "grad_norm": 0.47035305733386035, + "learning_rate": 0.00013906092563206968, + "loss": 0.6524, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6483859419822693, + "step": 1925, + "valid_targets_mean": 15656.5, + "valid_targets_min": 498 + }, + { + "epoch": 0.5150787296503869, + "grad_norm": 0.45402330651367906, + "learning_rate": 0.00013896990817462363, + "loss": 0.6795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7136232256889343, + "step": 1930, + "valid_targets_mean": 16150.9, + "valid_targets_min": 647 + }, + { + "epoch": 0.5164131305044035, + "grad_norm": 0.7824076954450869, + "learning_rate": 0.00013887854367667645, + "loss": 0.6714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6787303686141968, + "step": 1935, + "valid_targets_mean": 16542.0, + "valid_targets_min": 898 + }, + { + "epoch": 0.5177475313584201, + "grad_norm": 0.5056478751091026, + "learning_rate": 0.00013878683263388587, + "loss": 0.6747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6699013113975525, + "step": 1940, + "valid_targets_mean": 14940.9, + "valid_targets_min": 250 + }, + { + "epoch": 0.5190819322124366, + "grad_norm": 0.5252915459634886, + "learning_rate": 0.00013869477554378972, + "loss": 0.6727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6794301271438599, + "step": 1945, + "valid_targets_mean": 14674.8, + "valid_targets_min": 106 + }, + { + "epoch": 0.5204163330664532, + "grad_norm": 0.38122775082529703, + "learning_rate": 0.00013860237290580306, + "loss": 0.6532, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6353006958961487, + "step": 1950, + "valid_targets_mean": 16347.3, + "valid_targets_min": 469 + }, + { + "epoch": 0.5217507339204697, + "grad_norm": 0.4481900683975625, + "learning_rate": 0.00013850962522121569, + "loss": 0.679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6387051939964294, + "step": 1955, + "valid_targets_mean": 16739.2, + "valid_targets_min": 523 + }, + { + "epoch": 0.5230851347744863, + "grad_norm": 0.3884767558072463, + "learning_rate": 0.00013841653299318915, + "loss": 0.6655, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7000205516815186, + "step": 1960, + "valid_targets_mean": 16349.4, + "valid_targets_min": 844 + }, + { + "epoch": 0.5244195356285029, + "grad_norm": 0.3751791438449631, + "learning_rate": 0.00013832309672675428, + "loss": 0.6503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6721636652946472, + "step": 1965, + "valid_targets_mean": 15760.5, + "valid_targets_min": 225 + }, + { + "epoch": 0.5257539364825193, + "grad_norm": 0.5018554381804197, + "learning_rate": 0.00013822931692880828, + "loss": 0.6734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6598831415176392, + "step": 1970, + "valid_targets_mean": 16458.7, + "valid_targets_min": 478 + }, + { + "epoch": 0.5270883373365359, + "grad_norm": 0.43344427993303225, + "learning_rate": 0.00013813519410811208, + "loss": 0.6681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6558117866516113, + "step": 1975, + "valid_targets_mean": 15469.7, + "valid_targets_min": 99 + }, + { + "epoch": 0.5284227381905524, + "grad_norm": 0.40192550153987733, + "learning_rate": 0.00013804072877528746, + "loss": 0.6816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6607159376144409, + "step": 1980, + "valid_targets_mean": 16332.3, + "valid_targets_min": 359 + }, + { + "epoch": 0.529757139044569, + "grad_norm": 0.3261496597805123, + "learning_rate": 0.0001379459214428144, + "loss": 0.6596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6428033113479614, + "step": 1985, + "valid_targets_mean": 15988.9, + "valid_targets_min": 753 + }, + { + "epoch": 0.5310915398985855, + "grad_norm": 0.2827103987399224, + "learning_rate": 0.0001378507726250283, + "loss": 0.6697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6552940011024475, + "step": 1990, + "valid_targets_mean": 16928.4, + "valid_targets_min": 735 + }, + { + "epoch": 0.5324259407526021, + "grad_norm": 0.4131312586238756, + "learning_rate": 0.00013775528283811695, + "loss": 0.6639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6279177665710449, + "step": 1995, + "valid_targets_mean": 17712.5, + "valid_targets_min": 554 + }, + { + "epoch": 0.5337603416066187, + "grad_norm": 0.4328575262764605, + "learning_rate": 0.00013765945260011815, + "loss": 0.6693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6813353300094604, + "step": 2000, + "valid_targets_mean": 15772.1, + "valid_targets_min": 306 + }, + { + "epoch": 0.5350947424606352, + "grad_norm": 0.4303463028986665, + "learning_rate": 0.0001375632824309165, + "loss": 0.6642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6382510662078857, + "step": 2005, + "valid_targets_mean": 17243.4, + "valid_targets_min": 686 + }, + { + "epoch": 0.5364291433146517, + "grad_norm": 0.31754546536948197, + "learning_rate": 0.00013746677285224082, + "loss": 0.6661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6832298636436462, + "step": 2010, + "valid_targets_mean": 15342.7, + "valid_targets_min": 448 + }, + { + "epoch": 0.5377635441686682, + "grad_norm": 0.3224539660495597, + "learning_rate": 0.00013736992438766123, + "loss": 0.658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6509510278701782, + "step": 2015, + "valid_targets_mean": 15682.6, + "valid_targets_min": 20 + }, + { + "epoch": 0.5390979450226848, + "grad_norm": 0.3476987488221845, + "learning_rate": 0.00013727273756258633, + "loss": 0.6595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6609938144683838, + "step": 2020, + "valid_targets_mean": 16596.7, + "valid_targets_min": 544 + }, + { + "epoch": 0.5404323458767014, + "grad_norm": 0.3341925429496843, + "learning_rate": 0.00013717521290426034, + "loss": 0.6584, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6978187561035156, + "step": 2025, + "valid_targets_mean": 17569.2, + "valid_targets_min": 482 + }, + { + "epoch": 0.5417667467307179, + "grad_norm": 0.31980325681357635, + "learning_rate": 0.00013707735094176026, + "loss": 0.663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6462590098381042, + "step": 2030, + "valid_targets_mean": 17217.4, + "valid_targets_min": 180 + }, + { + "epoch": 0.5431011475847345, + "grad_norm": 0.504110733594983, + "learning_rate": 0.00013697915220599294, + "loss": 0.6694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6722946763038635, + "step": 2035, + "valid_targets_mean": 15108.6, + "valid_targets_min": 455 + }, + { + "epoch": 0.544435548438751, + "grad_norm": 0.39427036155645856, + "learning_rate": 0.0001368806172296923, + "loss": 0.6617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6628670692443848, + "step": 2040, + "valid_targets_mean": 17106.6, + "valid_targets_min": 184 + }, + { + "epoch": 0.5457699492927676, + "grad_norm": 0.3798470884563092, + "learning_rate": 0.00013678174654741638, + "loss": 0.6478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6374893188476562, + "step": 2045, + "valid_targets_mean": 17227.5, + "valid_targets_min": 517 + }, + { + "epoch": 0.547104350146784, + "grad_norm": 0.3542392713845455, + "learning_rate": 0.00013668254069554439, + "loss": 0.6764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6546074748039246, + "step": 2050, + "valid_targets_mean": 15193.7, + "valid_targets_min": 578 + }, + { + "epoch": 0.5484387510008006, + "grad_norm": 0.3049919714486412, + "learning_rate": 0.00013658300021227387, + "loss": 0.6746, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6780501008033752, + "step": 2055, + "valid_targets_mean": 16047.9, + "valid_targets_min": 735 + }, + { + "epoch": 0.5497731518548172, + "grad_norm": 0.4094752526440804, + "learning_rate": 0.00013648312563761784, + "loss": 0.6497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.672895073890686, + "step": 2060, + "valid_targets_mean": 15821.3, + "valid_targets_min": 432 + }, + { + "epoch": 0.5511075527088337, + "grad_norm": 0.2885708539239041, + "learning_rate": 0.0001363829175134017, + "loss": 0.6569, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6362361907958984, + "step": 2065, + "valid_targets_mean": 16060.2, + "valid_targets_min": 249 + }, + { + "epoch": 0.5524419535628503, + "grad_norm": 0.3679911308247253, + "learning_rate": 0.00013628237638326038, + "loss": 0.6684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6490753889083862, + "step": 2070, + "valid_targets_mean": 16748.8, + "valid_targets_min": 790 + }, + { + "epoch": 0.5537763544168668, + "grad_norm": 0.4534861336884921, + "learning_rate": 0.0001361815027926354, + "loss": 0.6607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6785265207290649, + "step": 2075, + "valid_targets_mean": 17079.0, + "valid_targets_min": 456 + }, + { + "epoch": 0.5551107552708834, + "grad_norm": 0.44250368563770404, + "learning_rate": 0.00013608029728877195, + "loss": 0.6572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6550644636154175, + "step": 2080, + "valid_targets_mean": 16177.8, + "valid_targets_min": 441 + }, + { + "epoch": 0.5564451561248999, + "grad_norm": 0.3950264297661988, + "learning_rate": 0.00013597876042071574, + "loss": 0.6703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6962975263595581, + "step": 2085, + "valid_targets_mean": 14695.6, + "valid_targets_min": 467 + }, + { + "epoch": 0.5577795569789165, + "grad_norm": 0.4343603248782463, + "learning_rate": 0.00013587689273931032, + "loss": 0.6631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6817919015884399, + "step": 2090, + "valid_targets_mean": 15244.0, + "valid_targets_min": 111 + }, + { + "epoch": 0.559113957832933, + "grad_norm": 0.3778902089930458, + "learning_rate": 0.00013577469479719376, + "loss": 0.6818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6776700615882874, + "step": 2095, + "valid_targets_mean": 16056.0, + "valid_targets_min": 192 + }, + { + "epoch": 0.5604483586869495, + "grad_norm": 0.4665567574775196, + "learning_rate": 0.00013567216714879593, + "loss": 0.6575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.634872317314148, + "step": 2100, + "valid_targets_mean": 16989.1, + "valid_targets_min": 501 + }, + { + "epoch": 0.5617827595409661, + "grad_norm": 6.260037404534871, + "learning_rate": 0.00013556931035033526, + "loss": 0.6993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7710926532745361, + "step": 2105, + "valid_targets_mean": 15841.9, + "valid_targets_min": 95 + }, + { + "epoch": 0.5631171603949826, + "grad_norm": 0.7013102551903544, + "learning_rate": 0.00013546612495981603, + "loss": 0.6811, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6613208055496216, + "step": 2110, + "valid_targets_mean": 15519.8, + "valid_targets_min": 728 + }, + { + "epoch": 0.5644515612489992, + "grad_norm": 0.47711928148353344, + "learning_rate": 0.00013536261153702494, + "loss": 0.661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.666735053062439, + "step": 2115, + "valid_targets_mean": 15697.4, + "valid_targets_min": 448 + }, + { + "epoch": 0.5657859621030158, + "grad_norm": 0.6530144831314217, + "learning_rate": 0.0001352587706435284, + "loss": 0.6495, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6208878755569458, + "step": 2120, + "valid_targets_mean": 15542.3, + "valid_targets_min": 267 + }, + { + "epoch": 0.5671203629570323, + "grad_norm": 0.4575924813341875, + "learning_rate": 0.00013515460284266933, + "loss": 0.6653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6797025203704834, + "step": 2125, + "valid_targets_mean": 15705.2, + "valid_targets_min": 406 + }, + { + "epoch": 0.5684547638110489, + "grad_norm": 0.4181593612220908, + "learning_rate": 0.0001350501086995642, + "loss": 0.6567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6510787606239319, + "step": 2130, + "valid_targets_mean": 16198.4, + "valid_targets_min": 101 + }, + { + "epoch": 0.5697891646650654, + "grad_norm": 0.5909184489265575, + "learning_rate": 0.00013494528878109978, + "loss": 0.6756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520047783851624, + "step": 2135, + "valid_targets_mean": 15843.7, + "valid_targets_min": 587 + }, + { + "epoch": 0.5711235655190819, + "grad_norm": 0.6030856727277748, + "learning_rate": 0.00013484014365593036, + "loss": 0.6668, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6336778402328491, + "step": 2140, + "valid_targets_mean": 16958.3, + "valid_targets_min": 472 + }, + { + "epoch": 0.5724579663730984, + "grad_norm": 0.4515248521744553, + "learning_rate": 0.00013473467389447436, + "loss": 0.6559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6533001661300659, + "step": 2145, + "valid_targets_mean": 15690.6, + "valid_targets_min": 250 + }, + { + "epoch": 0.573792367227115, + "grad_norm": 0.4667994555141797, + "learning_rate": 0.0001346288800689114, + "loss": 0.6521, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6496244668960571, + "step": 2150, + "valid_targets_mean": 15861.7, + "valid_targets_min": 650 + }, + { + "epoch": 0.5751267680811316, + "grad_norm": 0.4435676406772137, + "learning_rate": 0.00013452276275317926, + "loss": 0.6762, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6681039333343506, + "step": 2155, + "valid_targets_mean": 15310.4, + "valid_targets_min": 770 + }, + { + "epoch": 0.5764611689351481, + "grad_norm": 0.36479657444039537, + "learning_rate": 0.00013441632252297054, + "loss": 0.6537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.627946138381958, + "step": 2160, + "valid_targets_mean": 16752.0, + "valid_targets_min": 144 + }, + { + "epoch": 0.5777955697891647, + "grad_norm": 0.34293032801686635, + "learning_rate": 0.0001343095599557297, + "loss": 0.6663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6876500844955444, + "step": 2165, + "valid_targets_mean": 15393.2, + "valid_targets_min": 115 + }, + { + "epoch": 0.5791299706431812, + "grad_norm": 0.4076228566130478, + "learning_rate": 0.00013420247563064998, + "loss": 0.6739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6447117924690247, + "step": 2170, + "valid_targets_mean": 15293.0, + "valid_targets_min": 413 + }, + { + "epoch": 0.5804643714971978, + "grad_norm": 0.44537032041814034, + "learning_rate": 0.0001340950701286701, + "loss": 0.6695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6437950730323792, + "step": 2175, + "valid_targets_mean": 16650.6, + "valid_targets_min": 448 + }, + { + "epoch": 0.5817987723512144, + "grad_norm": 0.3878069492513395, + "learning_rate": 0.0001339873440324712, + "loss": 0.6705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6598751544952393, + "step": 2180, + "valid_targets_mean": 15965.4, + "valid_targets_min": 278 + }, + { + "epoch": 0.5831331732052308, + "grad_norm": 0.3411736097320242, + "learning_rate": 0.00013387929792647366, + "loss": 0.6558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6527872681617737, + "step": 2185, + "valid_targets_mean": 15891.7, + "valid_targets_min": 563 + }, + { + "epoch": 0.5844675740592474, + "grad_norm": 0.3003184033242001, + "learning_rate": 0.00013377093239683396, + "loss": 0.6719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6643562316894531, + "step": 2190, + "valid_targets_mean": 15842.3, + "valid_targets_min": 554 + }, + { + "epoch": 0.5858019749132639, + "grad_norm": 0.36648446645528304, + "learning_rate": 0.0001336622480314414, + "loss": 0.686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6981199979782104, + "step": 2195, + "valid_targets_mean": 14542.6, + "valid_targets_min": 118 + }, + { + "epoch": 0.5871363757672805, + "grad_norm": 0.36396613520492294, + "learning_rate": 0.00013355324541991512, + "loss": 0.6544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.675082266330719, + "step": 2200, + "valid_targets_mean": 15199.7, + "valid_targets_min": 641 + }, + { + "epoch": 0.588470776621297, + "grad_norm": 0.38112202254205735, + "learning_rate": 0.00013344392515360055, + "loss": 0.6435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6569694876670837, + "step": 2205, + "valid_targets_mean": 15126.9, + "valid_targets_min": 835 + }, + { + "epoch": 0.5898051774753136, + "grad_norm": 0.49269313436468004, + "learning_rate": 0.0001333342878255667, + "loss": 0.6601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6463513970375061, + "step": 2210, + "valid_targets_mean": 16902.2, + "valid_targets_min": 94 + }, + { + "epoch": 0.5911395783293302, + "grad_norm": 0.44890881586303993, + "learning_rate": 0.00013322433403060237, + "loss": 0.6628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6854138374328613, + "step": 2215, + "valid_targets_mean": 15081.2, + "valid_targets_min": 620 + }, + { + "epoch": 0.5924739791833467, + "grad_norm": 0.45988820654600676, + "learning_rate": 0.0001331140643652134, + "loss": 0.6544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6454874277114868, + "step": 2220, + "valid_targets_mean": 16441.7, + "valid_targets_min": 736 + }, + { + "epoch": 0.5938083800373632, + "grad_norm": 0.7093304778268725, + "learning_rate": 0.00013300347942761916, + "loss": 0.6569, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6526100635528564, + "step": 2225, + "valid_targets_mean": 16363.5, + "valid_targets_min": 340 + }, + { + "epoch": 0.5951427808913797, + "grad_norm": 0.3468346631394234, + "learning_rate": 0.00013289257981774944, + "loss": 0.6663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6592247486114502, + "step": 2230, + "valid_targets_mean": 15972.2, + "valid_targets_min": 895 + }, + { + "epoch": 0.5964771817453963, + "grad_norm": 0.3553442337570315, + "learning_rate": 0.0001327813661372411, + "loss": 0.6717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6738698482513428, + "step": 2235, + "valid_targets_mean": 15463.1, + "valid_targets_min": 533 + }, + { + "epoch": 0.5978115825994129, + "grad_norm": 0.3838662240074573, + "learning_rate": 0.00013266983898943495, + "loss": 0.6473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6299634575843811, + "step": 2240, + "valid_targets_mean": 17580.9, + "valid_targets_min": 729 + }, + { + "epoch": 0.5991459834534294, + "grad_norm": 0.3592590789558824, + "learning_rate": 0.00013255799897937218, + "loss": 0.6732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6780022382736206, + "step": 2245, + "valid_targets_mean": 16846.2, + "valid_targets_min": 602 + }, + { + "epoch": 0.600480384307446, + "grad_norm": 0.44100859110625984, + "learning_rate": 0.0001324458467137915, + "loss": 0.6703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6987379193305969, + "step": 2250, + "valid_targets_mean": 15482.9, + "valid_targets_min": 588 + }, + { + "epoch": 0.6018147851614625, + "grad_norm": 0.37062644306975717, + "learning_rate": 0.00013233338280112548, + "loss": 0.6554, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6602747440338135, + "step": 2255, + "valid_targets_mean": 17064.1, + "valid_targets_min": 223 + }, + { + "epoch": 0.6031491860154791, + "grad_norm": 0.418849866695498, + "learning_rate": 0.00013222060785149744, + "loss": 0.6673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6753230094909668, + "step": 2260, + "valid_targets_mean": 15280.1, + "valid_targets_min": 268 + }, + { + "epoch": 0.6044835868694955, + "grad_norm": 0.43917318413874673, + "learning_rate": 0.00013210752247671813, + "loss": 0.6774, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.654193639755249, + "step": 2265, + "valid_targets_mean": 14665.9, + "valid_targets_min": 826 + }, + { + "epoch": 0.6058179877235121, + "grad_norm": 0.40114074662966903, + "learning_rate": 0.00013199412729028226, + "loss": 0.6598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.668895423412323, + "step": 2270, + "valid_targets_mean": 14357.4, + "valid_targets_min": 562 + }, + { + "epoch": 0.6071523885775287, + "grad_norm": 0.3970227577568205, + "learning_rate": 0.00013188042290736542, + "loss": 0.6705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6774420738220215, + "step": 2275, + "valid_targets_mean": 16830.2, + "valid_targets_min": 410 + }, + { + "epoch": 0.6084867894315452, + "grad_norm": 0.3764067127859396, + "learning_rate": 0.00013176640994482056, + "loss": 0.6441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6230798363685608, + "step": 2280, + "valid_targets_mean": 16233.8, + "valid_targets_min": 222 + }, + { + "epoch": 0.6098211902855618, + "grad_norm": 0.40059163154769223, + "learning_rate": 0.00013165208902117466, + "loss": 0.6681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6714913249015808, + "step": 2285, + "valid_targets_mean": 17469.4, + "valid_targets_min": 785 + }, + { + "epoch": 0.6111555911395783, + "grad_norm": 0.3605557043946584, + "learning_rate": 0.0001315374607566254, + "loss": 0.6626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6634005308151245, + "step": 2290, + "valid_targets_mean": 16034.4, + "valid_targets_min": 685 + }, + { + "epoch": 0.6124899919935949, + "grad_norm": 0.3240690873923662, + "learning_rate": 0.0001314225257730379, + "loss": 0.6702, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6710679531097412, + "step": 2295, + "valid_targets_mean": 15922.1, + "valid_targets_min": 426 + }, + { + "epoch": 0.6138243928476115, + "grad_norm": 0.45278167405604686, + "learning_rate": 0.00013130728469394113, + "loss": 0.662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6353721022605896, + "step": 2300, + "valid_targets_mean": 15621.8, + "valid_targets_min": 537 + }, + { + "epoch": 0.615158793701628, + "grad_norm": 0.5261678023296263, + "learning_rate": 0.00013119173814452474, + "loss": 0.6623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6599146127700806, + "step": 2305, + "valid_targets_mean": 15986.3, + "valid_targets_min": 675 + }, + { + "epoch": 0.6164931945556446, + "grad_norm": 0.3520154885026282, + "learning_rate": 0.0001310758867516355, + "loss": 0.6636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420433521270752, + "step": 2310, + "valid_targets_mean": 16249.3, + "valid_targets_min": 947 + }, + { + "epoch": 0.617827595409661, + "grad_norm": 0.3160597821977501, + "learning_rate": 0.00013095973114377401, + "loss": 0.6504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6603477597236633, + "step": 2315, + "valid_targets_mean": 16349.6, + "valid_targets_min": 685 + }, + { + "epoch": 0.6191619962636776, + "grad_norm": 0.36231419289255584, + "learning_rate": 0.00013084327195109127, + "loss": 0.6712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6746746301651001, + "step": 2320, + "valid_targets_mean": 14960.1, + "valid_targets_min": 512 + }, + { + "epoch": 0.6204963971176941, + "grad_norm": 0.5203030064565997, + "learning_rate": 0.0001307265098053852, + "loss": 0.6776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6610316038131714, + "step": 2325, + "valid_targets_mean": 14701.1, + "valid_targets_min": 512 + }, + { + "epoch": 0.6218307979717107, + "grad_norm": 0.4654024359266842, + "learning_rate": 0.00013060944534009727, + "loss": 0.6592, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6650247573852539, + "step": 2330, + "valid_targets_mean": 16131.2, + "valid_targets_min": 613 + }, + { + "epoch": 0.6231651988257273, + "grad_norm": 0.40579144818563323, + "learning_rate": 0.00013049207919030913, + "loss": 0.6713, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7027677297592163, + "step": 2335, + "valid_targets_mean": 15358.5, + "valid_targets_min": 594 + }, + { + "epoch": 0.6244995996797438, + "grad_norm": 0.33738783680985324, + "learning_rate": 0.000130374411992739, + "loss": 0.6717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6985683441162109, + "step": 2340, + "valid_targets_mean": 15497.9, + "valid_targets_min": 735 + }, + { + "epoch": 0.6258340005337604, + "grad_norm": 0.29967326257870436, + "learning_rate": 0.00013025644438573828, + "loss": 0.6736, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.681916356086731, + "step": 2345, + "valid_targets_mean": 15759.5, + "valid_targets_min": 466 + }, + { + "epoch": 0.6271684013877769, + "grad_norm": 0.3784599680448572, + "learning_rate": 0.0001301381770092882, + "loss": 0.6603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6813744902610779, + "step": 2350, + "valid_targets_mean": 15277.1, + "valid_targets_min": 668 + }, + { + "epoch": 0.6285028022417934, + "grad_norm": 0.6857152779568253, + "learning_rate": 0.00013001961050499618, + "loss": 0.6598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7079257965087891, + "step": 2355, + "valid_targets_mean": 14874.0, + "valid_targets_min": 368 + }, + { + "epoch": 0.6298372030958099, + "grad_norm": 0.6008392351197666, + "learning_rate": 0.00012990074551609248, + "loss": 0.6479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6424392461776733, + "step": 2360, + "valid_targets_mean": 16310.2, + "valid_targets_min": 534 + }, + { + "epoch": 0.6311716039498265, + "grad_norm": 0.5035494087224074, + "learning_rate": 0.00012978158268742656, + "loss": 0.646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6734390258789062, + "step": 2365, + "valid_targets_mean": 15363.5, + "valid_targets_min": 413 + }, + { + "epoch": 0.6325060048038431, + "grad_norm": 0.8359104728648866, + "learning_rate": 0.00012966212266546384, + "loss": 0.6737, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6907227039337158, + "step": 2370, + "valid_targets_mean": 16321.4, + "valid_targets_min": 454 + }, + { + "epoch": 0.6338404056578596, + "grad_norm": 0.6869329295377531, + "learning_rate": 0.0001295423660982819, + "loss": 0.677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6277381181716919, + "step": 2375, + "valid_targets_mean": 16251.1, + "valid_targets_min": 424 + }, + { + "epoch": 0.6351748065118762, + "grad_norm": 0.6148555801464882, + "learning_rate": 0.00012942231363556717, + "loss": 0.6729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.675305962562561, + "step": 2380, + "valid_targets_mean": 15309.9, + "valid_targets_min": 841 + }, + { + "epoch": 0.6365092073658927, + "grad_norm": 0.45415070983770905, + "learning_rate": 0.00012930196592861123, + "loss": 0.6387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6547595262527466, + "step": 2385, + "valid_targets_mean": 15454.3, + "valid_targets_min": 196 + }, + { + "epoch": 0.6378436082199093, + "grad_norm": 0.442794276566689, + "learning_rate": 0.0001291813236303075, + "loss": 0.6617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6543595790863037, + "step": 2390, + "valid_targets_mean": 16753.5, + "valid_targets_min": 653 + }, + { + "epoch": 0.6391780090739259, + "grad_norm": 0.5332207438446981, + "learning_rate": 0.0001290603873951475, + "loss": 0.6613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6456538438796997, + "step": 2395, + "valid_targets_mean": 15616.2, + "valid_targets_min": 316 + }, + { + "epoch": 0.6405124099279423, + "grad_norm": 0.7521918638954632, + "learning_rate": 0.0001289391578792174, + "loss": 0.6552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6417596340179443, + "step": 2400, + "valid_targets_mean": 15314.5, + "valid_targets_min": 687 + }, + { + "epoch": 0.6418468107819589, + "grad_norm": 0.5277592718542781, + "learning_rate": 0.0001288176357401944, + "loss": 0.6609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6445276141166687, + "step": 2405, + "valid_targets_mean": 16181.8, + "valid_targets_min": 665 + }, + { + "epoch": 0.6431812116359754, + "grad_norm": 0.5360797058408273, + "learning_rate": 0.00012869582163734327, + "loss": 0.6621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6326366066932678, + "step": 2410, + "valid_targets_mean": 14843.5, + "valid_targets_min": 677 + }, + { + "epoch": 0.644515612489992, + "grad_norm": 0.5613437487080589, + "learning_rate": 0.00012857371623151265, + "loss": 0.6459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6261048316955566, + "step": 2415, + "valid_targets_mean": 16203.7, + "valid_targets_min": 424 + }, + { + "epoch": 0.6458500133440085, + "grad_norm": 0.5401174366140299, + "learning_rate": 0.00012845132018513147, + "loss": 0.6576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6785622835159302, + "step": 2420, + "valid_targets_mean": 15360.1, + "valid_targets_min": 507 + }, + { + "epoch": 0.6471844141980251, + "grad_norm": 0.5523670660311945, + "learning_rate": 0.00012832863416220556, + "loss": 0.6704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6968633532524109, + "step": 2425, + "valid_targets_mean": 15177.7, + "valid_targets_min": 434 + }, + { + "epoch": 0.6485188150520417, + "grad_norm": 0.6266815221915214, + "learning_rate": 0.00012820565882831365, + "loss": 0.6504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6593841910362244, + "step": 2430, + "valid_targets_mean": 14721.1, + "valid_targets_min": 547 + }, + { + "epoch": 0.6498532159060582, + "grad_norm": 0.34252486449660074, + "learning_rate": 0.00012808239485060426, + "loss": 0.6475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6551427841186523, + "step": 2435, + "valid_targets_mean": 16791.4, + "valid_targets_min": 18 + }, + { + "epoch": 0.6511876167600748, + "grad_norm": 0.3777353953835305, + "learning_rate": 0.00012795884289779161, + "loss": 0.6545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6419693231582642, + "step": 2440, + "valid_targets_mean": 16404.4, + "valid_targets_min": 353 + }, + { + "epoch": 0.6525220176140912, + "grad_norm": 0.45799644108503845, + "learning_rate": 0.00012783500364015233, + "loss": 0.6486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6675738096237183, + "step": 2445, + "valid_targets_mean": 15019.3, + "valid_targets_min": 486 + }, + { + "epoch": 0.6538564184681078, + "grad_norm": 0.35174570280079337, + "learning_rate": 0.00012771087774952165, + "loss": 0.6638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6781587600708008, + "step": 2450, + "valid_targets_mean": 16235.8, + "valid_targets_min": 543 + }, + { + "epoch": 0.6551908193221244, + "grad_norm": 0.29804159496964094, + "learning_rate": 0.00012758646589928975, + "loss": 0.6575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6292779445648193, + "step": 2455, + "valid_targets_mean": 15435.7, + "valid_targets_min": 790 + }, + { + "epoch": 0.6565252201761409, + "grad_norm": 0.3673376413084568, + "learning_rate": 0.00012746176876439824, + "loss": 0.677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7069848775863647, + "step": 2460, + "valid_targets_mean": 14007.8, + "valid_targets_min": 270 + }, + { + "epoch": 0.6578596210301575, + "grad_norm": 0.36509344991462184, + "learning_rate": 0.00012733678702133642, + "loss": 0.6493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6549676656723022, + "step": 2465, + "valid_targets_mean": 15895.7, + "valid_targets_min": 323 + }, + { + "epoch": 0.659194021884174, + "grad_norm": 0.429418610209433, + "learning_rate": 0.00012721152134813755, + "loss": 0.6624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6349632740020752, + "step": 2470, + "valid_targets_mean": 16081.5, + "valid_targets_min": 98 + }, + { + "epoch": 0.6605284227381906, + "grad_norm": 0.7270900153753073, + "learning_rate": 0.00012708597242437524, + "loss": 0.6568, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6852024793624878, + "step": 2475, + "valid_targets_mean": 14263.0, + "valid_targets_min": 270 + }, + { + "epoch": 0.661862823592207, + "grad_norm": 0.7031091414429342, + "learning_rate": 0.00012696014093115974, + "loss": 0.6717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.665812611579895, + "step": 2480, + "valid_targets_mean": 16887.2, + "valid_targets_min": 215 + }, + { + "epoch": 0.6631972244462236, + "grad_norm": 0.4374642051297583, + "learning_rate": 0.00012683402755113432, + "loss": 0.6475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6082494258880615, + "step": 2485, + "valid_targets_mean": 16537.8, + "valid_targets_min": 595 + }, + { + "epoch": 0.6645316253002402, + "grad_norm": 0.6477682364856551, + "learning_rate": 0.0001267076329684714, + "loss": 0.6509, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6187378168106079, + "step": 2490, + "valid_targets_mean": 16730.8, + "valid_targets_min": 393 + }, + { + "epoch": 0.6658660261542567, + "grad_norm": 0.38481277870775876, + "learning_rate": 0.0001265809578688691, + "loss": 0.6578, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6274208426475525, + "step": 2495, + "valid_targets_mean": 15341.1, + "valid_targets_min": 484 + }, + { + "epoch": 0.6672004270082733, + "grad_norm": 0.3917460884697377, + "learning_rate": 0.00012645400293954714, + "loss": 0.664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.663731575012207, + "step": 2500, + "valid_targets_mean": 15888.5, + "valid_targets_min": 612 + }, + { + "epoch": 0.6685348278622898, + "grad_norm": 0.9151888966738665, + "learning_rate": 0.0001263267688692435, + "loss": 0.6793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6852500438690186, + "step": 2505, + "valid_targets_mean": 15587.5, + "valid_targets_min": 286 + }, + { + "epoch": 0.6698692287163064, + "grad_norm": 0.5979390813822053, + "learning_rate": 0.00012619925634821052, + "loss": 0.6613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6739305257797241, + "step": 2510, + "valid_targets_mean": 16353.5, + "valid_targets_min": 575 + }, + { + "epoch": 0.671203629570323, + "grad_norm": 0.4449761729311656, + "learning_rate": 0.00012607146606821105, + "loss": 0.6525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6503389477729797, + "step": 2515, + "valid_targets_mean": 16451.6, + "valid_targets_min": 464 + }, + { + "epoch": 0.6725380304243395, + "grad_norm": 0.49706212546796325, + "learning_rate": 0.00012594339872251483, + "loss": 0.6644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6610913872718811, + "step": 2520, + "valid_targets_mean": 16268.6, + "valid_targets_min": 415 + }, + { + "epoch": 0.673872431278356, + "grad_norm": 0.5290075839543622, + "learning_rate": 0.00012581505500589474, + "loss": 0.6616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6627337336540222, + "step": 2525, + "valid_targets_mean": 15314.1, + "valid_targets_min": 590 + }, + { + "epoch": 0.6752068321323725, + "grad_norm": 0.5250059480100745, + "learning_rate": 0.00012568643561462298, + "loss": 0.6539, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6993048787117004, + "step": 2530, + "valid_targets_mean": 16188.7, + "valid_targets_min": 703 + }, + { + "epoch": 0.6765412329863891, + "grad_norm": 0.4750525887774703, + "learning_rate": 0.00012555754124646729, + "loss": 0.6505, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6581923365592957, + "step": 2535, + "valid_targets_mean": 15603.4, + "valid_targets_min": 686 + }, + { + "epoch": 0.6778756338404056, + "grad_norm": 0.3684157475749975, + "learning_rate": 0.0001254283726006871, + "loss": 0.6487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6634360551834106, + "step": 2540, + "valid_targets_mean": 16575.8, + "valid_targets_min": 387 + }, + { + "epoch": 0.6792100346944222, + "grad_norm": 0.5074329452000185, + "learning_rate": 0.00012529893037803, + "loss": 0.6621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6525907516479492, + "step": 2545, + "valid_targets_mean": 16449.4, + "valid_targets_min": 407 + }, + { + "epoch": 0.6805444355484388, + "grad_norm": 0.5328389684013507, + "learning_rate": 0.00012516921528072752, + "loss": 0.6497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6763752698898315, + "step": 2550, + "valid_targets_mean": 16478.6, + "valid_targets_min": 499 + }, + { + "epoch": 0.6818788364024553, + "grad_norm": 0.9065202004121011, + "learning_rate": 0.00012503922801249172, + "loss": 0.679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6522437334060669, + "step": 2555, + "valid_targets_mean": 16686.2, + "valid_targets_min": 827 + }, + { + "epoch": 0.6832132372564719, + "grad_norm": 0.5445419222694561, + "learning_rate": 0.00012490896927851118, + "loss": 0.6606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6466104984283447, + "step": 2560, + "valid_targets_mean": 16886.7, + "valid_targets_min": 570 + }, + { + "epoch": 0.6845476381104884, + "grad_norm": 0.709381810114747, + "learning_rate": 0.0001247784397854471, + "loss": 0.6505, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6570961475372314, + "step": 2565, + "valid_targets_mean": 16608.6, + "valid_targets_min": 332 + }, + { + "epoch": 0.685882038964505, + "grad_norm": 0.5686902000812523, + "learning_rate": 0.0001246476402414297, + "loss": 0.6612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.682182788848877, + "step": 2570, + "valid_targets_mean": 15198.4, + "valid_targets_min": 307 + }, + { + "epoch": 0.6872164398185214, + "grad_norm": 0.6011052255291751, + "learning_rate": 0.0001245165713560541, + "loss": 0.6641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6695008277893066, + "step": 2575, + "valid_targets_mean": 16134.5, + "valid_targets_min": 447 + }, + { + "epoch": 0.688550840672538, + "grad_norm": 0.5532645790999307, + "learning_rate": 0.00012438523384037675, + "loss": 0.6644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6632760763168335, + "step": 2580, + "valid_targets_mean": 15272.8, + "valid_targets_min": 571 + }, + { + "epoch": 0.6898852415265546, + "grad_norm": 0.596489328498592, + "learning_rate": 0.0001242536284069113, + "loss": 0.6394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6107437610626221, + "step": 2585, + "valid_targets_mean": 16331.5, + "valid_targets_min": 160 + }, + { + "epoch": 0.6912196423805711, + "grad_norm": 0.5514444258245582, + "learning_rate": 0.00012412175576962504, + "loss": 0.6508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6393566727638245, + "step": 2590, + "valid_targets_mean": 16626.9, + "valid_targets_min": 437 + }, + { + "epoch": 0.6925540432345877, + "grad_norm": 0.5190980664614784, + "learning_rate": 0.00012398961664393467, + "loss": 0.6638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6491864919662476, + "step": 2595, + "valid_targets_mean": 16259.0, + "valid_targets_min": 188 + }, + { + "epoch": 0.6938884440886042, + "grad_norm": 0.34768837243198264, + "learning_rate": 0.0001238572117467027, + "loss": 0.6659, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6843166947364807, + "step": 2600, + "valid_targets_mean": 15492.4, + "valid_targets_min": 240 + }, + { + "epoch": 0.6952228449426208, + "grad_norm": 0.5270278631943136, + "learning_rate": 0.0001237245417962335, + "loss": 0.6479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6631830930709839, + "step": 2605, + "valid_targets_mean": 16151.7, + "valid_targets_min": 655 + }, + { + "epoch": 0.6965572457966374, + "grad_norm": 0.9404018373354717, + "learning_rate": 0.0001235916075122693, + "loss": 0.6692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6821975708007812, + "step": 2610, + "valid_targets_mean": 15369.8, + "valid_targets_min": 135 + }, + { + "epoch": 0.6978916466506538, + "grad_norm": 0.7210725325794161, + "learning_rate": 0.00012345840961598638, + "loss": 0.6831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.663686990737915, + "step": 2615, + "valid_targets_mean": 15961.8, + "valid_targets_min": 589 + }, + { + "epoch": 0.6992260475046704, + "grad_norm": 0.41395719841660517, + "learning_rate": 0.00012332494882999113, + "loss": 0.6675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6907253265380859, + "step": 2620, + "valid_targets_mean": 15160.7, + "valid_targets_min": 16 + }, + { + "epoch": 0.7005604483586869, + "grad_norm": 0.3569886499787534, + "learning_rate": 0.00012319122587831614, + "loss": 0.6466, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6753599643707275, + "step": 2625, + "valid_targets_mean": 15287.2, + "valid_targets_min": 729 + }, + { + "epoch": 0.7018948492127035, + "grad_norm": 0.29934624084299416, + "learning_rate": 0.00012305724148641627, + "loss": 0.6563, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6501826047897339, + "step": 2630, + "valid_targets_mean": 15727.1, + "valid_targets_min": 583 + }, + { + "epoch": 0.70322925006672, + "grad_norm": 0.318425447077463, + "learning_rate": 0.00012292299638116472, + "loss": 0.6601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.665668249130249, + "step": 2635, + "valid_targets_mean": 16180.4, + "valid_targets_min": 419 + }, + { + "epoch": 0.7045636509207366, + "grad_norm": 0.32493659582242096, + "learning_rate": 0.00012278849129084902, + "loss": 0.6451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6409593820571899, + "step": 2640, + "valid_targets_mean": 15696.4, + "valid_targets_min": 707 + }, + { + "epoch": 0.7058980517747532, + "grad_norm": 0.3094955674403719, + "learning_rate": 0.00012265372694516714, + "loss": 0.6629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.657052218914032, + "step": 2645, + "valid_targets_mean": 15152.1, + "valid_targets_min": 413 + }, + { + "epoch": 0.7072324526287697, + "grad_norm": 0.23050310147089786, + "learning_rate": 0.00012251870407522364, + "loss": 0.6626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6353529095649719, + "step": 2650, + "valid_targets_mean": 16007.0, + "valid_targets_min": 566 + }, + { + "epoch": 0.7085668534827863, + "grad_norm": 0.2805492113192007, + "learning_rate": 0.00012238342341352546, + "loss": 0.6458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6158525943756104, + "step": 2655, + "valid_targets_mean": 16036.7, + "valid_targets_min": 463 + }, + { + "epoch": 0.7099012543368027, + "grad_norm": 0.8419236025415093, + "learning_rate": 0.00012224788569397806, + "loss": 0.6685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6778745055198669, + "step": 2660, + "valid_targets_mean": 15884.4, + "valid_targets_min": 816 + }, + { + "epoch": 0.7112356551908193, + "grad_norm": 0.49950512465543345, + "learning_rate": 0.0001221120916518816, + "loss": 0.6707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6485254168510437, + "step": 2665, + "valid_targets_mean": 15734.8, + "valid_targets_min": 246 + }, + { + "epoch": 0.7125700560448359, + "grad_norm": 0.3086314975104693, + "learning_rate": 0.0001219760420239267, + "loss": 0.6371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.640455424785614, + "step": 2670, + "valid_targets_mean": 16773.1, + "valid_targets_min": 530 + }, + { + "epoch": 0.7139044568988524, + "grad_norm": 0.3616813061445184, + "learning_rate": 0.00012183973754819051, + "loss": 0.6376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6198325157165527, + "step": 2675, + "valid_targets_mean": 16633.2, + "valid_targets_min": 577 + }, + { + "epoch": 0.715238857752869, + "grad_norm": 0.3766222345660372, + "learning_rate": 0.00012170317896413284, + "loss": 0.6458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6716166734695435, + "step": 2680, + "valid_targets_mean": 15397.1, + "valid_targets_min": 728 + }, + { + "epoch": 0.7165732586068855, + "grad_norm": 0.2916119694175485, + "learning_rate": 0.00012156636701259202, + "loss": 0.6503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420208215713501, + "step": 2685, + "valid_targets_mean": 15637.3, + "valid_targets_min": 723 + }, + { + "epoch": 0.7179076594609021, + "grad_norm": 0.2775617851207647, + "learning_rate": 0.00012142930243578092, + "loss": 0.6447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6339491009712219, + "step": 2690, + "valid_targets_mean": 15479.5, + "valid_targets_min": 771 + }, + { + "epoch": 0.7192420603149186, + "grad_norm": 0.37674025138489925, + "learning_rate": 0.00012129198597728285, + "loss": 0.6613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6560890674591064, + "step": 2695, + "valid_targets_mean": 14771.5, + "valid_targets_min": 383 + }, + { + "epoch": 0.7205764611689351, + "grad_norm": 0.39622678418107, + "learning_rate": 0.00012115441838204767, + "loss": 0.662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6819006204605103, + "step": 2700, + "valid_targets_mean": 16697.3, + "valid_targets_min": 519 + }, + { + "epoch": 0.7219108620229517, + "grad_norm": 0.46002020422176004, + "learning_rate": 0.00012101660039638766, + "loss": 0.6272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6191419363021851, + "step": 2705, + "valid_targets_mean": 15123.1, + "valid_targets_min": 484 + }, + { + "epoch": 0.7232452628769682, + "grad_norm": 0.4054679246957719, + "learning_rate": 0.00012087853276797346, + "loss": 0.6594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6391434669494629, + "step": 2710, + "valid_targets_mean": 15248.1, + "valid_targets_min": 752 + }, + { + "epoch": 0.7245796637309848, + "grad_norm": 0.4589545493169983, + "learning_rate": 0.00012074021624583005, + "loss": 0.6672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7053963541984558, + "step": 2715, + "valid_targets_mean": 15634.4, + "valid_targets_min": 322 + }, + { + "epoch": 0.7259140645850013, + "grad_norm": 0.4100508001012324, + "learning_rate": 0.00012060165158033268, + "loss": 0.6445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6315319538116455, + "step": 2720, + "valid_targets_mean": 16354.7, + "valid_targets_min": 359 + }, + { + "epoch": 0.7272484654390179, + "grad_norm": 0.449503597581273, + "learning_rate": 0.00012046283952320275, + "loss": 0.6596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6481472253799438, + "step": 2725, + "valid_targets_mean": 17060.3, + "valid_targets_min": 415 + }, + { + "epoch": 0.7285828662930345, + "grad_norm": 0.5521352851054642, + "learning_rate": 0.00012032378082750382, + "loss": 0.641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6330423355102539, + "step": 2730, + "valid_targets_mean": 15964.4, + "valid_targets_min": 499 + }, + { + "epoch": 0.729917267147051, + "grad_norm": 0.3662763277079348, + "learning_rate": 0.00012018447624763748, + "loss": 0.6664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6733106374740601, + "step": 2735, + "valid_targets_mean": 15451.8, + "valid_targets_min": 115 + }, + { + "epoch": 0.7312516680010676, + "grad_norm": 0.4442832003030609, + "learning_rate": 0.00012004492653933923, + "loss": 0.6544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.644192636013031, + "step": 2740, + "valid_targets_mean": 17145.9, + "valid_targets_min": 506 + }, + { + "epoch": 0.732586068855084, + "grad_norm": 0.4146694850471416, + "learning_rate": 0.0001199051324596744, + "loss": 0.6548, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6647549867630005, + "step": 2745, + "valid_targets_mean": 16118.1, + "valid_targets_min": 418 + }, + { + "epoch": 0.7339204697091006, + "grad_norm": 0.4034483397987316, + "learning_rate": 0.00011976509476703408, + "loss": 0.6562, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6489412784576416, + "step": 2750, + "valid_targets_mean": 16238.3, + "valid_targets_min": 480 + }, + { + "epoch": 0.7352548705631171, + "grad_norm": 0.3858704887075872, + "learning_rate": 0.00011962481422113098, + "loss": 0.6641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6932016611099243, + "step": 2755, + "valid_targets_mean": 16186.4, + "valid_targets_min": 894 + }, + { + "epoch": 0.7365892714171337, + "grad_norm": 0.3708392071660316, + "learning_rate": 0.00011948429158299523, + "loss": 0.6414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6387462019920349, + "step": 2760, + "valid_targets_mean": 15729.8, + "valid_targets_min": 87 + }, + { + "epoch": 0.7379236722711503, + "grad_norm": 0.32790785396891836, + "learning_rate": 0.00011934352761497043, + "loss": 0.6562, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6276763677597046, + "step": 2765, + "valid_targets_mean": 15110.6, + "valid_targets_min": 682 + }, + { + "epoch": 0.7392580731251668, + "grad_norm": 0.435520809779603, + "learning_rate": 0.00011920252308070936, + "loss": 0.654, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6683900356292725, + "step": 2770, + "valid_targets_mean": 16605.6, + "valid_targets_min": 497 + }, + { + "epoch": 0.7405924739791834, + "grad_norm": 0.429796127636718, + "learning_rate": 0.00011906127874516985, + "loss": 0.6794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6834566593170166, + "step": 2775, + "valid_targets_mean": 15583.3, + "valid_targets_min": 186 + }, + { + "epoch": 0.7419268748331999, + "grad_norm": 0.5630641955667017, + "learning_rate": 0.00011891979537461069, + "loss": 0.6482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6598657369613647, + "step": 2780, + "valid_targets_mean": 14949.2, + "valid_targets_min": 487 + }, + { + "epoch": 0.7432612756872164, + "grad_norm": 0.42825593904406456, + "learning_rate": 0.00011877807373658751, + "loss": 0.6588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6864846348762512, + "step": 2785, + "valid_targets_mean": 15358.7, + "valid_targets_min": 376 + }, + { + "epoch": 0.7445956765412329, + "grad_norm": 0.24764962892304368, + "learning_rate": 0.00011863611459994845, + "loss": 0.6355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6364130973815918, + "step": 2790, + "valid_targets_mean": 16195.6, + "valid_targets_min": 395 + }, + { + "epoch": 0.7459300773952495, + "grad_norm": 0.3361856535909037, + "learning_rate": 0.00011849391873483016, + "loss": 0.6563, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6433441638946533, + "step": 2795, + "valid_targets_mean": 17315.0, + "valid_targets_min": 751 + }, + { + "epoch": 0.7472644782492661, + "grad_norm": 0.4839633607167184, + "learning_rate": 0.00011835148691265355, + "loss": 0.6423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6697137355804443, + "step": 2800, + "valid_targets_mean": 15119.5, + "valid_targets_min": 516 + }, + { + "epoch": 0.7485988791032826, + "grad_norm": 0.48866740517865787, + "learning_rate": 0.00011820881990611963, + "loss": 0.6584, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6491275429725647, + "step": 2805, + "valid_targets_mean": 16127.4, + "valid_targets_min": 587 + }, + { + "epoch": 0.7499332799572992, + "grad_norm": 0.4639695977583032, + "learning_rate": 0.00011806591848920521, + "loss": 0.6543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6611607074737549, + "step": 2810, + "valid_targets_mean": 16535.5, + "valid_targets_min": 665 + }, + { + "epoch": 0.7512676808113157, + "grad_norm": 0.5819254408562657, + "learning_rate": 0.00011792278343715892, + "loss": 0.6698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6676276922225952, + "step": 2815, + "valid_targets_mean": 15598.1, + "valid_targets_min": 600 + }, + { + "epoch": 0.7526020816653323, + "grad_norm": 0.5386974712188372, + "learning_rate": 0.00011777941552649674, + "loss": 0.6507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6673504710197449, + "step": 2820, + "valid_targets_mean": 16666.5, + "valid_targets_min": 540 + }, + { + "epoch": 0.7539364825193489, + "grad_norm": 0.5247082569671393, + "learning_rate": 0.00011763581553499803, + "loss": 0.6689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6670835018157959, + "step": 2825, + "valid_targets_mean": 15185.6, + "valid_targets_min": 509 + }, + { + "epoch": 0.7552708833733653, + "grad_norm": 0.20057356755323014, + "learning_rate": 0.00011749198424170117, + "loss": 0.636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6377661228179932, + "step": 2830, + "valid_targets_mean": 16080.7, + "valid_targets_min": 275 + }, + { + "epoch": 0.7566052842273819, + "grad_norm": 0.2717189631177877, + "learning_rate": 0.00011734792242689934, + "loss": 0.6503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6641967296600342, + "step": 2835, + "valid_targets_mean": 16038.2, + "valid_targets_min": 694 + }, + { + "epoch": 0.7579396850813984, + "grad_norm": 0.3539872406346123, + "learning_rate": 0.00011720363087213629, + "loss": 0.6492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6535997986793518, + "step": 2840, + "valid_targets_mean": 15803.9, + "valid_targets_min": 347 + }, + { + "epoch": 0.759274085935415, + "grad_norm": 0.3060505538467894, + "learning_rate": 0.00011705911036020222, + "loss": 0.6547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6756272912025452, + "step": 2845, + "valid_targets_mean": 16094.0, + "valid_targets_min": 585 + }, + { + "epoch": 0.7606084867894315, + "grad_norm": 0.32979603532007673, + "learning_rate": 0.00011691436167512938, + "loss": 0.6558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6754165291786194, + "step": 2850, + "valid_targets_mean": 14935.3, + "valid_targets_min": 421 + }, + { + "epoch": 0.7619428876434481, + "grad_norm": 0.4055952495934608, + "learning_rate": 0.00011676938560218781, + "loss": 0.6692, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6552126407623291, + "step": 2855, + "valid_targets_mean": 15897.4, + "valid_targets_min": 36 + }, + { + "epoch": 0.7632772884974647, + "grad_norm": 0.24961533900790797, + "learning_rate": 0.00011662418292788127, + "loss": 0.6383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6132807731628418, + "step": 2860, + "valid_targets_mean": 16758.9, + "valid_targets_min": 350 + }, + { + "epoch": 0.7646116893514812, + "grad_norm": 0.2912209439909631, + "learning_rate": 0.00011647875443994271, + "loss": 0.6536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6957015991210938, + "step": 2865, + "valid_targets_mean": 15787.5, + "valid_targets_min": 428 + }, + { + "epoch": 0.7659460902054978, + "grad_norm": 0.3042265405636786, + "learning_rate": 0.00011633310092733027, + "loss": 0.654, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6923919916152954, + "step": 2870, + "valid_targets_mean": 15682.3, + "valid_targets_min": 87 + }, + { + "epoch": 0.7672804910595142, + "grad_norm": 0.46422609082136285, + "learning_rate": 0.00011618722318022273, + "loss": 0.6469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420409679412842, + "step": 2875, + "valid_targets_mean": 16307.2, + "valid_targets_min": 493 + }, + { + "epoch": 0.7686148919135308, + "grad_norm": 0.2866231185689334, + "learning_rate": 0.00011604112199001546, + "loss": 0.6591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6567983627319336, + "step": 2880, + "valid_targets_mean": 16033.0, + "valid_targets_min": 549 + }, + { + "epoch": 0.7699492927675474, + "grad_norm": 0.29511853808011, + "learning_rate": 0.00011589479814931598, + "loss": 0.6747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6823477745056152, + "step": 2885, + "valid_targets_mean": 15575.4, + "valid_targets_min": 184 + }, + { + "epoch": 0.7712836936215639, + "grad_norm": 0.28271108085235624, + "learning_rate": 0.0001157482524519397, + "loss": 0.6484, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6464595794677734, + "step": 2890, + "valid_targets_mean": 16116.9, + "valid_targets_min": 439 + }, + { + "epoch": 0.7726180944755805, + "grad_norm": 0.2865267852616057, + "learning_rate": 0.00011560148569290558, + "loss": 0.6631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6816505789756775, + "step": 2895, + "valid_targets_mean": 15358.4, + "valid_targets_min": 629 + }, + { + "epoch": 0.773952495329597, + "grad_norm": 0.30991511376313186, + "learning_rate": 0.00011545449866843194, + "loss": 0.6525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.63730788230896, + "step": 2900, + "valid_targets_mean": 15462.2, + "valid_targets_min": 726 + }, + { + "epoch": 0.7752868961836136, + "grad_norm": 0.3893737799601431, + "learning_rate": 0.00011530729217593198, + "loss": 0.6611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6356149911880493, + "step": 2905, + "valid_targets_mean": 15372.1, + "valid_targets_min": 367 + }, + { + "epoch": 0.77662129703763, + "grad_norm": 0.3726536887518834, + "learning_rate": 0.00011515986701400955, + "loss": 0.6486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6307750344276428, + "step": 2910, + "valid_targets_mean": 16776.6, + "valid_targets_min": 700 + }, + { + "epoch": 0.7779556978916466, + "grad_norm": 0.5524398950886195, + "learning_rate": 0.00011501222398245478, + "loss": 0.6492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6876989603042603, + "step": 2915, + "valid_targets_mean": 15650.0, + "valid_targets_min": 493 + }, + { + "epoch": 0.7792900987456632, + "grad_norm": 0.43053436499737224, + "learning_rate": 0.00011486436388223977, + "loss": 0.6506, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6381161212921143, + "step": 2920, + "valid_targets_mean": 15313.3, + "valid_targets_min": 499 + }, + { + "epoch": 0.7806244995996797, + "grad_norm": 0.519345484811449, + "learning_rate": 0.00011471628751551426, + "loss": 0.6476, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6335276365280151, + "step": 2925, + "valid_targets_mean": 16039.5, + "valid_targets_min": 609 + }, + { + "epoch": 0.7819589004536963, + "grad_norm": 0.40279485056898695, + "learning_rate": 0.0001145679956856012, + "loss": 0.6519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6481651067733765, + "step": 2930, + "valid_targets_mean": 17094.5, + "valid_targets_min": 785 + }, + { + "epoch": 0.7832933013077128, + "grad_norm": 0.3694050878957853, + "learning_rate": 0.00011441948919699249, + "loss": 0.641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6418542861938477, + "step": 2935, + "valid_targets_mean": 16285.5, + "valid_targets_min": 462 + }, + { + "epoch": 0.7846277021617294, + "grad_norm": 0.4735156964913278, + "learning_rate": 0.00011427076885534445, + "loss": 0.6586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6383504867553711, + "step": 2940, + "valid_targets_mean": 15567.9, + "valid_targets_min": 306 + }, + { + "epoch": 0.785962103015746, + "grad_norm": 0.3844007153033924, + "learning_rate": 0.00011412183546747374, + "loss": 0.6717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6902410984039307, + "step": 2945, + "valid_targets_mean": 15343.8, + "valid_targets_min": 105 + }, + { + "epoch": 0.7872965038697625, + "grad_norm": 0.317269590749701, + "learning_rate": 0.00011397268984135266, + "loss": 0.6529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6304830312728882, + "step": 2950, + "valid_targets_mean": 16103.9, + "valid_targets_min": 386 + }, + { + "epoch": 0.7886309047237791, + "grad_norm": 0.3120496775255097, + "learning_rate": 0.00011382333278610503, + "loss": 0.656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6566540598869324, + "step": 2955, + "valid_targets_mean": 15891.0, + "valid_targets_min": 415 + }, + { + "epoch": 0.7899653055777955, + "grad_norm": 0.29363407283435133, + "learning_rate": 0.00011367376511200157, + "loss": 0.6344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6340903043746948, + "step": 2960, + "valid_targets_mean": 15561.6, + "valid_targets_min": 307 + }, + { + "epoch": 0.7912997064318121, + "grad_norm": 0.27145633159261673, + "learning_rate": 0.00011352398763045569, + "loss": 0.6529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175417304039001, + "step": 2965, + "valid_targets_mean": 15884.3, + "valid_targets_min": 289 + }, + { + "epoch": 0.7926341072858286, + "grad_norm": 0.3177062342894978, + "learning_rate": 0.00011337400115401905, + "loss": 0.6375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6519104242324829, + "step": 2970, + "valid_targets_mean": 15654.3, + "valid_targets_min": 731 + }, + { + "epoch": 0.7939685081398452, + "grad_norm": 0.3262337279748586, + "learning_rate": 0.00011322380649637704, + "loss": 0.6394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6559080481529236, + "step": 2975, + "valid_targets_mean": 16248.6, + "valid_targets_min": 675 + }, + { + "epoch": 0.7953029089938618, + "grad_norm": 0.3231189128287473, + "learning_rate": 0.00011307340447234449, + "loss": 0.6561, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6174107789993286, + "step": 2980, + "valid_targets_mean": 17327.3, + "valid_targets_min": 230 + }, + { + "epoch": 0.7966373098478783, + "grad_norm": 0.2673123843052834, + "learning_rate": 0.00011292279589786115, + "loss": 0.6415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.674813985824585, + "step": 2985, + "valid_targets_mean": 16437.4, + "valid_targets_min": 691 + }, + { + "epoch": 0.7979717107018949, + "grad_norm": 0.2628610801083876, + "learning_rate": 0.00011277198158998744, + "loss": 0.6521, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6365718841552734, + "step": 2990, + "valid_targets_mean": 16253.4, + "valid_targets_min": 635 + }, + { + "epoch": 0.7993061115559114, + "grad_norm": 0.41550078533066354, + "learning_rate": 0.00011262096236689978, + "loss": 0.6571, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6576251983642578, + "step": 2995, + "valid_targets_mean": 16513.4, + "valid_targets_min": 135 + }, + { + "epoch": 0.800640512409928, + "grad_norm": 0.3088075857567339, + "learning_rate": 0.0001124697390478863, + "loss": 0.6353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6164828538894653, + "step": 3000, + "valid_targets_mean": 15918.2, + "valid_targets_min": 798 + }, + { + "epoch": 0.8019749132639445, + "grad_norm": 0.25913707294388605, + "learning_rate": 0.00011231831245334238, + "loss": 0.6576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6322481632232666, + "step": 3005, + "valid_targets_mean": 17183.3, + "valid_targets_min": 903 + }, + { + "epoch": 0.803309314117961, + "grad_norm": 0.2875117928032586, + "learning_rate": 0.00011216668340476618, + "loss": 0.6382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6693239808082581, + "step": 3010, + "valid_targets_mean": 15421.7, + "valid_targets_min": 342 + }, + { + "epoch": 0.8046437149719776, + "grad_norm": 0.36214125629051713, + "learning_rate": 0.00011201485272475416, + "loss": 0.6626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.659346342086792, + "step": 3015, + "valid_targets_mean": 15835.4, + "valid_targets_min": 768 + }, + { + "epoch": 0.8059781158259941, + "grad_norm": 0.46775768851706007, + "learning_rate": 0.00011186282123699664, + "loss": 0.6548, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.636502742767334, + "step": 3020, + "valid_targets_mean": 14893.1, + "valid_targets_min": 189 + }, + { + "epoch": 0.8073125166800107, + "grad_norm": 0.2738171869503716, + "learning_rate": 0.00011171058976627341, + "loss": 0.654, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290814876556396, + "step": 3025, + "valid_targets_mean": 15760.6, + "valid_targets_min": 337 + }, + { + "epoch": 0.8086469175340272, + "grad_norm": 0.3647024223804018, + "learning_rate": 0.00011155815913844906, + "loss": 0.6462, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6478596925735474, + "step": 3030, + "valid_targets_mean": 14951.4, + "valid_targets_min": 413 + }, + { + "epoch": 0.8099813183880438, + "grad_norm": 0.27641270754591074, + "learning_rate": 0.00011140553018046872, + "loss": 0.6598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6753206849098206, + "step": 3035, + "valid_targets_mean": 14340.4, + "valid_targets_min": 115 + }, + { + "epoch": 0.8113157192420604, + "grad_norm": 0.27104302518571194, + "learning_rate": 0.00011125270372035342, + "loss": 0.6473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6414433121681213, + "step": 3040, + "valid_targets_mean": 16101.6, + "valid_targets_min": 534 + }, + { + "epoch": 0.8126501200960768, + "grad_norm": 0.24831789534538956, + "learning_rate": 0.00011109968058719565, + "loss": 0.6451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6589419841766357, + "step": 3045, + "valid_targets_mean": 15459.0, + "valid_targets_min": 64 + }, + { + "epoch": 0.8139845209500934, + "grad_norm": 0.19532136745712955, + "learning_rate": 0.00011094646161115489, + "loss": 0.6412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6319899559020996, + "step": 3050, + "valid_targets_mean": 16658.7, + "valid_targets_min": 640 + }, + { + "epoch": 0.8153189218041099, + "grad_norm": 0.3916604874994846, + "learning_rate": 0.00011079304762345307, + "loss": 0.6458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420038938522339, + "step": 3055, + "valid_targets_mean": 16778.7, + "valid_targets_min": 591 + }, + { + "epoch": 0.8166533226581265, + "grad_norm": 0.37864396364913205, + "learning_rate": 0.00011063943945637005, + "loss": 0.6355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6372954845428467, + "step": 3060, + "valid_targets_mean": 17428.5, + "valid_targets_min": 380 + }, + { + "epoch": 0.817987723512143, + "grad_norm": 0.3870524602109993, + "learning_rate": 0.00011048563794323915, + "loss": 0.6463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6788116693496704, + "step": 3065, + "valid_targets_mean": 15602.4, + "valid_targets_min": 797 + }, + { + "epoch": 0.8193221243661596, + "grad_norm": 0.2977983842070513, + "learning_rate": 0.00011033164391844259, + "loss": 0.6508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6552585363388062, + "step": 3070, + "valid_targets_mean": 15580.0, + "valid_targets_min": 421 + }, + { + "epoch": 0.8206565252201762, + "grad_norm": 0.26537308607076826, + "learning_rate": 0.00011017745821740696, + "loss": 0.6507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6489561200141907, + "step": 3075, + "valid_targets_mean": 15627.2, + "valid_targets_min": 588 + }, + { + "epoch": 0.8219909260741927, + "grad_norm": 0.3351573792494936, + "learning_rate": 0.00011002308167659877, + "loss": 0.6611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6333989500999451, + "step": 3080, + "valid_targets_mean": 16951.4, + "valid_targets_min": 129 + }, + { + "epoch": 0.8233253269282093, + "grad_norm": 0.3732147638583794, + "learning_rate": 0.00010986851513351976, + "loss": 0.6627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6664532423019409, + "step": 3085, + "valid_targets_mean": 15145.9, + "valid_targets_min": 305 + }, + { + "epoch": 0.8246597277822257, + "grad_norm": 0.32793741970703777, + "learning_rate": 0.00010971375942670251, + "loss": 0.6897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7011292576789856, + "step": 3090, + "valid_targets_mean": 16805.0, + "valid_targets_min": 139 + }, + { + "epoch": 0.8259941286362423, + "grad_norm": 0.37753399308849905, + "learning_rate": 0.00010955881539570581, + "loss": 0.6474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.661662757396698, + "step": 3095, + "valid_targets_mean": 15650.4, + "valid_targets_min": 527 + }, + { + "epoch": 0.8273285294902589, + "grad_norm": 0.30408206326658377, + "learning_rate": 0.00010940368388111008, + "loss": 0.6332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6272863745689392, + "step": 3100, + "valid_targets_mean": 15785.5, + "valid_targets_min": 650 + }, + { + "epoch": 0.8286629303442754, + "grad_norm": 0.2528560431432323, + "learning_rate": 0.00010924836572451287, + "loss": 0.6519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6672605276107788, + "step": 3105, + "valid_targets_mean": 16141.8, + "valid_targets_min": 667 + }, + { + "epoch": 0.829997331198292, + "grad_norm": 0.2883692488906481, + "learning_rate": 0.00010909286176852432, + "loss": 0.6529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.664074182510376, + "step": 3110, + "valid_targets_mean": 16108.2, + "valid_targets_min": 698 + }, + { + "epoch": 0.8313317320523085, + "grad_norm": 0.253752010702719, + "learning_rate": 0.0001089371728567625, + "loss": 0.644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6300142407417297, + "step": 3115, + "valid_targets_mean": 16448.3, + "valid_targets_min": 319 + }, + { + "epoch": 0.8326661329063251, + "grad_norm": 0.19621076323735484, + "learning_rate": 0.00010878129983384886, + "loss": 0.6421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6365523338317871, + "step": 3120, + "valid_targets_mean": 16571.9, + "valid_targets_min": 638 + }, + { + "epoch": 0.8340005337603416, + "grad_norm": 0.31043696213151706, + "learning_rate": 0.00010862524354540369, + "loss": 0.6392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6390799880027771, + "step": 3125, + "valid_targets_mean": 16295.1, + "valid_targets_min": 482 + }, + { + "epoch": 0.8353349346143581, + "grad_norm": 0.2660416805962427, + "learning_rate": 0.00010846900483804152, + "loss": 0.6536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6644906997680664, + "step": 3130, + "valid_targets_mean": 16289.7, + "valid_targets_min": 292 + }, + { + "epoch": 0.8366693354683747, + "grad_norm": 0.2860410130544462, + "learning_rate": 0.00010831258455936645, + "loss": 0.6523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6767973899841309, + "step": 3135, + "valid_targets_mean": 15392.7, + "valid_targets_min": 496 + }, + { + "epoch": 0.8380037363223912, + "grad_norm": 0.5964225786420335, + "learning_rate": 0.00010815598355796771, + "loss": 0.653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6599225997924805, + "step": 3140, + "valid_targets_mean": 15163.7, + "valid_targets_min": 609 + }, + { + "epoch": 0.8393381371764078, + "grad_norm": 0.40273457380132044, + "learning_rate": 0.0001079992026834149, + "loss": 0.6595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6746566295623779, + "step": 3145, + "valid_targets_mean": 16054.7, + "valid_targets_min": 643 + }, + { + "epoch": 0.8406725380304243, + "grad_norm": 0.37269235274804263, + "learning_rate": 0.00010784224278625345, + "loss": 0.6499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6395473480224609, + "step": 3150, + "valid_targets_mean": 16422.7, + "valid_targets_min": 543 + }, + { + "epoch": 0.8420069388844409, + "grad_norm": 0.33447721838177247, + "learning_rate": 0.00010768510471799996, + "loss": 0.6392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6642786264419556, + "step": 3155, + "valid_targets_mean": 16876.6, + "valid_targets_min": 483 + }, + { + "epoch": 0.8433413397384575, + "grad_norm": 0.2952224423385826, + "learning_rate": 0.00010752778933113774, + "loss": 0.6496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6484600305557251, + "step": 3160, + "valid_targets_mean": 15536.5, + "valid_targets_min": 615 + }, + { + "epoch": 0.844675740592474, + "grad_norm": 0.3861238288551174, + "learning_rate": 0.00010737029747911191, + "loss": 0.6658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.643525242805481, + "step": 3165, + "valid_targets_mean": 16309.5, + "valid_targets_min": 774 + }, + { + "epoch": 0.8460101414464906, + "grad_norm": 0.3135056303201646, + "learning_rate": 0.00010721263001632503, + "loss": 0.6531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6588514447212219, + "step": 3170, + "valid_targets_mean": 16432.4, + "valid_targets_min": 94 + }, + { + "epoch": 0.847344542300507, + "grad_norm": 0.2817059242378593, + "learning_rate": 0.00010705478779813235, + "loss": 0.6551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.682015061378479, + "step": 3175, + "valid_targets_mean": 15666.3, + "valid_targets_min": 501 + }, + { + "epoch": 0.8486789431545236, + "grad_norm": 0.3975996084790914, + "learning_rate": 0.00010689677168083711, + "loss": 0.6374, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6828092932701111, + "step": 3180, + "valid_targets_mean": 14917.6, + "valid_targets_min": 494 + }, + { + "epoch": 0.8500133440085401, + "grad_norm": 0.3058355653351926, + "learning_rate": 0.00010673858252168603, + "loss": 0.6542, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6468585729598999, + "step": 3185, + "valid_targets_mean": 15833.9, + "valid_targets_min": 428 + }, + { + "epoch": 0.8513477448625567, + "grad_norm": 0.4211216089487226, + "learning_rate": 0.00010658022117886457, + "loss": 0.6511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6917360424995422, + "step": 3190, + "valid_targets_mean": 16047.0, + "valid_targets_min": 731 + }, + { + "epoch": 0.8526821457165733, + "grad_norm": 0.30431416270371453, + "learning_rate": 0.00010642168851149229, + "loss": 0.6588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6483701467514038, + "step": 3195, + "valid_targets_mean": 16088.1, + "valid_targets_min": 299 + }, + { + "epoch": 0.8540165465705898, + "grad_norm": 0.37426473290512485, + "learning_rate": 0.00010626298537961821, + "loss": 0.6423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.663414478302002, + "step": 3200, + "valid_targets_mean": 16697.5, + "valid_targets_min": 684 + }, + { + "epoch": 0.8553509474246064, + "grad_norm": 0.2570405060046422, + "learning_rate": 0.00010610411264421611, + "loss": 0.6507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6568108797073364, + "step": 3205, + "valid_targets_mean": 16679.7, + "valid_targets_min": 714 + }, + { + "epoch": 0.8566853482786229, + "grad_norm": 0.37474591801273793, + "learning_rate": 0.0001059450711671799, + "loss": 0.6544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6513127088546753, + "step": 3210, + "valid_targets_mean": 15614.5, + "valid_targets_min": 255 + }, + { + "epoch": 0.8580197491326395, + "grad_norm": 0.3141516713671115, + "learning_rate": 0.0001057858618113189, + "loss": 0.6644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6733075380325317, + "step": 3215, + "valid_targets_mean": 15210.8, + "valid_targets_min": 740 + }, + { + "epoch": 0.859354149986656, + "grad_norm": 0.2974994549393474, + "learning_rate": 0.00010562648544035323, + "loss": 0.6449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6401640772819519, + "step": 3220, + "valid_targets_mean": 15541.6, + "valid_targets_min": 391 + }, + { + "epoch": 0.8606885508406725, + "grad_norm": 0.3388673466882177, + "learning_rate": 0.00010546694291890902, + "loss": 0.6254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6491298675537109, + "step": 3225, + "valid_targets_mean": 14598.7, + "valid_targets_min": 733 + }, + { + "epoch": 0.8620229516946891, + "grad_norm": 0.4371152887391013, + "learning_rate": 0.00010530723511251382, + "loss": 0.6544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6556539535522461, + "step": 3230, + "valid_targets_mean": 15699.9, + "valid_targets_min": 464 + }, + { + "epoch": 0.8633573525487056, + "grad_norm": 0.5767723282397708, + "learning_rate": 0.0001051473628875918, + "loss": 0.6468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6518882513046265, + "step": 3235, + "valid_targets_mean": 15763.0, + "valid_targets_min": 340 + }, + { + "epoch": 0.8646917534027222, + "grad_norm": 0.30426789707079194, + "learning_rate": 0.00010498732711145918, + "loss": 0.6601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6652976274490356, + "step": 3240, + "valid_targets_mean": 15535.9, + "valid_targets_min": 816 + }, + { + "epoch": 0.8660261542567387, + "grad_norm": 0.4130220093019007, + "learning_rate": 0.00010482712865231942, + "loss": 0.623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6167925596237183, + "step": 3245, + "valid_targets_mean": 16325.2, + "valid_targets_min": 469 + }, + { + "epoch": 0.8673605551107553, + "grad_norm": 0.36276171852808714, + "learning_rate": 0.00010466676837925857, + "loss": 0.6441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520528793334961, + "step": 3250, + "valid_targets_mean": 16459.6, + "valid_targets_min": 580 + }, + { + "epoch": 0.8686949559647719, + "grad_norm": 0.4067218367888341, + "learning_rate": 0.00010450624716224045, + "loss": 0.6573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6417218446731567, + "step": 3255, + "valid_targets_mean": 15986.3, + "valid_targets_min": 705 + }, + { + "epoch": 0.8700293568187883, + "grad_norm": 0.24818738071714427, + "learning_rate": 0.00010434556587210214, + "loss": 0.6394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.64249587059021, + "step": 3260, + "valid_targets_mean": 17100.3, + "valid_targets_min": 666 + }, + { + "epoch": 0.8713637576728049, + "grad_norm": 0.3850215570427052, + "learning_rate": 0.000104184725380549, + "loss": 0.6619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6386861801147461, + "step": 3265, + "valid_targets_mean": 16787.6, + "valid_targets_min": 337 + }, + { + "epoch": 0.8726981585268214, + "grad_norm": 0.3584729041483362, + "learning_rate": 0.0001040237265601502, + "loss": 0.6511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.627690315246582, + "step": 3270, + "valid_targets_mean": 17029.8, + "valid_targets_min": 6 + }, + { + "epoch": 0.874032559380838, + "grad_norm": 0.4339765963953783, + "learning_rate": 0.00010386257028433366, + "loss": 0.6427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6622530817985535, + "step": 3275, + "valid_targets_mean": 14468.4, + "valid_targets_min": 244 + }, + { + "epoch": 0.8753669602348545, + "grad_norm": 0.2825943811936514, + "learning_rate": 0.00010370125742738173, + "loss": 0.6424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384086608886719, + "step": 3280, + "valid_targets_mean": 16163.9, + "valid_targets_min": 534 + }, + { + "epoch": 0.8767013610888711, + "grad_norm": 0.29040496771866525, + "learning_rate": 0.00010353978886442605, + "loss": 0.6662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6597708463668823, + "step": 3285, + "valid_targets_mean": 15830.2, + "valid_targets_min": 133 + }, + { + "epoch": 0.8780357619428877, + "grad_norm": 0.41728095971133644, + "learning_rate": 0.00010337816547144308, + "loss": 0.6708, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6693861484527588, + "step": 3290, + "valid_targets_mean": 15653.0, + "valid_targets_min": 818 + }, + { + "epoch": 0.8793701627969042, + "grad_norm": 0.3651738291095255, + "learning_rate": 0.00010321638812524917, + "loss": 0.6547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.659409761428833, + "step": 3295, + "valid_targets_mean": 16814.6, + "valid_targets_min": 362 + }, + { + "epoch": 0.8807045636509208, + "grad_norm": 0.3325618768861608, + "learning_rate": 0.00010305445770349593, + "loss": 0.6414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6621459722518921, + "step": 3300, + "valid_targets_mean": 16536.9, + "valid_targets_min": 398 + }, + { + "epoch": 0.8820389645049372, + "grad_norm": 0.28918434164279605, + "learning_rate": 0.00010289237508466536, + "loss": 0.6448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6440975666046143, + "step": 3305, + "valid_targets_mean": 15207.3, + "valid_targets_min": 530 + }, + { + "epoch": 0.8833733653589538, + "grad_norm": 0.4985808542613525, + "learning_rate": 0.00010273014114806517, + "loss": 0.6388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.642197847366333, + "step": 3310, + "valid_targets_mean": 15152.4, + "valid_targets_min": 568 + }, + { + "epoch": 0.8847077662129704, + "grad_norm": 0.39850878457550165, + "learning_rate": 0.000102567756773824, + "loss": 0.6527, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6053390502929688, + "step": 3315, + "valid_targets_mean": 16184.6, + "valid_targets_min": 689 + }, + { + "epoch": 0.8860421670669869, + "grad_norm": 0.30925451590653463, + "learning_rate": 0.00010240522284288657, + "loss": 0.6404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6605707406997681, + "step": 3320, + "valid_targets_mean": 14017.9, + "valid_targets_min": 409 + }, + { + "epoch": 0.8873765679210035, + "grad_norm": 0.3691668202190612, + "learning_rate": 0.00010224254023700899, + "loss": 0.652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6467193961143494, + "step": 3325, + "valid_targets_mean": 16063.3, + "valid_targets_min": 699 + }, + { + "epoch": 0.88871096877502, + "grad_norm": 0.2674717558464169, + "learning_rate": 0.00010207970983875395, + "loss": 0.6522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6779950857162476, + "step": 3330, + "valid_targets_mean": 15231.2, + "valid_targets_min": 606 + }, + { + "epoch": 0.8900453696290366, + "grad_norm": 0.20038688374080343, + "learning_rate": 0.00010191673253148589, + "loss": 0.6484, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6465331315994263, + "step": 3335, + "valid_targets_mean": 15670.2, + "valid_targets_min": 386 + }, + { + "epoch": 0.8913797704830531, + "grad_norm": 0.28330757770723614, + "learning_rate": 0.00010175360919936623, + "loss": 0.6506, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6360025405883789, + "step": 3340, + "valid_targets_mean": 16725.9, + "valid_targets_min": 459 + }, + { + "epoch": 0.8927141713370697, + "grad_norm": 0.3439479225547816, + "learning_rate": 0.00010159034072734865, + "loss": 0.63, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6294069886207581, + "step": 3345, + "valid_targets_mean": 16449.0, + "valid_targets_min": 376 + }, + { + "epoch": 0.8940485721910862, + "grad_norm": 0.2700394489223394, + "learning_rate": 0.00010142692800117416, + "loss": 0.6418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6559712886810303, + "step": 3350, + "valid_targets_mean": 16355.4, + "valid_targets_min": 545 + }, + { + "epoch": 0.8953829730451027, + "grad_norm": 0.3290237145673029, + "learning_rate": 0.00010126337190736636, + "loss": 0.65, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6721099615097046, + "step": 3355, + "valid_targets_mean": 15148.3, + "valid_targets_min": 67 + }, + { + "epoch": 0.8967173738991193, + "grad_norm": 0.24940716395634227, + "learning_rate": 0.00010109967333322669, + "loss": 0.6475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6641243696212769, + "step": 3360, + "valid_targets_mean": 15853.0, + "valid_targets_min": 732 + }, + { + "epoch": 0.8980517747531358, + "grad_norm": 0.3767555898917068, + "learning_rate": 0.00010093583316682945, + "loss": 0.6475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6830979585647583, + "step": 3365, + "valid_targets_mean": 14323.9, + "valid_targets_min": 512 + }, + { + "epoch": 0.8993861756071524, + "grad_norm": 0.31077570308089764, + "learning_rate": 0.00010077185229701722, + "loss": 0.6438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6360262632369995, + "step": 3370, + "valid_targets_mean": 15914.6, + "valid_targets_min": 288 + }, + { + "epoch": 0.900720576461169, + "grad_norm": 0.35636066897001256, + "learning_rate": 0.00010060773161339574, + "loss": 0.6381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6645758152008057, + "step": 3375, + "valid_targets_mean": 15709.9, + "valid_targets_min": 78 + }, + { + "epoch": 0.9020549773151855, + "grad_norm": 0.3168169499045184, + "learning_rate": 0.00010044347200632943, + "loss": 0.638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6317712664604187, + "step": 3380, + "valid_targets_mean": 15377.5, + "valid_targets_min": 481 + }, + { + "epoch": 0.9033893781692021, + "grad_norm": 0.34833612107690176, + "learning_rate": 0.00010027907436693623, + "loss": 0.6494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6437000036239624, + "step": 3385, + "valid_targets_mean": 14439.3, + "valid_targets_min": 410 + }, + { + "epoch": 0.9047237790232185, + "grad_norm": 0.22139220732501388, + "learning_rate": 0.00010011453958708297, + "loss": 0.6508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6224488615989685, + "step": 3390, + "valid_targets_mean": 15715.7, + "valid_targets_min": 498 + }, + { + "epoch": 0.9060581798772351, + "grad_norm": 0.27304939667752415, + "learning_rate": 9.994986855938047e-05, + "loss": 0.6501, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6275122761726379, + "step": 3395, + "valid_targets_mean": 16695.6, + "valid_targets_min": 660 + }, + { + "epoch": 0.9073925807312516, + "grad_norm": 0.22683624420794118, + "learning_rate": 9.978506217717874e-05, + "loss": 0.6419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6165873408317566, + "step": 3400, + "valid_targets_mean": 16133.7, + "valid_targets_min": 672 + }, + { + "epoch": 0.9087269815852682, + "grad_norm": 0.3781598294210209, + "learning_rate": 9.962012133456204e-05, + "loss": 0.6531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6441546678543091, + "step": 3405, + "valid_targets_mean": 16254.3, + "valid_targets_min": 364 + }, + { + "epoch": 0.9100613824392848, + "grad_norm": 0.3485691664629273, + "learning_rate": 9.945504692634409e-05, + "loss": 0.6384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6154640913009644, + "step": 3410, + "valid_targets_mean": 15014.2, + "valid_targets_min": 644 + }, + { + "epoch": 0.9113957832933013, + "grad_norm": 0.2941331404988799, + "learning_rate": 9.928983984806326e-05, + "loss": 0.6405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6541690826416016, + "step": 3415, + "valid_targets_mean": 16053.0, + "valid_targets_min": 534 + }, + { + "epoch": 0.9127301841473179, + "grad_norm": 0.2940870924679832, + "learning_rate": 9.912450099597765e-05, + "loss": 0.6429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6771601438522339, + "step": 3420, + "valid_targets_mean": 15410.8, + "valid_targets_min": 701 + }, + { + "epoch": 0.9140645850013344, + "grad_norm": 0.2540267547781181, + "learning_rate": 9.895903126706019e-05, + "loss": 0.6478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6407514810562134, + "step": 3425, + "valid_targets_mean": 15978.2, + "valid_targets_min": 446 + }, + { + "epoch": 0.915398985855351, + "grad_norm": 0.58827205007206, + "learning_rate": 9.879343155899382e-05, + "loss": 0.6342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6365908980369568, + "step": 3430, + "valid_targets_mean": 15551.0, + "valid_targets_min": 791 + }, + { + "epoch": 0.9167333867093675, + "grad_norm": 0.48345445350401867, + "learning_rate": 9.862770277016676e-05, + "loss": 0.647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6549006700515747, + "step": 3435, + "valid_targets_mean": 16312.3, + "valid_targets_min": 712 + }, + { + "epoch": 0.918067787563384, + "grad_norm": 0.6096917662718333, + "learning_rate": 9.846184579966733e-05, + "loss": 0.6416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6357414126396179, + "step": 3440, + "valid_targets_mean": 16554.4, + "valid_targets_min": 498 + }, + { + "epoch": 0.9194021884174006, + "grad_norm": 0.5175036160963103, + "learning_rate": 9.829586154727933e-05, + "loss": 0.6507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284055709838867, + "step": 3445, + "valid_targets_mean": 15700.8, + "valid_targets_min": 839 + }, + { + "epoch": 0.9207365892714171, + "grad_norm": 0.38330154473288014, + "learning_rate": 9.812975091347706e-05, + "loss": 0.6359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6508110761642456, + "step": 3450, + "valid_targets_mean": 15062.5, + "valid_targets_min": 572 + }, + { + "epoch": 0.9220709901254337, + "grad_norm": 0.4369589415188452, + "learning_rate": 9.796351479942047e-05, + "loss": 0.6491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6330595016479492, + "step": 3455, + "valid_targets_mean": 16589.2, + "valid_targets_min": 434 + }, + { + "epoch": 0.9234053909794502, + "grad_norm": 0.428584499898361, + "learning_rate": 9.779715410695015e-05, + "loss": 0.6463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6327037811279297, + "step": 3460, + "valid_targets_mean": 16817.5, + "valid_targets_min": 409 + }, + { + "epoch": 0.9247397918334668, + "grad_norm": 0.5171308232638616, + "learning_rate": 9.76306697385827e-05, + "loss": 0.6502, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380854845046997, + "step": 3465, + "valid_targets_mean": 16331.6, + "valid_targets_min": 717 + }, + { + "epoch": 0.9260741926874834, + "grad_norm": 0.5943448075228943, + "learning_rate": 9.746406259750552e-05, + "loss": 0.6614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6656478047370911, + "step": 3470, + "valid_targets_mean": 14692.4, + "valid_targets_min": 570 + }, + { + "epoch": 0.9274085935414998, + "grad_norm": 0.45121493438958316, + "learning_rate": 9.729733358757213e-05, + "loss": 0.6312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6517891883850098, + "step": 3475, + "valid_targets_mean": 16139.6, + "valid_targets_min": 758 + }, + { + "epoch": 0.9287429943955164, + "grad_norm": 0.2765978957054617, + "learning_rate": 9.713048361329715e-05, + "loss": 0.644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6355182528495789, + "step": 3480, + "valid_targets_mean": 16863.1, + "valid_targets_min": 403 + }, + { + "epoch": 0.9300773952495329, + "grad_norm": 0.5155652814279078, + "learning_rate": 9.696351357985154e-05, + "loss": 0.6605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6674410104751587, + "step": 3485, + "valid_targets_mean": 14653.7, + "valid_targets_min": 648 + }, + { + "epoch": 0.9314117961035495, + "grad_norm": 0.5064196677900263, + "learning_rate": 9.679642439305744e-05, + "loss": 0.6589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6703199148178101, + "step": 3490, + "valid_targets_mean": 16033.6, + "valid_targets_min": 765 + }, + { + "epoch": 0.932746196957566, + "grad_norm": 0.5571820953695459, + "learning_rate": 9.662921695938354e-05, + "loss": 0.6379, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6885676383972168, + "step": 3495, + "valid_targets_mean": 15294.4, + "valid_targets_min": 655 + }, + { + "epoch": 0.9340805978115826, + "grad_norm": 0.39708045174193374, + "learning_rate": 9.646189218593992e-05, + "loss": 0.647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6267415881156921, + "step": 3500, + "valid_targets_mean": 15537.8, + "valid_targets_min": 449 + }, + { + "epoch": 0.9354149986655992, + "grad_norm": 0.43893302118614175, + "learning_rate": 9.629445098047334e-05, + "loss": 0.6566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6632278561592102, + "step": 3505, + "valid_targets_mean": 16264.6, + "valid_targets_min": 334 + }, + { + "epoch": 0.9367493995196157, + "grad_norm": 0.38062901384662845, + "learning_rate": 9.61268942513621e-05, + "loss": 0.6338, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6326217651367188, + "step": 3510, + "valid_targets_mean": 14996.4, + "valid_targets_min": 756 + }, + { + "epoch": 0.9380838003736323, + "grad_norm": 0.49266598679797097, + "learning_rate": 9.595922290761128e-05, + "loss": 0.6516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6653306484222412, + "step": 3515, + "valid_targets_mean": 16628.6, + "valid_targets_min": 624 + }, + { + "epoch": 0.9394182012276487, + "grad_norm": 0.35614289136880733, + "learning_rate": 9.579143785884779e-05, + "loss": 0.6287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084467768669128, + "step": 3520, + "valid_targets_mean": 16826.6, + "valid_targets_min": 887 + }, + { + "epoch": 0.9407526020816653, + "grad_norm": 0.37113715768790856, + "learning_rate": 9.562354001531532e-05, + "loss": 0.655, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6197367310523987, + "step": 3525, + "valid_targets_mean": 15503.0, + "valid_targets_min": 351 + }, + { + "epoch": 0.9420870029356819, + "grad_norm": 0.41762638777021666, + "learning_rate": 9.545553028786952e-05, + "loss": 0.6315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234275102615356, + "step": 3530, + "valid_targets_mean": 15646.6, + "valid_targets_min": 723 + }, + { + "epoch": 0.9434214037896984, + "grad_norm": 0.44380341857698374, + "learning_rate": 9.5287409587973e-05, + "loss": 0.6407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6393918395042419, + "step": 3535, + "valid_targets_mean": 15084.2, + "valid_targets_min": 625 + }, + { + "epoch": 0.944755804643715, + "grad_norm": 0.3892234490208754, + "learning_rate": 9.511917882769042e-05, + "loss": 0.6391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6391283273696899, + "step": 3540, + "valid_targets_mean": 16098.1, + "valid_targets_min": 918 + }, + { + "epoch": 0.9460902054977315, + "grad_norm": 0.43778742220118544, + "learning_rate": 9.495083891968351e-05, + "loss": 0.6486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234838962554932, + "step": 3545, + "valid_targets_mean": 15090.8, + "valid_targets_min": 159 + }, + { + "epoch": 0.9474246063517481, + "grad_norm": 0.381850694877453, + "learning_rate": 9.478239077720615e-05, + "loss": 0.6499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6469874978065491, + "step": 3550, + "valid_targets_mean": 16223.9, + "valid_targets_min": 760 + }, + { + "epoch": 0.9487590072057646, + "grad_norm": 0.41317054151838634, + "learning_rate": 9.461383531409937e-05, + "loss": 0.6389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6466406583786011, + "step": 3555, + "valid_targets_mean": 16031.7, + "valid_targets_min": 437 + }, + { + "epoch": 0.9500934080597812, + "grad_norm": 0.30576626565173615, + "learning_rate": 9.444517344478645e-05, + "loss": 0.6482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6074718236923218, + "step": 3560, + "valid_targets_mean": 16289.6, + "valid_targets_min": 584 + }, + { + "epoch": 0.9514278089137977, + "grad_norm": 0.349699953608093, + "learning_rate": 9.427640608426789e-05, + "loss": 0.6425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6368805170059204, + "step": 3565, + "valid_targets_mean": 16044.6, + "valid_targets_min": 427 + }, + { + "epoch": 0.9527622097678142, + "grad_norm": 0.34546045313356855, + "learning_rate": 9.410753414811654e-05, + "loss": 0.6377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6125216484069824, + "step": 3570, + "valid_targets_mean": 16506.6, + "valid_targets_min": 648 + }, + { + "epoch": 0.9540966106218308, + "grad_norm": 0.3893315863348032, + "learning_rate": 9.393855855247254e-05, + "loss": 0.6687, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6844526529312134, + "step": 3575, + "valid_targets_mean": 16149.5, + "valid_targets_min": 643 + }, + { + "epoch": 0.9554310114758473, + "grad_norm": 0.2633863843990565, + "learning_rate": 9.376948021403838e-05, + "loss": 0.6567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6337841749191284, + "step": 3580, + "valid_targets_mean": 16207.8, + "valid_targets_min": 181 + }, + { + "epoch": 0.9567654123298639, + "grad_norm": 0.29692519605292395, + "learning_rate": 9.360030005007399e-05, + "loss": 0.647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6229900121688843, + "step": 3585, + "valid_targets_mean": 15579.8, + "valid_targets_min": 420 + }, + { + "epoch": 0.9580998131838805, + "grad_norm": 0.2757188736918943, + "learning_rate": 9.343101897839169e-05, + "loss": 0.6508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6774806976318359, + "step": 3590, + "valid_targets_mean": 15031.3, + "valid_targets_min": 485 + }, + { + "epoch": 0.959434214037897, + "grad_norm": 0.31332494454541954, + "learning_rate": 9.326163791735116e-05, + "loss": 0.6292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6396254301071167, + "step": 3595, + "valid_targets_mean": 16527.8, + "valid_targets_min": 976 + }, + { + "epoch": 0.9607686148919136, + "grad_norm": 0.36077294744202587, + "learning_rate": 9.309215778585461e-05, + "loss": 0.6457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6841853857040405, + "step": 3600, + "valid_targets_mean": 16090.1, + "valid_targets_min": 535 + }, + { + "epoch": 0.96210301574593, + "grad_norm": 0.2672498287309418, + "learning_rate": 9.29225795033417e-05, + "loss": 0.6541, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6412582397460938, + "step": 3605, + "valid_targets_mean": 16092.3, + "valid_targets_min": 570 + }, + { + "epoch": 0.9634374165999466, + "grad_norm": 0.2540687238294275, + "learning_rate": 9.275290398978454e-05, + "loss": 0.6652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6630794405937195, + "step": 3610, + "valid_targets_mean": 14939.0, + "valid_targets_min": 355 + }, + { + "epoch": 0.9647718174539631, + "grad_norm": 0.2131800114252568, + "learning_rate": 9.258313216568273e-05, + "loss": 0.6461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6630018949508667, + "step": 3615, + "valid_targets_mean": 16149.2, + "valid_targets_min": 510 + }, + { + "epoch": 0.9661062183079797, + "grad_norm": 0.24902095013861963, + "learning_rate": 9.241326495205836e-05, + "loss": 0.6539, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6484121084213257, + "step": 3620, + "valid_targets_mean": 15283.1, + "valid_targets_min": 688 + }, + { + "epoch": 0.9674406191619963, + "grad_norm": 0.2524604516006915, + "learning_rate": 9.224330327045105e-05, + "loss": 0.6348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242421269416809, + "step": 3625, + "valid_targets_mean": 15518.7, + "valid_targets_min": 801 + }, + { + "epoch": 0.9687750200160128, + "grad_norm": 0.28238647446499715, + "learning_rate": 9.207324804291285e-05, + "loss": 0.6475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6292116641998291, + "step": 3630, + "valid_targets_mean": 16086.4, + "valid_targets_min": 513 + }, + { + "epoch": 0.9701094208700294, + "grad_norm": 0.29096513969754145, + "learning_rate": 9.190310019200338e-05, + "loss": 0.6444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6281774044036865, + "step": 3635, + "valid_targets_mean": 16468.9, + "valid_targets_min": 456 + }, + { + "epoch": 0.9714438217240459, + "grad_norm": 0.2546985499074181, + "learning_rate": 9.173286064078465e-05, + "loss": 0.6639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6918833255767822, + "step": 3640, + "valid_targets_mean": 15578.0, + "valid_targets_min": 563 + }, + { + "epoch": 0.9727782225780625, + "grad_norm": 0.25499970964039437, + "learning_rate": 9.156253031281625e-05, + "loss": 0.6588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6605820059776306, + "step": 3645, + "valid_targets_mean": 14916.7, + "valid_targets_min": 757 + }, + { + "epoch": 0.974112623432079, + "grad_norm": 0.3389180129292924, + "learning_rate": 9.139211013215013e-05, + "loss": 0.6547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6656877398490906, + "step": 3650, + "valid_targets_mean": 15895.6, + "valid_targets_min": 143 + }, + { + "epoch": 0.9754470242860955, + "grad_norm": 0.25053024078219016, + "learning_rate": 9.122160102332583e-05, + "loss": 0.6503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6228987574577332, + "step": 3655, + "valid_targets_mean": 16149.6, + "valid_targets_min": 221 + }, + { + "epoch": 0.9767814251401121, + "grad_norm": 0.2178268898809574, + "learning_rate": 9.105100391136523e-05, + "loss": 0.6346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6444330215454102, + "step": 3660, + "valid_targets_mean": 15280.1, + "valid_targets_min": 826 + }, + { + "epoch": 0.9781158259941286, + "grad_norm": 0.27511389097304567, + "learning_rate": 9.088031972176764e-05, + "loss": 0.6362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6305812001228333, + "step": 3665, + "valid_targets_mean": 16102.7, + "valid_targets_min": 800 + }, + { + "epoch": 0.9794502268481452, + "grad_norm": 0.27125123958326863, + "learning_rate": 9.070954938050482e-05, + "loss": 0.6569, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6606098413467407, + "step": 3670, + "valid_targets_mean": 15203.1, + "valid_targets_min": 332 + }, + { + "epoch": 0.9807846277021617, + "grad_norm": 0.30513794835142677, + "learning_rate": 9.053869381401589e-05, + "loss": 0.6471, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6514785885810852, + "step": 3675, + "valid_targets_mean": 15489.2, + "valid_targets_min": 566 + }, + { + "epoch": 0.9821190285561783, + "grad_norm": 0.2674682260881522, + "learning_rate": 9.036775394920228e-05, + "loss": 0.6474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6139630079269409, + "step": 3680, + "valid_targets_mean": 17697.0, + "valid_targets_min": 309 + }, + { + "epoch": 0.9834534294101949, + "grad_norm": 0.42011865968688955, + "learning_rate": 9.01967307134228e-05, + "loss": 0.643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6135485768318176, + "step": 3685, + "valid_targets_mean": 16937.3, + "valid_targets_min": 582 + }, + { + "epoch": 0.9847878302642114, + "grad_norm": 0.25991299262090733, + "learning_rate": 9.00256250344885e-05, + "loss": 0.6352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6385388970375061, + "step": 3690, + "valid_targets_mean": 17042.7, + "valid_targets_min": 484 + }, + { + "epoch": 0.9861222311182279, + "grad_norm": 0.3094872030920946, + "learning_rate": 8.985443784065774e-05, + "loss": 0.6347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6620912551879883, + "step": 3695, + "valid_targets_mean": 16172.8, + "valid_targets_min": 437 + }, + { + "epoch": 0.9874566319722444, + "grad_norm": 0.2648905621560967, + "learning_rate": 8.968317006063107e-05, + "loss": 0.643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6437067985534668, + "step": 3700, + "valid_targets_mean": 15814.3, + "valid_targets_min": 666 + }, + { + "epoch": 0.988791032826261, + "grad_norm": 0.2872339382049347, + "learning_rate": 8.951182262354624e-05, + "loss": 0.6226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.634140133857727, + "step": 3705, + "valid_targets_mean": 15975.5, + "valid_targets_min": 922 + }, + { + "epoch": 0.9901254336802775, + "grad_norm": 0.22777511656801333, + "learning_rate": 8.934039645897316e-05, + "loss": 0.6508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6716867685317993, + "step": 3710, + "valid_targets_mean": 16354.8, + "valid_targets_min": 704 + }, + { + "epoch": 0.9914598345342941, + "grad_norm": 0.2817686690598872, + "learning_rate": 8.916889249690877e-05, + "loss": 0.6598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6462900638580322, + "step": 3715, + "valid_targets_mean": 15771.1, + "valid_targets_min": 120 + }, + { + "epoch": 0.9927942353883107, + "grad_norm": 0.2206326896920367, + "learning_rate": 8.899731166777216e-05, + "loss": 0.6583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6339864134788513, + "step": 3720, + "valid_targets_mean": 16834.7, + "valid_targets_min": 98 + }, + { + "epoch": 0.9941286362423272, + "grad_norm": 0.5024525222279345, + "learning_rate": 8.882565490239935e-05, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6254690885543823, + "step": 3725, + "valid_targets_mean": 15646.8, + "valid_targets_min": 472 + }, + { + "epoch": 0.9954630370963438, + "grad_norm": 0.3856087446468771, + "learning_rate": 8.865392313203839e-05, + "loss": 0.6402, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6251246333122253, + "step": 3730, + "valid_targets_mean": 15004.9, + "valid_targets_min": 630 + }, + { + "epoch": 0.9967974379503602, + "grad_norm": 0.40239943536134476, + "learning_rate": 8.848211728834415e-05, + "loss": 0.6633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6419751644134521, + "step": 3735, + "valid_targets_mean": 15467.9, + "valid_targets_min": 319 + }, + { + "epoch": 0.9981318388043768, + "grad_norm": 0.31304776164504733, + "learning_rate": 8.831023830337348e-05, + "loss": 0.6602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6425862312316895, + "step": 3740, + "valid_targets_mean": 14812.8, + "valid_targets_min": 431 + }, + { + "epoch": 0.9994662396583934, + "grad_norm": 0.35589672329273264, + "learning_rate": 8.813828710957987e-05, + "loss": 0.6247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6540701389312744, + "step": 3745, + "valid_targets_mean": 15883.5, + "valid_targets_min": 492 + }, + { + "epoch": 1.00080064051241, + "grad_norm": 0.26760563380752905, + "learning_rate": 8.796626463980863e-05, + "loss": 0.6313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6551904678344727, + "step": 3750, + "valid_targets_mean": 17182.7, + "valid_targets_min": 696 + }, + { + "epoch": 1.0021350413664265, + "grad_norm": 0.31015553596849776, + "learning_rate": 8.779417182729181e-05, + "loss": 0.6395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6176386475563049, + "step": 3755, + "valid_targets_mean": 16216.0, + "valid_targets_min": 610 + }, + { + "epoch": 1.003469442220443, + "grad_norm": 0.19888626057576428, + "learning_rate": 8.762200960564295e-05, + "loss": 0.6428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6564364433288574, + "step": 3760, + "valid_targets_mean": 16117.9, + "valid_targets_min": 216 + }, + { + "epoch": 1.0048038430744595, + "grad_norm": 0.31576042269966875, + "learning_rate": 8.744977890885218e-05, + "loss": 0.6372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6488126516342163, + "step": 3765, + "valid_targets_mean": 15915.4, + "valid_targets_min": 796 + }, + { + "epoch": 1.006138243928476, + "grad_norm": 0.37031993459449786, + "learning_rate": 8.727748067128116e-05, + "loss": 0.6441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6726912260055542, + "step": 3770, + "valid_targets_mean": 14668.3, + "valid_targets_min": 583 + }, + { + "epoch": 1.0074726447824927, + "grad_norm": 0.25852458130057065, + "learning_rate": 8.71051158276579e-05, + "loss": 0.6408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.630450963973999, + "step": 3775, + "valid_targets_mean": 17935.9, + "valid_targets_min": 563 + }, + { + "epoch": 1.0088070456365092, + "grad_norm": 0.2507167855310047, + "learning_rate": 8.693268531307182e-05, + "loss": 0.6495, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6480845808982849, + "step": 3780, + "valid_targets_mean": 15486.5, + "valid_targets_min": 522 + }, + { + "epoch": 1.0101414464905258, + "grad_norm": 0.25299995341948267, + "learning_rate": 8.676019006296851e-05, + "loss": 0.6424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6288371086120605, + "step": 3785, + "valid_targets_mean": 16877.4, + "valid_targets_min": 340 + }, + { + "epoch": 1.0114758473445422, + "grad_norm": 0.4671268307313036, + "learning_rate": 8.658763101314484e-05, + "loss": 0.647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6182825565338135, + "step": 3790, + "valid_targets_mean": 15726.7, + "valid_targets_min": 771 + }, + { + "epoch": 1.0128102481985588, + "grad_norm": 0.4394010424816238, + "learning_rate": 8.64150090997438e-05, + "loss": 0.6323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6484892964363098, + "step": 3795, + "valid_targets_mean": 15794.6, + "valid_targets_min": 640 + }, + { + "epoch": 1.0141446490525754, + "grad_norm": 0.4487423936581022, + "learning_rate": 8.624232525924936e-05, + "loss": 0.6433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6359849572181702, + "step": 3800, + "valid_targets_mean": 16178.8, + "valid_targets_min": 679 + }, + { + "epoch": 1.015479049906592, + "grad_norm": 0.41831834818461444, + "learning_rate": 8.606958042848145e-05, + "loss": 0.6422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6211769580841064, + "step": 3805, + "valid_targets_mean": 16291.6, + "valid_targets_min": 515 + }, + { + "epoch": 1.0168134507606086, + "grad_norm": 0.45389931206375994, + "learning_rate": 8.589677554459094e-05, + "loss": 0.625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6307047605514526, + "step": 3810, + "valid_targets_mean": 17618.1, + "valid_targets_min": 87 + }, + { + "epoch": 1.018147851614625, + "grad_norm": 0.3268915481818196, + "learning_rate": 8.572391154505444e-05, + "loss": 0.6216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6273326873779297, + "step": 3815, + "valid_targets_mean": 15623.5, + "valid_targets_min": 779 + }, + { + "epoch": 1.0194822524686415, + "grad_norm": 0.41308299425023076, + "learning_rate": 8.555098936766927e-05, + "loss": 0.6308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6591796278953552, + "step": 3820, + "valid_targets_mean": 14928.0, + "valid_targets_min": 679 + }, + { + "epoch": 1.0208166533226581, + "grad_norm": 0.44942713175635873, + "learning_rate": 8.537800995054838e-05, + "loss": 0.6519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6796396374702454, + "step": 3825, + "valid_targets_mean": 15782.7, + "valid_targets_min": 729 + }, + { + "epoch": 1.0221510541766747, + "grad_norm": 0.3653635630100857, + "learning_rate": 8.520497423211527e-05, + "loss": 0.6176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6224901080131531, + "step": 3830, + "valid_targets_mean": 15665.9, + "valid_targets_min": 110 + }, + { + "epoch": 1.0234854550306913, + "grad_norm": 0.3963653125859711, + "learning_rate": 8.503188315109881e-05, + "loss": 0.6472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6270386576652527, + "step": 3835, + "valid_targets_mean": 15768.8, + "valid_targets_min": 566 + }, + { + "epoch": 1.0248198558847077, + "grad_norm": 0.45406483483665866, + "learning_rate": 8.485873764652832e-05, + "loss": 0.6325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6315596103668213, + "step": 3840, + "valid_targets_mean": 16419.9, + "valid_targets_min": 767 + }, + { + "epoch": 1.0261542567387243, + "grad_norm": 0.44474720584480903, + "learning_rate": 8.468553865772826e-05, + "loss": 0.6202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6255053281784058, + "step": 3845, + "valid_targets_mean": 16084.4, + "valid_targets_min": 503 + }, + { + "epoch": 1.0274886575927409, + "grad_norm": 0.39211860098514184, + "learning_rate": 8.451228712431332e-05, + "loss": 0.6344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6344472169876099, + "step": 3850, + "valid_targets_mean": 17080.2, + "valid_targets_min": 675 + }, + { + "epoch": 1.0288230584467575, + "grad_norm": 0.39459268154462224, + "learning_rate": 8.433898398618319e-05, + "loss": 0.6433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6279346942901611, + "step": 3855, + "valid_targets_mean": 15763.7, + "valid_targets_min": 650 + }, + { + "epoch": 1.0301574593007738, + "grad_norm": 0.45597533762198056, + "learning_rate": 8.416563018351758e-05, + "loss": 0.6209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6651809215545654, + "step": 3860, + "valid_targets_mean": 14995.1, + "valid_targets_min": 506 + }, + { + "epoch": 1.0314918601547904, + "grad_norm": 0.36845803818318634, + "learning_rate": 8.399222665677105e-05, + "loss": 0.646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6424490213394165, + "step": 3865, + "valid_targets_mean": 16269.7, + "valid_targets_min": 727 + }, + { + "epoch": 1.032826261008807, + "grad_norm": 0.3660998871304325, + "learning_rate": 8.381877434666784e-05, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6427116394042969, + "step": 3870, + "valid_targets_mean": 14471.5, + "valid_targets_min": 627 + }, + { + "epoch": 1.0341606618628236, + "grad_norm": 0.35705162926889794, + "learning_rate": 8.364527419419696e-05, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6127498149871826, + "step": 3875, + "valid_targets_mean": 15339.7, + "valid_targets_min": 517 + }, + { + "epoch": 1.0354950627168402, + "grad_norm": 0.3976760051887081, + "learning_rate": 8.347172714060686e-05, + "loss": 0.6366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6624436974525452, + "step": 3880, + "valid_targets_mean": 15717.8, + "valid_targets_min": 432 + }, + { + "epoch": 1.0368294635708566, + "grad_norm": 0.3248289435744747, + "learning_rate": 8.32981341274005e-05, + "loss": 0.6228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6057945489883423, + "step": 3885, + "valid_targets_mean": 15022.4, + "valid_targets_min": 20 + }, + { + "epoch": 1.0381638644248732, + "grad_norm": 0.3799068194660505, + "learning_rate": 8.312449609633014e-05, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380169987678528, + "step": 3890, + "valid_targets_mean": 16899.8, + "valid_targets_min": 629 + }, + { + "epoch": 1.0394982652788898, + "grad_norm": 0.27786217332276264, + "learning_rate": 8.295081398939227e-05, + "loss": 0.6264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6606595516204834, + "step": 3895, + "valid_targets_mean": 15556.7, + "valid_targets_min": 554 + }, + { + "epoch": 1.0408326661329064, + "grad_norm": 0.3262178393145254, + "learning_rate": 8.277708874882252e-05, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.608328104019165, + "step": 3900, + "valid_targets_mean": 16115.2, + "valid_targets_min": 787 + }, + { + "epoch": 1.042167066986923, + "grad_norm": 0.2967558099112656, + "learning_rate": 8.26033213170905e-05, + "loss": 0.6284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6086621284484863, + "step": 3905, + "valid_targets_mean": 16689.7, + "valid_targets_min": 794 + }, + { + "epoch": 1.0435014678409393, + "grad_norm": 0.18378657045763086, + "learning_rate": 8.242951263689468e-05, + "loss": 0.6477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6364154815673828, + "step": 3910, + "valid_targets_mean": 16203.4, + "valid_targets_min": 535 + }, + { + "epoch": 1.044835868694956, + "grad_norm": 0.2697854055357981, + "learning_rate": 8.225566365115738e-05, + "loss": 0.6357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6307680606842041, + "step": 3915, + "valid_targets_mean": 16268.8, + "valid_targets_min": 544 + }, + { + "epoch": 1.0461702695489725, + "grad_norm": 0.32997967067160905, + "learning_rate": 8.20817753030195e-05, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6161054372787476, + "step": 3920, + "valid_targets_mean": 16692.8, + "valid_targets_min": 399 + }, + { + "epoch": 1.0475046704029891, + "grad_norm": 0.2630706017357537, + "learning_rate": 8.190784853583554e-05, + "loss": 0.656, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6609646081924438, + "step": 3925, + "valid_targets_mean": 15393.3, + "valid_targets_min": 87 + }, + { + "epoch": 1.0488390712570057, + "grad_norm": 0.25045695026175163, + "learning_rate": 8.17338842931684e-05, + "loss": 0.6417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6067150235176086, + "step": 3930, + "valid_targets_mean": 17500.9, + "valid_targets_min": 542 + }, + { + "epoch": 1.050173472111022, + "grad_norm": 0.2177517219494181, + "learning_rate": 8.155988351878433e-05, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6083317995071411, + "step": 3935, + "valid_targets_mean": 15829.2, + "valid_targets_min": 872 + }, + { + "epoch": 1.0515078729650387, + "grad_norm": 0.3013828015707749, + "learning_rate": 8.138584715664766e-05, + "loss": 0.6578, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6143460273742676, + "step": 3940, + "valid_targets_mean": 15557.4, + "valid_targets_min": 861 + }, + { + "epoch": 1.0528422738190553, + "grad_norm": 0.30390911254139075, + "learning_rate": 8.121177615091591e-05, + "loss": 0.6457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6318605542182922, + "step": 3945, + "valid_targets_mean": 15857.7, + "valid_targets_min": 36 + }, + { + "epoch": 1.0541766746730719, + "grad_norm": 0.3350524541259267, + "learning_rate": 8.103767144593445e-05, + "loss": 0.6341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6261539459228516, + "step": 3950, + "valid_targets_mean": 16744.7, + "valid_targets_min": 463 + }, + { + "epoch": 1.0555110755270882, + "grad_norm": 0.30249343171639453, + "learning_rate": 8.086353398623154e-05, + "loss": 0.628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6331799030303955, + "step": 3955, + "valid_targets_mean": 16559.9, + "valid_targets_min": 620 + }, + { + "epoch": 1.0568454763811048, + "grad_norm": 0.2546085452828038, + "learning_rate": 8.068936471651308e-05, + "loss": 0.6425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6100320219993591, + "step": 3960, + "valid_targets_mean": 15661.1, + "valid_targets_min": 415 + }, + { + "epoch": 1.0581798772351214, + "grad_norm": 0.2646061268757464, + "learning_rate": 8.051516458165759e-05, + "loss": 0.6308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6500637531280518, + "step": 3965, + "valid_targets_mean": 15055.7, + "valid_targets_min": 473 + }, + { + "epoch": 1.059514278089138, + "grad_norm": 0.19452961730319374, + "learning_rate": 8.0340934526711e-05, + "loss": 0.6433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6682567596435547, + "step": 3970, + "valid_targets_mean": 15522.8, + "valid_targets_min": 587 + }, + { + "epoch": 1.0608486789431546, + "grad_norm": 0.2567508331337579, + "learning_rate": 8.016667549688157e-05, + "loss": 0.633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242945194244385, + "step": 3975, + "valid_targets_mean": 16522.6, + "valid_targets_min": 489 + }, + { + "epoch": 1.062183079797171, + "grad_norm": 0.21485742918403294, + "learning_rate": 7.999238843753474e-05, + "loss": 0.6357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6230143308639526, + "step": 3980, + "valid_targets_mean": 15910.7, + "valid_targets_min": 810 + }, + { + "epoch": 1.0635174806511876, + "grad_norm": 0.22484131136152755, + "learning_rate": 7.981807429418803e-05, + "loss": 0.6644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6617487072944641, + "step": 3985, + "valid_targets_mean": 15697.9, + "valid_targets_min": 621 + }, + { + "epoch": 1.0648518815052042, + "grad_norm": 0.20638645597298313, + "learning_rate": 7.96437340125059e-05, + "loss": 0.6214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6088519096374512, + "step": 3990, + "valid_targets_mean": 17400.2, + "valid_targets_min": 665 + }, + { + "epoch": 1.0661862823592207, + "grad_norm": 0.27568755648856647, + "learning_rate": 7.946936853829458e-05, + "loss": 0.6405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6442372798919678, + "step": 3995, + "valid_targets_mean": 16478.1, + "valid_targets_min": 430 + }, + { + "epoch": 1.0675206832132373, + "grad_norm": 0.3198359769041008, + "learning_rate": 7.929497881749699e-05, + "loss": 0.6363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.630896806716919, + "step": 4000, + "valid_targets_mean": 17061.9, + "valid_targets_min": 775 + }, + { + "epoch": 1.0688550840672537, + "grad_norm": 0.3236960340782802, + "learning_rate": 7.912056579618759e-05, + "loss": 0.648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6238499879837036, + "step": 4005, + "valid_targets_mean": 16409.8, + "valid_targets_min": 837 + }, + { + "epoch": 1.0701894849212703, + "grad_norm": 0.21317090795425317, + "learning_rate": 7.894613042056721e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6377233266830444, + "step": 4010, + "valid_targets_mean": 15927.7, + "valid_targets_min": 583 + }, + { + "epoch": 1.071523885775287, + "grad_norm": 0.3228179754734646, + "learning_rate": 7.877167363695805e-05, + "loss": 0.6405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6575232148170471, + "step": 4015, + "valid_targets_mean": 15166.5, + "valid_targets_min": 329 + }, + { + "epoch": 1.0728582866293035, + "grad_norm": 0.22502051279544055, + "learning_rate": 7.859719639179834e-05, + "loss": 0.6227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6041486263275146, + "step": 4020, + "valid_targets_mean": 16201.1, + "valid_targets_min": 364 + }, + { + "epoch": 1.07419268748332, + "grad_norm": 0.19018623600098714, + "learning_rate": 7.842269963163735e-05, + "loss": 0.6403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.615936279296875, + "step": 4025, + "valid_targets_mean": 17408.3, + "valid_targets_min": 700 + }, + { + "epoch": 1.0755270883373365, + "grad_norm": 0.2633541076294458, + "learning_rate": 7.824818430313028e-05, + "loss": 0.635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6207270622253418, + "step": 4030, + "valid_targets_mean": 16066.5, + "valid_targets_min": 57 + }, + { + "epoch": 1.076861489191353, + "grad_norm": 0.19894714512203296, + "learning_rate": 7.807365135303299e-05, + "loss": 0.6517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6607016324996948, + "step": 4035, + "valid_targets_mean": 15828.8, + "valid_targets_min": 604 + }, + { + "epoch": 1.0781958900453696, + "grad_norm": 0.2939348493891375, + "learning_rate": 7.789910172819693e-05, + "loss": 0.635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290296316146851, + "step": 4040, + "valid_targets_mean": 16706.2, + "valid_targets_min": 544 + }, + { + "epoch": 1.0795302908993862, + "grad_norm": 0.27275384805874286, + "learning_rate": 7.772453637556411e-05, + "loss": 0.6592, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6724493503570557, + "step": 4045, + "valid_targets_mean": 16034.1, + "valid_targets_min": 249 + }, + { + "epoch": 1.0808646917534026, + "grad_norm": 0.35278405634413196, + "learning_rate": 7.754995624216176e-05, + "loss": 0.6371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6188097596168518, + "step": 4050, + "valid_targets_mean": 16723.1, + "valid_targets_min": 574 + }, + { + "epoch": 1.0821990926074192, + "grad_norm": 0.26278431869708246, + "learning_rate": 7.737536227509734e-05, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200742721557617, + "step": 4055, + "valid_targets_mean": 15671.6, + "valid_targets_min": 392 + }, + { + "epoch": 1.0835334934614358, + "grad_norm": 0.27084560921646084, + "learning_rate": 7.720075542155336e-05, + "loss": 0.6645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6747046709060669, + "step": 4060, + "valid_targets_mean": 15743.4, + "valid_targets_min": 786 + }, + { + "epoch": 1.0848678943154524, + "grad_norm": 0.22793996132664027, + "learning_rate": 7.702613662878223e-05, + "loss": 0.6523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6548327803611755, + "step": 4065, + "valid_targets_mean": 15993.7, + "valid_targets_min": 609 + }, + { + "epoch": 1.086202295169469, + "grad_norm": 0.28041981538949434, + "learning_rate": 7.685150684410114e-05, + "loss": 0.6336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6257905960083008, + "step": 4070, + "valid_targets_mean": 15352.7, + "valid_targets_min": 682 + }, + { + "epoch": 1.0875366960234856, + "grad_norm": 0.2253117839055684, + "learning_rate": 7.667686701488688e-05, + "loss": 0.6369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5900462865829468, + "step": 4075, + "valid_targets_mean": 17873.3, + "valid_targets_min": 371 + }, + { + "epoch": 1.088871096877502, + "grad_norm": 0.23298394292558355, + "learning_rate": 7.650221808857081e-05, + "loss": 0.6425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6310970187187195, + "step": 4080, + "valid_targets_mean": 16328.8, + "valid_targets_min": 548 + }, + { + "epoch": 1.0902054977315185, + "grad_norm": 0.20823478267229803, + "learning_rate": 7.632756101263358e-05, + "loss": 0.6231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5811946392059326, + "step": 4085, + "valid_targets_mean": 17497.8, + "valid_targets_min": 411 + }, + { + "epoch": 1.0915398985855351, + "grad_norm": 0.28914326624880793, + "learning_rate": 7.615289673460003e-05, + "loss": 0.6376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6378998756408691, + "step": 4090, + "valid_targets_mean": 14718.8, + "valid_targets_min": 495 + }, + { + "epoch": 1.0928742994395517, + "grad_norm": 0.29919918167845155, + "learning_rate": 7.59782262020341e-05, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6432034373283386, + "step": 4095, + "valid_targets_mean": 16114.1, + "valid_targets_min": 308 + }, + { + "epoch": 1.094208700293568, + "grad_norm": 0.18872135872551207, + "learning_rate": 7.580355036253372e-05, + "loss": 0.6381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6325193643569946, + "step": 4100, + "valid_targets_mean": 14879.7, + "valid_targets_min": 701 + }, + { + "epoch": 1.0955431011475847, + "grad_norm": 0.2170776845688349, + "learning_rate": 7.562887016372551e-05, + "loss": 0.6436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6410015225410461, + "step": 4105, + "valid_targets_mean": 15726.7, + "valid_targets_min": 561 + }, + { + "epoch": 1.0968775020016013, + "grad_norm": 0.3454607950583436, + "learning_rate": 7.54541865532598e-05, + "loss": 0.6389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6285821199417114, + "step": 4110, + "valid_targets_mean": 16712.9, + "valid_targets_min": 682 + }, + { + "epoch": 1.0982119028556179, + "grad_norm": 0.256231016783552, + "learning_rate": 7.527950047880543e-05, + "loss": 0.6378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6538169980049133, + "step": 4115, + "valid_targets_mean": 15445.9, + "valid_targets_min": 477 + }, + { + "epoch": 1.0995463037096345, + "grad_norm": 0.2564298714151834, + "learning_rate": 7.51048128880446e-05, + "loss": 0.644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6618050336837769, + "step": 4120, + "valid_targets_mean": 14654.4, + "valid_targets_min": 620 + }, + { + "epoch": 1.1008807045636508, + "grad_norm": 0.2391895949624863, + "learning_rate": 7.493012472866769e-05, + "loss": 0.6383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6317932605743408, + "step": 4125, + "valid_targets_mean": 16660.1, + "valid_targets_min": 627 + }, + { + "epoch": 1.1022151054176674, + "grad_norm": 0.2307958569944933, + "learning_rate": 7.47554369483682e-05, + "loss": 0.6371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.656184732913971, + "step": 4130, + "valid_targets_mean": 15621.7, + "valid_targets_min": 681 + }, + { + "epoch": 1.103549506271684, + "grad_norm": 0.24380743638684044, + "learning_rate": 7.458075049483762e-05, + "loss": 0.6299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6304770112037659, + "step": 4135, + "valid_targets_mean": 16798.2, + "valid_targets_min": 458 + }, + { + "epoch": 1.1048839071257006, + "grad_norm": 0.28731780160095854, + "learning_rate": 7.44060663157602e-05, + "loss": 0.6378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6511474251747131, + "step": 4140, + "valid_targets_mean": 16375.2, + "valid_targets_min": 765 + }, + { + "epoch": 1.1062183079797172, + "grad_norm": 0.2513566937786385, + "learning_rate": 7.423138535880779e-05, + "loss": 0.638, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6225339770317078, + "step": 4145, + "valid_targets_mean": 16275.2, + "valid_targets_min": 395 + }, + { + "epoch": 1.1075527088337336, + "grad_norm": 0.40907374807887503, + "learning_rate": 7.405670857163489e-05, + "loss": 0.6476, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6531241536140442, + "step": 4150, + "valid_targets_mean": 16403.7, + "valid_targets_min": 617 + }, + { + "epoch": 1.1088871096877502, + "grad_norm": 0.41217346744153255, + "learning_rate": 7.388203690187325e-05, + "loss": 0.6384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6631238460540771, + "step": 4155, + "valid_targets_mean": 14551.2, + "valid_targets_min": 754 + }, + { + "epoch": 1.1102215105417668, + "grad_norm": 0.33374581286984195, + "learning_rate": 7.370737129712695e-05, + "loss": 0.6242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6131796836853027, + "step": 4160, + "valid_targets_mean": 16204.9, + "valid_targets_min": 666 + }, + { + "epoch": 1.1115559113957834, + "grad_norm": 0.45881666367462687, + "learning_rate": 7.353271270496713e-05, + "loss": 0.6458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6824424862861633, + "step": 4165, + "valid_targets_mean": 15262.4, + "valid_targets_min": 709 + }, + { + "epoch": 1.1128903122498, + "grad_norm": 0.3249252539125189, + "learning_rate": 7.335806207292687e-05, + "loss": 0.6408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6273507475852966, + "step": 4170, + "valid_targets_mean": 16026.1, + "valid_targets_min": 831 + }, + { + "epoch": 1.1142247131038163, + "grad_norm": 0.41682632170083284, + "learning_rate": 7.31834203484961e-05, + "loss": 0.6408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6524085402488708, + "step": 4175, + "valid_targets_mean": 14977.0, + "valid_targets_min": 735 + }, + { + "epoch": 1.115559113957833, + "grad_norm": 0.30109531205332285, + "learning_rate": 7.300878847911642e-05, + "loss": 0.6432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6498684883117676, + "step": 4180, + "valid_targets_mean": 15246.6, + "valid_targets_min": 278 + }, + { + "epoch": 1.1168935148118495, + "grad_norm": 0.3671309009672698, + "learning_rate": 7.283416741217595e-05, + "loss": 0.6211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6055911779403687, + "step": 4185, + "valid_targets_mean": 17311.5, + "valid_targets_min": 744 + }, + { + "epoch": 1.118227915665866, + "grad_norm": 0.3153704556403042, + "learning_rate": 7.26595580950042e-05, + "loss": 0.6513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.687164306640625, + "step": 4190, + "valid_targets_mean": 15870.5, + "valid_targets_min": 859 + }, + { + "epoch": 1.1195623165198825, + "grad_norm": 0.3666269955347262, + "learning_rate": 7.248496147486695e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6103506088256836, + "step": 4195, + "valid_targets_mean": 17057.8, + "valid_targets_min": 436 + }, + { + "epoch": 1.120896717373899, + "grad_norm": 0.3438879047175211, + "learning_rate": 7.23103784989611e-05, + "loss": 0.6451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6561911106109619, + "step": 4200, + "valid_targets_mean": 15884.4, + "valid_targets_min": 729 + }, + { + "epoch": 1.1222311182279157, + "grad_norm": 0.2833414402565143, + "learning_rate": 7.213581011440954e-05, + "loss": 0.6671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6505024433135986, + "step": 4205, + "valid_targets_mean": 16336.9, + "valid_targets_min": 199 + }, + { + "epoch": 1.1235655190819323, + "grad_norm": 0.34970656377825804, + "learning_rate": 7.1961257268256e-05, + "loss": 0.6377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6430806517601013, + "step": 4210, + "valid_targets_mean": 14787.7, + "valid_targets_min": 388 + }, + { + "epoch": 1.1248999199359488, + "grad_norm": 0.3823019646687883, + "learning_rate": 7.178672090745986e-05, + "loss": 0.6286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6347396373748779, + "step": 4215, + "valid_targets_mean": 16203.0, + "valid_targets_min": 602 + }, + { + "epoch": 1.1262343207899652, + "grad_norm": 0.3278569894429977, + "learning_rate": 7.161220197889114e-05, + "loss": 0.6409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6750344634056091, + "step": 4220, + "valid_targets_mean": 16876.0, + "valid_targets_min": 682 + }, + { + "epoch": 1.1275687216439818, + "grad_norm": 0.3283760936090551, + "learning_rate": 7.143770142932524e-05, + "loss": 0.6389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6138772964477539, + "step": 4225, + "valid_targets_mean": 17061.0, + "valid_targets_min": 719 + }, + { + "epoch": 1.1289031224979984, + "grad_norm": 0.2751031909904081, + "learning_rate": 7.126322020543785e-05, + "loss": 0.6336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.62000572681427, + "step": 4230, + "valid_targets_mean": 15323.3, + "valid_targets_min": 595 + }, + { + "epoch": 1.130237523352015, + "grad_norm": 0.3125927012088527, + "learning_rate": 7.108875925379991e-05, + "loss": 0.6333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6249172687530518, + "step": 4235, + "valid_targets_mean": 14841.3, + "valid_targets_min": 574 + }, + { + "epoch": 1.1315719242060316, + "grad_norm": 0.2353496713324635, + "learning_rate": 7.091431952087221e-05, + "loss": 0.6535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6486538648605347, + "step": 4240, + "valid_targets_mean": 15914.3, + "valid_targets_min": 604 + }, + { + "epoch": 1.132906325060048, + "grad_norm": 0.28818023845326846, + "learning_rate": 7.073990195300058e-05, + "loss": 0.6308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.616797685623169, + "step": 4245, + "valid_targets_mean": 15263.0, + "valid_targets_min": 312 + }, + { + "epoch": 1.1342407259140646, + "grad_norm": 0.30990451144746395, + "learning_rate": 7.056550749641056e-05, + "loss": 0.6361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6597074270248413, + "step": 4250, + "valid_targets_mean": 15883.9, + "valid_targets_min": 721 + }, + { + "epoch": 1.1355751267680811, + "grad_norm": 0.29519057375689733, + "learning_rate": 7.039113709720227e-05, + "loss": 0.6367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6335593461990356, + "step": 4255, + "valid_targets_mean": 15723.1, + "valid_targets_min": 999 + }, + { + "epoch": 1.1369095276220977, + "grad_norm": 0.23344528739206696, + "learning_rate": 7.021679170134533e-05, + "loss": 0.6264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6216973662376404, + "step": 4260, + "valid_targets_mean": 16099.4, + "valid_targets_min": 360 + }, + { + "epoch": 1.1382439284761143, + "grad_norm": 0.28822907095570005, + "learning_rate": 7.004247225467381e-05, + "loss": 0.6317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6207790970802307, + "step": 4265, + "valid_targets_mean": 16510.5, + "valid_targets_min": 613 + }, + { + "epoch": 1.1395783293301307, + "grad_norm": 0.22615557292653501, + "learning_rate": 6.986817970288082e-05, + "loss": 0.6356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6095227003097534, + "step": 4270, + "valid_targets_mean": 16566.2, + "valid_targets_min": 833 + }, + { + "epoch": 1.1409127301841473, + "grad_norm": 0.2789627702109262, + "learning_rate": 6.969391499151371e-05, + "loss": 0.6208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.612389326095581, + "step": 4275, + "valid_targets_mean": 15183.5, + "valid_targets_min": 391 + }, + { + "epoch": 1.1422471310381639, + "grad_norm": 0.19826473078863655, + "learning_rate": 6.95196790659688e-05, + "loss": 0.6332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6624350547790527, + "step": 4280, + "valid_targets_mean": 15083.0, + "valid_targets_min": 711 + }, + { + "epoch": 1.1435815318921805, + "grad_norm": 0.22431913852918883, + "learning_rate": 6.934547287148614e-05, + "loss": 0.6453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6406052112579346, + "step": 4285, + "valid_targets_mean": 15643.4, + "valid_targets_min": 514 + }, + { + "epoch": 1.1449159327461969, + "grad_norm": 0.16484255463144135, + "learning_rate": 6.917129735314455e-05, + "loss": 0.6393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6505135297775269, + "step": 4290, + "valid_targets_mean": 15640.7, + "valid_targets_min": 482 + }, + { + "epoch": 1.1462503336002134, + "grad_norm": 0.18808915828082584, + "learning_rate": 6.899715345585649e-05, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6421415209770203, + "step": 4295, + "valid_targets_mean": 16454.7, + "valid_targets_min": 303 + }, + { + "epoch": 1.14758473445423, + "grad_norm": 0.20215904565478326, + "learning_rate": 6.882304212436272e-05, + "loss": 0.6413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6256978511810303, + "step": 4300, + "valid_targets_mean": 16380.1, + "valid_targets_min": 657 + }, + { + "epoch": 1.1489191353082466, + "grad_norm": 0.48019910123488907, + "learning_rate": 6.864896430322745e-05, + "loss": 0.6659, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7197443246841431, + "step": 4305, + "valid_targets_mean": 15080.7, + "valid_targets_min": 751 + }, + { + "epoch": 1.1502535361622632, + "grad_norm": 0.18749183197740524, + "learning_rate": 6.84749209368331e-05, + "loss": 0.6176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5742081999778748, + "step": 4310, + "valid_targets_mean": 17511.4, + "valid_targets_min": 409 + }, + { + "epoch": 1.1515879370162796, + "grad_norm": 0.2364048097934658, + "learning_rate": 6.830091296937509e-05, + "loss": 0.6325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6291307806968689, + "step": 4315, + "valid_targets_mean": 15929.1, + "valid_targets_min": 556 + }, + { + "epoch": 1.1529223378702962, + "grad_norm": 0.2601345422541887, + "learning_rate": 6.812694134485686e-05, + "loss": 0.6368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6046054363250732, + "step": 4320, + "valid_targets_mean": 16293.8, + "valid_targets_min": 387 + }, + { + "epoch": 1.1542567387243128, + "grad_norm": 0.2605636939487043, + "learning_rate": 6.795300700708466e-05, + "loss": 0.6403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6342687606811523, + "step": 4325, + "valid_targets_mean": 16742.1, + "valid_targets_min": 776 + }, + { + "epoch": 1.1555911395783294, + "grad_norm": 0.2702252161459794, + "learning_rate": 6.777911089966245e-05, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6475258469581604, + "step": 4330, + "valid_targets_mean": 15410.6, + "valid_targets_min": 59 + }, + { + "epoch": 1.156925540432346, + "grad_norm": 0.21623367735516652, + "learning_rate": 6.760525396598686e-05, + "loss": 0.6498, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6857297420501709, + "step": 4335, + "valid_targets_mean": 15698.7, + "valid_targets_min": 472 + }, + { + "epoch": 1.1582599412863623, + "grad_norm": 0.2524994678636068, + "learning_rate": 6.74314371492419e-05, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.655139684677124, + "step": 4340, + "valid_targets_mean": 15753.3, + "valid_targets_min": 497 + }, + { + "epoch": 1.159594342140379, + "grad_norm": 0.35038263626958716, + "learning_rate": 6.725766139239399e-05, + "loss": 0.6372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6007696986198425, + "step": 4345, + "valid_targets_mean": 15674.3, + "valid_targets_min": 301 + }, + { + "epoch": 1.1609287429943955, + "grad_norm": 0.27171891513965785, + "learning_rate": 6.708392763818681e-05, + "loss": 0.6347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6097182035446167, + "step": 4350, + "valid_targets_mean": 15697.2, + "valid_targets_min": 186 + }, + { + "epoch": 1.1622631438484121, + "grad_norm": 0.3963280716536439, + "learning_rate": 6.691023682913616e-05, + "loss": 0.6488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.665363609790802, + "step": 4355, + "valid_targets_mean": 17297.8, + "valid_targets_min": 362 + }, + { + "epoch": 1.1635975447024287, + "grad_norm": 0.3304867835821895, + "learning_rate": 6.673658990752484e-05, + "loss": 0.6301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6157478094100952, + "step": 4360, + "valid_targets_mean": 16411.7, + "valid_targets_min": 248 + }, + { + "epoch": 1.164931945556445, + "grad_norm": 0.36259027834719193, + "learning_rate": 6.656298781539764e-05, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6261616945266724, + "step": 4365, + "valid_targets_mean": 16823.3, + "valid_targets_min": 129 + }, + { + "epoch": 1.1662663464104617, + "grad_norm": 0.29117128189517166, + "learning_rate": 6.638943149455598e-05, + "loss": 0.6417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6324571371078491, + "step": 4370, + "valid_targets_mean": 15005.9, + "valid_targets_min": 460 + }, + { + "epoch": 1.1676007472644783, + "grad_norm": 0.2521032334673322, + "learning_rate": 6.621592188655314e-05, + "loss": 0.6298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6089852452278137, + "step": 4375, + "valid_targets_mean": 15565.0, + "valid_targets_min": 603 + }, + { + "epoch": 1.1689351481184949, + "grad_norm": 0.3063978273693239, + "learning_rate": 6.604245993268893e-05, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6192407608032227, + "step": 4380, + "valid_targets_mean": 16533.9, + "valid_targets_min": 731 + }, + { + "epoch": 1.1702695489725112, + "grad_norm": 0.2919718403743578, + "learning_rate": 6.586904657400457e-05, + "loss": 0.635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6104006171226501, + "step": 4385, + "valid_targets_mean": 15465.3, + "valid_targets_min": 331 + }, + { + "epoch": 1.1716039498265278, + "grad_norm": 0.27954703339928455, + "learning_rate": 6.569568275127769e-05, + "loss": 0.6164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6153366565704346, + "step": 4390, + "valid_targets_mean": 16239.0, + "valid_targets_min": 875 + }, + { + "epoch": 1.1729383506805444, + "grad_norm": 0.2577231730281383, + "learning_rate": 6.552236940501725e-05, + "loss": 0.6168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6046464443206787, + "step": 4395, + "valid_targets_mean": 14669.8, + "valid_targets_min": 452 + }, + { + "epoch": 1.174272751534561, + "grad_norm": 0.27404691900004263, + "learning_rate": 6.534910747545825e-05, + "loss": 0.6199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6306606531143188, + "step": 4400, + "valid_targets_mean": 15363.8, + "valid_targets_min": 528 + }, + { + "epoch": 1.1756071523885776, + "grad_norm": 0.1798445084889397, + "learning_rate": 6.517589790255686e-05, + "loss": 0.6488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6698160171508789, + "step": 4405, + "valid_targets_mean": 14588.3, + "valid_targets_min": 371 + }, + { + "epoch": 1.1769415532425942, + "grad_norm": 0.30087020212970406, + "learning_rate": 6.500274162598512e-05, + "loss": 0.6411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6415399312973022, + "step": 4410, + "valid_targets_mean": 15331.5, + "valid_targets_min": 482 + }, + { + "epoch": 1.1782759540966106, + "grad_norm": 0.22891062443425242, + "learning_rate": 6.482963958512599e-05, + "loss": 0.6342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6426824927330017, + "step": 4415, + "valid_targets_mean": 15908.3, + "valid_targets_min": 726 + }, + { + "epoch": 1.1796103549506272, + "grad_norm": 0.25552739097544924, + "learning_rate": 6.465659271906823e-05, + "loss": 0.6277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185193061828613, + "step": 4420, + "valid_targets_mean": 16322.4, + "valid_targets_min": 403 + }, + { + "epoch": 1.1809447558046438, + "grad_norm": 0.25044588493176134, + "learning_rate": 6.448360196660116e-05, + "loss": 0.6371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6124670505523682, + "step": 4425, + "valid_targets_mean": 16749.6, + "valid_targets_min": 614 + }, + { + "epoch": 1.1822791566586603, + "grad_norm": 0.19454645206623475, + "learning_rate": 6.43106682662098e-05, + "loss": 0.629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6282304525375366, + "step": 4430, + "valid_targets_mean": 15491.6, + "valid_targets_min": 384 + }, + { + "epoch": 1.1836135575126767, + "grad_norm": 0.2540826353003291, + "learning_rate": 6.413779255606961e-05, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6295236349105835, + "step": 4435, + "valid_targets_mean": 15087.2, + "valid_targets_min": 167 + }, + { + "epoch": 1.1849479583666933, + "grad_norm": 0.3649774351284495, + "learning_rate": 6.396497577404143e-05, + "loss": 0.6455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.64961838722229, + "step": 4440, + "valid_targets_mean": 16165.2, + "valid_targets_min": 584 + }, + { + "epoch": 1.18628235922071, + "grad_norm": 0.3090907649636376, + "learning_rate": 6.379221885766643e-05, + "loss": 0.6293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6002676486968994, + "step": 4445, + "valid_targets_mean": 16184.6, + "valid_targets_min": 314 + }, + { + "epoch": 1.1876167600747265, + "grad_norm": 0.2670827791758813, + "learning_rate": 6.361952274416106e-05, + "loss": 0.6231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6144086122512817, + "step": 4450, + "valid_targets_mean": 17209.1, + "valid_targets_min": 611 + }, + { + "epoch": 1.188951160928743, + "grad_norm": 0.2762036773882695, + "learning_rate": 6.344688837041177e-05, + "loss": 0.6262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.61281418800354, + "step": 4455, + "valid_targets_mean": 18342.9, + "valid_targets_min": 328 + }, + { + "epoch": 1.1902855617827595, + "grad_norm": 0.36065831326273906, + "learning_rate": 6.32743166729702e-05, + "loss": 0.6359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284192204475403, + "step": 4460, + "valid_targets_mean": 16182.9, + "valid_targets_min": 297 + }, + { + "epoch": 1.191619962636776, + "grad_norm": 0.23353933817304148, + "learning_rate": 6.310180858804794e-05, + "loss": 0.6485, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6543843150138855, + "step": 4465, + "valid_targets_mean": 15583.2, + "valid_targets_min": 421 + }, + { + "epoch": 1.1929543634907926, + "grad_norm": 0.3570787968656111, + "learning_rate": 6.292936505151145e-05, + "loss": 0.6412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6564721465110779, + "step": 4470, + "valid_targets_mean": 14519.4, + "valid_targets_min": 535 + }, + { + "epoch": 1.1942887643448092, + "grad_norm": 0.36008419141471126, + "learning_rate": 6.275698699887699e-05, + "loss": 0.6161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520239114761353, + "step": 4475, + "valid_targets_mean": 16250.3, + "valid_targets_min": 53 + }, + { + "epoch": 1.1956231651988256, + "grad_norm": 0.3207534581185475, + "learning_rate": 6.258467536530565e-05, + "loss": 0.6344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185310482978821, + "step": 4480, + "valid_targets_mean": 15550.9, + "valid_targets_min": 299 + }, + { + "epoch": 1.1969575660528422, + "grad_norm": 0.2775970978135452, + "learning_rate": 6.241243108559811e-05, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6161234378814697, + "step": 4485, + "valid_targets_mean": 16199.4, + "valid_targets_min": 491 + }, + { + "epoch": 1.1982919669068588, + "grad_norm": 0.3128052037762757, + "learning_rate": 6.224025509418971e-05, + "loss": 0.6491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6437747478485107, + "step": 4490, + "valid_targets_mean": 14918.8, + "valid_targets_min": 722 + }, + { + "epoch": 1.1996263677608754, + "grad_norm": 0.3206313524507226, + "learning_rate": 6.206814832514525e-05, + "loss": 0.6343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6561208963394165, + "step": 4495, + "valid_targets_mean": 15631.4, + "valid_targets_min": 262 + }, + { + "epoch": 1.200960768614892, + "grad_norm": 0.29463076747279565, + "learning_rate": 6.189611171215405e-05, + "loss": 0.6299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6470526456832886, + "step": 4500, + "valid_targets_mean": 16196.3, + "valid_targets_min": 364 + }, + { + "epoch": 1.2022951694689086, + "grad_norm": 0.21321940478714968, + "learning_rate": 6.172414618852488e-05, + "loss": 0.6394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6385337114334106, + "step": 4505, + "valid_targets_mean": 17155.1, + "valid_targets_min": 810 + }, + { + "epoch": 1.203629570322925, + "grad_norm": 0.33018462000086, + "learning_rate": 6.155225268718069e-05, + "loss": 0.6193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6546652913093567, + "step": 4510, + "valid_targets_mean": 15543.9, + "valid_targets_min": 444 + }, + { + "epoch": 1.2049639711769415, + "grad_norm": 0.2191433153569452, + "learning_rate": 6.138043214065385e-05, + "loss": 0.6274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6190072298049927, + "step": 4515, + "valid_targets_mean": 16248.8, + "valid_targets_min": 522 + }, + { + "epoch": 1.2062983720309581, + "grad_norm": 0.2941732327678985, + "learning_rate": 6.120868548108093e-05, + "loss": 0.6194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6256512403488159, + "step": 4520, + "valid_targets_mean": 15419.4, + "valid_targets_min": 439 + }, + { + "epoch": 1.2076327728849747, + "grad_norm": 0.27394641869706676, + "learning_rate": 6.103701364019754e-05, + "loss": 0.6327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.625571608543396, + "step": 4525, + "valid_targets_mean": 16626.2, + "valid_targets_min": 643 + }, + { + "epoch": 1.208967173738991, + "grad_norm": 0.3562152679188747, + "learning_rate": 6.0865417549333536e-05, + "loss": 0.6431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6560186147689819, + "step": 4530, + "valid_targets_mean": 15384.8, + "valid_targets_min": 538 + }, + { + "epoch": 1.2103015745930077, + "grad_norm": 0.2864401824703139, + "learning_rate": 6.0693898139407786e-05, + "loss": 0.6433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6474707126617432, + "step": 4535, + "valid_targets_mean": 15037.6, + "valid_targets_min": 725 + }, + { + "epoch": 1.2116359754470243, + "grad_norm": 0.3635249627954564, + "learning_rate": 6.0522456340923085e-05, + "loss": 0.6261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6389481425285339, + "step": 4540, + "valid_targets_mean": 15964.4, + "valid_targets_min": 150 + }, + { + "epoch": 1.2129703763010409, + "grad_norm": 0.25685540368852067, + "learning_rate": 6.0351093083961267e-05, + "loss": 0.6203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290313005447388, + "step": 4545, + "valid_targets_mean": 15779.2, + "valid_targets_min": 26 + }, + { + "epoch": 1.2143047771550575, + "grad_norm": 0.29619248753111965, + "learning_rate": 6.017980929817807e-05, + "loss": 0.6292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6584930419921875, + "step": 4550, + "valid_targets_mean": 16471.1, + "valid_targets_min": 516 + }, + { + "epoch": 1.2156391780090738, + "grad_norm": 0.28564040063006574, + "learning_rate": 6.000860591279801e-05, + "loss": 0.6325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6416076421737671, + "step": 4555, + "valid_targets_mean": 14785.7, + "valid_targets_min": 757 + }, + { + "epoch": 1.2169735788630904, + "grad_norm": 0.3510476897469252, + "learning_rate": 5.9837483856609527e-05, + "loss": 0.6353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6294372081756592, + "step": 4560, + "valid_targets_mean": 16263.0, + "valid_targets_min": 549 + }, + { + "epoch": 1.218307979717107, + "grad_norm": 0.3394073281836747, + "learning_rate": 5.966644405795982e-05, + "loss": 0.631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6662023067474365, + "step": 4565, + "valid_targets_mean": 16064.6, + "valid_targets_min": 613 + }, + { + "epoch": 1.2196423805711236, + "grad_norm": 0.30884667299242735, + "learning_rate": 5.949548744474978e-05, + "loss": 0.6214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6019168496131897, + "step": 4570, + "valid_targets_mean": 15504.7, + "valid_targets_min": 693 + }, + { + "epoch": 1.22097678142514, + "grad_norm": 0.26457608857420895, + "learning_rate": 5.9324614944429095e-05, + "loss": 0.6387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6279822587966919, + "step": 4575, + "valid_targets_mean": 15599.3, + "valid_targets_min": 585 + }, + { + "epoch": 1.2223111822791566, + "grad_norm": 0.2621594312135588, + "learning_rate": 5.915382748399105e-05, + "loss": 0.6431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.625961184501648, + "step": 4580, + "valid_targets_mean": 16323.6, + "valid_targets_min": 504 + }, + { + "epoch": 1.2236455831331732, + "grad_norm": 0.28013919204235443, + "learning_rate": 5.8983125989967646e-05, + "loss": 0.6493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6862317323684692, + "step": 4585, + "valid_targets_mean": 16439.2, + "valid_targets_min": 223 + }, + { + "epoch": 1.2249799839871898, + "grad_norm": 0.2811201149430358, + "learning_rate": 5.881251138842453e-05, + "loss": 0.6277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5923159122467041, + "step": 4590, + "valid_targets_mean": 16460.1, + "valid_targets_min": 553 + }, + { + "epoch": 1.2263143848412064, + "grad_norm": 0.22967843281129904, + "learning_rate": 5.864198460495585e-05, + "loss": 0.6351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6291022300720215, + "step": 4595, + "valid_targets_mean": 15312.0, + "valid_targets_min": 356 + }, + { + "epoch": 1.227648785695223, + "grad_norm": 0.23520044247290123, + "learning_rate": 5.847154656467944e-05, + "loss": 0.6319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6028156280517578, + "step": 4600, + "valid_targets_mean": 16651.4, + "valid_targets_min": 355 + }, + { + "epoch": 1.2289831865492393, + "grad_norm": 0.26946665323032615, + "learning_rate": 5.830119819223166e-05, + "loss": 0.6267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6300636529922485, + "step": 4605, + "valid_targets_mean": 16018.6, + "valid_targets_min": 570 + }, + { + "epoch": 1.230317587403256, + "grad_norm": 0.32477605566846685, + "learning_rate": 5.8130940411762406e-05, + "loss": 0.6249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6440907716751099, + "step": 4610, + "valid_targets_mean": 17033.9, + "valid_targets_min": 473 + }, + { + "epoch": 1.2316519882572725, + "grad_norm": 0.23081030208781445, + "learning_rate": 5.79607741469301e-05, + "loss": 0.6445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6172423958778381, + "step": 4615, + "valid_targets_mean": 16389.6, + "valid_targets_min": 675 + }, + { + "epoch": 1.232986389111289, + "grad_norm": 0.31649508316647457, + "learning_rate": 5.779070032089674e-05, + "loss": 0.6387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6402013301849365, + "step": 4620, + "valid_targets_mean": 15918.7, + "valid_targets_min": 293 + }, + { + "epoch": 1.2343207899653055, + "grad_norm": 0.19452765805479708, + "learning_rate": 5.762071985632276e-05, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6300052404403687, + "step": 4625, + "valid_targets_mean": 16835.9, + "valid_targets_min": 520 + }, + { + "epoch": 1.235655190819322, + "grad_norm": 0.2823409706822507, + "learning_rate": 5.745083367536217e-05, + "loss": 0.6245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.620025634765625, + "step": 4630, + "valid_targets_mean": 15694.7, + "valid_targets_min": 427 + }, + { + "epoch": 1.2369895916733387, + "grad_norm": 0.26476187073764795, + "learning_rate": 5.7281042699657465e-05, + "loss": 0.6388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380904912948608, + "step": 4635, + "valid_targets_mean": 16004.7, + "valid_targets_min": 740 + }, + { + "epoch": 1.2383239925273553, + "grad_norm": 0.3134755420445105, + "learning_rate": 5.71113478503346e-05, + "loss": 0.633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6498226523399353, + "step": 4640, + "valid_targets_mean": 16175.9, + "valid_targets_min": 27 + }, + { + "epoch": 1.2396583933813718, + "grad_norm": 0.20770097652952002, + "learning_rate": 5.694175004799814e-05, + "loss": 0.6361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6252698302268982, + "step": 4645, + "valid_targets_mean": 16053.2, + "valid_targets_min": 558 + }, + { + "epoch": 1.2409927942353882, + "grad_norm": 0.3212021535054955, + "learning_rate": 5.6772250212726025e-05, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6281235218048096, + "step": 4650, + "valid_targets_mean": 14775.4, + "valid_targets_min": 564 + }, + { + "epoch": 1.2423271950894048, + "grad_norm": 0.2152007420515824, + "learning_rate": 5.660284926406484e-05, + "loss": 0.6241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6370538473129272, + "step": 4655, + "valid_targets_mean": 16842.9, + "valid_targets_min": 675 + }, + { + "epoch": 1.2436615959434214, + "grad_norm": 0.31336835020726617, + "learning_rate": 5.64335481210247e-05, + "loss": 0.6395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6438559293746948, + "step": 4660, + "valid_targets_mean": 17387.4, + "valid_targets_min": 505 + }, + { + "epoch": 1.244995996797438, + "grad_norm": 0.23760951337333752, + "learning_rate": 5.626434770207414e-05, + "loss": 0.6264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6267757415771484, + "step": 4665, + "valid_targets_mean": 16263.9, + "valid_targets_min": 318 + }, + { + "epoch": 1.2463303976514546, + "grad_norm": 0.23155203486515635, + "learning_rate": 5.60952489251354e-05, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6151365041732788, + "step": 4670, + "valid_targets_mean": 17165.5, + "valid_targets_min": 39 + }, + { + "epoch": 1.247664798505471, + "grad_norm": 0.22217206648146606, + "learning_rate": 5.592625270757928e-05, + "loss": 0.6383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6513705253601074, + "step": 4675, + "valid_targets_mean": 14673.6, + "valid_targets_min": 571 + }, + { + "epoch": 1.2489991993594876, + "grad_norm": 0.22140652238088304, + "learning_rate": 5.575735996622011e-05, + "loss": 0.6178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6008556485176086, + "step": 4680, + "valid_targets_mean": 17656.0, + "valid_targets_min": 297 + }, + { + "epoch": 1.2503336002135041, + "grad_norm": 0.19959940963850556, + "learning_rate": 5.558857161731093e-05, + "loss": 0.6328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6737499833106995, + "step": 4685, + "valid_targets_mean": 15595.3, + "valid_targets_min": 326 + }, + { + "epoch": 1.2516680010675207, + "grad_norm": 0.2504724859467704, + "learning_rate": 5.541988857653847e-05, + "loss": 0.6305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380608081817627, + "step": 4690, + "valid_targets_mean": 15766.5, + "valid_targets_min": 691 + }, + { + "epoch": 1.2530024019215373, + "grad_norm": 0.2672212181599046, + "learning_rate": 5.5251311759018046e-05, + "loss": 0.6289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6470935344696045, + "step": 4695, + "valid_targets_mean": 15265.7, + "valid_targets_min": 574 + }, + { + "epoch": 1.2543368027755537, + "grad_norm": 0.17364708553119368, + "learning_rate": 5.508284207928879e-05, + "loss": 0.6305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420101523399353, + "step": 4700, + "valid_targets_mean": 15472.1, + "valid_targets_min": 29 + }, + { + "epoch": 1.2556712036295703, + "grad_norm": 0.1975931861065749, + "learning_rate": 5.491448045130865e-05, + "loss": 0.6244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6059800386428833, + "step": 4705, + "valid_targets_mean": 17265.4, + "valid_targets_min": 334 + }, + { + "epoch": 1.257005604483587, + "grad_norm": 0.19654584278709405, + "learning_rate": 5.4746227788449236e-05, + "loss": 0.6192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5940755605697632, + "step": 4710, + "valid_targets_mean": 17243.3, + "valid_targets_min": 264 + }, + { + "epoch": 1.2583400053376035, + "grad_norm": 0.17652417356658778, + "learning_rate": 5.457808500349115e-05, + "loss": 0.633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6395894289016724, + "step": 4715, + "valid_targets_mean": 15693.4, + "valid_targets_min": 282 + }, + { + "epoch": 1.2596744061916199, + "grad_norm": 0.21081149707273059, + "learning_rate": 5.441005300861887e-05, + "loss": 0.6271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.645363986492157, + "step": 4720, + "valid_targets_mean": 15345.9, + "valid_targets_min": 354 + }, + { + "epoch": 1.2610088070456364, + "grad_norm": 0.21219622352906828, + "learning_rate": 5.424213271541578e-05, + "loss": 0.6518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6449532508850098, + "step": 4725, + "valid_targets_mean": 16548.9, + "valid_targets_min": 749 + }, + { + "epoch": 1.262343207899653, + "grad_norm": 0.20776927168613465, + "learning_rate": 5.4074325034859336e-05, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6154712438583374, + "step": 4730, + "valid_targets_mean": 15414.3, + "valid_targets_min": 383 + }, + { + "epoch": 1.2636776087536696, + "grad_norm": 0.14797261024718483, + "learning_rate": 5.390663087731605e-05, + "loss": 0.641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6244392395019531, + "step": 4735, + "valid_targets_mean": 16484.8, + "valid_targets_min": 982 + }, + { + "epoch": 1.2650120096076862, + "grad_norm": 0.23990355060984186, + "learning_rate": 5.3739051152536506e-05, + "loss": 0.6199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6142117977142334, + "step": 4740, + "valid_targets_mean": 16228.0, + "valid_targets_min": 56 + }, + { + "epoch": 1.2663464104617028, + "grad_norm": 0.22640906977866915, + "learning_rate": 5.357158676965059e-05, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6549844741821289, + "step": 4745, + "valid_targets_mean": 16698.5, + "valid_targets_min": 865 + }, + { + "epoch": 1.2676808113157192, + "grad_norm": 0.2735033998795201, + "learning_rate": 5.3404238637162364e-05, + "loss": 0.6364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6428447961807251, + "step": 4750, + "valid_targets_mean": 16238.8, + "valid_targets_min": 118 + }, + { + "epoch": 1.2690152121697358, + "grad_norm": 0.2462400805867784, + "learning_rate": 5.323700766294526e-05, + "loss": 0.6269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6167312264442444, + "step": 4755, + "valid_targets_mean": 15054.7, + "valid_targets_min": 369 + }, + { + "epoch": 1.2703496130237524, + "grad_norm": 0.18587242356920117, + "learning_rate": 5.306989475423712e-05, + "loss": 0.625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6305737495422363, + "step": 4760, + "valid_targets_mean": 16805.6, + "valid_targets_min": 671 + }, + { + "epoch": 1.2716840138777687, + "grad_norm": 0.2021984168637943, + "learning_rate": 5.2902900817635264e-05, + "loss": 0.6395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6341131925582886, + "step": 4765, + "valid_targets_mean": 14891.0, + "valid_targets_min": 403 + }, + { + "epoch": 1.2730184147317853, + "grad_norm": 0.1721371921090052, + "learning_rate": 5.273602675909159e-05, + "loss": 0.6528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6565139293670654, + "step": 4770, + "valid_targets_mean": 16145.6, + "valid_targets_min": 579 + }, + { + "epoch": 1.274352815585802, + "grad_norm": 0.1607326214209887, + "learning_rate": 5.256927348390765e-05, + "loss": 0.6384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6334860920906067, + "step": 4775, + "valid_targets_mean": 16294.3, + "valid_targets_min": 230 + }, + { + "epoch": 1.2756872164398185, + "grad_norm": 0.16235131734879868, + "learning_rate": 5.24026418967297e-05, + "loss": 0.6329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6610786318778992, + "step": 4780, + "valid_targets_mean": 15935.6, + "valid_targets_min": 289 + }, + { + "epoch": 1.2770216172938351, + "grad_norm": 0.16419031382936092, + "learning_rate": 5.2236132901543895e-05, + "loss": 0.6168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6397436261177063, + "step": 4785, + "valid_targets_mean": 15607.6, + "valid_targets_min": 237 + }, + { + "epoch": 1.2783560181478517, + "grad_norm": 0.1987148988456433, + "learning_rate": 5.2069747401671334e-05, + "loss": 0.6283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6338160037994385, + "step": 4790, + "valid_targets_mean": 15817.7, + "valid_targets_min": 420 + }, + { + "epoch": 1.279690419001868, + "grad_norm": 0.17343024441593377, + "learning_rate": 5.1903486299763026e-05, + "loss": 0.6343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.607448935508728, + "step": 4795, + "valid_targets_mean": 16366.8, + "valid_targets_min": 624 + }, + { + "epoch": 1.2810248198558847, + "grad_norm": 0.16366990841190826, + "learning_rate": 5.173735049779523e-05, + "loss": 0.6427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623712956905365, + "step": 4800, + "valid_targets_mean": 16776.7, + "valid_targets_min": 567 + }, + { + "epoch": 1.2823592207099013, + "grad_norm": 0.19917720907875183, + "learning_rate": 5.1571340897064454e-05, + "loss": 0.6323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6857748627662659, + "step": 4805, + "valid_targets_mean": 14956.1, + "valid_targets_min": 433 + }, + { + "epoch": 1.2836936215639179, + "grad_norm": 0.3813637628640378, + "learning_rate": 5.140545839818242e-05, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.605983316898346, + "step": 4810, + "valid_targets_mean": 16493.7, + "valid_targets_min": 573 + }, + { + "epoch": 1.2850280224179342, + "grad_norm": 0.18836472575490848, + "learning_rate": 5.1239703901071506e-05, + "loss": 0.6119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6219553351402283, + "step": 4815, + "valid_targets_mean": 16133.3, + "valid_targets_min": 569 + }, + { + "epoch": 1.2863624232719508, + "grad_norm": 0.1893647179336856, + "learning_rate": 5.1074078304959474e-05, + "loss": 0.6274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6246172785758972, + "step": 4820, + "valid_targets_mean": 15314.3, + "valid_targets_min": 596 + }, + { + "epoch": 1.2876968241259674, + "grad_norm": 0.1584138984615297, + "learning_rate": 5.090858250837495e-05, + "loss": 0.6358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6141932606697083, + "step": 4825, + "valid_targets_mean": 15665.5, + "valid_targets_min": 686 + }, + { + "epoch": 1.289031224979984, + "grad_norm": 0.18886991213724974, + "learning_rate": 5.0743217409142344e-05, + "loss": 0.6267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5984083414077759, + "step": 4830, + "valid_targets_mean": 17682.3, + "valid_targets_min": 565 + }, + { + "epoch": 1.2903656258340006, + "grad_norm": 0.1787055361455221, + "learning_rate": 5.057798390437696e-05, + "loss": 0.6363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6204890012741089, + "step": 4835, + "valid_targets_mean": 17329.2, + "valid_targets_min": 527 + }, + { + "epoch": 1.2917000266880172, + "grad_norm": 0.2697400634607623, + "learning_rate": 5.0412882890480266e-05, + "loss": 0.6312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6120416522026062, + "step": 4840, + "valid_targets_mean": 16662.8, + "valid_targets_min": 381 + }, + { + "epoch": 1.2930344275420336, + "grad_norm": 0.18808204647018414, + "learning_rate": 5.0247915263134984e-05, + "loss": 0.6364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6301390528678894, + "step": 4845, + "valid_targets_mean": 16133.6, + "valid_targets_min": 535 + }, + { + "epoch": 1.2943688283960502, + "grad_norm": 0.18255274583932535, + "learning_rate": 5.0083081917300086e-05, + "loss": 0.6501, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6858794689178467, + "step": 4850, + "valid_targets_mean": 16014.1, + "valid_targets_min": 561 + }, + { + "epoch": 1.2957032292500668, + "grad_norm": 0.1655884067769675, + "learning_rate": 4.991838374720618e-05, + "loss": 0.6462, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6166006326675415, + "step": 4855, + "valid_targets_mean": 15985.5, + "valid_targets_min": 419 + }, + { + "epoch": 1.2970376301040831, + "grad_norm": 0.17322275617538, + "learning_rate": 4.975382164635051e-05, + "loss": 0.6126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6046770215034485, + "step": 4860, + "valid_targets_mean": 15465.7, + "valid_targets_min": 465 + }, + { + "epoch": 1.2983720309580997, + "grad_norm": 0.15974272488697086, + "learning_rate": 4.9589396507492044e-05, + "loss": 0.6373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6578046083450317, + "step": 4865, + "valid_targets_mean": 16058.8, + "valid_targets_min": 577 + }, + { + "epoch": 1.2997064318121163, + "grad_norm": 0.18475723438811187, + "learning_rate": 4.942510922264686e-05, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5904414057731628, + "step": 4870, + "valid_targets_mean": 16700.1, + "valid_targets_min": 724 + }, + { + "epoch": 1.301040832666133, + "grad_norm": 0.1698843941112048, + "learning_rate": 4.926096068308312e-05, + "loss": 0.6265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6341725587844849, + "step": 4875, + "valid_targets_mean": 15507.0, + "valid_targets_min": 234 + }, + { + "epoch": 1.3023752335201495, + "grad_norm": 0.14543667801391244, + "learning_rate": 4.90969517793162e-05, + "loss": 0.6388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6560980081558228, + "step": 4880, + "valid_targets_mean": 16731.6, + "valid_targets_min": 460 + }, + { + "epoch": 1.303709634374166, + "grad_norm": 0.14532183493811077, + "learning_rate": 4.893308340110407e-05, + "loss": 0.6356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6323143243789673, + "step": 4885, + "valid_targets_mean": 15907.5, + "valid_targets_min": 668 + }, + { + "epoch": 1.3050440352281825, + "grad_norm": 0.2876475131773128, + "learning_rate": 4.876935643744229e-05, + "loss": 0.6411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6975796818733215, + "step": 4890, + "valid_targets_mean": 15803.8, + "valid_targets_min": 517 + }, + { + "epoch": 1.306378436082199, + "grad_norm": 0.2102077296249055, + "learning_rate": 4.860577177655922e-05, + "loss": 0.6362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6357290148735046, + "step": 4895, + "valid_targets_mean": 16207.7, + "valid_targets_min": 642 + }, + { + "epoch": 1.3077128369362157, + "grad_norm": 0.18759868555822456, + "learning_rate": 4.844233030591122e-05, + "loss": 0.6321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6458548307418823, + "step": 4900, + "valid_targets_mean": 16728.7, + "valid_targets_min": 603 + }, + { + "epoch": 1.3090472377902322, + "grad_norm": 0.18943513623219738, + "learning_rate": 4.827903291217785e-05, + "loss": 0.6428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6549099087715149, + "step": 4905, + "valid_targets_mean": 16717.1, + "valid_targets_min": 926 + }, + { + "epoch": 1.3103816386442486, + "grad_norm": 0.14584218135147162, + "learning_rate": 4.8115880481257066e-05, + "loss": 0.6271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.604077935218811, + "step": 4910, + "valid_targets_mean": 16537.5, + "valid_targets_min": 801 + }, + { + "epoch": 1.3117160394982652, + "grad_norm": 0.15614884433868975, + "learning_rate": 4.795287389826035e-05, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6058860421180725, + "step": 4915, + "valid_targets_mean": 15564.1, + "valid_targets_min": 560 + }, + { + "epoch": 1.3130504403522818, + "grad_norm": 0.19647445810549968, + "learning_rate": 4.779001404750797e-05, + "loss": 0.6234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6127307415008545, + "step": 4920, + "valid_targets_mean": 16563.2, + "valid_targets_min": 562 + }, + { + "epoch": 1.3143848412062984, + "grad_norm": 0.15351376101927297, + "learning_rate": 4.762730181252415e-05, + "loss": 0.6248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6400808095932007, + "step": 4925, + "valid_targets_mean": 15953.7, + "valid_targets_min": 25 + }, + { + "epoch": 1.315719242060315, + "grad_norm": 0.19129910797630822, + "learning_rate": 4.746473807603235e-05, + "loss": 0.6481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6250849962234497, + "step": 4930, + "valid_targets_mean": 15565.2, + "valid_targets_min": 687 + }, + { + "epoch": 1.3170536429143316, + "grad_norm": 0.24069633672786006, + "learning_rate": 4.730232371995029e-05, + "loss": 0.6273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520248651504517, + "step": 4935, + "valid_targets_mean": 16213.8, + "valid_targets_min": 787 + }, + { + "epoch": 1.318388043768348, + "grad_norm": 0.206513608573115, + "learning_rate": 4.714005962538543e-05, + "loss": 0.6367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.634706974029541, + "step": 4940, + "valid_targets_mean": 17679.6, + "valid_targets_min": 464 + }, + { + "epoch": 1.3197224446223645, + "grad_norm": 0.24134880808451342, + "learning_rate": 4.6977946672630004e-05, + "loss": 0.63, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.607745885848999, + "step": 4945, + "valid_targets_mean": 17591.5, + "valid_targets_min": 564 + }, + { + "epoch": 1.3210568454763811, + "grad_norm": 0.1801320898077436, + "learning_rate": 4.681598574115622e-05, + "loss": 0.6287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6350492835044861, + "step": 4950, + "valid_targets_mean": 16330.3, + "valid_targets_min": 887 + }, + { + "epoch": 1.3223912463303977, + "grad_norm": 0.1738518510160165, + "learning_rate": 4.665417770961166e-05, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6333613395690918, + "step": 4955, + "valid_targets_mean": 15356.5, + "valid_targets_min": 419 + }, + { + "epoch": 1.323725647184414, + "grad_norm": 0.15642467135401047, + "learning_rate": 4.6492523455814415e-05, + "loss": 0.6094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5787743330001831, + "step": 4960, + "valid_targets_mean": 15801.2, + "valid_targets_min": 466 + }, + { + "epoch": 1.3250600480384307, + "grad_norm": 0.149988243905769, + "learning_rate": 4.633102385674821e-05, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6080968379974365, + "step": 4965, + "valid_targets_mean": 16495.6, + "valid_targets_min": 123 + }, + { + "epoch": 1.3263944488924473, + "grad_norm": 0.1564258726734769, + "learning_rate": 4.616967978855788e-05, + "loss": 0.6144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178469657897949, + "step": 4970, + "valid_targets_mean": 15740.2, + "valid_targets_min": 598 + }, + { + "epoch": 1.3277288497464639, + "grad_norm": 0.15096598858177918, + "learning_rate": 4.6008492126544476e-05, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6312127113342285, + "step": 4975, + "valid_targets_mean": 15290.4, + "valid_targets_min": 466 + }, + { + "epoch": 1.3290632506004805, + "grad_norm": 0.16745460403329684, + "learning_rate": 4.584746174516045e-05, + "loss": 0.6172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5870546102523804, + "step": 4980, + "valid_targets_mean": 17124.3, + "valid_targets_min": 428 + }, + { + "epoch": 1.330397651454497, + "grad_norm": 0.1986477705300295, + "learning_rate": 4.568658951800512e-05, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6241950988769531, + "step": 4985, + "valid_targets_mean": 14701.8, + "valid_targets_min": 381 + }, + { + "epoch": 1.3317320523085134, + "grad_norm": 0.2503093418138642, + "learning_rate": 4.552587631781969e-05, + "loss": 0.6104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6214447617530823, + "step": 4990, + "valid_targets_mean": 17417.6, + "valid_targets_min": 231 + }, + { + "epoch": 1.33306645316253, + "grad_norm": 0.16628560708840986, + "learning_rate": 4.536532301648271e-05, + "loss": 0.6313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6199056506156921, + "step": 4995, + "valid_targets_mean": 16565.2, + "valid_targets_min": 571 + }, + { + "epoch": 1.3344008540165466, + "grad_norm": 0.25358311504745584, + "learning_rate": 4.5204930485005306e-05, + "loss": 0.6297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6275741457939148, + "step": 5000, + "valid_targets_mean": 16034.8, + "valid_targets_min": 438 + }, + { + "epoch": 1.335735254870563, + "grad_norm": 0.22096396426353762, + "learning_rate": 4.504469959352627e-05, + "loss": 0.6221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6337085366249084, + "step": 5005, + "valid_targets_mean": 15851.9, + "valid_targets_min": 553 + }, + { + "epoch": 1.3370696557245796, + "grad_norm": 0.17905523831113826, + "learning_rate": 4.488463121130762e-05, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6013862490653992, + "step": 5010, + "valid_targets_mean": 16295.4, + "valid_targets_min": 199 + }, + { + "epoch": 1.3384040565785962, + "grad_norm": 0.18892903740727368, + "learning_rate": 4.472472620672976e-05, + "loss": 0.621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6233558654785156, + "step": 5015, + "valid_targets_mean": 14884.6, + "valid_targets_min": 656 + }, + { + "epoch": 1.3397384574326128, + "grad_norm": 0.1960202408759845, + "learning_rate": 4.4564985447286614e-05, + "loss": 0.6421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6817205548286438, + "step": 5020, + "valid_targets_mean": 13823.1, + "valid_targets_min": 721 + }, + { + "epoch": 1.3410728582866294, + "grad_norm": 0.16756027953019842, + "learning_rate": 4.440540979958124e-05, + "loss": 0.6355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6471720337867737, + "step": 5025, + "valid_targets_mean": 15493.6, + "valid_targets_min": 561 + }, + { + "epoch": 1.342407259140646, + "grad_norm": 0.17529206291663108, + "learning_rate": 4.4246000129320867e-05, + "loss": 0.6356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6711809635162354, + "step": 5030, + "valid_targets_mean": 14982.9, + "valid_targets_min": 562 + }, + { + "epoch": 1.3437416599946623, + "grad_norm": 0.19955952977785812, + "learning_rate": 4.408675730131227e-05, + "loss": 0.6303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6456050872802734, + "step": 5035, + "valid_targets_mean": 15447.3, + "valid_targets_min": 157 + }, + { + "epoch": 1.345076060848679, + "grad_norm": 0.16163297867636223, + "learning_rate": 4.3927682179457144e-05, + "loss": 0.6183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6260631084442139, + "step": 5040, + "valid_targets_mean": 15513.2, + "valid_targets_min": 445 + }, + { + "epoch": 1.3464104617026955, + "grad_norm": 0.18520629633766658, + "learning_rate": 4.376877562674737e-05, + "loss": 0.6267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6137248277664185, + "step": 5045, + "valid_targets_mean": 16198.9, + "valid_targets_min": 520 + }, + { + "epoch": 1.347744862556712, + "grad_norm": 0.2500265725529047, + "learning_rate": 4.3610038505260264e-05, + "loss": 0.6469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6569816470146179, + "step": 5050, + "valid_targets_mean": 15119.1, + "valid_targets_min": 639 + }, + { + "epoch": 1.3490792634107285, + "grad_norm": 0.1694413784545287, + "learning_rate": 4.3451471676154035e-05, + "loss": 0.6172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6165503263473511, + "step": 5055, + "valid_targets_mean": 17920.4, + "valid_targets_min": 563 + }, + { + "epoch": 1.350413664264745, + "grad_norm": 0.15935104068927747, + "learning_rate": 4.329307599966306e-05, + "loss": 0.6398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6341271996498108, + "step": 5060, + "valid_targets_mean": 16518.5, + "valid_targets_min": 255 + }, + { + "epoch": 1.3517480651187617, + "grad_norm": 0.20247588720231224, + "learning_rate": 4.313485233509309e-05, + "loss": 0.641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6382253170013428, + "step": 5065, + "valid_targets_mean": 14843.2, + "valid_targets_min": 147 + }, + { + "epoch": 1.3530824659727783, + "grad_norm": 0.17668341881020452, + "learning_rate": 4.297680154081686e-05, + "loss": 0.628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6434556245803833, + "step": 5070, + "valid_targets_mean": 16067.9, + "valid_targets_min": 598 + }, + { + "epoch": 1.3544168668267949, + "grad_norm": 0.23015809453586503, + "learning_rate": 4.2818924474269126e-05, + "loss": 0.6307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6627788543701172, + "step": 5075, + "valid_targets_mean": 15679.1, + "valid_targets_min": 478 + }, + { + "epoch": 1.3557512676808114, + "grad_norm": 0.19363015963806815, + "learning_rate": 4.266122199194226e-05, + "loss": 0.6294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6344991326332092, + "step": 5080, + "valid_targets_mean": 15946.4, + "valid_targets_min": 384 + }, + { + "epoch": 1.3570856685348278, + "grad_norm": 0.1696018155620583, + "learning_rate": 4.250369494938146e-05, + "loss": 0.6314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520615816116333, + "step": 5085, + "valid_targets_mean": 14841.5, + "valid_targets_min": 787 + }, + { + "epoch": 1.3584200693888444, + "grad_norm": 0.16023070867785383, + "learning_rate": 4.234634420118021e-05, + "loss": 0.6288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6024264097213745, + "step": 5090, + "valid_targets_mean": 16656.5, + "valid_targets_min": 142 + }, + { + "epoch": 1.359754470242861, + "grad_norm": 0.27425959242038045, + "learning_rate": 4.218917060097547e-05, + "loss": 0.6506, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6734393835067749, + "step": 5095, + "valid_targets_mean": 13772.1, + "valid_targets_min": 486 + }, + { + "epoch": 1.3610888710968774, + "grad_norm": 0.2609294240114705, + "learning_rate": 4.203217500144326e-05, + "loss": 0.6207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6329338550567627, + "step": 5100, + "valid_targets_mean": 15875.0, + "valid_targets_min": 608 + }, + { + "epoch": 1.362423271950894, + "grad_norm": 0.21382203340370412, + "learning_rate": 4.187535825429396e-05, + "loss": 0.6311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6623399257659912, + "step": 5105, + "valid_targets_mean": 15016.3, + "valid_targets_min": 542 + }, + { + "epoch": 1.3637576728049106, + "grad_norm": 0.186234246475179, + "learning_rate": 4.171872121026753e-05, + "loss": 0.6431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6502887010574341, + "step": 5110, + "valid_targets_mean": 15757.6, + "valid_targets_min": 477 + }, + { + "epoch": 1.3650920736589272, + "grad_norm": 0.14765918505153394, + "learning_rate": 4.1562264719129165e-05, + "loss": 0.6172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5981555581092834, + "step": 5115, + "valid_targets_mean": 17159.0, + "valid_targets_min": 387 + }, + { + "epoch": 1.3664264745129437, + "grad_norm": 0.17270382952270566, + "learning_rate": 4.140598962966447e-05, + "loss": 0.636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6030063033103943, + "step": 5120, + "valid_targets_mean": 16237.5, + "valid_targets_min": 94 + }, + { + "epoch": 1.3677608753669603, + "grad_norm": 0.16978609229491592, + "learning_rate": 4.124989678967503e-05, + "loss": 0.6253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6567881107330322, + "step": 5125, + "valid_targets_mean": 14794.4, + "valid_targets_min": 419 + }, + { + "epoch": 1.3690952762209767, + "grad_norm": 0.14802313718879107, + "learning_rate": 4.109398704597357e-05, + "loss": 0.6248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6337324976921082, + "step": 5130, + "valid_targets_mean": 14994.8, + "valid_targets_min": 778 + }, + { + "epoch": 1.3704296770749933, + "grad_norm": 0.14832414023378732, + "learning_rate": 4.093826124437962e-05, + "loss": 0.6198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6228146553039551, + "step": 5135, + "valid_targets_mean": 16929.2, + "valid_targets_min": 353 + }, + { + "epoch": 1.37176407792901, + "grad_norm": 0.14911468961970115, + "learning_rate": 4.078272022971481e-05, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6165578961372375, + "step": 5140, + "valid_targets_mean": 15223.8, + "valid_targets_min": 502 + }, + { + "epoch": 1.3730984787830265, + "grad_norm": 0.1296469390132913, + "learning_rate": 4.06273648457982e-05, + "loss": 0.6272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6289052367210388, + "step": 5145, + "valid_targets_mean": 16206.2, + "valid_targets_min": 373 + }, + { + "epoch": 1.3744328796370429, + "grad_norm": 0.20771349174880657, + "learning_rate": 4.0472195935441904e-05, + "loss": 0.6371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.635810375213623, + "step": 5150, + "valid_targets_mean": 15276.2, + "valid_targets_min": 526 + }, + { + "epoch": 1.3757672804910595, + "grad_norm": 0.1426689571733511, + "learning_rate": 4.031721434044635e-05, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6031745076179504, + "step": 5155, + "valid_targets_mean": 16678.9, + "valid_targets_min": 890 + }, + { + "epoch": 1.377101681345076, + "grad_norm": 0.1736397062698139, + "learning_rate": 4.016242090159574e-05, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6417535543441772, + "step": 5160, + "valid_targets_mean": 14546.7, + "valid_targets_min": 99 + }, + { + "epoch": 1.3784360821990926, + "grad_norm": 0.15597388264000142, + "learning_rate": 4.0007816458653566e-05, + "loss": 0.6104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5856055617332458, + "step": 5165, + "valid_targets_mean": 15726.9, + "valid_targets_min": 85 + }, + { + "epoch": 1.3797704830531092, + "grad_norm": 0.15334672011634948, + "learning_rate": 3.9853401850358036e-05, + "loss": 0.6257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6129058003425598, + "step": 5170, + "valid_targets_mean": 17155.0, + "valid_targets_min": 727 + }, + { + "epoch": 1.3811048839071258, + "grad_norm": 0.1631981195786689, + "learning_rate": 3.969917791441739e-05, + "loss": 0.6298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6201703548431396, + "step": 5175, + "valid_targets_mean": 16696.0, + "valid_targets_min": 411 + }, + { + "epoch": 1.3824392847611422, + "grad_norm": 0.15249718456766068, + "learning_rate": 3.954514548750553e-05, + "loss": 0.6251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6350277662277222, + "step": 5180, + "valid_targets_mean": 15671.8, + "valid_targets_min": 627 + }, + { + "epoch": 1.3837736856151588, + "grad_norm": 0.13970025285922955, + "learning_rate": 3.939130540525746e-05, + "loss": 0.623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961894989013672, + "step": 5185, + "valid_targets_mean": 16183.0, + "valid_targets_min": 614 + }, + { + "epoch": 1.3851080864691754, + "grad_norm": 0.16541443655951255, + "learning_rate": 3.923765850226456e-05, + "loss": 0.6362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.605224609375, + "step": 5190, + "valid_targets_mean": 15942.9, + "valid_targets_min": 617 + }, + { + "epoch": 1.3864424873231918, + "grad_norm": 0.20505065015451213, + "learning_rate": 3.908420561207032e-05, + "loss": 0.6226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6064752340316772, + "step": 5195, + "valid_targets_mean": 16724.2, + "valid_targets_min": 237 + }, + { + "epoch": 1.3877768881772083, + "grad_norm": 0.1625840801923186, + "learning_rate": 3.893094756716569e-05, + "loss": 0.6415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6216104030609131, + "step": 5200, + "valid_targets_mean": 15669.0, + "valid_targets_min": 750 + }, + { + "epoch": 1.389111289031225, + "grad_norm": 0.15262810603720672, + "learning_rate": 3.87778851989845e-05, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6247696876525879, + "step": 5205, + "valid_targets_mean": 15331.0, + "valid_targets_min": 541 + }, + { + "epoch": 1.3904456898852415, + "grad_norm": 0.17970027336562808, + "learning_rate": 3.862501933789908e-05, + "loss": 0.6235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6287873387336731, + "step": 5210, + "valid_targets_mean": 15491.3, + "valid_targets_min": 359 + }, + { + "epoch": 1.3917800907392581, + "grad_norm": 0.17621270663724736, + "learning_rate": 3.847235081321573e-05, + "loss": 0.643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6243505477905273, + "step": 5215, + "valid_targets_mean": 15494.3, + "valid_targets_min": 566 + }, + { + "epoch": 1.3931144915932747, + "grad_norm": 0.1434464905938825, + "learning_rate": 3.831988045317007e-05, + "loss": 0.614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6041746139526367, + "step": 5220, + "valid_targets_mean": 17664.0, + "valid_targets_min": 301 + }, + { + "epoch": 1.394448892447291, + "grad_norm": 0.15414481962946985, + "learning_rate": 3.816760908492282e-05, + "loss": 0.6127, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6363335847854614, + "step": 5225, + "valid_targets_mean": 15424.6, + "valid_targets_min": 577 + }, + { + "epoch": 1.3957832933013077, + "grad_norm": 0.12673670646454216, + "learning_rate": 3.8015537534555e-05, + "loss": 0.6554, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6517373323440552, + "step": 5230, + "valid_targets_mean": 15626.9, + "valid_targets_min": 595 + }, + { + "epoch": 1.3971176941553243, + "grad_norm": 0.15606926008374739, + "learning_rate": 3.786366662706372e-05, + "loss": 0.635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6305726766586304, + "step": 5235, + "valid_targets_mean": 15393.1, + "valid_targets_min": 637 + }, + { + "epoch": 1.3984520950093409, + "grad_norm": 0.17304182022885428, + "learning_rate": 3.771199718635758e-05, + "loss": 0.6295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6062044501304626, + "step": 5240, + "valid_targets_mean": 15592.8, + "valid_targets_min": 123 + }, + { + "epoch": 1.3997864958633572, + "grad_norm": 0.14937846564123805, + "learning_rate": 3.756053003525213e-05, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961400270462036, + "step": 5245, + "valid_targets_mean": 17602.9, + "valid_targets_min": 391 + }, + { + "epoch": 1.4011208967173738, + "grad_norm": 0.14330067972015584, + "learning_rate": 3.7409265995465577e-05, + "loss": 0.6433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.636821985244751, + "step": 5250, + "valid_targets_mean": 15189.9, + "valid_targets_min": 572 + }, + { + "epoch": 1.4024552975713904, + "grad_norm": 0.15326204532333548, + "learning_rate": 3.725820588761422e-05, + "loss": 0.6332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6448045969009399, + "step": 5255, + "valid_targets_mean": 15761.1, + "valid_targets_min": 496 + }, + { + "epoch": 1.403789698425407, + "grad_norm": 0.1911081730773287, + "learning_rate": 3.7107350531207944e-05, + "loss": 0.6228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6157747507095337, + "step": 5260, + "valid_targets_mean": 16320.1, + "valid_targets_min": 122 + }, + { + "epoch": 1.4051240992794236, + "grad_norm": 0.15975441609751267, + "learning_rate": 3.6956700744645934e-05, + "loss": 0.6378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.664246141910553, + "step": 5265, + "valid_targets_mean": 15061.1, + "valid_targets_min": 344 + }, + { + "epoch": 1.4064585001334402, + "grad_norm": 0.17030194394230258, + "learning_rate": 3.6806257345212136e-05, + "loss": 0.63, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6642188429832458, + "step": 5270, + "valid_targets_mean": 15093.4, + "valid_targets_min": 434 + }, + { + "epoch": 1.4077929009874566, + "grad_norm": 0.2071399958210783, + "learning_rate": 3.665602114907075e-05, + "loss": 0.6247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6460654735565186, + "step": 5275, + "valid_targets_mean": 15851.9, + "valid_targets_min": 153 + }, + { + "epoch": 1.4091273018414732, + "grad_norm": 0.20186223724820232, + "learning_rate": 3.650599297126198e-05, + "loss": 0.6138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6479173898696899, + "step": 5280, + "valid_targets_mean": 15088.5, + "valid_targets_min": 853 + }, + { + "epoch": 1.4104617026954898, + "grad_norm": 0.1715220156560148, + "learning_rate": 3.63561736256975e-05, + "loss": 0.6428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6402706503868103, + "step": 5285, + "valid_targets_mean": 16333.2, + "valid_targets_min": 329 + }, + { + "epoch": 1.4117961035495064, + "grad_norm": 0.18866956062784462, + "learning_rate": 3.6206563925156e-05, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6222355365753174, + "step": 5290, + "valid_targets_mean": 15949.2, + "valid_targets_min": 395 + }, + { + "epoch": 1.4131305044035227, + "grad_norm": 0.1692810813069157, + "learning_rate": 3.605716468127889e-05, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6255773305892944, + "step": 5295, + "valid_targets_mean": 15020.3, + "valid_targets_min": 577 + }, + { + "epoch": 1.4144649052575393, + "grad_norm": 0.1761368719849253, + "learning_rate": 3.590797670456586e-05, + "loss": 0.6345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6473125219345093, + "step": 5300, + "valid_targets_mean": 15610.2, + "valid_targets_min": 339 + }, + { + "epoch": 1.415799306111556, + "grad_norm": 0.15287688398886665, + "learning_rate": 3.575900080437036e-05, + "loss": 0.6368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6090598702430725, + "step": 5305, + "valid_targets_mean": 17042.0, + "valid_targets_min": 698 + }, + { + "epoch": 1.4171337069655725, + "grad_norm": 0.20294069550913238, + "learning_rate": 3.561023778889545e-05, + "loss": 0.6175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6067546010017395, + "step": 5310, + "valid_targets_mean": 16089.0, + "valid_targets_min": 434 + }, + { + "epoch": 1.418468107819589, + "grad_norm": 0.17411375489959932, + "learning_rate": 3.546168846518915e-05, + "loss": 0.6221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6281801462173462, + "step": 5315, + "valid_targets_mean": 16322.3, + "valid_targets_min": 672 + }, + { + "epoch": 1.4198025086736055, + "grad_norm": 0.1992434771552196, + "learning_rate": 3.531335363914027e-05, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.652416467666626, + "step": 5320, + "valid_targets_mean": 15787.6, + "valid_targets_min": 704 + }, + { + "epoch": 1.421136909527622, + "grad_norm": 0.2804856175246008, + "learning_rate": 3.516523411547397e-05, + "loss": 0.6347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.601277232170105, + "step": 5325, + "valid_targets_mean": 15735.6, + "valid_targets_min": 448 + }, + { + "epoch": 1.4224713103816387, + "grad_norm": 0.2331782119792056, + "learning_rate": 3.5017330697747276e-05, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6436649560928345, + "step": 5330, + "valid_targets_mean": 15940.2, + "valid_targets_min": 318 + }, + { + "epoch": 1.4238057112356552, + "grad_norm": 0.20092372413155127, + "learning_rate": 3.486964418834495e-05, + "loss": 0.6299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6183117628097534, + "step": 5335, + "valid_targets_mean": 14376.1, + "valid_targets_min": 28 + }, + { + "epoch": 1.4251401120896716, + "grad_norm": 0.18482644972327308, + "learning_rate": 3.472217538847496e-05, + "loss": 0.6272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6374001502990723, + "step": 5340, + "valid_targets_mean": 16009.2, + "valid_targets_min": 531 + }, + { + "epoch": 1.4264745129436882, + "grad_norm": 0.18657467619893198, + "learning_rate": 3.457492509816416e-05, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5956864953041077, + "step": 5345, + "valid_targets_mean": 15606.7, + "valid_targets_min": 693 + }, + { + "epoch": 1.4278089137977048, + "grad_norm": 0.17376513299379437, + "learning_rate": 3.442789411625402e-05, + "loss": 0.6365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6099961996078491, + "step": 5350, + "valid_targets_mean": 15835.6, + "valid_targets_min": 466 + }, + { + "epoch": 1.4291433146517214, + "grad_norm": 0.16282284195478497, + "learning_rate": 3.428108324039626e-05, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623703122138977, + "step": 5355, + "valid_targets_mean": 17537.7, + "valid_targets_min": 684 + }, + { + "epoch": 1.430477715505738, + "grad_norm": 0.15783998047918987, + "learning_rate": 3.413449326704843e-05, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5866317749023438, + "step": 5360, + "valid_targets_mean": 16450.6, + "valid_targets_min": 485 + }, + { + "epoch": 1.4318121163597546, + "grad_norm": 0.16225480021708807, + "learning_rate": 3.3988124991469764e-05, + "loss": 0.6477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6615272760391235, + "step": 5365, + "valid_targets_mean": 15123.1, + "valid_targets_min": 353 + }, + { + "epoch": 1.433146517213771, + "grad_norm": 0.1319022511747964, + "learning_rate": 3.384197920771676e-05, + "loss": 0.6156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.585268497467041, + "step": 5370, + "valid_targets_mean": 18510.1, + "valid_targets_min": 500 + }, + { + "epoch": 1.4344809180677875, + "grad_norm": 0.22534083880885686, + "learning_rate": 3.36960567086388e-05, + "loss": 0.6454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6688559651374817, + "step": 5375, + "valid_targets_mean": 15660.4, + "valid_targets_min": 522 + }, + { + "epoch": 1.4358153189218041, + "grad_norm": 0.1504794415732279, + "learning_rate": 3.355035828587403e-05, + "loss": 0.6236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6434562802314758, + "step": 5380, + "valid_targets_mean": 15358.2, + "valid_targets_min": 403 + }, + { + "epoch": 1.4371497197758207, + "grad_norm": 0.14914466776523827, + "learning_rate": 3.340488472984493e-05, + "loss": 0.6216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6424883604049683, + "step": 5385, + "valid_targets_mean": 15463.3, + "valid_targets_min": 167 + }, + { + "epoch": 1.438484120629837, + "grad_norm": 0.17701115124674544, + "learning_rate": 3.3259636829754086e-05, + "loss": 0.6291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6274256706237793, + "step": 5390, + "valid_targets_mean": 15954.8, + "valid_targets_min": 490 + }, + { + "epoch": 1.4398185214838537, + "grad_norm": 0.16413150057095138, + "learning_rate": 3.3114615373579827e-05, + "loss": 0.6155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6335543990135193, + "step": 5395, + "valid_targets_mean": 16068.7, + "valid_targets_min": 439 + }, + { + "epoch": 1.4411529223378703, + "grad_norm": 0.20083715478632508, + "learning_rate": 3.296982114807207e-05, + "loss": 0.6366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6472524404525757, + "step": 5400, + "valid_targets_mean": 15599.1, + "valid_targets_min": 549 + }, + { + "epoch": 1.4424873231918869, + "grad_norm": 0.18175668651315993, + "learning_rate": 3.282525493874798e-05, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6218005418777466, + "step": 5405, + "valid_targets_mean": 15867.5, + "valid_targets_min": 385 + }, + { + "epoch": 1.4438217240459035, + "grad_norm": 0.15353302359402962, + "learning_rate": 3.2680917529887746e-05, + "loss": 0.6339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6132454872131348, + "step": 5410, + "valid_targets_mean": 17124.1, + "valid_targets_min": 722 + }, + { + "epoch": 1.44515612489992, + "grad_norm": 0.16417620846628184, + "learning_rate": 3.2536809704530206e-05, + "loss": 0.6117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290859580039978, + "step": 5415, + "valid_targets_mean": 16340.5, + "valid_targets_min": 379 + }, + { + "epoch": 1.4464905257539364, + "grad_norm": 0.17678199877547868, + "learning_rate": 3.239293224446879e-05, + "loss": 0.6285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6204519271850586, + "step": 5420, + "valid_targets_mean": 16516.2, + "valid_targets_min": 672 + }, + { + "epoch": 1.447824926607953, + "grad_norm": 0.1742844233875428, + "learning_rate": 3.224928593024719e-05, + "loss": 0.6161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6010374426841736, + "step": 5425, + "valid_targets_mean": 16831.8, + "valid_targets_min": 297 + }, + { + "epoch": 1.4491593274619696, + "grad_norm": 0.13521384271171266, + "learning_rate": 3.210587154115501e-05, + "loss": 0.6377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6182513236999512, + "step": 5430, + "valid_targets_mean": 16220.3, + "valid_targets_min": 704 + }, + { + "epoch": 1.450493728315986, + "grad_norm": 0.1358185671226795, + "learning_rate": 3.196268985522376e-05, + "loss": 0.629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6077415943145752, + "step": 5435, + "valid_targets_mean": 15695.3, + "valid_targets_min": 613 + }, + { + "epoch": 1.4518281291700026, + "grad_norm": 0.1711167885783527, + "learning_rate": 3.1819741649222485e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.624676525592804, + "step": 5440, + "valid_targets_mean": 15729.9, + "valid_targets_min": 295 + }, + { + "epoch": 1.4531625300240192, + "grad_norm": 0.12948194931451742, + "learning_rate": 3.167702769865354e-05, + "loss": 0.649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6523416638374329, + "step": 5445, + "valid_targets_mean": 16590.8, + "valid_targets_min": 445 + }, + { + "epoch": 1.4544969308780358, + "grad_norm": 0.12902218339041557, + "learning_rate": 3.153454877774849e-05, + "loss": 0.6273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242078542709351, + "step": 5450, + "valid_targets_mean": 16365.0, + "valid_targets_min": 355 + }, + { + "epoch": 1.4558313317320524, + "grad_norm": 0.1432691221891138, + "learning_rate": 3.139230565946387e-05, + "loss": 0.6218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6167353987693787, + "step": 5455, + "valid_targets_mean": 15632.9, + "valid_targets_min": 722 + }, + { + "epoch": 1.457165732586069, + "grad_norm": 0.1276182225412851, + "learning_rate": 3.1250299115476874e-05, + "loss": 0.6399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6298602223396301, + "step": 5460, + "valid_targets_mean": 15770.1, + "valid_targets_min": 692 + }, + { + "epoch": 1.4585001334400853, + "grad_norm": 0.13430459310454113, + "learning_rate": 3.110852991618135e-05, + "loss": 0.6288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6262118816375732, + "step": 5465, + "valid_targets_mean": 15365.5, + "valid_targets_min": 529 + }, + { + "epoch": 1.459834534294102, + "grad_norm": 0.1599431741046989, + "learning_rate": 3.0966998830683536e-05, + "loss": 0.626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6742227673530579, + "step": 5470, + "valid_targets_mean": 15713.1, + "valid_targets_min": 282 + }, + { + "epoch": 1.4611689351481185, + "grad_norm": 0.15944593752909758, + "learning_rate": 3.082570662679782e-05, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6399157047271729, + "step": 5475, + "valid_targets_mean": 15939.1, + "valid_targets_min": 364 + }, + { + "epoch": 1.4625033360021351, + "grad_norm": 0.15541531945278628, + "learning_rate": 3.068465407104275e-05, + "loss": 0.6261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6311227679252625, + "step": 5480, + "valid_targets_mean": 16185.3, + "valid_targets_min": 492 + }, + { + "epoch": 1.4638377368561515, + "grad_norm": 0.14751704087209916, + "learning_rate": 3.054384192863664e-05, + "loss": 0.61, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6270675659179688, + "step": 5485, + "valid_targets_mean": 15642.4, + "valid_targets_min": 419 + }, + { + "epoch": 1.465172137710168, + "grad_norm": 0.15132906174249833, + "learning_rate": 3.0403270963493657e-05, + "loss": 0.6209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6355879306793213, + "step": 5490, + "valid_targets_mean": 15252.9, + "valid_targets_min": 334 + }, + { + "epoch": 1.4665065385641847, + "grad_norm": 0.16247058056010277, + "learning_rate": 3.026294193821954e-05, + "loss": 0.6313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6449081897735596, + "step": 5495, + "valid_targets_mean": 14411.7, + "valid_targets_min": 679 + }, + { + "epoch": 1.4678409394182013, + "grad_norm": 0.13192412620555163, + "learning_rate": 3.012285561410742e-05, + "loss": 0.6244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6533715724945068, + "step": 5500, + "valid_targets_mean": 16055.3, + "valid_targets_min": 584 + }, + { + "epoch": 1.4691753402722179, + "grad_norm": 0.15751341118940315, + "learning_rate": 2.9983012751133852e-05, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6110358238220215, + "step": 5505, + "valid_targets_mean": 16525.5, + "valid_targets_min": 519 + }, + { + "epoch": 1.4705097411262344, + "grad_norm": 0.1393812435209019, + "learning_rate": 2.9843414107954588e-05, + "loss": 0.6175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.600792646408081, + "step": 5510, + "valid_targets_mean": 17548.1, + "valid_targets_min": 385 + }, + { + "epoch": 1.4718441419802508, + "grad_norm": 0.19223152973983335, + "learning_rate": 2.9704060441900402e-05, + "loss": 0.6382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6561647653579712, + "step": 5515, + "valid_targets_mean": 15718.0, + "valid_targets_min": 624 + }, + { + "epoch": 1.4731785428342674, + "grad_norm": 0.17235258312296173, + "learning_rate": 2.956495250897311e-05, + "loss": 0.6234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6213047504425049, + "step": 5520, + "valid_targets_mean": 15810.1, + "valid_targets_min": 570 + }, + { + "epoch": 1.474512943688284, + "grad_norm": 0.13984398266172365, + "learning_rate": 2.9426091063841444e-05, + "loss": 0.6013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.622529149055481, + "step": 5525, + "valid_targets_mean": 16110.9, + "valid_targets_min": 645 + }, + { + "epoch": 1.4758473445423004, + "grad_norm": 0.23048960361106072, + "learning_rate": 2.9287476859836817e-05, + "loss": 0.6269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6269211769104004, + "step": 5530, + "valid_targets_mean": 15144.9, + "valid_targets_min": 756 + }, + { + "epoch": 1.477181745396317, + "grad_norm": 0.15808842147469523, + "learning_rate": 2.9149110648949447e-05, + "loss": 0.6364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6489793658256531, + "step": 5535, + "valid_targets_mean": 15504.8, + "valid_targets_min": 497 + }, + { + "epoch": 1.4785161462503336, + "grad_norm": 0.1773982287753316, + "learning_rate": 2.9010993181824158e-05, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6429401636123657, + "step": 5540, + "valid_targets_mean": 17764.1, + "valid_targets_min": 720 + }, + { + "epoch": 1.4798505471043502, + "grad_norm": 0.15296864635389418, + "learning_rate": 2.8873125207756255e-05, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6262995004653931, + "step": 5545, + "valid_targets_mean": 15969.9, + "valid_targets_min": 500 + }, + { + "epoch": 1.4811849479583667, + "grad_norm": 0.16954670356160156, + "learning_rate": 2.8735507474687603e-05, + "loss": 0.6286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5944501161575317, + "step": 5550, + "valid_targets_mean": 16193.0, + "valid_targets_min": 155 + }, + { + "epoch": 1.4825193488123833, + "grad_norm": 0.1733352867343545, + "learning_rate": 2.859814072920249e-05, + "loss": 0.6152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5982875823974609, + "step": 5555, + "valid_targets_mean": 16719.0, + "valid_targets_min": 549 + }, + { + "epoch": 1.4838537496663997, + "grad_norm": 0.1474432157642333, + "learning_rate": 2.846102571652352e-05, + "loss": 0.6297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284036636352539, + "step": 5560, + "valid_targets_mean": 15888.5, + "valid_targets_min": 549 + }, + { + "epoch": 1.4851881505204163, + "grad_norm": 0.1547180714905254, + "learning_rate": 2.8324163180507716e-05, + "loss": 0.6269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.606930673122406, + "step": 5565, + "valid_targets_mean": 16781.9, + "valid_targets_min": 133 + }, + { + "epoch": 1.486522551374433, + "grad_norm": 0.1544643190284509, + "learning_rate": 2.8187553863642314e-05, + "loss": 0.6191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6283329725265503, + "step": 5570, + "valid_targets_mean": 16809.4, + "valid_targets_min": 62 + }, + { + "epoch": 1.4878569522284495, + "grad_norm": 0.13276430690247742, + "learning_rate": 2.8051198507040876e-05, + "loss": 0.6375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6261632442474365, + "step": 5575, + "valid_targets_mean": 16062.8, + "valid_targets_min": 684 + }, + { + "epoch": 1.4891913530824659, + "grad_norm": 0.1433474702905804, + "learning_rate": 2.7915097850439238e-05, + "loss": 0.6257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.633348822593689, + "step": 5580, + "valid_targets_mean": 17175.4, + "valid_targets_min": 497 + }, + { + "epoch": 1.4905257539364825, + "grad_norm": 0.16163825754953928, + "learning_rate": 2.7779252632191394e-05, + "loss": 0.622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284037828445435, + "step": 5585, + "valid_targets_mean": 16106.5, + "valid_targets_min": 128 + }, + { + "epoch": 1.491860154790499, + "grad_norm": 0.1398100737015759, + "learning_rate": 2.7643663589265642e-05, + "loss": 0.6309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6473536491394043, + "step": 5590, + "valid_targets_mean": 15708.0, + "valid_targets_min": 331 + }, + { + "epoch": 1.4931945556445156, + "grad_norm": 0.14418286876980943, + "learning_rate": 2.750833145724049e-05, + "loss": 0.6368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6269103288650513, + "step": 5595, + "valid_targets_mean": 16005.2, + "valid_targets_min": 595 + }, + { + "epoch": 1.4945289564985322, + "grad_norm": 0.13891282326030407, + "learning_rate": 2.7373256970300663e-05, + "loss": 0.6319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6326860785484314, + "step": 5600, + "valid_targets_mean": 15055.2, + "valid_targets_min": 139 + }, + { + "epoch": 1.4958633573525488, + "grad_norm": 0.1493646883274745, + "learning_rate": 2.7238440861233176e-05, + "loss": 0.6427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6493257284164429, + "step": 5605, + "valid_targets_mean": 15705.0, + "valid_targets_min": 642 + }, + { + "epoch": 1.4971977582065652, + "grad_norm": 0.1431354744300022, + "learning_rate": 2.710388386142335e-05, + "loss": 0.6366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6588246822357178, + "step": 5610, + "valid_targets_mean": 16106.0, + "valid_targets_min": 739 + }, + { + "epoch": 1.4985321590605818, + "grad_norm": 0.15838659749919395, + "learning_rate": 2.6969586700850753e-05, + "loss": 0.6328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6347640752792358, + "step": 5615, + "valid_targets_mean": 16459.5, + "valid_targets_min": 944 + }, + { + "epoch": 1.4998665599145984, + "grad_norm": 0.14202052693469316, + "learning_rate": 2.6835550108085373e-05, + "loss": 0.6234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6258725523948669, + "step": 5620, + "valid_targets_mean": 15989.1, + "valid_targets_min": 614 + }, + { + "epoch": 1.5012009607686148, + "grad_norm": 0.1439483870521881, + "learning_rate": 2.67017748102836e-05, + "loss": 0.6214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6074327230453491, + "step": 5625, + "valid_targets_mean": 16374.8, + "valid_targets_min": 116 + }, + { + "epoch": 1.5025353616226313, + "grad_norm": 0.15289582914743377, + "learning_rate": 2.6568261533184233e-05, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6085629463195801, + "step": 5630, + "valid_targets_mean": 16198.2, + "valid_targets_min": 674 + }, + { + "epoch": 1.503869762476648, + "grad_norm": 0.14157557834741372, + "learning_rate": 2.643501100110463e-05, + "loss": 0.6228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.602777361869812, + "step": 5635, + "valid_targets_mean": 15891.9, + "valid_targets_min": 449 + }, + { + "epoch": 1.5052041633306645, + "grad_norm": 0.14813942268202115, + "learning_rate": 2.6302023936936776e-05, + "loss": 0.6309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6272621154785156, + "step": 5640, + "valid_targets_mean": 15252.1, + "valid_targets_min": 275 + }, + { + "epoch": 1.5065385641846811, + "grad_norm": 0.12366778416433712, + "learning_rate": 2.616930106214323e-05, + "loss": 0.6271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6292228698730469, + "step": 5645, + "valid_targets_mean": 14449.2, + "valid_targets_min": 634 + }, + { + "epoch": 1.5078729650386977, + "grad_norm": 0.13723249797592718, + "learning_rate": 2.6036843096753394e-05, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6192312836647034, + "step": 5650, + "valid_targets_mean": 16084.3, + "valid_targets_min": 295 + }, + { + "epoch": 1.5092073658927143, + "grad_norm": 0.14013442644306484, + "learning_rate": 2.5904650759359528e-05, + "loss": 0.6359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6109635233879089, + "step": 5655, + "valid_targets_mean": 15055.7, + "valid_targets_min": 434 + }, + { + "epoch": 1.5105417667467307, + "grad_norm": 0.16452772456933798, + "learning_rate": 2.5772724767112753e-05, + "loss": 0.6231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6206374764442444, + "step": 5660, + "valid_targets_mean": 14545.7, + "valid_targets_min": 308 + }, + { + "epoch": 1.5118761676007473, + "grad_norm": 0.12885976269120666, + "learning_rate": 2.564106583571933e-05, + "loss": 0.6435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6476463079452515, + "step": 5665, + "valid_targets_mean": 14707.1, + "valid_targets_min": 564 + }, + { + "epoch": 1.5132105684547636, + "grad_norm": 0.14333944608867255, + "learning_rate": 2.550967467943668e-05, + "loss": 0.6233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5939033627510071, + "step": 5670, + "valid_targets_mean": 16372.6, + "valid_targets_min": 297 + }, + { + "epoch": 1.5145449693087802, + "grad_norm": 0.14271168882303076, + "learning_rate": 2.537855201106955e-05, + "loss": 0.6281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6289101839065552, + "step": 5675, + "valid_targets_mean": 17221.4, + "valid_targets_min": 478 + }, + { + "epoch": 1.5158793701627968, + "grad_norm": 0.12587353338371615, + "learning_rate": 2.5247698541966066e-05, + "loss": 0.6366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6356736421585083, + "step": 5680, + "valid_targets_mean": 15807.4, + "valid_targets_min": 568 + }, + { + "epoch": 1.5172137710168134, + "grad_norm": 0.135942169633523, + "learning_rate": 2.511711498201397e-05, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6369425058364868, + "step": 5685, + "valid_targets_mean": 16512.2, + "valid_targets_min": 764 + }, + { + "epoch": 1.51854817187083, + "grad_norm": 0.1300809788916359, + "learning_rate": 2.4986802039636773e-05, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5703003406524658, + "step": 5690, + "valid_targets_mean": 16038.2, + "valid_targets_min": 100 + }, + { + "epoch": 1.5198825727248466, + "grad_norm": 0.13972459116404298, + "learning_rate": 2.485676042178976e-05, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6317213773727417, + "step": 5695, + "valid_targets_mean": 15872.5, + "valid_targets_min": 742 + }, + { + "epoch": 1.5212169735788632, + "grad_norm": 0.13552004006518586, + "learning_rate": 2.4726990833956363e-05, + "loss": 0.6313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6211484670639038, + "step": 5700, + "valid_targets_mean": 14656.1, + "valid_targets_min": 465 + }, + { + "epoch": 1.5225513744328798, + "grad_norm": 0.14386227146441763, + "learning_rate": 2.45974939801442e-05, + "loss": 0.6199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5977884531021118, + "step": 5705, + "valid_targets_mean": 16085.2, + "valid_targets_min": 615 + }, + { + "epoch": 1.5238857752868962, + "grad_norm": 0.14276055446610306, + "learning_rate": 2.446827056288131e-05, + "loss": 0.6134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6355063915252686, + "step": 5710, + "valid_targets_mean": 16763.1, + "valid_targets_min": 570 + }, + { + "epoch": 1.5252201761409128, + "grad_norm": 0.1579645574450176, + "learning_rate": 2.4339321283212276e-05, + "loss": 0.628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.639201283454895, + "step": 5715, + "valid_targets_mean": 15428.9, + "valid_targets_min": 767 + }, + { + "epoch": 1.5265545769949291, + "grad_norm": 0.143331740428986, + "learning_rate": 2.421064684069453e-05, + "loss": 0.6343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6173781752586365, + "step": 5720, + "valid_targets_mean": 16842.1, + "valid_targets_min": 721 + }, + { + "epoch": 1.5278889778489457, + "grad_norm": 0.1473926456593145, + "learning_rate": 2.4082247933394414e-05, + "loss": 0.6317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6531630754470825, + "step": 5725, + "valid_targets_mean": 15427.3, + "valid_targets_min": 380 + }, + { + "epoch": 1.5292233787029623, + "grad_norm": 0.12416220263906289, + "learning_rate": 2.3954125257883558e-05, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5931440591812134, + "step": 5730, + "valid_targets_mean": 16346.6, + "valid_targets_min": 779 + }, + { + "epoch": 1.530557779556979, + "grad_norm": 0.14830788556227337, + "learning_rate": 2.382627950923501e-05, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6504865884780884, + "step": 5735, + "valid_targets_mean": 15952.8, + "valid_targets_min": 401 + }, + { + "epoch": 1.5318921804109955, + "grad_norm": 0.12532641548964424, + "learning_rate": 2.3698711381019398e-05, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6455780863761902, + "step": 5740, + "valid_targets_mean": 15303.9, + "valid_targets_min": 348 + }, + { + "epoch": 1.533226581265012, + "grad_norm": 0.13403566036637113, + "learning_rate": 2.3571421565301315e-05, + "loss": 0.6159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6332656145095825, + "step": 5745, + "valid_targets_mean": 16482.3, + "valid_targets_min": 137 + }, + { + "epoch": 1.5345609821190287, + "grad_norm": 0.12054379160148655, + "learning_rate": 2.3444410752635512e-05, + "loss": 0.6324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6107887029647827, + "step": 5750, + "valid_targets_mean": 15134.1, + "valid_targets_min": 633 + }, + { + "epoch": 1.535895382973045, + "grad_norm": 0.1230026498193065, + "learning_rate": 2.331767963206302e-05, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6055983304977417, + "step": 5755, + "valid_targets_mean": 15497.7, + "valid_targets_min": 31 + }, + { + "epoch": 1.5372297838270617, + "grad_norm": 0.11103447026365328, + "learning_rate": 2.319122889110763e-05, + "loss": 0.6219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.597805917263031, + "step": 5760, + "valid_targets_mean": 16754.6, + "valid_targets_min": 384 + }, + { + "epoch": 1.5385641846810783, + "grad_norm": 0.12465669790762561, + "learning_rate": 2.3065059215772057e-05, + "loss": 0.6176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6329092383384705, + "step": 5765, + "valid_targets_mean": 16111.2, + "valid_targets_min": 561 + }, + { + "epoch": 1.5398985855350946, + "grad_norm": 0.12713411167158647, + "learning_rate": 2.2939171290534127e-05, + "loss": 0.6152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6023916006088257, + "step": 5770, + "valid_targets_mean": 15803.7, + "valid_targets_min": 506 + }, + { + "epoch": 1.5412329863891112, + "grad_norm": 0.15179356801369148, + "learning_rate": 2.281356579834324e-05, + "loss": 0.6249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6431618332862854, + "step": 5775, + "valid_targets_mean": 16487.9, + "valid_targets_min": 307 + }, + { + "epoch": 1.5425673872431278, + "grad_norm": 0.1691329261460599, + "learning_rate": 2.2688243420616573e-05, + "loss": 0.6162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6375676393508911, + "step": 5780, + "valid_targets_mean": 14028.1, + "valid_targets_min": 623 + }, + { + "epoch": 1.5439017880971444, + "grad_norm": 0.12370458237505477, + "learning_rate": 2.2563204837235323e-05, + "loss": 0.637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.660173237323761, + "step": 5785, + "valid_targets_mean": 16358.3, + "valid_targets_min": 723 + }, + { + "epoch": 1.545236188951161, + "grad_norm": 0.13657774631918929, + "learning_rate": 2.243845072654115e-05, + "loss": 0.6082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6270567178726196, + "step": 5790, + "valid_targets_mean": 15915.3, + "valid_targets_min": 320 + }, + { + "epoch": 1.5465705898051776, + "grad_norm": 0.12029933244132973, + "learning_rate": 2.2313981765332464e-05, + "loss": 0.6252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6249598264694214, + "step": 5795, + "valid_targets_mean": 15742.1, + "valid_targets_min": 478 + }, + { + "epoch": 1.5479049906591942, + "grad_norm": 0.14750127845581507, + "learning_rate": 2.2189798628860604e-05, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6229920387268066, + "step": 5800, + "valid_targets_mean": 15027.0, + "valid_targets_min": 863 + }, + { + "epoch": 1.5492393915132106, + "grad_norm": 0.13344401129734557, + "learning_rate": 2.206590199082642e-05, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5828033089637756, + "step": 5805, + "valid_targets_mean": 16073.2, + "valid_targets_min": 299 + }, + { + "epoch": 1.5505737923672271, + "grad_norm": 0.13797418177317824, + "learning_rate": 2.194229252337639e-05, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.627313494682312, + "step": 5810, + "valid_targets_mean": 15657.3, + "valid_targets_min": 134 + }, + { + "epoch": 1.5519081932212435, + "grad_norm": 0.1307355779013856, + "learning_rate": 2.181897089709913e-05, + "loss": 0.6169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6516543626785278, + "step": 5815, + "valid_targets_mean": 16195.4, + "valid_targets_min": 213 + }, + { + "epoch": 1.55324259407526, + "grad_norm": 4.503023293741496, + "learning_rate": 2.1695937781021736e-05, + "loss": 0.6162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6091921925544739, + "step": 5820, + "valid_targets_mean": 17610.6, + "valid_targets_min": 357 + }, + { + "epoch": 1.5545769949292767, + "grad_norm": 0.11458451257446015, + "learning_rate": 2.1573193842606007e-05, + "loss": 0.6212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6066598296165466, + "step": 5825, + "valid_targets_mean": 15284.7, + "valid_targets_min": 431 + }, + { + "epoch": 1.5559113957832933, + "grad_norm": 0.1322682207343315, + "learning_rate": 2.1450739747745034e-05, + "loss": 0.6232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.631981611251831, + "step": 5830, + "valid_targets_mean": 15703.0, + "valid_targets_min": 452 + }, + { + "epoch": 1.5572457966373099, + "grad_norm": 0.13382475468535615, + "learning_rate": 2.1328576160759486e-05, + "loss": 0.6184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.608359694480896, + "step": 5835, + "valid_targets_mean": 15746.4, + "valid_targets_min": 440 + }, + { + "epoch": 1.5585801974913265, + "grad_norm": 0.13395960709287713, + "learning_rate": 2.1206703744393936e-05, + "loss": 0.6477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6912551522254944, + "step": 5840, + "valid_targets_mean": 15902.0, + "valid_targets_min": 332 + }, + { + "epoch": 1.559914598345343, + "grad_norm": 0.14083845588341448, + "learning_rate": 2.1085123159813398e-05, + "loss": 0.6249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6276473999023438, + "step": 5845, + "valid_targets_mean": 15508.2, + "valid_targets_min": 632 + }, + { + "epoch": 1.5612489991993594, + "grad_norm": 0.12300532252725843, + "learning_rate": 2.0963835066599703e-05, + "loss": 0.6153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6046478748321533, + "step": 5850, + "valid_targets_mean": 16468.6, + "valid_targets_min": 481 + }, + { + "epoch": 1.562583400053376, + "grad_norm": 0.16509827475279112, + "learning_rate": 2.084284012274781e-05, + "loss": 0.6387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6476929783821106, + "step": 5855, + "valid_targets_mean": 15581.5, + "valid_targets_min": 649 + }, + { + "epoch": 1.5639178009073926, + "grad_norm": 0.11987186265018815, + "learning_rate": 2.0722138984662415e-05, + "loss": 0.6134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5942327380180359, + "step": 5860, + "valid_targets_mean": 15606.3, + "valid_targets_min": 720 + }, + { + "epoch": 1.565252201761409, + "grad_norm": 0.11365970803386147, + "learning_rate": 2.0601732307154283e-05, + "loss": 0.6241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6330580711364746, + "step": 5865, + "valid_targets_mean": 16879.3, + "valid_targets_min": 767 + }, + { + "epoch": 1.5665866026154256, + "grad_norm": 0.11422402035884933, + "learning_rate": 2.048162074343665e-05, + "loss": 0.6079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6077611446380615, + "step": 5870, + "valid_targets_mean": 15804.7, + "valid_targets_min": 529 + }, + { + "epoch": 1.5679210034694422, + "grad_norm": 0.13577381742940237, + "learning_rate": 2.036180494512181e-05, + "loss": 0.6194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.605219304561615, + "step": 5875, + "valid_targets_mean": 15895.9, + "valid_targets_min": 668 + }, + { + "epoch": 1.5692554043234588, + "grad_norm": 0.12183516763109287, + "learning_rate": 2.024228556221752e-05, + "loss": 0.6357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6044329404830933, + "step": 5880, + "valid_targets_mean": 16786.0, + "valid_targets_min": 657 + }, + { + "epoch": 1.5705898051774754, + "grad_norm": 0.11449228550751389, + "learning_rate": 2.0123063243123395e-05, + "loss": 0.6309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6163490414619446, + "step": 5885, + "valid_targets_mean": 16912.6, + "valid_targets_min": 419 + }, + { + "epoch": 1.571924206031492, + "grad_norm": 0.12515999124031796, + "learning_rate": 2.000413863462754e-05, + "loss": 0.6178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6148951053619385, + "step": 5890, + "valid_targets_mean": 17588.8, + "valid_targets_min": 360 + }, + { + "epoch": 1.5732586068855086, + "grad_norm": 0.142567993474962, + "learning_rate": 1.988551238190288e-05, + "loss": 0.6099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5837486982345581, + "step": 5895, + "valid_targets_mean": 15626.2, + "valid_targets_min": 160 + }, + { + "epoch": 1.574593007739525, + "grad_norm": 0.13447486127424788, + "learning_rate": 1.9767185128503817e-05, + "loss": 0.6257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6562528610229492, + "step": 5900, + "valid_targets_mean": 16196.6, + "valid_targets_min": 685 + }, + { + "epoch": 1.5759274085935415, + "grad_norm": 0.14137687867755716, + "learning_rate": 1.9649157516362663e-05, + "loss": 0.6298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5984712839126587, + "step": 5905, + "valid_targets_mean": 17495.9, + "valid_targets_min": 290 + }, + { + "epoch": 1.577261809447558, + "grad_norm": 0.1667576470540979, + "learning_rate": 1.953143018578607e-05, + "loss": 0.6245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6378732919692993, + "step": 5910, + "valid_targets_mean": 15191.1, + "valid_targets_min": 425 + }, + { + "epoch": 1.5785962103015745, + "grad_norm": 0.12107450822688537, + "learning_rate": 1.9414003775451754e-05, + "loss": 0.6281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6455228328704834, + "step": 5915, + "valid_targets_mean": 15451.3, + "valid_targets_min": 586 + }, + { + "epoch": 1.579930611155591, + "grad_norm": 0.110173869196171, + "learning_rate": 1.9296878922404868e-05, + "loss": 0.6295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6453032493591309, + "step": 5920, + "valid_targets_mean": 15667.5, + "valid_targets_min": 620 + }, + { + "epoch": 1.5812650120096077, + "grad_norm": 0.1599541540200817, + "learning_rate": 1.9180056262054575e-05, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6145048141479492, + "step": 5925, + "valid_targets_mean": 16622.8, + "valid_targets_min": 649 + }, + { + "epoch": 1.5825994128636243, + "grad_norm": 0.13096133851618708, + "learning_rate": 1.9063536428170682e-05, + "loss": 0.6261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6367355585098267, + "step": 5930, + "valid_targets_mean": 15805.8, + "valid_targets_min": 303 + }, + { + "epoch": 1.5839338137176409, + "grad_norm": 0.13026012485411959, + "learning_rate": 1.8947320052880106e-05, + "loss": 0.6265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6729874610900879, + "step": 5935, + "valid_targets_mean": 14871.8, + "valid_targets_min": 623 + }, + { + "epoch": 1.5852682145716575, + "grad_norm": 0.14375365982896932, + "learning_rate": 1.8831407766663513e-05, + "loss": 0.633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6526641249656677, + "step": 5940, + "valid_targets_mean": 16618.8, + "valid_targets_min": 205 + }, + { + "epoch": 1.5866026154256738, + "grad_norm": 0.13475996262830925, + "learning_rate": 1.8715800198351824e-05, + "loss": 0.6283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6065152287483215, + "step": 5945, + "valid_targets_mean": 15873.9, + "valid_targets_min": 308 + }, + { + "epoch": 1.5879370162796904, + "grad_norm": 0.11567212712524262, + "learning_rate": 1.8600497975122877e-05, + "loss": 0.609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6047914028167725, + "step": 5950, + "valid_targets_mean": 15512.6, + "valid_targets_min": 593 + }, + { + "epoch": 1.589271417133707, + "grad_norm": 0.11457752537575618, + "learning_rate": 1.8485501722498024e-05, + "loss": 0.6252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6193585395812988, + "step": 5955, + "valid_targets_mean": 15587.5, + "valid_targets_min": 615 + }, + { + "epoch": 1.5906058179877234, + "grad_norm": 0.11153565821354677, + "learning_rate": 1.8370812064338624e-05, + "loss": 0.6192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6255379915237427, + "step": 5960, + "valid_targets_mean": 17222.9, + "valid_targets_min": 537 + }, + { + "epoch": 1.59194021884174, + "grad_norm": 0.13306138930387013, + "learning_rate": 1.8256429622842818e-05, + "loss": 0.6184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6517558693885803, + "step": 5965, + "valid_targets_mean": 16220.2, + "valid_targets_min": 464 + }, + { + "epoch": 1.5932746196957566, + "grad_norm": 0.1232840132144764, + "learning_rate": 1.814235501854206e-05, + "loss": 0.6188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6157183647155762, + "step": 5970, + "valid_targets_mean": 16222.9, + "valid_targets_min": 430 + }, + { + "epoch": 1.5946090205497732, + "grad_norm": 0.1297889203000817, + "learning_rate": 1.8028588870297774e-05, + "loss": 0.6289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6302587985992432, + "step": 5975, + "valid_targets_mean": 14871.2, + "valid_targets_min": 530 + }, + { + "epoch": 1.5959434214037898, + "grad_norm": 0.12199596817565361, + "learning_rate": 1.7915131795297956e-05, + "loss": 0.6275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6188775897026062, + "step": 5980, + "valid_targets_mean": 17172.1, + "valid_targets_min": 576 + }, + { + "epoch": 1.5972778222578063, + "grad_norm": 0.10827901865386277, + "learning_rate": 1.7801984409053897e-05, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6051005125045776, + "step": 5985, + "valid_targets_mean": 16912.6, + "valid_targets_min": 593 + }, + { + "epoch": 1.598612223111823, + "grad_norm": 0.1317375536272242, + "learning_rate": 1.7689147325396822e-05, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6553663015365601, + "step": 5990, + "valid_targets_mean": 15914.1, + "valid_targets_min": 388 + }, + { + "epoch": 1.5999466239658393, + "grad_norm": 0.1552078070629989, + "learning_rate": 1.757662115647448e-05, + "loss": 0.6315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6441587209701538, + "step": 5995, + "valid_targets_mean": 15740.9, + "valid_targets_min": 490 + }, + { + "epoch": 1.601281024819856, + "grad_norm": 0.11280524840766815, + "learning_rate": 1.7464406512747964e-05, + "loss": 0.6244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6006412506103516, + "step": 6000, + "valid_targets_mean": 15848.0, + "valid_targets_min": 441 + }, + { + "epoch": 1.6026154256738723, + "grad_norm": 0.12471678249023585, + "learning_rate": 1.7352504002988303e-05, + "loss": 0.6293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6565764546394348, + "step": 6005, + "valid_targets_mean": 14849.7, + "valid_targets_min": 320 + }, + { + "epoch": 1.6039498265278889, + "grad_norm": 0.1302767791335395, + "learning_rate": 1.7240914234273126e-05, + "loss": 0.64, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6389578580856323, + "step": 6010, + "valid_targets_mean": 16321.4, + "valid_targets_min": 460 + }, + { + "epoch": 1.6052842273819055, + "grad_norm": 0.1418301646406482, + "learning_rate": 1.7129637811983507e-05, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6155678033828735, + "step": 6015, + "valid_targets_mean": 15113.6, + "valid_targets_min": 233 + }, + { + "epoch": 1.606618628235922, + "grad_norm": 0.12063202066398034, + "learning_rate": 1.7018675339800557e-05, + "loss": 0.6288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6044756174087524, + "step": 6020, + "valid_targets_mean": 16629.7, + "valid_targets_min": 533 + }, + { + "epoch": 1.6079530290899386, + "grad_norm": 0.11807271642364235, + "learning_rate": 1.690802741970217e-05, + "loss": 0.6217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5868763327598572, + "step": 6025, + "valid_targets_mean": 16365.8, + "valid_targets_min": 529 + }, + { + "epoch": 1.6092874299439552, + "grad_norm": 0.12548250813804548, + "learning_rate": 1.6797694651959806e-05, + "loss": 0.6146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6389151811599731, + "step": 6030, + "valid_targets_mean": 16226.5, + "valid_targets_min": 410 + }, + { + "epoch": 1.6106218307979718, + "grad_norm": 0.1155585728721283, + "learning_rate": 1.6687677635135218e-05, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380968689918518, + "step": 6035, + "valid_targets_mean": 14740.4, + "valid_targets_min": 394 + }, + { + "epoch": 1.6119562316519882, + "grad_norm": 0.10679030044235797, + "learning_rate": 1.657797696607714e-05, + "loss": 0.631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6434690356254578, + "step": 6040, + "valid_targets_mean": 15633.7, + "valid_targets_min": 551 + }, + { + "epoch": 1.6132906325060048, + "grad_norm": 0.1318356171263497, + "learning_rate": 1.6468593239918136e-05, + "loss": 0.6325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6549495458602905, + "step": 6045, + "valid_targets_mean": 15992.0, + "valid_targets_min": 189 + }, + { + "epoch": 1.6146250333600214, + "grad_norm": 0.12706740457026952, + "learning_rate": 1.635952705007136e-05, + "loss": 0.6177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6158535480499268, + "step": 6050, + "valid_targets_mean": 17493.1, + "valid_targets_min": 415 + }, + { + "epoch": 1.6159594342140378, + "grad_norm": 0.11346395785230665, + "learning_rate": 1.6250778988227248e-05, + "loss": 0.6375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6460615396499634, + "step": 6055, + "valid_targets_mean": 16660.3, + "valid_targets_min": 616 + }, + { + "epoch": 1.6172938350680544, + "grad_norm": 0.10806654813730997, + "learning_rate": 1.614234964435044e-05, + "loss": 0.6128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.620269238948822, + "step": 6060, + "valid_targets_mean": 17277.5, + "valid_targets_min": 605 + }, + { + "epoch": 1.618628235922071, + "grad_norm": 0.11771772078819821, + "learning_rate": 1.603423960667645e-05, + "loss": 0.6282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6567904949188232, + "step": 6065, + "valid_targets_mean": 16147.1, + "valid_targets_min": 682 + }, + { + "epoch": 1.6199626367760875, + "grad_norm": 0.11055707030855468, + "learning_rate": 1.5926449461708577e-05, + "loss": 0.6325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6463902592658997, + "step": 6070, + "valid_targets_mean": 16450.0, + "valid_targets_min": 653 + }, + { + "epoch": 1.6212970376301041, + "grad_norm": 0.12058597331639832, + "learning_rate": 1.581897979421471e-05, + "loss": 0.6296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6483221650123596, + "step": 6075, + "valid_targets_mean": 15915.4, + "valid_targets_min": 859 + }, + { + "epoch": 1.6226314384841207, + "grad_norm": 0.11426474258314467, + "learning_rate": 1.571183118722405e-05, + "loss": 0.6261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623265266418457, + "step": 6080, + "valid_targets_mean": 15442.9, + "valid_targets_min": 365 + }, + { + "epoch": 1.6239658393381373, + "grad_norm": 0.1167146873257186, + "learning_rate": 1.5605004222024074e-05, + "loss": 0.6316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6657377481460571, + "step": 6085, + "valid_targets_mean": 15991.5, + "valid_targets_min": 110 + }, + { + "epoch": 1.6253002401921537, + "grad_norm": 0.13662401295294158, + "learning_rate": 1.549849947815737e-05, + "loss": 0.6307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6083266735076904, + "step": 6090, + "valid_targets_mean": 15308.7, + "valid_targets_min": 698 + }, + { + "epoch": 1.6266346410461703, + "grad_norm": 0.12981339267319347, + "learning_rate": 1.5392317533418366e-05, + "loss": 0.6336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6244166493415833, + "step": 6095, + "valid_targets_mean": 16245.6, + "valid_targets_min": 522 + }, + { + "epoch": 1.6279690419001867, + "grad_norm": 0.11868066092095313, + "learning_rate": 1.5286458963850363e-05, + "loss": 0.6164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6081252098083496, + "step": 6100, + "valid_targets_mean": 15854.4, + "valid_targets_min": 666 + }, + { + "epoch": 1.6293034427542032, + "grad_norm": 0.09876253127857607, + "learning_rate": 1.5180924343742316e-05, + "loss": 0.6209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011303067207336, + "step": 6105, + "valid_targets_mean": 16851.0, + "valid_targets_min": 548 + }, + { + "epoch": 1.6306378436082198, + "grad_norm": 0.1075861225035157, + "learning_rate": 1.5075714245625689e-05, + "loss": 0.6094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6410889029502869, + "step": 6110, + "valid_targets_mean": 15197.6, + "valid_targets_min": 427 + }, + { + "epoch": 1.6319722444622364, + "grad_norm": 0.10809641783904705, + "learning_rate": 1.4970829240271448e-05, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6171035766601562, + "step": 6115, + "valid_targets_mean": 16254.8, + "valid_targets_min": 600 + }, + { + "epoch": 1.633306645316253, + "grad_norm": 0.11734497353593293, + "learning_rate": 1.4866269896686917e-05, + "loss": 0.6557, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6341985464096069, + "step": 6120, + "valid_targets_mean": 16048.5, + "valid_targets_min": 375 + }, + { + "epoch": 1.6346410461702696, + "grad_norm": 0.11884394081671218, + "learning_rate": 1.4762036782112624e-05, + "loss": 0.6305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.629259467124939, + "step": 6125, + "valid_targets_mean": 16594.1, + "valid_targets_min": 732 + }, + { + "epoch": 1.6359754470242862, + "grad_norm": 0.12452586757341529, + "learning_rate": 1.465813046201934e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5998879671096802, + "step": 6130, + "valid_targets_mean": 16457.3, + "valid_targets_min": 528 + }, + { + "epoch": 1.6373098478783028, + "grad_norm": 0.11193146868364372, + "learning_rate": 1.4554551500104971e-05, + "loss": 0.621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6431502103805542, + "step": 6135, + "valid_targets_mean": 16036.7, + "valid_targets_min": 689 + }, + { + "epoch": 1.6386442487323192, + "grad_norm": 0.11208089126063975, + "learning_rate": 1.4451300458291401e-05, + "loss": 0.625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6364864706993103, + "step": 6140, + "valid_targets_mean": 16052.0, + "valid_targets_min": 691 + }, + { + "epoch": 1.6399786495863358, + "grad_norm": 0.11237804561337364, + "learning_rate": 1.4348377896721635e-05, + "loss": 0.6175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063425540924072, + "step": 6145, + "valid_targets_mean": 16655.0, + "valid_targets_min": 663 + }, + { + "epoch": 1.6413130504403521, + "grad_norm": 0.12681529743407421, + "learning_rate": 1.4245784373756566e-05, + "loss": 0.6243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6388323307037354, + "step": 6150, + "valid_targets_mean": 14902.1, + "valid_targets_min": 391 + }, + { + "epoch": 1.6426474512943687, + "grad_norm": 0.10827991259037892, + "learning_rate": 1.4143520445972078e-05, + "loss": 0.6307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6546180844306946, + "step": 6155, + "valid_targets_mean": 15754.9, + "valid_targets_min": 574 + }, + { + "epoch": 1.6439818521483853, + "grad_norm": 0.11328509104388595, + "learning_rate": 1.4041586668155989e-05, + "loss": 0.6298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234450340270996, + "step": 6160, + "valid_targets_mean": 16188.8, + "valid_targets_min": 495 + }, + { + "epoch": 1.645316253002402, + "grad_norm": 0.11256147696959475, + "learning_rate": 1.3939983593304992e-05, + "loss": 0.6049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5933871865272522, + "step": 6165, + "valid_targets_mean": 16867.5, + "valid_targets_min": 434 + }, + { + "epoch": 1.6466506538564185, + "grad_norm": 0.11122460509970357, + "learning_rate": 1.3838711772621743e-05, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979670882225037, + "step": 6170, + "valid_targets_mean": 15328.9, + "valid_targets_min": 561 + }, + { + "epoch": 1.647985054710435, + "grad_norm": 0.1113993401924013, + "learning_rate": 1.3737771755511811e-05, + "loss": 0.6301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5980991721153259, + "step": 6175, + "valid_targets_mean": 15607.7, + "valid_targets_min": 19 + }, + { + "epoch": 1.6493194555644517, + "grad_norm": 0.09801233009419923, + "learning_rate": 1.3637164089580673e-05, + "loss": 0.6179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.582968533039093, + "step": 6180, + "valid_targets_mean": 17630.9, + "valid_targets_min": 199 + }, + { + "epoch": 1.650653856418468, + "grad_norm": 0.1087711592160608, + "learning_rate": 1.3536889320630841e-05, + "loss": 0.626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6532264947891235, + "step": 6185, + "valid_targets_mean": 16123.4, + "valid_targets_min": 702 + }, + { + "epoch": 1.6519882572724847, + "grad_norm": 0.11184043267681884, + "learning_rate": 1.3436947992658814e-05, + "loss": 0.608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6151658892631531, + "step": 6190, + "valid_targets_mean": 16591.8, + "valid_targets_min": 613 + }, + { + "epoch": 1.6533226581265013, + "grad_norm": 0.11221188634828733, + "learning_rate": 1.3337340647852135e-05, + "loss": 0.6236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6335886716842651, + "step": 6195, + "valid_targets_mean": 15858.9, + "valid_targets_min": 646 + }, + { + "epoch": 1.6546570589805176, + "grad_norm": 0.10263641797224998, + "learning_rate": 1.3238067826586491e-05, + "loss": 0.629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.626166582107544, + "step": 6200, + "valid_targets_mean": 15845.0, + "valid_targets_min": 494 + }, + { + "epoch": 1.6559914598345342, + "grad_norm": 0.1338534198225952, + "learning_rate": 1.3139130067422792e-05, + "loss": 0.6255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6296816468238831, + "step": 6205, + "valid_targets_mean": 16170.1, + "valid_targets_min": 529 + }, + { + "epoch": 1.6573258606885508, + "grad_norm": 0.12010717720533998, + "learning_rate": 1.3040527907104126e-05, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6044759750366211, + "step": 6210, + "valid_targets_mean": 17815.8, + "valid_targets_min": 614 + }, + { + "epoch": 1.6586602615425674, + "grad_norm": 0.12918287791024774, + "learning_rate": 1.2942261880553012e-05, + "loss": 0.6194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6262900829315186, + "step": 6215, + "valid_targets_mean": 16474.6, + "valid_targets_min": 677 + }, + { + "epoch": 1.659994662396584, + "grad_norm": 0.132575982276469, + "learning_rate": 1.2844332520868433e-05, + "loss": 0.6166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5894056558609009, + "step": 6220, + "valid_targets_mean": 15954.4, + "valid_targets_min": 688 + }, + { + "epoch": 1.6613290632506006, + "grad_norm": 0.1321503283916604, + "learning_rate": 1.2746740359322857e-05, + "loss": 0.6316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6472313404083252, + "step": 6225, + "valid_targets_mean": 13889.1, + "valid_targets_min": 259 + }, + { + "epoch": 1.6626634641046172, + "grad_norm": 0.11477171567083412, + "learning_rate": 1.2649485925359514e-05, + "loss": 0.6315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6197164058685303, + "step": 6230, + "valid_targets_mean": 15947.2, + "valid_targets_min": 783 + }, + { + "epoch": 1.6639978649586336, + "grad_norm": 0.12877855557649734, + "learning_rate": 1.2552569746589386e-05, + "loss": 0.6129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6343130469322205, + "step": 6235, + "valid_targets_mean": 15370.8, + "valid_targets_min": 465 + }, + { + "epoch": 1.6653322658126501, + "grad_norm": 0.09600522815823713, + "learning_rate": 1.245599234878846e-05, + "loss": 0.6177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6135959029197693, + "step": 6240, + "valid_targets_mean": 15830.2, + "valid_targets_min": 542 + }, + { + "epoch": 1.6666666666666665, + "grad_norm": 0.11616223212883085, + "learning_rate": 1.2359754255894737e-05, + "loss": 0.6274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.639473557472229, + "step": 6245, + "valid_targets_mean": 16264.7, + "valid_targets_min": 333 + }, + { + "epoch": 1.6680010675206831, + "grad_norm": 0.11963674310921693, + "learning_rate": 1.2263855990005527e-05, + "loss": 0.6341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6277503967285156, + "step": 6250, + "valid_targets_mean": 16285.1, + "valid_targets_min": 764 + }, + { + "epoch": 1.6693354683746997, + "grad_norm": 0.11062418716806117, + "learning_rate": 1.2168298071374543e-05, + "loss": 0.6287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6286278367042542, + "step": 6255, + "valid_targets_mean": 16346.8, + "valid_targets_min": 515 + }, + { + "epoch": 1.6706698692287163, + "grad_norm": 0.10960058347069801, + "learning_rate": 1.2073081018409112e-05, + "loss": 0.6193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6018089652061462, + "step": 6260, + "valid_targets_mean": 16467.2, + "valid_targets_min": 309 + }, + { + "epoch": 1.672004270082733, + "grad_norm": 0.10255118898034118, + "learning_rate": 1.1978205347667303e-05, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6391971707344055, + "step": 6265, + "valid_targets_mean": 16542.4, + "valid_targets_min": 535 + }, + { + "epoch": 1.6733386709367495, + "grad_norm": 0.10248278837455822, + "learning_rate": 1.1883671573855186e-05, + "loss": 0.6231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175813674926758, + "step": 6270, + "valid_targets_mean": 16722.9, + "valid_targets_min": 698 + }, + { + "epoch": 1.674673071790766, + "grad_norm": 0.10176928928958952, + "learning_rate": 1.1789480209824064e-05, + "loss": 0.6142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5902460813522339, + "step": 6275, + "valid_targets_mean": 16472.0, + "valid_targets_min": 323 + }, + { + "epoch": 1.6760074726447824, + "grad_norm": 0.1087183247378677, + "learning_rate": 1.1695631766567562e-05, + "loss": 0.6238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5925770401954651, + "step": 6280, + "valid_targets_mean": 17731.5, + "valid_targets_min": 623 + }, + { + "epoch": 1.677341873498799, + "grad_norm": 0.10441887834481199, + "learning_rate": 1.1602126753219005e-05, + "loss": 0.6117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6068078875541687, + "step": 6285, + "valid_targets_mean": 15705.7, + "valid_targets_min": 167 + }, + { + "epoch": 1.6786762743528156, + "grad_norm": 0.1111444887936262, + "learning_rate": 1.1508965677048585e-05, + "loss": 0.628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6204681396484375, + "step": 6290, + "valid_targets_mean": 15415.0, + "valid_targets_min": 258 + }, + { + "epoch": 1.680010675206832, + "grad_norm": 0.11846573698079757, + "learning_rate": 1.1416149043460562e-05, + "loss": 0.6156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6317400336265564, + "step": 6295, + "valid_targets_mean": 15837.8, + "valid_targets_min": 436 + }, + { + "epoch": 1.6813450760608486, + "grad_norm": 0.10428763462278852, + "learning_rate": 1.132367735599066e-05, + "loss": 0.644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6342741250991821, + "step": 6300, + "valid_targets_mean": 16270.4, + "valid_targets_min": 201 + }, + { + "epoch": 1.6826794769148652, + "grad_norm": 0.11537287186352241, + "learning_rate": 1.1231551116303162e-05, + "loss": 0.6336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6315730810165405, + "step": 6305, + "valid_targets_mean": 15533.6, + "valid_targets_min": 463 + }, + { + "epoch": 1.6840138777688818, + "grad_norm": 0.11791504517126551, + "learning_rate": 1.1139770824188334e-05, + "loss": 0.6193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6582194566726685, + "step": 6310, + "valid_targets_mean": 16453.3, + "valid_targets_min": 563 + }, + { + "epoch": 1.6853482786228984, + "grad_norm": 0.11369935640753852, + "learning_rate": 1.1048336977559666e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6206117868423462, + "step": 6315, + "valid_targets_mean": 16782.0, + "valid_targets_min": 638 + }, + { + "epoch": 1.686682679476915, + "grad_norm": 0.1105370783701265, + "learning_rate": 1.0957250072451084e-05, + "loss": 0.6292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6181900501251221, + "step": 6320, + "valid_targets_mean": 15370.0, + "valid_targets_min": 543 + }, + { + "epoch": 1.6880170803309316, + "grad_norm": 0.11493760168455935, + "learning_rate": 1.0866510603014411e-05, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6352699995040894, + "step": 6325, + "valid_targets_mean": 16530.7, + "valid_targets_min": 657 + }, + { + "epoch": 1.689351481184948, + "grad_norm": 0.11362010503965773, + "learning_rate": 1.0776119061516613e-05, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6385295987129211, + "step": 6330, + "valid_targets_mean": 16278.2, + "valid_targets_min": 647 + }, + { + "epoch": 1.6906858820389645, + "grad_norm": 0.09896105840122521, + "learning_rate": 1.0686075938337055e-05, + "loss": 0.6021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5819606184959412, + "step": 6335, + "valid_targets_mean": 16842.0, + "valid_targets_min": 595 + }, + { + "epoch": 1.692020282892981, + "grad_norm": 0.11475399800879332, + "learning_rate": 1.0596381721964984e-05, + "loss": 0.6366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.652917742729187, + "step": 6340, + "valid_targets_mean": 14536.0, + "valid_targets_min": 560 + }, + { + "epoch": 1.6933546837469975, + "grad_norm": 0.10134623003905739, + "learning_rate": 1.0507036898996787e-05, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6215161681175232, + "step": 6345, + "valid_targets_mean": 16243.6, + "valid_targets_min": 651 + }, + { + "epoch": 1.694689084601014, + "grad_norm": 0.09588119258250771, + "learning_rate": 1.0418041954133346e-05, + "loss": 0.6214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5866297483444214, + "step": 6350, + "valid_targets_mean": 15628.8, + "valid_targets_min": 290 + }, + { + "epoch": 1.6960234854550307, + "grad_norm": 0.09986891287447414, + "learning_rate": 1.032939737017745e-05, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.610047459602356, + "step": 6355, + "valid_targets_mean": 15860.2, + "valid_targets_min": 355 + }, + { + "epoch": 1.6973578863090473, + "grad_norm": 0.11484316617515455, + "learning_rate": 1.02411036280312e-05, + "loss": 0.6516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6614749431610107, + "step": 6360, + "valid_targets_mean": 15743.5, + "valid_targets_min": 542 + }, + { + "epoch": 1.6986922871630639, + "grad_norm": 0.10913443246250537, + "learning_rate": 1.0153161206693269e-05, + "loss": 0.6237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5896070003509521, + "step": 6365, + "valid_targets_mean": 15874.9, + "valid_targets_min": 700 + }, + { + "epoch": 1.7000266880170805, + "grad_norm": 0.11212393578471182, + "learning_rate": 1.0065570583256483e-05, + "loss": 0.6234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6237644553184509, + "step": 6370, + "valid_targets_mean": 16417.2, + "valid_targets_min": 684 + }, + { + "epoch": 1.7013610888710968, + "grad_norm": 0.1169098281301673, + "learning_rate": 9.978332232905114e-06, + "loss": 0.6162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6001089811325073, + "step": 6375, + "valid_targets_mean": 16773.5, + "valid_targets_min": 459 + }, + { + "epoch": 1.7026954897251134, + "grad_norm": 0.10243637132312938, + "learning_rate": 9.891446628912286e-06, + "loss": 0.6244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6666500568389893, + "step": 6380, + "valid_targets_mean": 14801.5, + "valid_targets_min": 87 + }, + { + "epoch": 1.70402989057913, + "grad_norm": 0.10482966119554739, + "learning_rate": 9.804914242637541e-06, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6140177249908447, + "step": 6385, + "valid_targets_mean": 16329.9, + "valid_targets_min": 496 + }, + { + "epoch": 1.7053642914331464, + "grad_norm": 0.09782409890646393, + "learning_rate": 9.718735543524103e-06, + "loss": 0.6184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6123791933059692, + "step": 6390, + "valid_targets_mean": 16561.2, + "valid_targets_min": 21 + }, + { + "epoch": 1.706698692287163, + "grad_norm": 0.10668349901133359, + "learning_rate": 9.632910999096486e-06, + "loss": 0.6302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6120879650115967, + "step": 6395, + "valid_targets_mean": 16596.8, + "valid_targets_min": 605 + }, + { + "epoch": 1.7080330931411796, + "grad_norm": 0.10309181428762786, + "learning_rate": 9.547441074957884e-06, + "loss": 0.6206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6141809225082397, + "step": 6400, + "valid_targets_mean": 16667.8, + "valid_targets_min": 615 + }, + { + "epoch": 1.7093674939951962, + "grad_norm": 0.10161441538417851, + "learning_rate": 9.462326234787621e-06, + "loss": 0.6177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6218645572662354, + "step": 6405, + "valid_targets_mean": 15889.5, + "valid_targets_min": 559 + }, + { + "epoch": 1.7107018948492128, + "grad_norm": 0.10421604528090228, + "learning_rate": 9.377566940338712e-06, + "loss": 0.6341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6338856220245361, + "step": 6410, + "valid_targets_mean": 17526.1, + "valid_targets_min": 116 + }, + { + "epoch": 1.7120362957032293, + "grad_norm": 0.09632850265502085, + "learning_rate": 9.293163651435298e-06, + "loss": 0.6171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6092801094055176, + "step": 6415, + "valid_targets_mean": 16826.8, + "valid_targets_min": 428 + }, + { + "epoch": 1.713370696557246, + "grad_norm": 0.14268700677759225, + "learning_rate": 9.20911682597015e-06, + "loss": 0.6092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6385226249694824, + "step": 6420, + "valid_targets_mean": 15199.0, + "valid_targets_min": 600 + }, + { + "epoch": 1.7147050974112623, + "grad_norm": 0.1141300203133269, + "learning_rate": 9.125426919902231e-06, + "loss": 0.5973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6092257499694824, + "step": 6425, + "valid_targets_mean": 16535.1, + "valid_targets_min": 706 + }, + { + "epoch": 1.716039498265279, + "grad_norm": 0.10828299644111676, + "learning_rate": 9.042094387254212e-06, + "loss": 0.622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178991794586182, + "step": 6430, + "valid_targets_mean": 14752.1, + "valid_targets_min": 120 + }, + { + "epoch": 1.7173738991192953, + "grad_norm": 0.11398118285533808, + "learning_rate": 8.959119680109918e-06, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384214162826538, + "step": 6435, + "valid_targets_mean": 15340.4, + "valid_targets_min": 510 + }, + { + "epoch": 1.7187082999733119, + "grad_norm": 0.10092605169272632, + "learning_rate": 8.876503248612036e-06, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6220699548721313, + "step": 6440, + "valid_targets_mean": 15507.5, + "valid_targets_min": 455 + }, + { + "epoch": 1.7200427008273285, + "grad_norm": 0.11330458786874878, + "learning_rate": 8.794245540959546e-06, + "loss": 0.6221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084585785865784, + "step": 6445, + "valid_targets_mean": 17206.7, + "valid_targets_min": 822 + }, + { + "epoch": 1.721377101681345, + "grad_norm": 0.10025211270623526, + "learning_rate": 8.712347003405304e-06, + "loss": 0.6093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6082017421722412, + "step": 6450, + "valid_targets_mean": 15802.1, + "valid_targets_min": 626 + }, + { + "epoch": 1.7227115025353616, + "grad_norm": 0.09997128198065185, + "learning_rate": 8.630808080253701e-06, + "loss": 0.6162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6296147704124451, + "step": 6455, + "valid_targets_mean": 16807.6, + "valid_targets_min": 785 + }, + { + "epoch": 1.7240459033893782, + "grad_norm": 0.10414111634434077, + "learning_rate": 8.549629213858192e-06, + "loss": 0.6194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.631471574306488, + "step": 6460, + "valid_targets_mean": 16801.4, + "valid_targets_min": 360 + }, + { + "epoch": 1.7253803042433948, + "grad_norm": 0.10504156485164873, + "learning_rate": 8.468810844618842e-06, + "loss": 0.629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6191542148590088, + "step": 6465, + "valid_targets_mean": 15910.0, + "valid_targets_min": 562 + }, + { + "epoch": 1.7267147050974114, + "grad_norm": 0.11531327546603624, + "learning_rate": 8.388353410980075e-06, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6417456865310669, + "step": 6470, + "valid_targets_mean": 16802.6, + "valid_targets_min": 444 + }, + { + "epoch": 1.7280491059514278, + "grad_norm": 0.10884658145661602, + "learning_rate": 8.308257349428154e-06, + "loss": 0.617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6139084100723267, + "step": 6475, + "valid_targets_mean": 16511.0, + "valid_targets_min": 529 + }, + { + "epoch": 1.7293835068054444, + "grad_norm": 0.10834253980457187, + "learning_rate": 8.228523094488928e-06, + "loss": 0.6147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.656073808670044, + "step": 6480, + "valid_targets_mean": 14856.8, + "valid_targets_min": 355 + }, + { + "epoch": 1.7307179076594608, + "grad_norm": 0.10406939979420007, + "learning_rate": 8.149151078725416e-06, + "loss": 0.6319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6458457708358765, + "step": 6485, + "valid_targets_mean": 15603.7, + "valid_targets_min": 503 + }, + { + "epoch": 1.7320523085134774, + "grad_norm": 0.0983819920288647, + "learning_rate": 8.070141732735424e-06, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6092060804367065, + "step": 6490, + "valid_targets_mean": 16581.9, + "valid_targets_min": 456 + }, + { + "epoch": 1.733386709367494, + "grad_norm": 0.10687437145067663, + "learning_rate": 7.991495485149294e-06, + "loss": 0.6272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6291359663009644, + "step": 6495, + "valid_targets_mean": 15324.7, + "valid_targets_min": 861 + }, + { + "epoch": 1.7347211102215105, + "grad_norm": 0.09660211319603874, + "learning_rate": 7.913212762627539e-06, + "loss": 0.6255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6016951203346252, + "step": 6500, + "valid_targets_mean": 16839.8, + "valid_targets_min": 476 + }, + { + "epoch": 1.7360555110755271, + "grad_norm": 0.09778142185019807, + "learning_rate": 7.835293989858527e-06, + "loss": 0.6234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6057382225990295, + "step": 6505, + "valid_targets_mean": 16022.5, + "valid_targets_min": 631 + }, + { + "epoch": 1.7373899119295437, + "grad_norm": 0.10616126123251467, + "learning_rate": 7.75773958955614e-06, + "loss": 0.6115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6232156753540039, + "step": 6510, + "valid_targets_mean": 15161.9, + "valid_targets_min": 603 + }, + { + "epoch": 1.7387243127835603, + "grad_norm": 0.1107579677431388, + "learning_rate": 7.680549982457553e-06, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6101968288421631, + "step": 6515, + "valid_targets_mean": 15299.2, + "valid_targets_min": 459 + }, + { + "epoch": 1.7400587136375767, + "grad_norm": 0.10381732514792791, + "learning_rate": 7.6037255873209165e-06, + "loss": 0.6347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6579749584197998, + "step": 6520, + "valid_targets_mean": 17051.9, + "valid_targets_min": 38 + }, + { + "epoch": 1.7413931144915933, + "grad_norm": 0.09614501769644973, + "learning_rate": 7.527266820923089e-06, + "loss": 0.6265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6192217469215393, + "step": 6525, + "valid_targets_mean": 16462.7, + "valid_targets_min": 50 + }, + { + "epoch": 1.7427275153456097, + "grad_norm": 0.0990367797322132, + "learning_rate": 7.45117409805733e-06, + "loss": 0.6227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6273068189620972, + "step": 6530, + "valid_targets_mean": 15751.7, + "valid_targets_min": 463 + }, + { + "epoch": 1.7440619161996262, + "grad_norm": 0.09931179454623716, + "learning_rate": 7.375447831531128e-06, + "loss": 0.6198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5904843211174011, + "step": 6535, + "valid_targets_mean": 15938.6, + "valid_targets_min": 787 + }, + { + "epoch": 1.7453963170536428, + "grad_norm": 0.09179141156609635, + "learning_rate": 7.300088432163945e-06, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6543793678283691, + "step": 6540, + "valid_targets_mean": 16912.6, + "valid_targets_min": 299 + }, + { + "epoch": 1.7467307179076594, + "grad_norm": 0.10288250755398817, + "learning_rate": 7.2250963087849e-06, + "loss": 0.602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6032967567443848, + "step": 6545, + "valid_targets_mean": 14788.7, + "valid_targets_min": 579 + }, + { + "epoch": 1.748065118761676, + "grad_norm": 0.10263235031062287, + "learning_rate": 7.1504718682306754e-06, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6326683163642883, + "step": 6550, + "valid_targets_mean": 14526.3, + "valid_targets_min": 444 + }, + { + "epoch": 1.7493995196156926, + "grad_norm": 0.0976976803425861, + "learning_rate": 7.076215515343256e-06, + "loss": 0.6152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6148498058319092, + "step": 6555, + "valid_targets_mean": 15711.9, + "valid_targets_min": 251 + }, + { + "epoch": 1.7507339204697092, + "grad_norm": 0.1025678208255761, + "learning_rate": 7.0023276529676655e-06, + "loss": 0.6431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6772218942642212, + "step": 6560, + "valid_targets_mean": 15850.6, + "valid_targets_min": 325 + }, + { + "epoch": 1.7520683213237258, + "grad_norm": 0.09645792081965308, + "learning_rate": 6.928808681949919e-06, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6133409738540649, + "step": 6565, + "valid_targets_mean": 15282.2, + "valid_targets_min": 601 + }, + { + "epoch": 1.7534027221777422, + "grad_norm": 0.0914832409321191, + "learning_rate": 6.855659001134739e-06, + "loss": 0.6368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.609194815158844, + "step": 6570, + "valid_targets_mean": 15832.7, + "valid_targets_min": 368 + }, + { + "epoch": 1.7547371230317588, + "grad_norm": 0.09547658611807025, + "learning_rate": 6.78287900736342e-06, + "loss": 0.618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6080896854400635, + "step": 6575, + "valid_targets_mean": 16496.8, + "valid_targets_min": 563 + }, + { + "epoch": 1.7560715238857751, + "grad_norm": 0.09427204552893005, + "learning_rate": 6.710469095471701e-06, + "loss": 0.6122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6215167045593262, + "step": 6580, + "valid_targets_mean": 17439.6, + "valid_targets_min": 262 + }, + { + "epoch": 1.7574059247397917, + "grad_norm": 0.09694008938352663, + "learning_rate": 6.638429658287603e-06, + "loss": 0.6204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5812457799911499, + "step": 6585, + "valid_targets_mean": 15750.2, + "valid_targets_min": 625 + }, + { + "epoch": 1.7587403255938083, + "grad_norm": 0.10046226105291199, + "learning_rate": 6.566761086629285e-06, + "loss": 0.6166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6253821849822998, + "step": 6590, + "valid_targets_mean": 17012.2, + "valid_targets_min": 762 + }, + { + "epoch": 1.760074726447825, + "grad_norm": 0.10557213616677373, + "learning_rate": 6.495463769302952e-06, + "loss": 0.6269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6374891996383667, + "step": 6595, + "valid_targets_mean": 15844.3, + "valid_targets_min": 751 + }, + { + "epoch": 1.7614091273018415, + "grad_norm": 0.10711113282060361, + "learning_rate": 6.424538093100745e-06, + "loss": 0.6302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6101715564727783, + "step": 6600, + "valid_targets_mean": 15971.3, + "valid_targets_min": 524 + }, + { + "epoch": 1.762743528155858, + "grad_norm": 0.08854100780900193, + "learning_rate": 6.353984442798582e-06, + "loss": 0.6273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5808321237564087, + "step": 6605, + "valid_targets_mean": 17444.8, + "valid_targets_min": 582 + }, + { + "epoch": 1.7640779290098747, + "grad_norm": 0.10110922215288053, + "learning_rate": 6.283803201154173e-06, + "loss": 0.6126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6101663708686829, + "step": 6610, + "valid_targets_mean": 17214.1, + "valid_targets_min": 414 + }, + { + "epoch": 1.765412329863891, + "grad_norm": 0.20493053145002474, + "learning_rate": 6.213994748904866e-06, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6190000772476196, + "step": 6615, + "valid_targets_mean": 16494.0, + "valid_targets_min": 698 + }, + { + "epoch": 1.7667467307179077, + "grad_norm": 0.09578545081324519, + "learning_rate": 6.144559464765605e-06, + "loss": 0.6216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.592930257320404, + "step": 6620, + "valid_targets_mean": 16264.1, + "valid_targets_min": 442 + }, + { + "epoch": 1.7680811315719243, + "grad_norm": 0.10950373475500869, + "learning_rate": 6.075497725426862e-06, + "loss": 0.6267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6404623985290527, + "step": 6625, + "valid_targets_mean": 15382.0, + "valid_targets_min": 368 + }, + { + "epoch": 1.7694155324259406, + "grad_norm": 0.099924757154183, + "learning_rate": 6.0068099055526505e-06, + "loss": 0.6325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6134600639343262, + "step": 6630, + "valid_targets_mean": 16468.3, + "valid_targets_min": 548 + }, + { + "epoch": 1.7707499332799572, + "grad_norm": 0.10276845222389408, + "learning_rate": 5.938496377778395e-06, + "loss": 0.6277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6179153919219971, + "step": 6635, + "valid_targets_mean": 15734.6, + "valid_targets_min": 678 + }, + { + "epoch": 1.7720843341339738, + "grad_norm": 0.10264895930540381, + "learning_rate": 5.870557512709001e-06, + "loss": 0.6237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.611757755279541, + "step": 6640, + "valid_targets_mean": 16182.3, + "valid_targets_min": 415 + }, + { + "epoch": 1.7734187349879904, + "grad_norm": 0.10089157369476227, + "learning_rate": 5.802993678916773e-06, + "loss": 0.6333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6308541297912598, + "step": 6645, + "valid_targets_mean": 15795.2, + "valid_targets_min": 688 + }, + { + "epoch": 1.774753135842007, + "grad_norm": 0.09778285328051206, + "learning_rate": 5.7358052429394785e-06, + "loss": 0.6253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.614090085029602, + "step": 6650, + "valid_targets_mean": 16161.4, + "valid_targets_min": 296 + }, + { + "epoch": 1.7760875366960236, + "grad_norm": 0.09629551427385658, + "learning_rate": 5.668992569278347e-06, + "loss": 0.6242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6327216625213623, + "step": 6655, + "valid_targets_mean": 15158.7, + "valid_targets_min": 526 + }, + { + "epoch": 1.7774219375500402, + "grad_norm": 0.09088615364424045, + "learning_rate": 5.602556020396004e-06, + "loss": 0.604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.596990704536438, + "step": 6660, + "valid_targets_mean": 16353.3, + "valid_targets_min": 144 + }, + { + "epoch": 1.7787563384040566, + "grad_norm": 0.09034274812917362, + "learning_rate": 5.5364959567146514e-06, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6033511161804199, + "step": 6665, + "valid_targets_mean": 16006.4, + "valid_targets_min": 654 + }, + { + "epoch": 1.7800907392580732, + "grad_norm": 0.10302388333968907, + "learning_rate": 5.470812736614014e-06, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6411268711090088, + "step": 6670, + "valid_targets_mean": 14318.7, + "valid_targets_min": 633 + }, + { + "epoch": 1.7814251401120895, + "grad_norm": 0.09713243549010361, + "learning_rate": 5.405506716429378e-06, + "loss": 0.62, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6400075554847717, + "step": 6675, + "valid_targets_mean": 16221.4, + "valid_targets_min": 192 + }, + { + "epoch": 1.7827595409661061, + "grad_norm": 0.09115390102874049, + "learning_rate": 5.340578250449742e-06, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5856536626815796, + "step": 6680, + "valid_targets_mean": 16640.9, + "valid_targets_min": 517 + }, + { + "epoch": 1.7840939418201227, + "grad_norm": 0.09460582406704682, + "learning_rate": 5.276027690915868e-06, + "loss": 0.6335, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6678420305252075, + "step": 6685, + "valid_targets_mean": 16394.7, + "valid_targets_min": 376 + }, + { + "epoch": 1.7854283426741393, + "grad_norm": 0.09718467678046305, + "learning_rate": 5.211855388018282e-06, + "loss": 0.6329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6457293629646301, + "step": 6690, + "valid_targets_mean": 16005.6, + "valid_targets_min": 761 + }, + { + "epoch": 1.786762743528156, + "grad_norm": 0.09177107012065362, + "learning_rate": 5.148061689895519e-06, + "loss": 0.6356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6243642568588257, + "step": 6695, + "valid_targets_mean": 15437.2, + "valid_targets_min": 695 + }, + { + "epoch": 1.7880971443821725, + "grad_norm": 0.10024429506027321, + "learning_rate": 5.084646942632123e-06, + "loss": 0.6149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.591733455657959, + "step": 6700, + "valid_targets_mean": 16580.0, + "valid_targets_min": 616 + }, + { + "epoch": 1.789431545236189, + "grad_norm": 0.10069899627284365, + "learning_rate": 5.0216114902567995e-06, + "loss": 0.6165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.649412989616394, + "step": 6705, + "valid_targets_mean": 14921.5, + "valid_targets_min": 501 + }, + { + "epoch": 1.7907659460902055, + "grad_norm": 0.09197071177860598, + "learning_rate": 4.9589556747406e-06, + "loss": 0.6132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6070678234100342, + "step": 6710, + "valid_targets_mean": 16360.8, + "valid_targets_min": 311 + }, + { + "epoch": 1.792100346944222, + "grad_norm": 0.09280745282636378, + "learning_rate": 4.896679835994965e-06, + "loss": 0.6083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5776534676551819, + "step": 6715, + "valid_targets_mean": 16509.3, + "valid_targets_min": 165 + }, + { + "epoch": 1.7934347477982386, + "grad_norm": 0.08650443355926254, + "learning_rate": 4.834784311869985e-06, + "loss": 0.606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5921191573143005, + "step": 6720, + "valid_targets_mean": 16442.8, + "valid_targets_min": 342 + }, + { + "epoch": 1.794769148652255, + "grad_norm": 0.1016813277797864, + "learning_rate": 4.773269438152516e-06, + "loss": 0.6313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.631247878074646, + "step": 6725, + "valid_targets_mean": 14925.6, + "valid_targets_min": 605 + }, + { + "epoch": 1.7961035495062716, + "grad_norm": 0.08980829163466826, + "learning_rate": 4.712135548564333e-06, + "loss": 0.6032, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.625686764717102, + "step": 6730, + "valid_targets_mean": 16406.4, + "valid_targets_min": 817 + }, + { + "epoch": 1.7974379503602882, + "grad_norm": 0.09012413974461835, + "learning_rate": 4.651382974760382e-06, + "loss": 0.6265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6504734754562378, + "step": 6735, + "valid_targets_mean": 16003.1, + "valid_targets_min": 433 + }, + { + "epoch": 1.7987723512143048, + "grad_norm": 0.09455961172931404, + "learning_rate": 4.591012046326944e-06, + "loss": 0.6138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6531174778938293, + "step": 6740, + "valid_targets_mean": 15780.7, + "valid_targets_min": 675 + }, + { + "epoch": 1.8001067520683214, + "grad_norm": 0.08931663578747313, + "learning_rate": 4.5310230907798285e-06, + "loss": 0.6212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175740957260132, + "step": 6745, + "valid_targets_mean": 15773.0, + "valid_targets_min": 257 + }, + { + "epoch": 1.801441152922338, + "grad_norm": 0.09386050236286557, + "learning_rate": 4.471416433562638e-06, + "loss": 0.6148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6489225625991821, + "step": 6750, + "valid_targets_mean": 16038.3, + "valid_targets_min": 724 + }, + { + "epoch": 1.8027755537763546, + "grad_norm": 0.2394574484960667, + "learning_rate": 4.412192398044997e-06, + "loss": 0.611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5736192464828491, + "step": 6755, + "valid_targets_mean": 16190.5, + "valid_targets_min": 18 + }, + { + "epoch": 1.804109954630371, + "grad_norm": 0.10661505123251912, + "learning_rate": 4.353351305520747e-06, + "loss": 0.6223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6465322375297546, + "step": 6760, + "valid_targets_mean": 17468.6, + "valid_targets_min": 635 + }, + { + "epoch": 1.8054443554843875, + "grad_norm": 0.09541439718146676, + "learning_rate": 4.2948934752062655e-06, + "loss": 0.6358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6139446496963501, + "step": 6765, + "valid_targets_mean": 17065.6, + "valid_targets_min": 512 + }, + { + "epoch": 1.806778756338404, + "grad_norm": 0.09386372933318869, + "learning_rate": 4.2368192242387355e-06, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6409814357757568, + "step": 6770, + "valid_targets_mean": 14635.9, + "valid_targets_min": 329 + }, + { + "epoch": 1.8081131571924205, + "grad_norm": 0.10396463801811591, + "learning_rate": 4.179128867674348e-06, + "loss": 0.6016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6246637105941772, + "step": 6775, + "valid_targets_mean": 17589.5, + "valid_targets_min": 257 + }, + { + "epoch": 1.809447558046437, + "grad_norm": 0.10734828990482441, + "learning_rate": 4.121822718486664e-06, + "loss": 0.6237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6268129944801331, + "step": 6780, + "valid_targets_mean": 15491.9, + "valid_targets_min": 480 + }, + { + "epoch": 1.8107819589004537, + "grad_norm": 0.1001303927768195, + "learning_rate": 4.064901087564918e-06, + "loss": 0.6359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6495320200920105, + "step": 6785, + "valid_targets_mean": 14824.9, + "valid_targets_min": 744 + }, + { + "epoch": 1.8121163597544703, + "grad_norm": 0.09842864829102572, + "learning_rate": 4.008364283712298e-06, + "loss": 0.6049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6317485570907593, + "step": 6790, + "valid_targets_mean": 15738.1, + "valid_targets_min": 790 + }, + { + "epoch": 1.8134507606084869, + "grad_norm": 0.10150505686914285, + "learning_rate": 3.9522126136442515e-06, + "loss": 0.613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200088858604431, + "step": 6795, + "valid_targets_mean": 17679.3, + "valid_targets_min": 696 + }, + { + "epoch": 1.8147851614625035, + "grad_norm": 0.10700599241927931, + "learning_rate": 3.896446381986901e-06, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6170170307159424, + "step": 6800, + "valid_targets_mean": 15742.3, + "valid_targets_min": 20 + }, + { + "epoch": 1.8161195623165198, + "grad_norm": 0.09039156496096841, + "learning_rate": 3.841065891275328e-06, + "loss": 0.6106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6032929420471191, + "step": 6805, + "valid_targets_mean": 16021.7, + "valid_targets_min": 308 + }, + { + "epoch": 1.8174539631705364, + "grad_norm": 0.08908389333812784, + "learning_rate": 3.786071441951918e-06, + "loss": 0.6003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6013544201850891, + "step": 6810, + "valid_targets_mean": 14962.3, + "valid_targets_min": 470 + }, + { + "epoch": 1.818788364024553, + "grad_norm": 0.08782159043693183, + "learning_rate": 3.7314633323647952e-06, + "loss": 0.6287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6162735819816589, + "step": 6815, + "valid_targets_mean": 15977.1, + "valid_targets_min": 420 + }, + { + "epoch": 1.8201227648785694, + "grad_norm": 0.09504087980101503, + "learning_rate": 3.6772418587661474e-06, + "loss": 0.6185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6311695575714111, + "step": 6820, + "valid_targets_mean": 16229.0, + "valid_targets_min": 608 + }, + { + "epoch": 1.821457165732586, + "grad_norm": 0.09507045562862382, + "learning_rate": 3.623407315310667e-06, + "loss": 0.6392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6561924815177917, + "step": 6825, + "valid_targets_mean": 15305.6, + "valid_targets_min": 506 + }, + { + "epoch": 1.8227915665866026, + "grad_norm": 0.09690981421722983, + "learning_rate": 3.5699599940538836e-06, + "loss": 0.622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6211844086647034, + "step": 6830, + "valid_targets_mean": 15366.9, + "valid_targets_min": 640 + }, + { + "epoch": 1.8241259674406192, + "grad_norm": 0.09590079146274327, + "learning_rate": 3.5169001849506496e-06, + "loss": 0.6443, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6609474420547485, + "step": 6835, + "valid_targets_mean": 15275.2, + "valid_targets_min": 541 + }, + { + "epoch": 1.8254603682946358, + "grad_norm": 0.08760180167427375, + "learning_rate": 3.4642281758535645e-06, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5892127752304077, + "step": 6840, + "valid_targets_mean": 16206.0, + "valid_targets_min": 701 + }, + { + "epoch": 1.8267947691486524, + "grad_norm": 0.09239379002212816, + "learning_rate": 3.4119442525113283e-06, + "loss": 0.6236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5922919511795044, + "step": 6845, + "valid_targets_mean": 15991.8, + "valid_targets_min": 513 + }, + { + "epoch": 1.828129170002669, + "grad_norm": 0.0946090785298155, + "learning_rate": 3.3600486985673163e-06, + "loss": 0.6147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6722390651702881, + "step": 6850, + "valid_targets_mean": 14939.3, + "valid_targets_min": 749 + }, + { + "epoch": 1.8294635708566853, + "grad_norm": 0.09402100238995499, + "learning_rate": 3.308541795557948e-06, + "loss": 0.6244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6498205661773682, + "step": 6855, + "valid_targets_mean": 14678.4, + "valid_targets_min": 582 + }, + { + "epoch": 1.830797971710702, + "grad_norm": 0.09131839871535954, + "learning_rate": 3.2574238229111704e-06, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5872923135757446, + "step": 6860, + "valid_targets_mean": 15649.0, + "valid_targets_min": 544 + }, + { + "epoch": 1.8321323725647183, + "grad_norm": 0.09225730410624328, + "learning_rate": 3.2066950579450024e-06, + "loss": 0.6118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5875071287155151, + "step": 6865, + "valid_targets_mean": 16057.5, + "valid_targets_min": 57 + }, + { + "epoch": 1.8334667734187349, + "grad_norm": 0.09345988443966001, + "learning_rate": 3.156355775865968e-06, + "loss": 0.6076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6212291717529297, + "step": 6870, + "valid_targets_mean": 15905.6, + "valid_targets_min": 274 + }, + { + "epoch": 1.8348011742727515, + "grad_norm": 0.09836957478446351, + "learning_rate": 3.106406249767607e-06, + "loss": 0.6107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6226930618286133, + "step": 6875, + "valid_targets_mean": 15694.5, + "valid_targets_min": 584 + }, + { + "epoch": 1.836135575126768, + "grad_norm": 0.0935003323911921, + "learning_rate": 3.056846750629041e-06, + "loss": 0.6327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6048910021781921, + "step": 6880, + "valid_targets_mean": 16648.4, + "valid_targets_min": 497 + }, + { + "epoch": 1.8374699759807847, + "grad_norm": 0.0996757747150725, + "learning_rate": 3.007677547313436e-06, + "loss": 0.6252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6208453178405762, + "step": 6885, + "valid_targets_mean": 16256.8, + "valid_targets_min": 795 + }, + { + "epoch": 1.8388043768348012, + "grad_norm": 0.08849021655160869, + "learning_rate": 2.958898906566626e-06, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6154869794845581, + "step": 6890, + "valid_targets_mean": 16353.3, + "valid_targets_min": 404 + }, + { + "epoch": 1.8401387776888178, + "grad_norm": 0.08928376035381869, + "learning_rate": 2.910511093015588e-06, + "loss": 0.6283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6386107206344604, + "step": 6895, + "valid_targets_mean": 15752.9, + "valid_targets_min": 639 + }, + { + "epoch": 1.8414731785428344, + "grad_norm": 0.09861416715637732, + "learning_rate": 2.8625143691670404e-06, + "loss": 0.6164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6506497859954834, + "step": 6900, + "valid_targets_mean": 14408.1, + "valid_targets_min": 427 + }, + { + "epoch": 1.8428075793968508, + "grad_norm": 0.09163939734191671, + "learning_rate": 2.8149089954060287e-06, + "loss": 0.6141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.597012996673584, + "step": 6905, + "valid_targets_mean": 15989.0, + "valid_targets_min": 200 + }, + { + "epoch": 1.8441419802508674, + "grad_norm": 0.08995619879356641, + "learning_rate": 2.767695229994507e-06, + "loss": 0.6416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6536890268325806, + "step": 6910, + "valid_targets_mean": 17191.4, + "valid_targets_min": 475 + }, + { + "epoch": 1.8454763811048838, + "grad_norm": 0.0839875319084046, + "learning_rate": 2.720873329069895e-06, + "loss": 0.6183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5766624808311462, + "step": 6915, + "valid_targets_mean": 17233.1, + "valid_targets_min": 591 + }, + { + "epoch": 1.8468107819589004, + "grad_norm": 0.09083917258196791, + "learning_rate": 2.6744435466437535e-06, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6382717490196228, + "step": 6920, + "valid_targets_mean": 14588.1, + "valid_targets_min": 100 + }, + { + "epoch": 1.848145182812917, + "grad_norm": 0.08650332344005253, + "learning_rate": 2.6284061346004055e-06, + "loss": 0.6177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6030929684638977, + "step": 6925, + "valid_targets_mean": 16558.5, + "valid_targets_min": 384 + }, + { + "epoch": 1.8494795836669335, + "grad_norm": 0.09444305089496056, + "learning_rate": 2.5827613426954664e-06, + "loss": 0.6256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380075216293335, + "step": 6930, + "valid_targets_mean": 14690.7, + "valid_targets_min": 563 + }, + { + "epoch": 1.8508139845209501, + "grad_norm": 0.09483051297100908, + "learning_rate": 2.537509418554631e-06, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6225526332855225, + "step": 6935, + "valid_targets_mean": 15293.6, + "valid_targets_min": 486 + }, + { + "epoch": 1.8521483853749667, + "grad_norm": 0.10046672290201178, + "learning_rate": 2.4926506076722417e-06, + "loss": 0.6288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6159603595733643, + "step": 6940, + "valid_targets_mean": 15709.3, + "valid_targets_min": 642 + }, + { + "epoch": 1.8534827862289833, + "grad_norm": 0.08827032404875429, + "learning_rate": 2.4481851534099707e-06, + "loss": 0.6151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5953460931777954, + "step": 6945, + "valid_targets_mean": 15381.7, + "valid_targets_min": 567 + }, + { + "epoch": 1.8548171870829997, + "grad_norm": 0.08758508845183906, + "learning_rate": 2.404113296995505e-06, + "loss": 0.6321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6001626253128052, + "step": 6950, + "valid_targets_mean": 15501.0, + "valid_targets_min": 655 + }, + { + "epoch": 1.8561515879370163, + "grad_norm": 0.08709771266028127, + "learning_rate": 2.360435277521275e-06, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6188645958900452, + "step": 6955, + "valid_targets_mean": 16469.7, + "valid_targets_min": 118 + }, + { + "epoch": 1.8574859887910327, + "grad_norm": 0.09427280621483805, + "learning_rate": 2.3171513319430596e-06, + "loss": 0.6346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.649395227432251, + "step": 6960, + "valid_targets_mean": 14874.3, + "valid_targets_min": 455 + }, + { + "epoch": 1.8588203896450493, + "grad_norm": 0.0808931066414944, + "learning_rate": 2.274261695078841e-06, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6024237871170044, + "step": 6965, + "valid_targets_mean": 17161.4, + "valid_targets_min": 712 + }, + { + "epoch": 1.8601547904990658, + "grad_norm": 0.08414593552341547, + "learning_rate": 2.231766599607371e-06, + "loss": 0.5995, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5632792711257935, + "step": 6970, + "valid_targets_mean": 15532.3, + "valid_targets_min": 686 + }, + { + "epoch": 1.8614891913530824, + "grad_norm": 0.09441058517305718, + "learning_rate": 2.1896662760670618e-06, + "loss": 0.621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6468135714530945, + "step": 6975, + "valid_targets_mean": 16032.7, + "valid_targets_min": 290 + }, + { + "epoch": 1.862823592207099, + "grad_norm": 0.0851258200952786, + "learning_rate": 2.1479609528546328e-06, + "loss": 0.6248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6156222820281982, + "step": 6980, + "valid_targets_mean": 16126.7, + "valid_targets_min": 747 + }, + { + "epoch": 1.8641579930611156, + "grad_norm": 0.08353380996015211, + "learning_rate": 2.106650856223899e-06, + "loss": 0.6274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6163721084594727, + "step": 6985, + "valid_targets_mean": 16980.7, + "valid_targets_min": 872 + }, + { + "epoch": 1.8654923939151322, + "grad_norm": 0.0901724183069621, + "learning_rate": 2.0657362102845576e-06, + "loss": 0.6138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6244465112686157, + "step": 6990, + "valid_targets_mean": 14835.6, + "valid_targets_min": 669 + }, + { + "epoch": 1.8668267947691488, + "grad_norm": 0.3287515102847484, + "learning_rate": 2.0252172370009646e-06, + "loss": 0.6018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.603171169757843, + "step": 6995, + "valid_targets_mean": 16227.0, + "valid_targets_min": 585 + }, + { + "epoch": 1.8681611956231652, + "grad_norm": 0.08880212175295829, + "learning_rate": 1.985094156190925e-06, + "loss": 0.6345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6128568649291992, + "step": 7000, + "valid_targets_mean": 16593.5, + "valid_targets_min": 351 + }, + { + "epoch": 1.8694955964771818, + "grad_norm": 0.09309393580041371, + "learning_rate": 1.9453671855244963e-06, + "loss": 0.6211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6289182901382446, + "step": 7005, + "valid_targets_mean": 16403.7, + "valid_targets_min": 658 + }, + { + "epoch": 1.8708299973311981, + "grad_norm": 0.09480583622572787, + "learning_rate": 1.906036540522829e-06, + "loss": 0.6272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6634846329689026, + "step": 7010, + "valid_targets_mean": 15357.0, + "valid_targets_min": 540 + }, + { + "epoch": 1.8721643981852147, + "grad_norm": 0.08715063530216999, + "learning_rate": 1.8671024345569773e-06, + "loss": 0.6295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6392030119895935, + "step": 7015, + "valid_targets_mean": 16358.6, + "valid_targets_min": 695 + }, + { + "epoch": 1.8734987990392313, + "grad_norm": 0.08347898430310177, + "learning_rate": 1.8285650788467415e-06, + "loss": 0.6117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5922134518623352, + "step": 7020, + "valid_targets_mean": 16060.0, + "valid_targets_min": 478 + }, + { + "epoch": 1.874833199893248, + "grad_norm": 0.08718723584074349, + "learning_rate": 1.7904246824595514e-06, + "loss": 0.621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6190272569656372, + "step": 7025, + "valid_targets_mean": 16108.1, + "valid_targets_min": 774 + }, + { + "epoch": 1.8761676007472645, + "grad_norm": 0.08913725712331906, + "learning_rate": 1.7526814523092763e-06, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6637852787971497, + "step": 7030, + "valid_targets_mean": 14897.7, + "valid_targets_min": 638 + }, + { + "epoch": 1.8775020016012811, + "grad_norm": 0.09023604956675488, + "learning_rate": 1.7153355931551592e-06, + "loss": 0.6462, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6529320478439331, + "step": 7035, + "valid_targets_mean": 15052.8, + "valid_targets_min": 601 + }, + { + "epoch": 1.8788364024552977, + "grad_norm": 0.09370662512546263, + "learning_rate": 1.678387307600676e-06, + "loss": 0.6337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6144789457321167, + "step": 7040, + "valid_targets_mean": 15715.4, + "valid_targets_min": 506 + }, + { + "epoch": 1.880170803309314, + "grad_norm": 0.08469020269460416, + "learning_rate": 1.6418367960924271e-06, + "loss": 0.6135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6082459688186646, + "step": 7045, + "valid_targets_mean": 15793.0, + "valid_targets_min": 474 + }, + { + "epoch": 1.8815052041633307, + "grad_norm": 0.08138453596006119, + "learning_rate": 1.6056842569190987e-06, + "loss": 0.6217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5803401470184326, + "step": 7050, + "valid_targets_mean": 16992.2, + "valid_targets_min": 668 + }, + { + "epoch": 1.8828396050173473, + "grad_norm": 0.08643291719031197, + "learning_rate": 1.5699298862103276e-06, + "loss": 0.6179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6261525750160217, + "step": 7055, + "valid_targets_mean": 16001.4, + "valid_targets_min": 379 + }, + { + "epoch": 1.8841740058713636, + "grad_norm": 0.0938394622153444, + "learning_rate": 1.5345738779356714e-06, + "loss": 0.6301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6548340320587158, + "step": 7060, + "valid_targets_mean": 15555.3, + "valid_targets_min": 710 + }, + { + "epoch": 1.8855084067253802, + "grad_norm": 0.09162369025565296, + "learning_rate": 1.4996164239035408e-06, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.593757152557373, + "step": 7065, + "valid_targets_mean": 15477.0, + "valid_targets_min": 731 + }, + { + "epoch": 1.8868428075793968, + "grad_norm": 0.08752477920167435, + "learning_rate": 1.4650577137601843e-06, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6162948608398438, + "step": 7070, + "valid_targets_mean": 15712.4, + "valid_targets_min": 846 + }, + { + "epoch": 1.8881772084334134, + "grad_norm": 0.08378801161427556, + "learning_rate": 1.4308979349886146e-06, + "loss": 0.6202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6429492235183716, + "step": 7075, + "valid_targets_mean": 17087.5, + "valid_targets_min": 774 + }, + { + "epoch": 1.88951160928743, + "grad_norm": 0.08869747558124076, + "learning_rate": 1.3971372729076503e-06, + "loss": 0.6312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6538381576538086, + "step": 7080, + "valid_targets_mean": 15415.0, + "valid_targets_min": 709 + }, + { + "epoch": 1.8908460101414466, + "grad_norm": 0.08483051600051576, + "learning_rate": 1.3637759106708501e-06, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6220189332962036, + "step": 7085, + "valid_targets_mean": 16511.9, + "valid_targets_min": 549 + }, + { + "epoch": 1.8921804109954632, + "grad_norm": 0.08482293342113899, + "learning_rate": 1.3308140292655645e-06, + "loss": 0.608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6194273233413696, + "step": 7090, + "valid_targets_mean": 16692.6, + "valid_targets_min": 340 + }, + { + "epoch": 1.8935148118494796, + "grad_norm": 0.08867654734388321, + "learning_rate": 1.2982518075119352e-06, + "loss": 0.6046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6477352380752563, + "step": 7095, + "valid_targets_mean": 15490.1, + "valid_targets_min": 142 + }, + { + "epoch": 1.8948492127034962, + "grad_norm": 0.08680246823710645, + "learning_rate": 1.2660894220619139e-06, + "loss": 0.625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6353548765182495, + "step": 7100, + "valid_targets_mean": 16462.5, + "valid_targets_min": 589 + }, + { + "epoch": 1.8961836135575125, + "grad_norm": 0.08252503818191527, + "learning_rate": 1.2343270473983286e-06, + "loss": 0.6265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6071639060974121, + "step": 7105, + "valid_targets_mean": 16614.5, + "valid_targets_min": 533 + }, + { + "epoch": 1.8975180144115291, + "grad_norm": 0.08293124137152696, + "learning_rate": 1.202964855833935e-06, + "loss": 0.6133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5994781255722046, + "step": 7110, + "valid_targets_mean": 15927.0, + "valid_targets_min": 566 + }, + { + "epoch": 1.8988524152655457, + "grad_norm": 0.0824839342237248, + "learning_rate": 1.1720030175104506e-06, + "loss": 0.6281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6254457235336304, + "step": 7115, + "valid_targets_mean": 16195.4, + "valid_targets_min": 474 + }, + { + "epoch": 1.9001868161195623, + "grad_norm": 0.08473796491677214, + "learning_rate": 1.1414417003976634e-06, + "loss": 0.6074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5947679281234741, + "step": 7120, + "valid_targets_mean": 16226.3, + "valid_targets_min": 697 + }, + { + "epoch": 1.901521216973579, + "grad_norm": 0.07863211744651008, + "learning_rate": 1.1112810702925163e-06, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5904717445373535, + "step": 7125, + "valid_targets_mean": 17311.0, + "valid_targets_min": 540 + }, + { + "epoch": 1.9028556178275955, + "grad_norm": 0.08729504718220402, + "learning_rate": 1.0815212908181825e-06, + "loss": 0.6133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6068782210350037, + "step": 7130, + "valid_targets_mean": 16227.7, + "valid_targets_min": 384 + }, + { + "epoch": 1.904190018681612, + "grad_norm": 0.08799751275061786, + "learning_rate": 1.0521625234232333e-06, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.639133870601654, + "step": 7135, + "valid_targets_mean": 15186.4, + "valid_targets_min": 299 + }, + { + "epoch": 1.9055244195356285, + "grad_norm": 0.08766233161698946, + "learning_rate": 1.023204927380672e-06, + "loss": 0.6309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6215628385543823, + "step": 7140, + "valid_targets_mean": 16491.2, + "valid_targets_min": 489 + }, + { + "epoch": 1.906858820389645, + "grad_norm": 0.08136063705733775, + "learning_rate": 9.946486597871672e-07, + "loss": 0.6228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.603968620300293, + "step": 7145, + "valid_targets_mean": 16284.1, + "valid_targets_min": 333 + }, + { + "epoch": 1.9081932212436616, + "grad_norm": 0.08427514491379798, + "learning_rate": 9.664938755621632e-07, + "loss": 0.6145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6328669786453247, + "step": 7150, + "valid_targets_mean": 15816.9, + "valid_targets_min": 339 + }, + { + "epoch": 1.909527622097678, + "grad_norm": 0.08537633135837205, + "learning_rate": 9.387407274469793e-07, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234576106071472, + "step": 7155, + "valid_targets_mean": 16524.2, + "valid_targets_min": 177 + }, + { + "epoch": 1.9108620229516946, + "grad_norm": 0.08688371520142285, + "learning_rate": 9.113893660041033e-07, + "loss": 0.6156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6136159300804138, + "step": 7160, + "valid_targets_mean": 15847.0, + "valid_targets_min": 526 + }, + { + "epoch": 1.9121964238057112, + "grad_norm": 0.08095805144808471, + "learning_rate": 8.844399396162577e-07, + "loss": 0.6096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5837612152099609, + "step": 7165, + "valid_targets_mean": 16031.0, + "valid_targets_min": 572 + }, + { + "epoch": 1.9135308246597278, + "grad_norm": 0.08923077898805334, + "learning_rate": 8.578925944856596e-07, + "loss": 0.6296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6362388134002686, + "step": 7170, + "valid_targets_mean": 16244.0, + "valid_targets_min": 879 + }, + { + "epoch": 1.9148652255137444, + "grad_norm": 0.08023949216756944, + "learning_rate": 8.317474746332126e-07, + "loss": 0.6045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5978532433509827, + "step": 7175, + "valid_targets_mean": 16691.7, + "valid_targets_min": 460 + }, + { + "epoch": 1.916199626367761, + "grad_norm": 0.08614039079696198, + "learning_rate": 8.060047218977323e-07, + "loss": 0.6247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6216354370117188, + "step": 7180, + "valid_targets_mean": 15503.6, + "valid_targets_min": 295 + }, + { + "epoch": 1.9175340272217776, + "grad_norm": 0.08513143725032378, + "learning_rate": 7.806644759351471e-07, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.633056640625, + "step": 7185, + "valid_targets_mean": 16464.3, + "valid_targets_min": 604 + }, + { + "epoch": 1.918868428075794, + "grad_norm": 0.08707050074017611, + "learning_rate": 7.557268742177908e-07, + "loss": 0.6245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6251076459884644, + "step": 7190, + "valid_targets_mean": 15298.0, + "valid_targets_min": 695 + }, + { + "epoch": 1.9202028289298105, + "grad_norm": 0.08298457877614573, + "learning_rate": 7.311920520336106e-07, + "loss": 0.6185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.63387531042099, + "step": 7195, + "valid_targets_mean": 15801.4, + "valid_targets_min": 677 + }, + { + "epoch": 1.921537229783827, + "grad_norm": 0.07864046187495834, + "learning_rate": 7.070601424854522e-07, + "loss": 0.6197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6031808257102966, + "step": 7200, + "valid_targets_mean": 17465.6, + "valid_targets_min": 651 + }, + { + "epoch": 1.9228716306378435, + "grad_norm": 0.08324704107943265, + "learning_rate": 6.833312764903343e-07, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6396461725234985, + "step": 7205, + "valid_targets_mean": 16632.7, + "valid_targets_min": 519 + }, + { + "epoch": 1.92420603149186, + "grad_norm": 0.08765309774752181, + "learning_rate": 6.600055827787581e-07, + "loss": 0.6175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6199076175689697, + "step": 7210, + "valid_targets_mean": 15613.3, + "valid_targets_min": 567 + }, + { + "epoch": 1.9255404323458767, + "grad_norm": 0.08291832400714277, + "learning_rate": 6.370831878939747e-07, + "loss": 0.643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6336727142333984, + "step": 7215, + "valid_targets_mean": 16355.1, + "valid_targets_min": 540 + }, + { + "epoch": 1.9268748331998933, + "grad_norm": 0.08704375505728458, + "learning_rate": 6.1456421619131e-07, + "loss": 0.6088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6210100650787354, + "step": 7220, + "valid_targets_mean": 14533.1, + "valid_targets_min": 528 + }, + { + "epoch": 1.9282092340539099, + "grad_norm": 0.08803696864770845, + "learning_rate": 5.924487898375158e-07, + "loss": 0.6182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384143829345703, + "step": 7225, + "valid_targets_mean": 15410.6, + "valid_targets_min": 467 + }, + { + "epoch": 1.9295436349079265, + "grad_norm": 0.0834751205891046, + "learning_rate": 5.707370288100782e-07, + "loss": 0.6333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6324965357780457, + "step": 7230, + "valid_targets_mean": 16607.8, + "valid_targets_min": 425 + }, + { + "epoch": 1.9308780357619428, + "grad_norm": 0.08952295118745271, + "learning_rate": 5.494290508965605e-07, + "loss": 0.6345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6554481387138367, + "step": 7235, + "valid_targets_mean": 14700.1, + "valid_targets_min": 450 + }, + { + "epoch": 1.9322124366159594, + "grad_norm": 0.07836025153728045, + "learning_rate": 5.285249716940026e-07, + "loss": 0.6132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5875779986381531, + "step": 7240, + "valid_targets_mean": 17065.6, + "valid_targets_min": 512 + }, + { + "epoch": 1.933546837469976, + "grad_norm": 0.08531868760517099, + "learning_rate": 5.080249046082563e-07, + "loss": 0.6271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6375229954719543, + "step": 7245, + "valid_targets_mean": 15968.9, + "valid_targets_min": 226 + }, + { + "epoch": 1.9348812383239924, + "grad_norm": 0.08139798817382352, + "learning_rate": 4.879289608533926e-07, + "loss": 0.6356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6170284748077393, + "step": 7250, + "valid_targets_mean": 16205.3, + "valid_targets_min": 364 + }, + { + "epoch": 1.936215639178009, + "grad_norm": 0.08562110265994628, + "learning_rate": 4.6823724945107e-07, + "loss": 0.6165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6298227906227112, + "step": 7255, + "valid_targets_mean": 15892.4, + "valid_targets_min": 543 + }, + { + "epoch": 1.9375500400320256, + "grad_norm": 0.08088218838388078, + "learning_rate": 4.489498772299843e-07, + "loss": 0.6257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6066421866416931, + "step": 7260, + "valid_targets_mean": 16061.2, + "valid_targets_min": 409 + }, + { + "epoch": 1.9388844408860422, + "grad_norm": 0.08634923618970136, + "learning_rate": 4.3006694882526947e-07, + "loss": 0.6217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6236517429351807, + "step": 7265, + "valid_targets_mean": 16005.8, + "valid_targets_min": 646 + }, + { + "epoch": 1.9402188417400588, + "grad_norm": 0.08670401203490817, + "learning_rate": 4.115885666779062e-07, + "loss": 0.622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6537075638771057, + "step": 7270, + "valid_targets_mean": 15107.6, + "valid_targets_min": 671 + }, + { + "epoch": 1.9415532425940754, + "grad_norm": 0.07899525341897014, + "learning_rate": 3.9351483103420566e-07, + "loss": 0.6098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.583057165145874, + "step": 7275, + "valid_targets_mean": 17427.4, + "valid_targets_min": 588 + }, + { + "epoch": 1.942887643448092, + "grad_norm": 0.07866070576361257, + "learning_rate": 3.758458399452519e-07, + "loss": 0.6148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.587480366230011, + "step": 7280, + "valid_targets_mean": 16900.7, + "valid_targets_min": 189 + }, + { + "epoch": 1.9442220443021083, + "grad_norm": 0.07868622469701628, + "learning_rate": 3.585816892663351e-07, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5950984954833984, + "step": 7285, + "valid_targets_mean": 16367.6, + "valid_targets_min": 479 + }, + { + "epoch": 1.945556445156125, + "grad_norm": 0.08299176442121954, + "learning_rate": 3.4172247265650267e-07, + "loss": 0.6255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6286250352859497, + "step": 7290, + "valid_targets_mean": 15500.8, + "valid_targets_min": 327 + }, + { + "epoch": 1.9468908460101413, + "grad_norm": 0.08515529041637454, + "learning_rate": 3.252682815779922e-07, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6196545362472534, + "step": 7295, + "valid_targets_mean": 15439.1, + "valid_targets_min": 316 + }, + { + "epoch": 1.9482252468641579, + "grad_norm": 0.08309506619992096, + "learning_rate": 3.0921920529574096e-07, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6408487558364868, + "step": 7300, + "valid_targets_mean": 16132.7, + "valid_targets_min": 408 + }, + { + "epoch": 1.9495596477181745, + "grad_norm": 0.08463021920591228, + "learning_rate": 2.9357533087694397e-07, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6341683864593506, + "step": 7305, + "valid_targets_mean": 15742.3, + "valid_targets_min": 712 + }, + { + "epoch": 1.950894048572191, + "grad_norm": 0.07687671870926512, + "learning_rate": 2.7833674319052977e-07, + "loss": 0.6179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6142845153808594, + "step": 7310, + "valid_targets_mean": 16706.5, + "valid_targets_min": 736 + }, + { + "epoch": 1.9522284494262077, + "grad_norm": 0.08331816457428305, + "learning_rate": 2.6350352490672746e-07, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6477742791175842, + "step": 7315, + "valid_targets_mean": 15859.2, + "valid_targets_min": 438 + }, + { + "epoch": 1.9535628502802243, + "grad_norm": 0.08418031536600762, + "learning_rate": 2.49075756496625e-07, + "loss": 0.62, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6104916334152222, + "step": 7320, + "valid_targets_mean": 16536.3, + "valid_targets_min": 478 + }, + { + "epoch": 1.9548972511342408, + "grad_norm": 0.08018563522764396, + "learning_rate": 2.3505351623170353e-07, + "loss": 0.6365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6002669334411621, + "step": 7325, + "valid_targets_mean": 15635.6, + "valid_targets_min": 549 + }, + { + "epoch": 1.9562316519882574, + "grad_norm": 0.08294347847486674, + "learning_rate": 2.2143688018343707e-07, + "loss": 0.6376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6311354637145996, + "step": 7330, + "valid_targets_mean": 15950.8, + "valid_targets_min": 727 + }, + { + "epoch": 1.9575660528422738, + "grad_norm": 0.08169118747835444, + "learning_rate": 2.0822592222287659e-07, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6531394720077515, + "step": 7335, + "valid_targets_mean": 16453.7, + "valid_targets_min": 630 + }, + { + "epoch": 1.9589004536962904, + "grad_norm": 0.08870720045507874, + "learning_rate": 1.9542071402024185e-07, + "loss": 0.608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6536878347396851, + "step": 7340, + "valid_targets_mean": 14271.3, + "valid_targets_min": 564 + }, + { + "epoch": 1.9602348545503068, + "grad_norm": 0.08391865160704697, + "learning_rate": 1.830213250445467e-07, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5975584387779236, + "step": 7345, + "valid_targets_mean": 15199.5, + "valid_targets_min": 524 + }, + { + "epoch": 1.9615692554043234, + "grad_norm": 0.08387455033289205, + "learning_rate": 1.7102782256319115e-07, + "loss": 0.637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6481696963310242, + "step": 7350, + "valid_targets_mean": 15820.8, + "valid_targets_min": 539 + }, + { + "epoch": 1.96290365625834, + "grad_norm": 0.086376860258013, + "learning_rate": 1.5944027164163652e-07, + "loss": 0.6364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6533975005149841, + "step": 7355, + "valid_targets_mean": 15217.0, + "valid_targets_min": 606 + }, + { + "epoch": 1.9642380571123566, + "grad_norm": 0.08124994645822725, + "learning_rate": 1.4825873514302257e-07, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6236833333969116, + "step": 7360, + "valid_targets_mean": 15678.1, + "valid_targets_min": 608 + }, + { + "epoch": 1.9655724579663731, + "grad_norm": 0.08412854928063453, + "learning_rate": 1.3748327372784252e-07, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.638558566570282, + "step": 7365, + "valid_targets_mean": 16400.4, + "valid_targets_min": 551 + }, + { + "epoch": 1.9669068588203897, + "grad_norm": 0.08204700545173244, + "learning_rate": 1.271139458536019e-07, + "loss": 0.6221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.600684404373169, + "step": 7370, + "valid_targets_mean": 16416.3, + "valid_targets_min": 749 + }, + { + "epoch": 1.9682412596744063, + "grad_norm": 0.0791137749291822, + "learning_rate": 1.1715080777451868e-07, + "loss": 0.6198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6197346448898315, + "step": 7375, + "valid_targets_mean": 16873.1, + "valid_targets_min": 761 + }, + { + "epoch": 1.9695756605284227, + "grad_norm": 0.0798165165215919, + "learning_rate": 1.0759391354119017e-07, + "loss": 0.6166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6060048341751099, + "step": 7380, + "valid_targets_mean": 15929.8, + "valid_targets_min": 498 + }, + { + "epoch": 1.9709100613824393, + "grad_norm": 0.07952241282859478, + "learning_rate": 9.844331500034331e-08, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6397472023963928, + "step": 7385, + "valid_targets_mean": 16361.3, + "valid_targets_min": 621 + }, + { + "epoch": 1.9722444622364559, + "grad_norm": 0.08577264214557807, + "learning_rate": 8.969906179449316e-08, + "loss": 0.639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6487519145011902, + "step": 7390, + "valid_targets_mean": 15036.0, + "valid_targets_min": 580 + }, + { + "epoch": 1.9735788630904723, + "grad_norm": 0.08287326698149942, + "learning_rate": 8.136120136174318e-08, + "loss": 0.6347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6241464018821716, + "step": 7395, + "valid_targets_mean": 16079.6, + "valid_targets_min": 457 + }, + { + "epoch": 1.9749132639444889, + "grad_norm": 0.08095087491935442, + "learning_rate": 7.342977893546875e-08, + "loss": 0.6383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.635275661945343, + "step": 7400, + "valid_targets_mean": 16328.8, + "valid_targets_min": 845 + }, + { + "epoch": 1.9762476647985054, + "grad_norm": 0.07702461316924054, + "learning_rate": 6.590483754409237e-08, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5917639136314392, + "step": 7405, + "valid_targets_mean": 16817.6, + "valid_targets_min": 205 + }, + { + "epoch": 1.977582065652522, + "grad_norm": 0.08353983089533804, + "learning_rate": 5.878641801087547e-08, + "loss": 0.6188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6240130662918091, + "step": 7410, + "valid_targets_mean": 15362.0, + "valid_targets_min": 616 + }, + { + "epoch": 1.9789164665065386, + "grad_norm": 0.08288481791229246, + "learning_rate": 5.207455895365198e-08, + "loss": 0.6206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.618938148021698, + "step": 7415, + "valid_targets_mean": 15739.4, + "valid_targets_min": 475 + }, + { + "epoch": 1.9802508673605552, + "grad_norm": 0.08294923182205442, + "learning_rate": 4.5769296784653463e-08, + "loss": 0.626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6074753403663635, + "step": 7420, + "valid_targets_mean": 15770.5, + "valid_targets_min": 543 + }, + { + "epoch": 1.9815852682145718, + "grad_norm": 0.08301269507597478, + "learning_rate": 3.9870665710300954e-08, + "loss": 0.6286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6352344751358032, + "step": 7425, + "valid_targets_mean": 15678.1, + "valid_targets_min": 334 + }, + { + "epoch": 1.9829196690685882, + "grad_norm": 0.0873006698492684, + "learning_rate": 3.437869773101343e-08, + "loss": 0.6227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6336438059806824, + "step": 7430, + "valid_targets_mean": 14569.5, + "valid_targets_min": 360 + }, + { + "epoch": 1.9842540699226048, + "grad_norm": 0.08296937636453226, + "learning_rate": 2.929342264103296e-08, + "loss": 0.6079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380923986434937, + "step": 7435, + "valid_targets_mean": 17373.0, + "valid_targets_min": 195 + }, + { + "epoch": 1.9855884707766212, + "grad_norm": 0.08313305694130789, + "learning_rate": 2.4614868028274837e-08, + "loss": 0.6155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5898568630218506, + "step": 7440, + "valid_targets_mean": 15781.7, + "valid_targets_min": 661 + }, + { + "epoch": 1.9869228716306377, + "grad_norm": 0.07841450895238265, + "learning_rate": 2.034305927416935e-08, + "loss": 0.6142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.607092022895813, + "step": 7445, + "valid_targets_mean": 17081.3, + "valid_targets_min": 604 + }, + { + "epoch": 1.9882572724846543, + "grad_norm": 0.08059226081528832, + "learning_rate": 1.647801955354522e-08, + "loss": 0.6058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.593668520450592, + "step": 7450, + "valid_targets_mean": 15864.9, + "valid_targets_min": 689 + }, + { + "epoch": 1.989591673338671, + "grad_norm": 0.07953280935790458, + "learning_rate": 1.301976983445474e-08, + "loss": 0.6146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5993211269378662, + "step": 7455, + "valid_targets_mean": 16358.1, + "valid_targets_min": 449 + }, + { + "epoch": 1.9909260741926875, + "grad_norm": 0.08334060728670939, + "learning_rate": 9.968328878115495e-09, + "loss": 0.6428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6364392042160034, + "step": 7460, + "valid_targets_mean": 15288.5, + "valid_targets_min": 239 + }, + { + "epoch": 1.9922604750467041, + "grad_norm": 0.08366994870475707, + "learning_rate": 7.3237132387604646e-09, + "loss": 0.6364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.643349289894104, + "step": 7465, + "valid_targets_mean": 15160.0, + "valid_targets_min": 425 + }, + { + "epoch": 1.9935948759007207, + "grad_norm": 0.08287524752697885, + "learning_rate": 5.0859372635964065e-09, + "loss": 0.6105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.612499475479126, + "step": 7470, + "valid_targets_mean": 15704.7, + "valid_targets_min": 330 + }, + { + "epoch": 1.994929276754737, + "grad_norm": 0.08134192923159073, + "learning_rate": 3.2550130926789487e-09, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6421562433242798, + "step": 7475, + "valid_targets_mean": 16023.1, + "valid_targets_min": 287 + }, + { + "epoch": 1.9962636776087537, + "grad_norm": 0.08336881992144246, + "learning_rate": 1.8309506588959356e-09, + "loss": 0.6224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.638372004032135, + "step": 7480, + "valid_targets_mean": 16144.6, + "valid_targets_min": 570 + }, + { + "epoch": 1.9975980784627703, + "grad_norm": 0.08151270047704698, + "learning_rate": 8.137576878508578e-10, + "loss": 0.6412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6109259128570557, + "step": 7485, + "valid_targets_mean": 15843.8, + "valid_targets_min": 352 + }, + { + "epoch": 1.9989324793167866, + "grad_norm": 0.08234255749905797, + "learning_rate": 2.0343969787950387e-10, + "loss": 0.6171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063399314880371, + "step": 7490, + "valid_targets_mean": 16544.9, + "valid_targets_min": 819 + }, + { + "epoch": 2.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6287916302680969, + "step": 7494, + "total_flos": 2.788441056922829e+16, + "train_loss": 0.21610206831669151, + "train_runtime": 19384.2842, + "train_samples_per_second": 98.968, + "train_steps_per_second": 0.387, + "valid_targets_mean": 15631.9, + "valid_targets_min": 505 + } + ], + "logging_steps": 5, + "max_steps": 7494, + "num_input_tokens_seen": 0, + "num_train_epochs": 2, + "save_steps": 100, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.788441056922829e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..a244707 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2216a87350887705977d7daa8a0465f17ebfbebb7ec085430ffbe5411caade8 +size 8849 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..d9f66266be65f7c737723fce54bf4b196c35c0e7 GIT binary patch literal 48904 zcmeFZbySsY+c$X8NQ;P@MpQsWVABnvq9OpbDHGj^t9@nj#&ED5_#&P`Wyn;0^o~5N?rNS_b_WZfimobc( zfMG-fl;rS=cuUU+{71&=jJDGiJ2NL&qdTUUx{;H;wVji-r7^dQ=^aN)J6lmfys)68 z0Jnvclf9#ikdV!P-XUmr$6QD)>(EvBls)$6Za88Xy%G9Dl&tvH62nTJ&YwPc)$Q3- zud7#N+cw2qQ)F+6>xBcR5j;uO4DZQqz5k?n@@nCbQjPZ+B8r*unJ=WVq3cCvMO!>8o^?|RXT@wxQ{{f=K(>_hS7%9IE1 zGki0p>?$U@&j9}zX@7}5M1Oe|^5Xyh%m3aWWF5t5sHv+?(aV2VQP0xz@Q{%TuX=hy zx2yOlN9>G3=}MpHbT3m%D3>DVa9xDm6UQ{2JSz6O7s<)V*S?yk1#)^&e*OBj;CC#x z_4VOb^Uc-yv5pJ_Pf5Rrbal3(geXBh;yMQ@?{z0n$(r<$krBhT_ty&T2bJNUg1wGS z^3fuus-BWbSKg77MY?Y*Xqt8VTVKA2LWuOTREE^KqL@E6~){wQ7^Djo_jW9}X?$ zRgb;ZHvi$n2e-AKQ4Sl^1ywaQWbAc6ey@*hW4AYtMAp+Rw{8t4?);pXcrZ3*;k7wm zrt$-`}5nL$Az-L#T9>=VemT;Ly-L0s-rB z?$BG^m@P~5v2Fh*pWr;%&LW?0`i0q^-F%^_E}Ww(^+wLX=qSazs}C|Wg*PV+c9hM` z-n5j4&E_N}9V&9346tl{GnkT5dQbU`;H5|6eqxw8?RH6!(rdzqL>W7KNQ?%F?Ur3fyYj3y zt@O0C%>3J$$#h0olK9V+xPwb56Z|CmBg7`pO~1)wCh($)ho^~i8C%xK6UES zl`AA!+SZF%ZEbDZB_85fE(;G-vYjov$PQ`GWdT?$co_G>!omR<1)0fSY6hZGbzv$C=pJ>s8ku9WT6e0zOi zaBQq|q?F71_uhD)b<5MIPY=9%8?UUSgr(~h2kdOk`gWFj%Pvp-@OyOVEGx&`;wCD8 z;vYYLbQZe`ar&$pS$Adv(!6z-v0`uYT=SPCxhvq_3 z^1$fV=T)+^AFFo0>Ri5lJ+OGDh`KI) z+-kL>fmtMmM%HDjoG-zPIQX>jTqi6S`WQ8{g$VwwjTe{SJ^bgNd+Ko#2jTv%XXyX* zwS$Gn*AOF0(bCf525WF|aPV$!t{A(57cNfHu6A>6G0u7zF2wKiXH^p&Jm!CTUz7%2K$qy>XB+_+fN(kmB|#$=OjNpI$QrRs?~P?~_i%^d+N@IV4T)mf z{rmT)78XY1YdbX*x2myB5(+wP?~i$kJHPr4iLuhM$vE*-!+QQOEu*-zDN0gay0h)+ z)7|g8(|GLoaoXkM$Br2*C@5HePrgLnt?NNglnFJFoRFql@O2<7qjdcNks;jnU;&4` z$KySu#1b$xyis3hmo+Y4H1qNC5#Z(~JbCQ8wuW(jX=<`taI3|6!j6j87BG8z@p<-b-&$Ops5xDnu+hE76)r4J+L3o3CFxX@ zfe+pd-7*bUJR0vAIurF_V;*X)C^iL?I9jkY-Ws?x-5qt5i7II;t%PrUd|WN5MYtB{ zc<0V-5l;LOLBVji)O?dVy2ywGX~zJY-l8^(VwEH#_@DLK!cXh=)Em~&y;L?ve*VOV z4|l@CR_C;9Tx7z^J!eY-VGmV)`9e)cM~9Ph6ZY9&Gfy&X`Hn09{{3o0ygXZce7wDr zQ}x_nRalV?9j6>+`0(6tgyPV2LBEQwUxNtJPm?mHT zck?NGM@PTnVp(Rvn-&r$Jhs-IdtCdy=jP|{!Ulw{7ku5oyX`VN4OZwj&%^04b`W;@ zoaOI8E+1S?O^wP1r<@zZsQ{Y0YP_dz-8!tWF(sbEBOB~>?H4b6BY3C?Dxt#uzVB}7P!!l4931ABmjmDm zDyypI=c?%AdRAbd&%!snx_mT%j^lx-`B$+?&heR=wv_95-)%4G35LJNS|ob+Z7svM z8g^zHN!=L<`Z4+eO7rjWRtgyCO$jSsW+z31nVA{5>8h7!LNxXCY;qIwrWKqgnBJ(x z5YyAsLl-wHClIX;_|Z4yb6|ou3o$M(E(AcXUAuRL{8NcjWrzAH~Ph!N*|b6KyGL2_@H3w1}{U zg@sJGYf=h|Q^%h0aC2j#W(`Un9z_*PLV88_Q&R=DT|J?17kaIU==-dhR##W!rj9dF z&Hpe@sOar|KKt1?w4%G4?Msx<=t`@Fn7ylOpeDbVn+9qT+>F7io_j2OIcG{%^xZr> zlzAhKK0Q3RTDG&H=r=i0v=z=F8}Rc>6uQET7cWMOTRlB_{q<=ce9X@naVuub=0JGf z)niXi%BKAs8X^YN6Bl6>iVt}3fJ(U5S|)s0YISYx-RIP^>Qd+lSd8-z9| z@tIjgMP&$9!WmmzL0CaKycyIO)M-Ud@86f6$v9JOEKlc5;Jl9>JxWPOr($7|++tE% zTB^>O(PA-ILBVARn+GRhje`rWUs3Q5r01%IQ4ghMlj!Wx$0(_&Dq-h_6`2&+bO%7+ z?Ed~bb@F`k4vX6P^A*i6PK9NM5S&*?o0p$zM^;FVLRUpS>Z!nud&RS*-6IOHx+}I; z`t5SJ;A75dXw>z5a71ksdO~ONafK5nXhZR#tm2=?+`@-bJ>rQmw049onz=vD*RpBn zn9%~_F>8wN9a)Xr-1G`%muB=_nW=&884fs;EiW%GTESb!WxC5WcgJ^ok!z|ej~Xo+ zefOXHpUJs@8;R_P%K=#Y+_i6y(#9__lUf=tKv-@AcPZxDb?p%5(k`@r(UNsQNdL5& z8qN0lq>zCAM;w>e9Ff`AXTkkG8)@}%S%6|*y?JBY^770sj)EK5gpCCN_(28RFtjMV z<+sC32M(AlO|-dYmJKw_RBnz$flw$EYSdGU`N|AF7e)jRY7>ytCd>HZVII0j29el1f-5Y)f_Wn^>lK6Q|$2Z~mqLDr(88 zsnvjc9QwUijJ`ZQp`ypvp6}UT>W!0i5lGiBdGI#Dhjp?&tqRIhICP`l-yx&}00p9j zjflx(eQ1)V^~Z z`LvgYRV=71>U#Rk3g`q5(_P{pHy6HW7ua$b#?7+|zY=(>JSj$bz(|Mq$n z?sX2XK*C+f*@Ug6q$IBA0A|}$NW{m-2Qaa`zn=@imWtV)G={x^I#)a;V(qB0xU_bOWad!jX zoh?_j1O<*9^QKzp6KQl8ucztw!`9dy?Rh*gar^M$!-fsfcuIPD$q!A>q#e1RsGis^ zm0X5h1tXXqHa=6Zef`WCvK==I3;yiv?70pD-y7cY-q2ajT)ap}PJ=`14IpjsPSR5O zT@sazl(yS)OW&`!{cbtiQs%p3rne9K)szqc8zXF|>g?;wgD~^Avpuz3=@%9k5eS!q zA~d(KPzjiF%^NWPqlXU-9X5@1TT2S$=gLVWxQcDMB~GiT7>_l-h?cNnW#{0ShZ4ay zl|;Sj3#gHo#3cu3l3G;M#eE`q@@WjfiHhasW=%h_G1xs-SmvR#;d9-9c5b-2Nl{Z% zo7~Qe1-NvVgaU`P!>;jrJVn9fRgPs|h!SMEISMsSY;0)bXOsaBTb?PNUFg1gY(JZ* zS?DF#F{nu~Kyki&`Xns%R`7|{`QeRnoCz#nd6IHEE`xVv(bn498l%a7%dTuIzd{-sPW5S?M-|He;s9O7*_93!0G9bRJKKcFfKObSUU{+0 zw8%uIg<40+@Xw#7%{KE;x<#-l*wVuVH#{Sp^f;l|i*|N&dA_`QEG8pEC?q^wVl`%M zbFqm9OA;IasFE}zWaY!`H0`xI7)ZN}8qMOuLiUH=V^1FV2L|TA0BPyy++HqP?_~j2 zXquj$K9ycPV+iuTZvoGHn?E?aH3+rUF`)Fi8ebSFS ztHO_Bu|IB-Sn$M&JP*o~!!I}h%r`VPHV)yTewkyPJ6rub_*&e?tnbd3`^pDXl9LTX z@ymmOT-k6564sr<%fQp%4Oddy8lcn4!)n-c2L$zLeP!0pK0+KYtn{73ArBr56^s{c z8Jn2U>gNDadb-D7Sqm6wRtZq02B3#yOOij~Q_WJe(u{$G81{QD(#AotCn<+XEai=` zNtM1-V1IopZRt?2QXc_SF#&ENnK1B&^R}5ew%#v!dD-dFUdi~3*O$T6Gmb}EZ{QwpVQbxY8ow1J(S zeKmawHc0H&!WSWx-qv4JJs%={cOu~O47`{2Z%m|QXkWd`6nXCO6u=^U=MHo>Gh18R z)Wk#r-pupB#~Gif$B%`BPgj<1E$i0eOp0A+&DiU*e*bogT=~+o1^wCByeVG1u=ap~ zR|SUNXj``B0=JZr1=~b>OSDDXv4~*a7+ZtkN({b#|DIV{sl1&szi}UkioU-7RNHlf zp9PHxiV3vrQq5zm)XV~gSae_@MI0=o2kampztqC_984rc;{(**0xDBJ#Qhn7KIU7cY+lojDe=WdDd zj?{7aimeJC=jYFyh-zgmI&glaw!o;0yf%87q_3jlE?i9iSTyJrnYurBb-e#Tv}F^t>n?g1clxKzrJ=%({&cAcl~44*Y(~`P4n}0T#}vo zmoHahne+;)>Z{ z8anl1G~NW}_ZI9tfIGsNHH>&DzV<;#2uq#ARHJ0Sn8%ir$+B(V$9kOAYO|f(jONP8 zAFCvn`Tx4a1J>-~u3qSx3ChIVCU%gJ84-+$meME!l7Q37%Q(tk+xmC}Y56EZt z53sN0>U|o*zzE~rf3c)AWoYt)NU_lgMXh~_qwg@SN4oZSfPe6atxK)fR~XSKtO^Zku-r{`%L;iSM=>0Sgo!;yRkR{}&TwW>kG4Ls{?WI{>oSVZEr`NwrJN}{pZGpCS$Mn`MZf@>! z3$=4i@$$5#8tUp~SjaHNW7Q+7s;V^kYpbhD{7f%jy&_Gyo>5D$xJkHokJ!)KNly(> zV)DCpCqZrv``YWKd-*aW&Lrr;1Cbw3Yen&XetuyyA7Gyg>VLFYUK<1HgC+DJBb7gp z*NQ@iVf!Ze6+?t(ceYmWKAUb0&!qP)jy45eJti&{D4r1^zH-iB*p|_1_PmM;Ifk3& zV-5ku#mK2=rnlGuIMhO~eEX)rSkCVrJw3fNTUS-p2W=f`X=ycjuD$-yV}?-?=)Trg z;^~@{5W*?%fi;IWF0QN;thr|4LCTDnZ=Ii;6LyZzL$}aaZ)lq{H7qftxGp<1Sg%1h)qq1dHOVf zg3}E{K<_M<_pRS<=g;qfN#7{}VvmZ|G8-UoRO~-)%oMv#Wz~gpx;i)zHP4A!UNkj5 zQkEg^G}{{%v6sqUtI=(yC5ZxckmR=8ARO;U+F_sfik`rYY*G;Eg2KYYH;RDy!zB29 zPw?+a)0GV6lxGEzaI|3DEK33KA9J_K^j5s0uL7sn+{s&JWzX4c0>4lXYF z?-Z=m)x%mw<7ebGR&=yr5z4K2!n*Vo@&W7=`nlY?w`f0H;X~Eeo9w}$q)W-j7(0v`a1u6MyYvY}lNvzJiCQUPp9S23!t*>*a)Nb$ptDI` zcnv6;NcIn^G4=v=U900u*3%D?0&gT;tYMQ;Qd6HwQ1I4S>XJb+DWH7YOrUDCpn?>F zz-|wX1Com5oBN+V>OSDUYP^X$fKapHxk&N_U)VDP>gweMXqJ*+!vuT!`Z$Px9Pl&Okh=; zOC1I{F$)H4dUiSaQW8xc&BpI>Kfrn1qN1(*1K(P>X#o z<%x)hynb+btG;Fgf+-1=D5%79C3fo&FX%b&Go-_BZ*SQ7gueTVI4lU;^Zi0M3!A4# zJ|GGPlHVrjVQ;V@0?!@JUOoFk`Gu0P@yknW0v|y3@!fvPK;=KyU#5t5;NC+j1IyiZ zb@?{k3~X#x%g!xNF3vA5ipnGa*#4TJNUyX}w*k6KIKUZhKEA;IxB2%(IzCL7cfDb?q z4U7S<{AVOBVL7iu-8!dsdAb{U7k)NHD}nkY9z@Nh`Rn_{LCat5cK{L1Pmut9YYrOq zi~RidTiJsEcZaQnBz^%q9&deXvi^GC?lSNj=dao$%9>4CKRAo zLO-*5xOW}EWvti2ix)4>si}!|`G7jP?Vvl|SJIvQFvC{K{MxlA6%;nZR+9?cPGxFu zXaN6Nym^w|eokVPc8h~6EnG?lk7ZMseVpl3?(t7zsFHTFj9+~@T~sDCpj>+m^fC1c=;|>~)*LVp!>y)&d8Tt249&;q z!SB@0G$dkVWJKz+G3)}fh^YEos{mB+MwO&$v0{4wnks{&vR2oTrfdH2L*7+$2Y4Hr z>^}EV4!;#?%>K@uN~ExqZLd?au(0s@X83H*pXFzwirY@yfb~sOKE=h?_<~x=S$wLY zL=f&KP+LF+3T=xt*mJ81RZ~;e7GkV`M`=LB5$%$clVb;;K@51C;nJ3iy?r@oHd)S- zT59ofKPG~&gx!!0DV>-9k#7@sQtSKG*?*2eZ8tNw)p#zme`l@97ci$^L8xKv4FQOjs+~m)`m5+_s-!7sr&3O140jwI_i}L9d{^0CbOhDD0eGchxrL4n zBG_WMrrPMW^W3`~2ejg>pdiY~NG0Sa`7MfbM!ZU~$^k9fZ_Bpk@I&aP;ArUN0Rn@O zv=y7NocR7uOP%;Uco@nr9`5pob=I%|uu|sxv835fOS37^Ny~RR9gajH#0HN=zOf4DD!HtwPcJ-feG{Mx{I==O?JqJl9a`@QK zJJKod-r+mnXr;tJjV%U|3()*?8E3F#fV1E`HQrs#1~4rG%286VDhL|8H?byKiy$`0 z8c<;*K!ftx0PpZd1gAU>^RfT%6}Ef~5YR96^>~l;^=GK1I@!-w(xOCfWt_A|RFa7pW8WbEPt|FZF zy{+vaKR>1K_8Q-}Z{I?f_401--`-r*0Ogzt#0`I)v|5<0P$=;%HxG%3Fe09TByji! zlV1%n_6`mwVV}Xc`2!2bnVyb?dbtM(lyz6`9zj7ts4B{8YN0>=AvN&b5?5Fo+1C&& zPW|Z7BP9BQLOuwqc<~?0{GLM>rVD<>18PFj@@hxfw*Q`eyoO(&Nuz2GUYF_b>s|5k zo}u67looxNb-vl&RU$xnVFHkF3ibx_^Z|9&r$%)xijvHNVy1 z3Odb$On|kuwP;yaLCnUi|9dlCmNp3PE{4#2aPl6x6{_5*M}2)R8|b^U(XZm1s}hQ< zxL#tAeQQsdH#n7>ngqN_Esj0MVORy>V1!@5Qv`xj5%o`@`y%i5+9+4t%vpfhz%Mj) zbRHbgcdJOY)&h$SeUvYl4t9Ps&45CUAXN}8X~$XQIvXAv%Ze@y#Yz4-a>2garr<_f zctM{BH6g!&HnEWxJXt1;Ci^{f)$-lp$UJrG6dugu-?RN(V8x@b2O@Z2o}mPaNKyL- z$I(nE*03x<_Jz;IN#A)@(RuL-YJqHQAwVJ%LD*%WBt_X4RMsI7FbFmJ*Gg}u5eb^; zP#m5ZsM4mmGc+~RJ7iRLc6L+U1@u5dRIIH9!a3z{3#Yg0AVnTnAx#n9xi*|51c~%u zoz;N?HrITLe!grN{QUrxqzagPH8TZRr{>_`oqBh5;rLy4Sr-~Gv8!Pn+{!IeeJ$cK z6E?fsYk}GfftFVbpMqH!yhX7SAnR_wV$5T`O0C*cPXZ9(Rf{e+Us2ecI|WAE5X2lL zvFVcM(vELhvWj#FZ#Z*m0YuPxI0>|raj}MxLkI56wcIDh8dj0*iY!5ph~KEk1)vPh z&pT87Wn4hf*$i}EA4UJ&iPwZUM92Z5g)%F^cB8X-M<8LaYso;dg%-#HTIAf^+`x5W zX%Gwh9iK!-`oX4AH9XtiCa1{n~4phn^*d@qCgUclZ@8hck=^yC#>h{L$JV1{D zK3rO+sJ4dX))!Thxc*Vo~6~0kmwjKA`pc zd8amFKp{#tLlcp_^TUr`;nPh$y%_K{Ji)*F0p?R!HcP1G+nT0W@esQ!z+b|)i^P7y z1#LQjl4uPn5&=HGx{-!D@SP;US>t_lP8$~L1`K9hyyuKGZ)APw*J99jB%lQS8X2hu z!$UhmzoZkmm65PjeHUC_*9~Rw_1}Y{;ZMy-6J%Y(8{;G+0APike|`Da&Eo24=dzF!^_a+;=g;NAI)__a?f96S93($qy$_8w#5IDEt`{AR^ShA?rX)Vr zG(7_ZMKF^bQ^8W){6M7rj6()`J$X5|mB->Qb#j9L{rk~!yho1spU}=EtZi(FW@$Iv zyLYb>c=`{R)rMIU8}jDMmQ0w+>=TQ}A1h+u=A7k)+u!OQ8z*al9(sX&x<64lJ`(z^{BX2-vXcD?m`Qq}jnQ>M$ny3?~Up`OayOrN(PgQBh$HplJ#km)K|0?mP6r+iT<9hW4~) z7%2Yw^{ckvCuG=+!8B%0C@zJ&%I@scMr-5d&6}M-a5^D$6DyZ~B!|$Ll}{523@J{^ z;pL^;S*SDSQ1(orc{G5Q3(6guyk(#wtXtM`Cga=P*^JlK)oHt-{;=VVNgbV?O?e&# z!RY3^yYe<0(EfbReSp7pSSBpjoY5|b2$JMJxpM5-u} zo=xA!AMaNf!trbu$_n;AQ6&Q(9TI2E5sKSxo|12GAQ$)e_4H0L-tgQ8pi&`AlO2a7 zB@516>z=-*t&Lk>nluO9#WOM?Ap)AyChS=)^XDi<06l>F@L^IYyW-M*5KcX}nD@~j z8R9XI2Ovi9GwM>dYgiODsBo1~_EO)QY3OLc=Yc}Jb&+M$nHl^Cx2>g)umBhBZ)Lu| zh-{pL_X5DCRaJ$ktEF^tJ?0_?M0Yc`5WxH@xC)3@Zg0Bhp8Kj+$J8qN zD9Z6le(dn>UyT3r7YiD0xCFrnJUL8Po=$I{`oT01F_jN9I*;Rh)OQ2G=c3+RJ@zOr zE(8RLWm_uCGti|dDJco3c`Rq&bRMC?;4YkQK*ib%=)oqqu4m7e41p|nccH_y~fW06KXd`0=`U7fKT_qf^oLg{ze(DC$VE+3R zjUP@8fG-X*hjb^Oc~zqMXJGDx;z58z*%t5<-%g}aCdwG4VPyjy+s42MtP}JL#Z;hVV@QDh~E=I0S*+UrD zpFuh3Iix+c^Q~FH3O^WGk20U&1CwJA&pm0+9*DvPfYbv($7o498&;%$?bv?E43h&I zbaQtfd>y4<3Hk=g;P@oe>Xkz=Ls}aO6M}i22<>qdG%VUKWb(a$odL-y$TX4adrpf3 zNX`2>%`Gv(Ks10P4zIO4D36K4htQ+<9ykyPpgD3Q1DIig_cDvZ`q&|)MIy|N2sNn7 zY*QTtb_OHAek~ZlN0;o^czZr7=ZgbR9H2Z8E~2?3Qit#!u*bFI`iM5h24efq@|4fx;2s*spDYJqdKkt}!z6&4Ku~TJb~}kONck4B)>qb#4Z32?=Jti_e7JLm}II zY<&!@oyUV0R8^G?4Y_%EcLf3MRo%d(ANr+CkbK933^!>;+E%QtOiLYBz7PL-&e+`Q?Ev12Sai2gkP+ zJpHhtP|zI3@p^i0A}0WeJ>b_s_S<;jBP467&YaTJx^$_9s;N0TD$=D_`NL(}*QzAJ zpJs-gpcF8jRwkNZW9+f*u(g4_SDMd7OeN=@bhw{N(sZqY!w@M_yU^zXAVk?Xgwdhr z=AG9)x9Ifw(-1&5C4hY%OA}n zp|^~+zKysxigJm-pA;QPF^JYcB{ILF%PQ-$DW!bs)I2m}W0(Q(f|MaU7V`DHPC_pQ z0VGSPqo10ZBs=3166{sg)@na?wegH@M zdQQ{Xt^l}bxOpgMDnJy<)SSI2;)f(zw=QJE#7n~<2ujRpck68tT5^FuN+tk5b@ z%YklYKhq-(BTv$-bt(aJDKM3ffRBLqF$5L6&|~Qs60L5dbPxDLn)>>E?<)*djrRAg zP9LM|<*%+vs+?aJoBXy0-Prnyu5JiKv+oB67VwXa3jjRuSeXd}Cy5?tm>J-vGXf>~ zHcM;0k2<#wGhoq>>jgV<9xx2@3P2Zuu+k`B02o26p|dIA>w#bPFgBJ7HY%!mr~-0r z5|sl_z}xl7K{O79C1K6f)<^QC(QSAALm1{xNm#vf>4Lu~bn@IVkg_)+z=4yrWd}7F zIR_BdHrn1?o9-3+Rx5KFqr_0qBi?J_d}IWNoLlq22IOr9K_y~tT7fN>tJSK*L7~LE zml!*CdlzYZlOQD~%D4V;4`hALQ2g)74*HFi*|Xr3bQfE`3UiLeGLP@IXTN1^gK6JL zxjovB&`K(b)SEFzrdQ4I-E}&{P9gQ3g7BS84MBi*6{19rA*neQrCs#F@U4p<%RNON zsdPJ;IvRfYU|I;VlI-Du!hrMKdCtuiQ>B;bVXrF7Fi>IB54Ukjwb+M$vIz(bS;{kE zT?fNk1u6Ja4H%-$hyijOd?kJfvj`+*r?{BGM59iM4oF=>A>(LiN3)a!R}jd^spS~D zHQ`N87wlV4qp##R^XJ$Pw04=*RbSiO_coVy^@Z;h(=Yq1+=& z1aJ=u+X1MD-Cg>{84jb&EiR%cGqUoNuO34N7fRs+)-GM2IPSNoSL6g*kJ>;}0i*)J zEuN3C5@SUHMM#wbm^cIS4rCP8>Z+=$h%i5LTEHkETz{-s>-U_MCnY5kHGf94TrQk~*N42s&d&lo^3`AwLz>o(DIb3E)g*kxDC;a9F+cNkU2c@KNDA5W% z0hzf2AebUa?c#G8e{dy-4R+QKAl`{m#DYrKjSj{EYJD+d`Y zWYIMKww#B?7Svpd@> zWouU8s?mT6Rs*gLO0CY#**{bC<%BY#GJXF1`Ma9Q>eeV^ij*oCl!q}f!C(MDap4gb zeyAu20Hi8_wh9iV2t!)^aa5EEgc>%7foGoa@{;@f`LkMIQf)>W*l3$G=aQ*A>E`vy zc_xT~e;8X2l;4d8nHPD0KXS}XAZEvZ;>1s`S(qj$Pz0#E@S`SQAttIp*bsnFv2sW} zp-8U6DhUCS*C(N`;PHFGOaOvZfeh6y{O#}j04~$&m!YCZ(Qjig(S)+)*B7E-hyYd7 z1H@l6KyHqzDph|e5*-}Farl?@lZ=b#^2R-|)ixyyX5oYPdl>1A52lyy?Xd00f2zq} z4RSy7mr*H1VTC#9)#z{zhQX<+OvO3}-U3Up*r$>`R8Q0Ou3aO0p&10^oRu^fgI45q zp{rv*Dj^n(Xy?Q6xzw2e8@oT5*Im)scgq=~fW{r^dW|yIp%7-l5jQ9R3e<2u15Zgx z{Cn!hK3G#grmA7f2;25ZZ5M)6ZUn#$E00*al48SlN*W|2U@=TgOekn-*8P^+*7;(* zoMo$X(7_4f{8L3ViMge8hEMK^pi0MzBIuyyRRDJlYiLk|{M$Y_gEt0}Mb1}OfR3ji zTo31IP*5L1)3@;+R1nwVh82Wi=H<){% z^}^w$f{8A9kKg5Br$s>W*AQq25~aZ~MM-0yhJMiH5%@sTB`mpBKv}eA-21xGconW& zmNULs{`u}wep9Fz)XC-gwzmDKaDeOH4D*THEQH@7w;boJ0Lso(Z}EX6M~)y2jt&W+ zEC+OQd|4BGOC}H>IY1Do&O%9?_uX0X4SMkH;$^1b)2pELqcaEx;rt!QlbP%5CoKBSu|F)^(ft zk!o5+gl~U!*ruwrbbPo1QF`ZM?s%>gw5wk^VpkqJS&LD3ihPEy(2G;b5+v!oDE z2g5gMbmLAY*pVd@Eai#VAJrf&5E|I46w(Yf5^Z%8M6nsZJ%A=>Qbfb8PKQ{cL^F2c<;fRbYI@XJ*O{u^Ax_M?mjWyz4bi@ztch! zP17hieFG?gY{C6piC(KNHx`+fZTR-$@t0EJe%ky5<<~D_%Hd1NAz2C`!%Lc)n368T z4avO`PHLg}tJkk5B_?8U1Vv?%dfy4?Y|qpLQt7dyB%nLkRDkG;t#UtfqJuYVT3rZ* zFMmrO=rLfea`cul(Pyh&*&%m-_%H(l16n?au(~>)JI)YN^LWjQn2g|}s;#)HQE-gX z6mI>M4R}RVtmmRmMk-CQm$9>l5g{Gp-0>G!^TqKu8Il4NXIT*Gzn@D7SMoUBWA6!y zv+&Pdobddc*k|lA$Df}wqo2R=`6-D<9}Ktm8Aj`h7kQ?S{J?}vEGhbshwUv!#O42+ zGJsdeSND|hr^0`_`u*H|y1ke!Y!al&gRSWRKoRVG2ISSI6lDm(WP*GNnVTUb6n@x2M-Y%@0tX+cfchb7i_jiy4Xb5oJ8?aX zzugqGJn{#5Fc#BePgIYf2oT^5pEx)a42%-ub4Cj|e`O*#N0`}IQ9%Se!Up|vSUR=# zIX#$sKu3BmTp08I{U_73s+yXb42z*kgYKoqxer7HB;Ua?0#JTX3KK% z*)LyK4x~)u%&?UIdJS>I|4RaPPpLWk?SG|NY2S@awr%M!ezclkKFn8$5(^3>VI@Ma zoi=}TbhN6!zkdV|$Lm%>V&IPY0=m&%NHKz%!vfw=qXHlHapCiEs70e?5Utl)oob-I zlR=MJBDsq}StsWI1!2h@dv^I96VzgI1DpCwJg=0ScL&D#<+3e7{Hc&ZH~>CG;{Ngo z?8D9QGa<}G*#Ar-0Osp^&7VnWvK0CkvZkFPCBTu4lOUMsLwkTz25@?pb$)(+^KdxS zYrlDKNRVr18Iu7b7zDa=^vWA_8pXf3xVUXJmx8^cnN02PHee3N_r~t4)`C_E{PUE% zyL+4y#g4~8Hus--+8cGwm{M2Q(E+LSwv1CSz)nYOw$^(0c5dOy(?f@)N~v+!?Mboe zPFA!VoR|T~O6zeb5pEM9DdCkfpx!zuj5yryaqXX1P^YVNs@l3`d=N`~`uA=7ci(1l zNGT?IxBct_Z5NDg=|7mA6&0$mVuIDgZkL2<35S~ZCS|pbf}nbg1YOy~r%6!b#zhFU zdgYJ*Z2B*kuuh_LlYDo-Hwz#jeLt5N_H?W*v+&=tI0;oDTwIO#g^2L(L?L{S_hAeQ zqB^+??Uyv+13vxxm3yJqgbrK$-6#t1QQE_T1Mt*`-EByPE-~+zP5Im89mOYi|CHTC z`21_%E$TL(Xmt=J?xOkK!Xt|XCzmpak^P|+WK5U~#`waPk+KoNALVnq7d|FJ$a9W$ zu|=P*EJH$t$zuOjBB<_D7;6#X-!&ReTu!HSv!5(g(=xF=)5Vr{_g7@#3Zrus=2}fL zA|3i&u5;onkRdka894gv8oAJ&%=YKiGw^DP0TqtDuHw>5J-Tqz4q*CTqg%S^P5KEp zaCkovHbV7BuzqEVUSHay^!U>g`}a-Q=iN$v{~1)-xp-i2YSqN-73QVt!m2f9?^X)O7H*d>!-V)9YORsI8W%> z{=Wqoy$A1yCotM@l;8e44ZE*Z;R(?DoQZZP(Nsna0~b^UT-1}ikq3Es$=_-u-`%Isz`R>zuhtRwn-<#)3lA7hc z;UZvA$_~d&z<{Sgf&j<~5Mik7=;*N60ZW?>6h#rlHqg;GN!y*zMp$F@Dm1kOHQyiYvHse^2U+f56br{oJCNd@dcQP z@&ll|o(0Q-J+bRlymIcm zp73@L7+vuE24JJ2oin4Ofly!L8vv8C0y*i9qZg<8O4vXE;Vo+dsE7Al zwx+=eW6(xX6cKm^N^Zr<&;D1%OFbdbhy^!&;f&RvHS&5&fn;oYnih~bh?{=X08Zyt zRwUgUtTIXhz`L6K)cX zqe_2!;t`hwqQ~bBqa)0aAzQV91_&A_4sU$F-UN=4h24{Tp~hF`231FIk{_+LlEL{_$LMd9tO|Rv!a)P0x++5Ak$JaWHb{4Y6W~@Bkh@f8- zu$pX|4JWMcosK?dvAQ62K6j7qzs2t)lsU(ztjo=^Z4o4?ZxCh$*n+f{n~xJjvFT95 zvkD~Vkn6;t92)@*=4}dDWBF<*cN)d6l=KwJ`PXqR5~I`?)cJ@DJ{62!MGqDe2S zPySg=WKhl=X<3xW`Hudd1>ItlwHA{|C0EY*1KSv(cuA)#kU?>U$}RBrZ*#z)$%GH@ z)C_3-pCscYmV-{pc_c5pl06hJ^)GG(P$Z0^n9;u`JCE5lh@E zjiI~v-;TnGUhb7rqBXI1eT-qB|JCstPZ1eXa3@D#ZLH)g>w*J}(tqz%4z<^!Z$hC& zeP1tQN|&Czl#e@&5Ca{Y9imf8>>!&u^=Hy`z!jx?0h_G6`;094!(H$2zSsdW0tdl| zyt(lt8}{@H3l1R(v3>9&RySUYi4?YFP}~G5vWa&uYMLZT@c4&jQ;db==B=(9<@?2* z4MX!xQvMyBPNK2TgJc(5LL-U))WNX>>L;y5XLZWOK3)HJ;FpEjtKelr;A`5;(T;@E?Y(&ey9m%kpUj^+l{*K-x_>f>)WVy{73+UuhLh7OdqCf*LnY<@6 zq=PmkAmRq}=9!d3

^v!quQMtr3L8#rJzIPgQ_^0Oz$ac;*K@bV+!%Xunj6Z^C(@ zGlV!M?4ho{+5i!o~AO#K4h@2M-<~8&|kC z@$$R5PLl|bw;HASFys_~mts38n*CgmBzbst0>k)|uO?nhyQ^)n;vk2L&(yiMq3r*C zqcaQny7BpVM&ieh&vu}{-G0ri`zCHHWqADXUF}bI@iq**Ys8qkxC!&{^gPAS#G|O# zZ|LdcqW~7BI_Dxd9D{JcwmK;SKr9kGM(#+X!~c*4%)2p4ioLr^_3mm{rTMMm2^FjD zJM06a$Eq5?v5q|H;QrJ*__QDxH3g0+u=I{F?jfh=4295#Pn=2;ihe?v7Lw5L?x+A}C4PG)G<0vYJ4jai1aQ|Erc}J@IV$@b}iee3u`r z&9dM&dv9Tck9YonLgP4K+F#)bH=tpmaL1#ls6dc)tLy3(Bc(({MQKHRK%l|u91vs5 z&dC`Z9`-{|hJws?{`#}!)7%3C6Wl}Bw+(41?K{W`(qj8|VY9?gbb66+){XyIH+0vp zcSw|IZT^%4WQ-At?WikP-il_e7o-%X_+k=$zPfSxad6+`YPLT|3rey#@PyMTzL{)0 zcC{GSf$3Y1m1B233kEjW-Y3VJew!N3Ik&hF9k}`z9(D#meL8)8HU?kbdWi<(e}6gO zBxH9t?uFmDYrhmy`Q+1+)#F(VnC5HElds!z&2x5tTmeMp(f15WSA`TBI*&Y}p}=-oAmh%Fh1NHk(Hva(5lIj}h}l7_-%XD|#7 zLwx_P+5TDUnb9Ui-8!CNDlWDM72kvHR;@GxV94J^_5s)+m7wS#6pWQaWn*AwZhsmz z!{`*L^w|<=v|z+FzhObDk8yR-Ui2I!$YFsoLxxGg6Q{uJ?|`>IE>t1_lE$sTeb=gfU$^jx>zQJ3f17G0MdT} zV6X0hYd7WP^&C^JU@y89#Nv0)*7;B8Cd#uU*W`JW2q&MgOy3=!9{17b7zU3{Q4l?+ z^F|}_I5u$E#T`_`-Fk5*&I|+DC=5J&6ZAL-?{zUaqe_Rk8TmawzwU)^dI1R`G?;x( zE_oKa})_KHUnx5@)n*&X% z%mWEpj7TX>YZwm6Re+s z{Gi=|xfDlE0Gkj!Ob7%hII*_Kj7QQ|IC(aL7u(E*f>Z@uZV<&7< zkx`}m#bE+gt=Jqq)CE0gW^jDG-VUBHP>GT>>@rTtCxm(}*QD5lR(P4I2CkLKZ{O)l zvt``9-DtSo*O!li`4*Oc{o1vYJow({=LPmfA6;Y|c=LSILGA;t?#hG27R~G6crYld z!PkJx^$xKgu;R#SaX1rnDvr~03J<1Q3Hqj(?Dm++X)i=YS ztTa!k-!%9>arM$tUEgu{bI1SjyIZ@-r(NJkp>-EAiZJ?ejtR;KZHAiA|WVeoFf}-YJ~3ep+=8)v+fS_UK_%v#^F^;O?dk zd6BEhH}s4D*N(T`>!2OiYiaN0W05$;AbW<$kdKFvQrOjk5=(rg^W$q8y5OLamw*RG&l}k zlK)AkE`vicfKS#kVAoZE$;gkvLjlM)-~@ipgSV~5#MI7Aem!|6q>IOH+g)=+gZk~R zQxK;4?&=Vjm~a~QX8}BLth%-q&K2y_dOnN*CxFsHpyrud0~LOAOG{@UT$Kg#HzXV4 zbkD8|+lkQ5{~h<8;5;7nWgapY1CP#f zS}w?d_6-jlQ@L{|yS@&}0Hj1|OQ+7Z~l@vj`_guf-`S0$`#*B`P1DAW> z_q@+}o?o3j=YJUM)C_nr$iF29m}scq2Jo7_z#v7HIs)}qLb^Z!JptVK-O_~r4@mhx=mK=9r?w_0)L@&91Vr7;o{xAw7D$!q13H8lpz8us+imEK0rFv% zjICh~4!3p#{l9*{`O}__p8Mvt8Jmy(`=-`^Bixraq^4@Lg)Knzya@<*Kz+CqVP3D5 z$vtkInYQNVeZ{}4!9Q6k$7S}3kAK!89wK0I*&EdR#^D1Av}y64SrVA?!XOSGgRObXI#mHmvyyDf;s9UrK4UIpbe(DTWBV%S8xqS zoQ`S$&cX)W+BSO-fqjgq(_)Nf>Jj34|Ic$?hdad*d7%) z`VALQqhtSJzPkWcV0d3nP6-($0qky`ao3#Q@2^hkD0t)^?;;Zk#} zzHepnHyD2BZiOC8i^qTH`R@n82>F5w{GgA1Aw3148g^=aBLw(qjoLr{M5xd~<}qk!j!%9z|SiSS9Qluyhl8M|LyrVy7u z`uP#rruE!~ATuL$F)gBhhqyb#^6KPXp%|a0s1`+6 z(Y${72l!6tySxnI4#>{(yBFY|Mg{H9%^#uI-fgbuK&V~b%?0j~M7GWgytloCqc#<)|2}ozNG?g>t@y1j&~qbMv4OeD`BuNC*!*v(r?B{tlM+wpvB_IHY90TzKbCM>8oOirjvW^}vQF>Qw^O%&&nY+b5{^%Y8u*oI-8l>JrT3}>@+K9X z6zeEdd9D3)Alk3FAZ`oWMbnuW)aEd&T^`v4eVu|Ut=@tnXF9No#0t1J8Y)CFrZTuf z|1Bo+7?>ki`irx74Jz=O>COAu7ppG>33s_=rvxTrHr%}x4M7d*YFI_N_o717rkhhL z}y1usC_h+&~cb@e3A8GJ(|d`kfEB&hUS{88NqW?k;o_T zuH)w=62)2t69RfC9Tl%zWHQ~_?0t+rH1OYP>QwcmpJSt;p9O~%1aC}aq_=?wZ&UC$ z;hTrFIOS*mJ~J~4YNF94_MP^;5IwWvwqz=pbQKvcm_UL#0PbRIQV9P zO7u#@>llbjSk#D*I#V2!fFDc-rmQsIIJ)>h7c+7I zyj&Ju!C6)zb@ah;Om}|Hi7PiNGS1fT;A4>imMArrxkXP(BAH}&>yvzv5U@jj9kE8c z{HCoF6iJNd{GE6Ji(HXiJjHT@HqI;R9BC%+SacJ~d@`WL-Q1emGK$`E^#T(Do?{YHf@4+Jo(`xx!7_GfV>2Ar zm8vD?%_+LW{u5pC2DF2xNhWB>XJVM5JKIxG=LB5|EcI)mV-jMMeI_V_sc#VW{r}zO za}Jz9b-qBn2qJSqH!Pu|GF|1#>|WsXA;syH&*p*A;~!WTn_Fknurx;wITEb!FUlhH zS2tU(#Z!&j%xC?1ZiH~LC6)`Mk1yJ1e~3uKFIQXPp%X&4nv7YXa)BnofCK=Lg-!?6 zAA$jk8fY)!;Rn*`Awaax07RWPHDLGxc%unW#ovnnB9tBK0fiEnAZj=;F%buf4(r;q z6iQo6gR7TXhpUSCjCxXk{>TN;K&)g05eW$fTEgtuI|rzexg)GWt;zu@%6fJOxCp$_ zL=AOZ`kFitAAeySc=@Cvuyn**zhdD0U-{BM`}@ey7&se{&;VR7Kj6d${wcWeSTu}4 zKm{SE5d_-2gPeS5@@GrPM5XWW+aCI>sR?Y9(IUv<2O%5TPEa&W4g$oW|EPI5Je~&I z-0(LgaE+L~Cr*tpMiX>gJEuT^KBD`SFaYd@g2~TGNJbn$jxx9r{lHpUDLe?G-aZ02 zrDs@L_b)BTr2#?;%X|pxzY232UJw-m#6t25seehT)|{jrLM;`fvPzYtaqg|DuA8w8vD;q$ct!Av zpK_55GRe?|*J(J)mBzdMllC>({E5HaHBzoJmcBKsLizKMKICxakw~@JJGFg51Ysz{ zioCU7-*_DEo`w17Sc+-zVn)RY)Ytsd8Kbv_n*YpBQVjD{+yQJCpudMws^ErbMUB_} zmv@59qj5i;QxRI3*}1>$lU0V7(NceWjo@U9>EJ0SEq6TPL>f%r8h7?Rle_{r$Li|y zv)!yiJ9&t|hGko=4_>Uw6ygovB&$P9T;n7dIDkJI#3D>{ik6G{I1g*z*td8HL|Ef)U_TdSph;G z=-dKafKh{wz%Bs@256)$T4PvP7*wUSnFT~Rf^G*%OD-}+D$M{^^KsL-Ei%eTyD}E5 z;-`p4M{^paDd>%9d~$1tESxbbmCO@9b1@`S>;-j9FkUNQntwc;NuBuUWoiuBu6^Ua z8|zf==yb%V46r(nl)?!Af9Ycz$5rTh1)^$@!R;uAH|PZQ%t5nvsX!zya8*FLWT-p< ze8+luiCNPvVhah|ojJN2&Qh}!g#~LSR)|Rp?23ZbA#BbVYyZ-yO7I6Es)~AI6RNP` z2iWVpKXP77=IAK=9Vwx&88=7GA&0Y2f`PhA9wA}!?}l*E-1l1-ep^|VPhiszOs$*U z{!%6JWaawVIOac}1sSpn)Y%{xu??jEg4|VTQ~^}WE=>xMGb~=6MSh_F1$ZMgx!US) z78IoZ?=%M(>!A4nKrIzNoM8x8Qy0Hi)o)|f(mdc4>6a~<5YMA?12?H~4JZ?KL4m7i<+4CW=?Rc5vLv36e~v7u#;hjjT7Z@6!W^Gf^E+c6 z-cx=Iwh^}mPlGwSkq?7$!aV8k-Q%?fek?uS>lp;qxPOAAc-;_Kv1wXan4~hwiPzM@ zN?qw3Tm=k^z0Y03+v8@*p1}kNZY~0XzXt2HrJ8dlJOp&V|AifZ zF^kZP0L?xzdT&T2cfo^=9BxK+X;p7W#f_3p!00FIEIBs&zb#8LPui}<%h1;DNHGks z;$$OfwKw{E*Bsd92<1-qi)u$piPd2CI2rl~Xh&c-K7O*gsqbta<*mjhZ_$ZSM zlX##lOb{8Tzp7CwRWi`Gh-a%%wQ+n^6G-7dLJP_VF4Mc>yI}UuTAXNevYHl&RdczDh6yNwJsqblnzhEJt-_qVW_2QQ|u< zeh^tPDn89G6pt>=-AvG+9sEU8CONo4F@x?4x2B|CA#N`1R=2EVQmo}>Go5?0qSoYY zL9MBi!wPW6!V6`H)aU^KI>`Ol@vpvA>q(ECS@iY*=EJoETFlH>%=oyioHs^^4tKXFkxN?^D zcG4ueV2)$QPzT!d3r}2<^GiD2@lxO-;1@mEC`zVfSjoYEIO@(9f>Asgos^o}l4C=-UTj0I%g$wqm6B&&9K--J61u zuYW>JBttFyRq9#1V---@K}?%yZ)_d7FFX^PR&EazNM;7K=L`SLZvT3u9x zzr@0^R`M$j^M6BdNs)TC{N8r0yASrLBMCJo^pq#ZZK>6yrE%OSM#c2lG11 z4*44vr83!~GdCcB%2QgZOjYyQSRzrFkB3B#Nv)XSRVgp}YZH>$^hU<^X5wA$?96oAib&xy*J%PFve;MbVjS za9U>uJd?`^Kz+@&eazS$y_e_S(x^t;*Jscn)m*JVqRGljA$5N4(!GC<4J7d64rk7v z@|s0luEpdSldSnj=|0n2h#c0{uYV~c`c^ViFHtpNmXxpg@D`u!VL1qZN0-?2R=j9| z=JTPTK{cTO@?U$Q0kl+$C=93FC$jDR040uh6%%}4nkdN0@nVfI5m||FtlT@-VX7rp zA}_4(>|P~*qlrKwtmAuI(=kNCS^3a_Aqi|TQOk+GL~%KL!J~kx{sq;zz{gZ zT0PJ*s**V%u|8DOhiUQk8qL}!52~ASK2%1CuSdmvhb;4B*_r9K;o0EZ8?kC7ssb(D z+7AGWg5KfJ1NV#V#~tH)$17x{h@;UMJpeHflnEA0G_bCXtBJyePnP$%dh~Fh1{>*? zin~x-c9Exv4{afRYf6J%lR*PId>qKO@Dl1GE+Pg45;za4Q6Xm9n(kiTOnx4@Ex{08 ztSRS9BX4Y6-Ryz;gTB9_Vj=F%@e1pNH9fdKo#6T`_jh4=0H}zIa&c^r>!Se{&e0Zx zA>zWnL{KW2kZ?PeQIuenr#at7hjH^{XwOlOgfP5>LGpCP`zG`FxIIZ9h^)(1jO^~+ zaAy@yz%>CQ42(oJ@kaLdzAchpsfl&`f|Zq3K{9rNvRVXB`xd*dO>~`~@xP5*oE5n} zHfKe_EubbC=*3iivL=;c<=o3)FRkqVcnHr}!&RwRYFb7DxN)i7w?tyjBSO+4@ev_u ztA@J7znpz*&0@=JwQ9rQ>{E1(Lz5zd_sBK_ZCa8c^*jk~BLn@Hmv5AlVLdQW0+qU; z(Akfag>A=APGTi$R<%@A$cpRhWE2!q2oN+Br@wS z&UzzNoI+(kt*hN(BdUKySNF+*Mz?czO;p<~yv)D)uEu&$ik$0oHQ>_FBh3paxPHtR zK;l=qJuWYLi!y%_&W^2Z`^9*3$;Z?sMpnuiWLA_2Gv+D@hNogq4J| z-b4lO;yVIhvb?E;KFF4hHiVPzH~e_d)>-EeY+H{V$@Eh_vRm^HGbf@mgo?!eq|Bxb z9jLR6THM;A!^&Uqmf&mTD~wIf$Y~@42IwIV`YwR3X?30Pgj<3hzh^}oR^#bU3a*4k zncWMGrpMDXMhY;w4zbmAYYtA!AA2*FVR>Ah3M^L}qeXm3hITDmBq^EzLeuV~&0*gw zFXdZH&NNUPd(t&x7UxN{wu#A@iRSW?GY&6-BemOWERm*!u6mH2V3G>Z!nhZA*D##y z5!;ks9tSnn0`~^AnZ=W8P}g&oCVuQJxUl4_5!IYHaW@cd&&^(v^@pqo%)%I=2sbeE)nNCA;gkCgDIs^9yv@@}NMZzwr<8lNKevFSEv^tG z-obbEN}J5J@X>1+Mg5*}#sBK`!hCK)xUDXZB4uL=4ic}a9Hri=-;HU(t<0?X`ExM_ zKrXHyOxXR80FYH$TJ@$u#jMtVYeR$tZr1-RYh3Cq7v6OS>ZlG4TcoNuEQdaUqYMw`uk`~#xh(ow{ zFoRnFouE(sJR`t5I%By4aPHcJr)tV}sn~61cy|5_m~35xpzDzj<_oCyM`{nvFH|q} zzVncz9c+9Y;QISB%Nd~Rj{F61gj&7iF2Xk^25*X^Z9+u7TR#YI=O=7kUscP3lhV9QZ~=Hc#8kue zy@zRz*vF3+?`MM>A>onz$)W%Qw~~Qs7-$8rFy`@f<~c(nGlZLk!ZTUVZP{e0Jj&Yk zla)zv+ z5mEu&`Jw58y7UITMTYUZ4?+za6J*4Je08_IHGb-`gM%J}N8R0Ns}r7$Cvg^ERKDAt`CL{wl}Gc0Nftsb87n4k#gS$Ju}b8@f=9N(N|*I zm+_;Dl&7wr2xEvUHOf!745jHOk~L`G*=1)Kez#vKL&H^Lj!)AB_|H0kbU9c<`fgb! z)Msa@IzLnOmQc_pYY03Gjfg=p%`~;qCemlIIh?)z*~Y)v!0Ysu(bA8y@M-xe+aM52 z@!fUH_YB{T`A^!P$DRqWBl!U|E%ocj^G){N->>X4+Z90PtOSt~ZkqxCvWFxxV2bRW zH-7c``NHZu@s)huC$q!aqkj_~2KV(~5HV#aIlS}J!Vf6j^Ek}hdn~)G!qfhsAFrvP#%-jdkQRc7FLB;t!8`2j)S;Ns+CqS~_}nIKX2UFyj- zm^borXt1LmnGC;df{s_YM=ofABu8VmL`=BN-XOO5uF>dPCt-N2Ybgt6w&u;E4j3XI zdf&*4%#Uoq$HgM=c4D4drtPF^x{G&cVS4x? zTO;u6fiU1B;PUhrw5ye9m^NI8$z^r^>VdZiBwW&|Jx-z8d4M!@j7Orxc5d>~D6No- z{)PxoWS1*YNkZM0{l)S<;V(4w?oVG5v^aZQYfCw%2WubRB}Um2pQUKf3Z(hKb{SpP zH#{l`uv4fOsF^O@*d7Vz+MTBz|D22)Bj(sjE!X@rxoq*?8r{mJ7xC;nI^3_$8Chku zqQ0NDGiI)~Eh1H}?~uN{1EWVPDezlF$pvc%)&JBWMig!8f#OW~2Oj~)#r{6oSjqQ` z6(szxO`7Y}$OfJ-oW4_02a9meAhO7~il>lt?Ul7iXvl{i33_oEbJ1t2YgQOq=rKZSDj;YobKEmhF5n?;cvUx+b+OvPanF~@9%t=nf!^arD-m?u;#`1 z1xxkzu6IpYWh1sYZfuqWM_bpTV`N!}EyLyQb4seh81U$|;>uP8cnV8nEi7QhVn2Td zYc#lYbZctM(+YMpecJoz`FUzEEwgmZ{cwk1AqkCE{!#I>wSC4D?P7_ic3LL%VR8zphqD-+bwwq#vGWLSdOLsVUmK z3k_oBbRD^68PXEA9TTet{Kr=FCRM;?Sds98U5Y8j!i)bg;KDhj2cQ;e?^oHZVjvzw ztsjJXl&Qr#DK&#Vbqva@t6a~VtuHfrZ*i;C(wb$Awbp^0C!Xp(L?!A6LYx3OTkX~p|CEvwt-9ffFJB30-+!g*d+d(ufY=Gr?G z3}&0dJYzIEXS2lD@&GfLu?i)6^)TEOy`+)1G@r)U)Q124HhnC`TIx?{MjUg9@j^qx zS`))eWP%FgyL+>dA|E+TE|cFUsw2FMm^7j$pt=M>VAFKkb$_Km7mLDzhxE5LpJX9a z(KdaN^NtbU8MKx)!>pg!#M`q@O!PP&y%%nW$uY30eqq{Z*_pn7|K_<}x>k6OAG;vf zWqw!W?$=npg0HTd!GE&=mzZ#w1c!0f}CQ-i> zrq6On<;&n`id;=jn%dkuf3muaD%}v|7v+ z8h`69m>{&5l|U2X@V~3P*p3Y~G(w?S4IqjRxQ>9y3K6g_y`mk~bId^ebpo=4IZ!QV z^~XT}KT3@I9=B~zZvW3l`2r3~vxa_2GuF3k*gAjgl@5N84z2IEAeOQrH?a1x& zl(o26aRF74lFH(2-D$5R{K#w^6Gf;u`M=xcfXk>45FpTy259J4Ue`IRWRXe)$oGW< z0if3)J0Ss_0t&KcXc&iT_kc0l7kGq6{6W6zxyDPf>5p0mDbvaLR&3%tQ-(>ob;G~y zn5G9?wAXe3>$+Mj+DpLM(w8kWc8!c9p)M2DRVtGYYl_C88s#KigT-Ttwp7G7#G$#l zfV#w3W0j`mELeu+&Hj_BXwrG>fF7=EAW@9?ceUEm_15~Hrww-i7+k(w$#mE)SW&GB zj)UG98q{$vndrQHf7^6!9gLM1}A}w(W`%{8F>aX=-CqDzm{@Y^o4*_8mPGtYO(%bT^Ar< z;VBFn@DC1b>H<126mVGNXs##)NBcQ;a8Ia{Cdhk$<^#&n_kzqO=n)AZU198pkn{qS zl>*WT%I7GKtVKu$3d_hCV5d$1V;`U~*Wy$W5%StvF?Q>|N2Aal;_ye(ino(ajm=D1 zeiMQnzo&)s{dmkRV)V6dMLQB)gm`t8n0(_L$E5K3UOLF=v~JJ%L?7`exW3UKcm=A< z$>6HI?_@!Udm$}>g-in5RWK}paB+3+d#;I{6Y=|FqSdljs5HE~kH??6ER>*W5tL*g zK_pf+y$6~fngXrZ(^tM*w0ut~o~On9BpNj z{Rch@2Gxd@3pjyn79qS7*H1>yosh(Z>VFIbHg^JK%{Lo;z$Hb4<#eMx0^tsTAOR(b zilIAjYBSQi^F)J$$3Ie95*TB0A5)MVUAk6y?zY5Cs4fjh20>Pv6I)H7VGjHBp!PS{oI2cxpj9+(wH@!< z6PP>^&2%KZ3;q3fpCUIY@xhFY8lsL8>}h#8tj?si=*10}PPa_S3J5EZBl$6u%l1Y3 zM=-0=uYB9l;}2XV11tUhR*}E>{Ony?lRLITk-=5FOw~szMllJy?BUH>Qb3UWIma%< z|4xO!gii^ENvck9@3C2NAs|R3dgdRq-?}85nMSvU`#`CnSuVx;18d7vP+Gcdni7`9#NW`Mx8YmQ4J3biBuAW@ z=qU!-f!ZFN%5XKHiqm?w^4OLUC*Wb&U;KtiP`5MmBxT3S=L8W#@bx?B-QMXWtlFNG zoOKqIEqZbi3CP-$q&0N2R13n)WpP#5@rMGlGsX%2|C|NWO#df~?ob^movN@~c=1Vmx)Cn`{G+|~Rf zfydZdSD=r=9=yDSA9Mn~wSdzA*LDXto@`x!T2jnLpPF{c0U&3y<%M^KuU_uAf@d7^ z2kUto6ORc#4^dPqTfu9B8kIFNCZ0l5pv zc9aBWDp4+49v&Rnc3x>IDI{>-P82x85+54m2~6`jez#W8V*u|(1RU0(o>C<}Jv8V! z*gz@(MCZYAar+Ir$W|P;6qn*K7MJo(shz0bZ4TmfN*^|VgKY^wPmgfJv$k&^CT2Jt zfYa!EW|ow31Xz3-_@oYznL&#`G6vrCzI+a3XkZ>fJGk0M^cP`Q;T%v>6P49{YKaLy zFE=F6_Qtt=)@pK9q*riQ%7@nSlkdbMnaB-!epyhCO!O^GuV}bjGA}imY#0&*W^UB5AfHQ1~I`^p~7_pVKaQQ`&ECPuJS0+ka@DE z4vdRYpBfA~;2_|YYc189UvpXM^6-_Y$mZ2Hq}3zKC*!xot3#D}(Z7MC?>8Xiqr=a+ zKV&^3`dAy|wSFKr7vv)jC4o=*HYqOzn6`S>3_mPAy`r~X372tkSc-@h+_LiUnoDMU zj##K$`?OmO!{?~Z{Q*WEXS=q4%jHcGo*I1ye)KTY{<7*kXE@f%+#3bN|IZ_5px5KQ zd8eXkon+lXEw(evU##_FRczN*5*akv_!a?~AQd=XO(}#D6EQO-g0^v=6Bx|(wR6QZ zhwzv^g=`KnFaLUk)I^~j$E=@Uh&onEV#6O;d-7FPgF455GG+X z9N7UWr_#4vG`BsX?JqGHK|c>;YTJ~~rHF>Rjr=i7+mmcOr>f3v7f#nP;T_;8%R>P~ zu^hQ>kkCuN89@42z&Z#@VQq7>dg`l0p@U>;RQ?$r)w!-fMG=p zsEUW36O~Xcv5^J`$YUQoDa~+1uB-fqokns@B^nE!r|6kfbJSH*j_P}9N9C#u*Co63 z6EKJoXX$2X0<48^Tpv7u6%~6L=51IriJgsg8Nbas@5M%sTl%+@jwSwvRUKVyRCxMt z)2n1-sZmn`ZekG7*K^U%;sC|mqdj-l1nUk%63~62!;0Cc&ChS?J>=bBKFRc)d0g_g zzH9x&mms3xn8f?gXj|U+nWrYe6=9p#dE8ns}P zqqb}#rSNY<|Dv575x6mLWd3NkB19Z(YdvaVGd5y1W=sI23h~N%F@RkzK>PZ5X2ndj z_({$q!NB<8>5c(W^%k*SMw{Fu{FsqSKh1BTplmc-jW!^+qJG$A`Rm`0?M?|1T-?){ zhWfOi8HkIC>I;0H52+7{xe&FLhaUlso<+AudR({V2fxlm&g$CA)^W@GT%BG=;i_jF zx#N8R?x)()5i$H#R3rx^G|-{8GTdrQm7SZ0Fi@s8`eToSpJ&29fT zQK7Wa36uFXa1bhR3UtrC4yHKFy-Gh<0YF5sY)p#RO06g|fJvZv2O*61Nqn-+1_8l` z@LEDun8Bo)xkRp^L4B9irm9y$o#G$wE0(L@JkUMp$Sn44PNX2bDE6!8ktu(E{2TZI zzSnlOtQQem@Ua;d7;gal)bmB=Q_!yK!$|0 zNf>ScU(Ds`U-3qYz_b~xCSnmhck zqAH(OszJS;dBK+t5Xf5uetkk;Jw*yXJS<;;3jh@KZTz>OrN0bdo4Rh6+S+IA1~C94 zb@bTINUkno#_D!;k<7Z_)J)K2{Sqzh5J`x&F!er(^Y;)g7+ z4fn!RDIgr;-TMMONrfVO5_uV8BcI>j!Hq>ab>-AqlAL3N1DGFCbR7^L^a7>8 zr&#X>d`u{xP~qz;f-WE;UEK8Je}z!HwVHAu!e4aiVvAw(SX*m`mRB^hHdM21*fda= zdN?~O2)FotM9Kvq)KUyPX89}MbpRy3oSgucq7KlbZpyf~47+({a<>>lxFaiWkg5Ls z>HMf!axSTy+>=Mhmp4Y3GROOjB`z8xtf>xnVq*!%jTk_dSRu(MQ1CK2bj#BDc^0ks zs*5h?aSI!v%~P|vt3ozFAROJWOkJ;v|9p^;pGl-*g=dn7pS=y^$AcUkx17GkHU)MN z68RsT4F^&?#ZQ-UPGo}v+JmZPbj|IWZ^ph=2;og~+NC<|h?+qAU%=1cGwAJG^vn{Q zPbQadw1NI%m9prsWD-GzIC7s6pK*_ zg6Xyg8Z61enz|{GfPF3r(g0x725OApL^Y%q@w=_cr`L-DwfoWUT@dp|`d~eUWbIHO z?b&qqm3;sx+ltw!`5Wg89;^2A)}qwdsJBwSzuS1M=oa0mNP@&yZ){W4Sc8vE7bet0 zU))(Q@K9{bAd(9D74KY=cK~M3qEQ}zfS(luDqb6XHin{wr-~XxU;^y%@6rUH6bwTm zsth=&Xqpw4uE$@k=|Il&!tH2uC>Mb9fgp<~vLXper*8U2tq~&%9@BvLAB{LW+Q|_1`z@!EHL@MEB6dE~A_D;ZeGFfMm=RW58xV@veba1>|p432|$_s7QRU!DDs!;b9!m*$X~B z{a*9-Q8jDjINA9A%IXunoy&eZyjMYzxNa$4pKL{lG0TwcPr+y!1M@~Sa;I~_J$Hwx zbmf;j(cb3Y$jID+{2IxpoSwP8#rg=#Owgj*l`<_ZyPv%NC$()ij<-U4SZ11qZTRfL z=k{juy_s3Nv{g>WpSzce5;%?c%WyJv3K5x!V^S1pF;3&S)mHmGHs53?Eliv3TH#%G z#2xEDBkSr57aqORj04{m*yybJ?U9DFz7KvutfXRLfWh&e_JyQYlj4ulShMT#9KZAP zmDLp1?05Qes}XQTK@Bwh;~tIWcor2p`AO0*=L?<%wD-G}TJ1}Exz=vReeUohVW0JW zge$ISqS&=w=IqDqn}EDX32%qDGx5N~oy#vMp_m)vqaKViSy~#2i`=7#O@ilUhdyO! zQ8Mg!xZ0PrGy{+*17w?887xLATGG$a#IHjS9It$$e6Q2om`5Y|#cEQv?oiRG0UkM3F1R*sjZ`%JNlhfcPrsu%XYV!Z0?yB47x-6scG za1Mju`enBewt0%#Ta?HTnnG+A!ifF>SCnPnCVpMq+UOj8JiKXj7lGLRIX=tqnOa{9 zQ;ai2fZQwnUSC*Qi8Hm)qr5MA$NriV+V*{MB#T z+hhg_cpIg`c_)Amd`{xO9+lH==S*u-V@bx_l1GKq<^$fCp=endYB+mwmdkJkkzcA6mvfpzU+JcKHXJjRfGpteJuO> ztD~d;w&7Kd$KkZ&50jug2tUNfZ=2g(5`jjF$wjE~xxc8e;F&N3`?Hx*okDb~7i(@G zG(Fd{7yTbm@M$x!iq$_)n7{EC4Vso^5m6M?VABsmX5!~hyEu%ZNf@5ddig3>ivh>* zf+H?fAOhb3;b>%WH>|eASrEgJ5RKpe6IoE;XW`jKcN&)Q@G|~!whPoo|tUx%(INd5Xpsqa4fw54Gq`SEU)p0xuqLy90b%QEG1vBOIt4$<*U z;>hw}?0Qyzx~rJ*-}ezuO|1cd0exyy&yGYvgMVjS`+3@NeH<&xe0V2r7Qw4dWtu_L z4-uYb@3=bmMMYSVFvsE$2c5#X%biLqVcH+~>s>FloK?XY0e9D3)s-D&{-VqVh9@Ca z7EZgBQlk-=uU#xSM1=LWG#noD9hPG`gs($1r3t zF3&~7#!YC!(PVT-@7-iCN`A}-d2#w81w ztk-kC&O07%S8*zIFhjo0{K#EG9Mi6HOR}?L|yjEFPLXqA6aNVmZ0Xh18A2{cHZ_b25(r=+tGn&j9HEa);TCl+L3HoT(S7VLL^?J(Xd@dcADJOhM{IpyNHFGJoMhX-%!7oC^*sOi;q8W$V|`@jBF8Q%@t$r7X)Uud8bejD^@ znZKhWpCKn@#Xi%%KiPfaZh7F1eI$Gf6aLhl4;$)wigka4>}9*fgs-2D;|5L>hPzCH zG_95}3wA$Wl_e;l-$uxr>W7Sit&^MmtO={@-FD($M27i1P*Ai3=novPrN&Z-jlsvJ zFZePZ%}LW7_fw_t{evZ)$s1m+c*~xV6@RQF)U^{kBH&+yBOUy(=C7eQ6PcKr5ua-v zqChv;lA&QMWDr4HL5?W1cBRMfakdnHFwc2YUYo_AcM*FOe)xZxk;#6nTPui@O7xflrGP;#=eXiQ@?v!=~DPJyn zL}W)`m#ZU*EC$Uv@2NSz{x&@ur@n+ot)ef=qd320BD7AO zZLe+#i-b5B^eR3^C7Q#I@4TKF;ye#nIVuRQYZ6M5rE9)w)q1=vs-sa>TSGxOu|xLA zs(L-1q?A=?- z(KD%;%5$?J#pC2)|1k!aq)J7p7)&{W2J4V2HhJy zODqgS%dSzzpb4TsIgj}lR(^IK$gOv_fF;^RO~*_=n|6@4BU$#o&HE(%Om=AZaG6ur z4);B)V(13kV>k$X41cGBEIHLP#9o-s4noaFDc_U_m1lHIRV`~C^0 zWJgduzPZ&pO2uJZwqn{s& zHrqSee+QOkG#4jA6RSy=K`ZSVQ@6RcB(6%&#olq9G1zbT2RH@TpM|}g71v83WAR#l zR)>LX?p-^c_9}pdvAnm5?n3JuCz1bkdH9CtbzGu)8VNyQ&qz?s)w+w@^|4R;-q#;% z+Ee!((iVs^HQ@-6vD`u?C@h)ET1(Ls7H>^%vIye_vukYLICP>*!}$lad2CX5HaTW2 z8ALyv|HOak+KU^v3+Y>VhA;~RNR?-U_U-ui0Kz$t?*P8du zue2X@C#<OuC@C+a!gckgiry=KnKp**yKg(OT>Zq}Lw!soLJ;&5{6w)SZ z4l)R^-P5=3=S#MqWgF3dzY_FqA>t`G68&Sh=6n4p4!8X#=;W7(cc9XTH;B{JL2KAA zFjDw7hx#R7HgFOVClE;v5I(jxCH={5e;lDW;Xp0EzK8qOS7bg^n0nnB3i=;fopS?< zH=!VxR(z;1*=Xu>Wye|-;i;$7IYT2t#j}smD#sscRFjkmEt?S>Vjse0XwC&)T0%HT z3gVZp`h6WO9S4S1WDM;ii6moSi!ORmH%WWyWjZp49D~FV6;pSs=r%oPDt=r$N#YW} z@N#tdv}E(ebb;;&DTw&2BxEZSd&BL)ugMib=5QIl&fSK9{#!DwPMURpQZ41%Fw49o z=>*Fu z&?g}yhr8XZqwOjiL`c$H!`TWh>8&mQ{lc-!-a*6GNRKt^MC3piHBTDk#3HpXyW55H zh^1^$K7#&rO#kt^-+wFZ%%h|3&LgM=)hLY6EcWG{P!NMuXd$yP*m zk$tV~W-JjBMr5rJLS$c_>r>C~oZs)C-}61^aX1FYd}i+Dy5HCRxv%$Ye=|ZN==&H9 zP4lk?GhS4|CeiSEnZ!sQ-k7W}_%nKEg~zS46N!tdRq$>FKZJ+qVcu(Va3v;NwS)>R z!+F%;{CL({?iXK=OOO_Q4_f*-N=PtS>_7;8L`?8>G4gqBgSlOLLtCqcc>H(m{Dc>j=Jc}vrfru)HuKE}%;)OSx6(J&k2QljTHT1zD_eYQvb6h(;R%BfL;fYQ?(aUw z56x_GjJktgu=X}9{3UHKXU>m5b5J(9F4`JAROgnfLcNa-aoA41Xw+n$(sQ(jNV5;$ zW4`lHF1+nr{oAyk!}P8>7ZdT@vVQo`6LpftvtM-aS=LS2idmJ_%d?goHggznt4jUL zhAdA>>}1eeYG;OAa;3H-`(K?1J)1CS%NlbhDdVDoCofHYn~0FpN}jaMlgX%I2q5gVt2ee>T1BO0u}X^x zJ8`3eDHqu|#nVL{9W&AdZT`;fo3WOy`yrzH(?y&cluOfTcRnFuWUwvt>N^;f3gBrb zvwvRk$u40G9pZ3lL)N2BoRd&&GN4TwC~uig@9ZWJz1St0;3bMela(n~U)k69m3jWf z?`sm@PG|V~8 zwLC_#3`|SaPUMzHgw6F9<(gtX`>O5iaU|93ZC|Ews&wL3k@yXNSv{_eI-b#n$QTeR z-HWpWLt`<)tiIN#PmS5rvHU@^9FC+pwDk3+S8|r``0(U~5R=DWhQ4)cEa`odU*WNu zZ_w>#okb3z7%~`jKktk|%EG-Pjyc8GE}D```SI&5(oCjEM%gLa8;$WjVVRc_K6sv+Ucdh(X3n<=e|6!4#Lw=LB-9+wtzflBScx_Q{MDSu#Kruu z8M(NZAFLPnM#b>%c_e;MNt6BA(%51OdG{DXkNhK6a&;kJI92pW>ZcG1b8@zYP zgb>L5Vi~R=sk^nlndcMHM-`Umkjy0ARiuu%%R5JX>U@5nN!7tiid5C0cjDP@nH$F| zNG8;u9^pul?KW{D=6ohTiv*){^`}0Fb3T^*z!T?YoW>yR>r~*ieYHBZTx~$!y(BC0 z&UGnotFGcs4v|VZi|l8!{d2$LTnCD_RhfQ0}$j{vFj;0lQS^18x=X`OOR-n01$D>aI+nf9J#qSlU z;uN~ue8lB&;iK9TOQ%rLC;tsu=!vABr;NXUe|J+TkY_29w?r{@0HrS>+ z(NB=88Kh$Sa?9h%jaUcerl|VfPeK}$ZHMbd{bMT!`Xhr&6U!1@ZZmpx7Gbsnlmb^4 z$6}djdRC%rG-W8}FYN2QImRTWR=Ri0_EQ}3U9Ov6UN?i#-94|hrBc3$(~?A?wFo7e zIh3Bpt&E{9uN5#0_Oq}SD;s#6wxNvx-A3O|(wa}QFfRB>h zMYShoV$IS&gI~rPq0$wm&rgf?Zsq8A5leW&0!2aFRwl?r3*B8v(~@%M6KB`!w*A|; z+RoP+Q=hi|Je47VmAhXjOb`*LA=48r_S>%>bgT_7%qQK}v&6X|>8k&xENg`SEh_>$ zvjUP~%dI)qpZc=N0`XUQTqNok8n)}qI$kg^MW*V`nwres>lxsPiwmg7p>=?u+KneseInP>_usjOoO6*1Mz(R(C3WD^2*Hg+ce>uPChS# z?B*&|AOpXx+roOKCtTryDukNxMEa=P3~N(A-|};WpQK=Z$LGnJNcJJsZyDoBzspVv zem_tF?emR!cRbBW*)!Z%V~fU?JkQ+u zBnC}>f?S(`nskl5S6}2yAusG1F{cR`$dP_`%aDC0XUlOdhI++mn#>X_o|OE~lZZxQ z+&?;!K$VRAndKs9 zB82+LQrq z@t!VM#5pvJPTj<8=Jw$--F)TKCXLFkhD*MtvArHa5_qm&wf{yt2Q+GEqL54NNvsCl z!*JIsB7hvUM_tZWwJX+@+$J0kCLDR$X(euTBKES34emt14!&4_dU%21VVIzDPJ4Jh zlYpyCT);b=AMe-IN^5`OPFnKEpmJi;?JwBgxF&V`YrH2XP|*pA+jTvH1&Ab@V>8q=lsB5!uTz)w45fPf9vO5ckeCMx_L%$ z^tF1{jX4kg!9-*EcJ2tOJN2g^1ejhs(NtO<>=8M;UF)$gEr$yvs$@7_QkDI>{)2Vw z?1TN$*T^PZ`O$-h5$gu`bOKMRGWD@b*wiR;dsO-sKh@TaEEP!y2k+88#^NL{g`SYC z=Z4%TKGUH;-94aOG;k(nazGLmYH?2Ky@D-XJDHZribxI5tr<=P3J) z+sUrls|S_0WZ`k_#4g$xB`&u8@NY6M?dd|OJ*TAFncYWW?qgdquwh--&#t6&x6&MYI^2t%E=x)G-ixv2kM$BG=Bk zx-Gt`ZFR!Tf}yk;*ewg2zb6ZB5uNdXP?Gup=W*Y&Dlesq?1bL#((@TdvX{qo{o?f5kKRaE>|Qqs;aQaU7xljo_=(=13vB)_mya@P`I+ow9+;Vv3ou_DIw z+>sOY;CrIc>Uzcz8eFIq|1rN2PaQbNH&vMb@~+%Npkq2XI5Y!6leB*P&`86~Y`oy( zW$-MbG%CYwH7Z*0ScknMO0yZd^_oBY+AmO`Sw$mZF#ac>MP85?RmzUNbwiE&o8A-C z&00f#I&Qz%F2_$I1X~*$Q-JgVOPpEP1PyNZ-Ud#xm)O=3f+5ge;HYsJ)~Y3vNn#b; zpt72p0^0v|0DtbtkN8_TN+%r4K3V(8l;3!38s7^c&N%k0x#pN`rBQY)GX2{_?xbiP*K^BLI z&_)iIm^b!IGX*3lpwQ$mdPyorBc&%F&;g?jJc0^}i`$_>BNCwBQQPlGca zbcKw=rYh`{%Jy^2Z*EKJ-EIZKD;hgLI!UEHPEWy-5eukQdhs2SAuCCbA zIK+ChF^XHa?KIp+O4TJP@b|>r5EnSMQ^+uX>8X2y<5KkGJMOA_75~rG$<7-$f7RknAw7{x=G3ExE_gu#p0)*HSt3EkZEQV8C%SKMPl4nrPp8x$D=UX}n3 zlq$Kqi#2Y~P`n2NF(?c86WfQ3Q_Y;QK`u8H*JQ=g-xp%DybH zud1}`ZLM)0+vbi2)VM|(voSz8t-)b>d#LnbC|E}!By{As>X&NA#}BljF>E+*pAvUa zE_o7j`|gPuyn}BKQC(6J1E7Ah>+4gKfdW*up+p6o#KT?3*oK98EuNJNb^5&wPUkr^dTt@Dp<0B!P*4ER5^ zQd)?)-?9``aw+BNaX_>MaPIT@tG{o9JA2*1<`~#Z69DlHs!3W7BE>H3Ema}|)Z~qt zxj8G?2lC0}!N`JO5NKZdxW%#=V2|N7HJBDLIBMH|LV6q+l%as=*ar?V+sdmaU>GY8 zPSAwu+N3at0oj{XP@v(aX=HTTu+%)NzhB3p+GKybLs3mjD{3kQ1{(sy1lE>aB@;q} z-re0L>HzjFI~NxrP|$#P+$Oj3USgt+?hkk-A|~4pIPhs{=m)^6-9I?QnA;;&NKi)& z#4_CE57$}$U-fe!ai;{pg}!NW5=VhbOibKfxEAmft_@b-Ks}#coo<8w-SiU>7XG*_ z|3iif0xii@#){ZlP~2r(xTfYSoid32W#GkE3B3Bb9!t@(=g*%%X_PFjarxT)^8OE| zO*nZgigJRf9kgcw)OrRqx(86!t-#-GL73MJY;1i1w%D;|5H{=lG&nd4E{u2p%HgYS z58~yw#=%8ye7r}Hfx;9>CIW(jHVA}Pzi4QwG~i%yh?!SJQ8B}Lye^KOfuRE68I^1Y z^Xh`UykS6#Tjl zI#f_lFj5|nzWZXiaQrZPpbWScY3Z^aVGX-Ki!{$ARydE<+#FgH$Kl}?C=Q7ohGu3x z;7y2cI$UfLuQ&S$Wcq`<@2OziSb>GN6Lf+T0L}N84>1!ElFL7TzHVq>fDM4)xwf@8 z=5vOb*%(NqruBDubI*DD;nxHf4F0NSd*8>n|J-(DA3-T z8LgLq=u3&(19ZfWH3IU(xuc7Ui)|vsHj|t7Lz$w~hQEI8WkWm*lb$`3{K)nDO-)S_ zfhEv`ZbgoE@Fjm3ojlx>K1>15vpC8LaDS0ve*J=R8pikTNd@!(&*0;Rue>78;%Ik7 zP)f>R)eJ&}Jy7Rn<#Ra1n4^{eJ+nEsR#Q_`0c@QbAaZ!kMoIrB$W)B>2E`;OFMo4G zAppGsfpc_!XI*}RjjXA5xcEj}o_2b-6Xu0QV@JE3$uYz#-PaA!>Hr8`tG&!k3*Qmk zIh~Jfwmy`P0;Z>>4x&|DdU|h+Bm6;>k+QS9dnTsq!-rs1&K7WdhoL5Dj0#n5VN3WY zr6e&J^W1@OM;8|oR7gk&3Kfl(4VsuRZ%Ii=NT8vk<6`tMF=2)w7@!HjArli5x804~ zhm3O`GSR8?8IKPSA0mFB%gf6E=3X0HD=}|i2H2t3JKg}66(|p-rlEPnub*d$eM%2V zR??}A*#lTiViOZX-~D<^0rMGJ6ldz%fSrV+bhYsIRww*crXP{A0>04rF)k-k6{pl!m|PbZ4lN1hldTD(5|;{^CQ?+Fom>4 zcnj5c=vnOI($uuZNl9Oy4$xU$779nT?x-6-pLY~du?3hKy$Q$ zthx}b0fL2)%E2gzL>Ne`1|{VzNJQU zc~Q;H)qP>T|BYsUmhGq+iev%Ij-7O=HW?Tk42F5vvQ}cfDaCrNWB$)B`Hqg^*;7c} z3Zilkjl@Qr2|nS?1|RMB9YK+3FxG0VXzi&OBP9qg zsJeYJ+0cZdW@U{AA_j%a)ytQslN%0pwuZ40r`Ld7H2dl?>x}Dq$5sm5cAw(T(m9LZ z>p@%nt{rv4AiQ%~Sy^P7(6OOA8b{1^)y5PSX{T>ZJkB|eQ3_`Z6Sbsv`}09v|*d4T}c4lw}_ zVxF9&OAl2J0l-H)hyp(tqj(q-c#(%|6n3JFL^q5QbU}N_c`Y#_UxdvFZ~|VMnAh6O zC0t5FT2PCnWyZr@emP*jm{!<4agYrKzuQVE6sZ6PXBZDRH(58oq?D9c1hy5StQ#5| zcOn;)WbO@lrjLwu3Mwi)Vq)T;isLLSEc;@R9*9Ofd2$P=&Q?Hgw}XZkgo0S+vQF8SuA=M z4?L3Z$+P#qrxEw097SzGjj<(MvbeZ7(jTalf+8X@zyd3WVcLXV0b)mrCa*QZt(Wuu zh4ur!eX3gat(Ar?)_};Sg9)o1^BbJ7NWQuGZg^QCz%S;B_bHUNa%to4IplSNe{OHO zTr!J{n`M?rS3ZEMBv39E$XvAUG1r@(JUW<6#ai9Ek{kd1#}A-gbGFEqnANv}qF~J% zx|3>NYL6s{j?T{XXpfn8atx5|U>&*v>8amBZgR;mHE}!ccp$QBE9O;JCLH`uZn9C! zj=L?%>;;`y@%r_-mixkHb7R=K*iwCM5 zQJ=e%{Ax3yAO@4ff9klMc&f3Bi!j^1*pC2cD`wR0m`}2Z#mCmRwp8U;mH^6j0>kH^ z=RTl_aEyEV>wTk;HKynl+Cbs(Qm^#nsqq!prdmd8Cx~K{fnzd^>wPexaAG)oh^G8s zJseA}^UlGVf71C4-`yaD7599C)n zx=#&85g9T-00QshJ~-YpZQ1 zv-9)qtw=ybx3RyNrvSf>H4r4Be!uETn~n}v+@bNas;lYYt+(|(+>`()OExSMXQW+- zkaZCtiyPLV^K^ z_cQ1Y0u;t&95yrpgMyBYdyP4xVBJRc8!l!KutVi{(@wAJ>bHbzGqp_zLfo__mXN`j zZ=88bJ+lQ;63iAN;MvCk8sr1JB>i~&{Mt4hpLS+W4$=8^Dw8)1@Ci)F`JX>qch={K z=Y||4_qSlOIygG2T)Kp}XXk`}XQj3n?5$taw7C95TrU57BQe-ijB*U0Y?eJTLGr>F~k!{7^Vi)*|3mq zY_D&^t_s3TgjiX2Z_%*Ww3Z60x5<`|xI#32B>_^s=I7hM>bLa^n{l|oS5;NTj=?Yl zztISLkAbX&(+F<>2AJme*1(}jD0D_W)Ov6AHsH&-PN=qAwa-~2=fanu6 zE<=6&`W3<5t&V&2X^mfmyM^I0IK~(A5ik}Vd%F__20nid5i+gO+{mR??kpQPPmD~o t|0}8Or~QlW`cG3j*oONL^XK&=f{s^723O;if1}{z@+EE65@pMv{{nFt_ay)T literal 0 HcmV?d00001 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833