Files
a1-codeelo/trainer_state.json
ModelHub XC 44ea31a28b 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-codeelo
Source: Original Platform
2026-05-03 22:43:55 +08:00

9255 lines
256 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4186,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.012626262626262626,
"grad_norm": 8.8502213152326,
"learning_rate": 5.755395683453238e-07,
"loss": 0.9749,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0252163410186768,
"step": 5,
"valid_targets_mean": 3810.4,
"valid_targets_min": 1456
},
{
"epoch": 0.025252525252525252,
"grad_norm": 7.0326382192271595,
"learning_rate": 1.2949640287769785e-06,
"loss": 0.97,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8746949434280396,
"step": 10,
"valid_targets_mean": 4736.2,
"valid_targets_min": 1766
},
{
"epoch": 0.03787878787878788,
"grad_norm": 6.6940046336920975,
"learning_rate": 2.0143884892086333e-06,
"loss": 0.9064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8456529378890991,
"step": 15,
"valid_targets_mean": 3504.3,
"valid_targets_min": 638
},
{
"epoch": 0.050505050505050504,
"grad_norm": 7.365976748970077,
"learning_rate": 2.733812949640288e-06,
"loss": 0.8841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9217684268951416,
"step": 20,
"valid_targets_mean": 2712.1,
"valid_targets_min": 1633
},
{
"epoch": 0.06313131313131314,
"grad_norm": 4.630647013342811,
"learning_rate": 3.453237410071943e-06,
"loss": 0.8408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7999893426895142,
"step": 25,
"valid_targets_mean": 2972.6,
"valid_targets_min": 1862
},
{
"epoch": 0.07575757575757576,
"grad_norm": 2.9138235176363723,
"learning_rate": 4.172661870503597e-06,
"loss": 0.7736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7608543634414673,
"step": 30,
"valid_targets_mean": 3347.9,
"valid_targets_min": 1252
},
{
"epoch": 0.08838383838383838,
"grad_norm": 1.7558069634979983,
"learning_rate": 4.892086330935253e-06,
"loss": 0.7821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.826799750328064,
"step": 35,
"valid_targets_mean": 4368.2,
"valid_targets_min": 591
},
{
"epoch": 0.10101010101010101,
"grad_norm": 1.7134790575388017,
"learning_rate": 5.611510791366906e-06,
"loss": 0.7603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8243893384933472,
"step": 40,
"valid_targets_mean": 3075.2,
"valid_targets_min": 596
},
{
"epoch": 0.11363636363636363,
"grad_norm": 1.2388060565695977,
"learning_rate": 6.330935251798561e-06,
"loss": 0.6669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6428935527801514,
"step": 45,
"valid_targets_mean": 3558.9,
"valid_targets_min": 1264
},
{
"epoch": 0.12626262626262627,
"grad_norm": 1.0686895415900157,
"learning_rate": 7.050359712230216e-06,
"loss": 0.6699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6036921143531799,
"step": 50,
"valid_targets_mean": 2548.7,
"valid_targets_min": 1499
},
{
"epoch": 0.1388888888888889,
"grad_norm": 0.8408313638128855,
"learning_rate": 7.769784172661872e-06,
"loss": 0.6825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6488921642303467,
"step": 55,
"valid_targets_mean": 3712.4,
"valid_targets_min": 741
},
{
"epoch": 0.15151515151515152,
"grad_norm": 0.8793404803472428,
"learning_rate": 8.489208633093526e-06,
"loss": 0.6406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5900353193283081,
"step": 60,
"valid_targets_mean": 2931.1,
"valid_targets_min": 1889
},
{
"epoch": 0.16414141414141414,
"grad_norm": 0.9233082070664455,
"learning_rate": 9.20863309352518e-06,
"loss": 0.6118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6843211650848389,
"step": 65,
"valid_targets_mean": 2688.2,
"valid_targets_min": 587
},
{
"epoch": 0.17676767676767677,
"grad_norm": 0.7695618266666612,
"learning_rate": 9.928057553956835e-06,
"loss": 0.5512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5856298208236694,
"step": 70,
"valid_targets_mean": 2935.6,
"valid_targets_min": 750
},
{
"epoch": 0.1893939393939394,
"grad_norm": 0.7101539830507525,
"learning_rate": 1.0647482014388491e-05,
"loss": 0.5928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.602681577205658,
"step": 75,
"valid_targets_mean": 3589.7,
"valid_targets_min": 741
},
{
"epoch": 0.20202020202020202,
"grad_norm": 0.6757736826618855,
"learning_rate": 1.1366906474820146e-05,
"loss": 0.5919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5044267177581787,
"step": 80,
"valid_targets_mean": 3180.0,
"valid_targets_min": 1420
},
{
"epoch": 0.21464646464646464,
"grad_norm": 0.7052512337384288,
"learning_rate": 1.20863309352518e-05,
"loss": 0.5713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.546467661857605,
"step": 85,
"valid_targets_mean": 2828.8,
"valid_targets_min": 1071
},
{
"epoch": 0.22727272727272727,
"grad_norm": 0.8245207595088883,
"learning_rate": 1.2805755395683454e-05,
"loss": 0.5641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.605029284954071,
"step": 90,
"valid_targets_mean": 2803.2,
"valid_targets_min": 643
},
{
"epoch": 0.2398989898989899,
"grad_norm": 0.7141934894188182,
"learning_rate": 1.3525179856115109e-05,
"loss": 0.5706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5871100425720215,
"step": 95,
"valid_targets_mean": 3075.2,
"valid_targets_min": 1141
},
{
"epoch": 0.25252525252525254,
"grad_norm": 0.7508217175713096,
"learning_rate": 1.4244604316546765e-05,
"loss": 0.5615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5834653973579407,
"step": 100,
"valid_targets_mean": 3024.4,
"valid_targets_min": 1610
},
{
"epoch": 0.26515151515151514,
"grad_norm": 0.6869296589904229,
"learning_rate": 1.496402877697842e-05,
"loss": 0.5107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5773706436157227,
"step": 105,
"valid_targets_mean": 3346.2,
"valid_targets_min": 465
},
{
"epoch": 0.2777777777777778,
"grad_norm": 0.6649670199118626,
"learning_rate": 1.5683453237410072e-05,
"loss": 0.6192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5906274318695068,
"step": 110,
"valid_targets_mean": 4020.4,
"valid_targets_min": 1802
},
{
"epoch": 0.2904040404040404,
"grad_norm": 0.749817497328354,
"learning_rate": 1.640287769784173e-05,
"loss": 0.542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6468950510025024,
"step": 115,
"valid_targets_mean": 3753.2,
"valid_targets_min": 550
},
{
"epoch": 0.30303030303030304,
"grad_norm": 0.6555186253660183,
"learning_rate": 1.7122302158273384e-05,
"loss": 0.5134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5901004076004028,
"step": 120,
"valid_targets_mean": 4881.6,
"valid_targets_min": 1494
},
{
"epoch": 0.31565656565656564,
"grad_norm": 0.7273014966297405,
"learning_rate": 1.784172661870504e-05,
"loss": 0.5702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5654794573783875,
"step": 125,
"valid_targets_mean": 3368.1,
"valid_targets_min": 1521
},
{
"epoch": 0.3282828282828283,
"grad_norm": 0.7586180547020986,
"learning_rate": 1.8561151079136693e-05,
"loss": 0.5293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41630545258522034,
"step": 130,
"valid_targets_mean": 3200.5,
"valid_targets_min": 1661
},
{
"epoch": 0.3409090909090909,
"grad_norm": 0.7688770234195088,
"learning_rate": 1.9280575539568347e-05,
"loss": 0.5299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5642590522766113,
"step": 135,
"valid_targets_mean": 3158.9,
"valid_targets_min": 799
},
{
"epoch": 0.35353535353535354,
"grad_norm": 0.8258141160820167,
"learning_rate": 2e-05,
"loss": 0.4706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43767279386520386,
"step": 140,
"valid_targets_mean": 2534.0,
"valid_targets_min": 527
},
{
"epoch": 0.3661616161616162,
"grad_norm": 0.6638208230368448,
"learning_rate": 2.0719424460431656e-05,
"loss": 0.5226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5216605067253113,
"step": 145,
"valid_targets_mean": 3478.1,
"valid_targets_min": 1455
},
{
"epoch": 0.3787878787878788,
"grad_norm": 0.6659508828600877,
"learning_rate": 2.143884892086331e-05,
"loss": 0.5054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46430742740631104,
"step": 150,
"valid_targets_mean": 3356.1,
"valid_targets_min": 1804
},
{
"epoch": 0.39141414141414144,
"grad_norm": 0.6857469917039041,
"learning_rate": 2.2158273381294965e-05,
"loss": 0.4803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46997326612472534,
"step": 155,
"valid_targets_mean": 3069.1,
"valid_targets_min": 712
},
{
"epoch": 0.40404040404040403,
"grad_norm": 0.7497478551719995,
"learning_rate": 2.287769784172662e-05,
"loss": 0.5096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5357323884963989,
"step": 160,
"valid_targets_mean": 2978.5,
"valid_targets_min": 978
},
{
"epoch": 0.4166666666666667,
"grad_norm": 0.6266767386519286,
"learning_rate": 2.3597122302158274e-05,
"loss": 0.4854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49465256929397583,
"step": 165,
"valid_targets_mean": 4385.0,
"valid_targets_min": 1146
},
{
"epoch": 0.4292929292929293,
"grad_norm": 0.7198305240954321,
"learning_rate": 2.431654676258993e-05,
"loss": 0.5133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4758256673812866,
"step": 170,
"valid_targets_mean": 3358.2,
"valid_targets_min": 1265
},
{
"epoch": 0.44191919191919193,
"grad_norm": 0.744564295446295,
"learning_rate": 2.5035971223021586e-05,
"loss": 0.4285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4645718038082123,
"step": 175,
"valid_targets_mean": 3257.9,
"valid_targets_min": 713
},
{
"epoch": 0.45454545454545453,
"grad_norm": 0.741277701622229,
"learning_rate": 2.575539568345324e-05,
"loss": 0.4867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5038046836853027,
"step": 180,
"valid_targets_mean": 3023.1,
"valid_targets_min": 696
},
{
"epoch": 0.4671717171717172,
"grad_norm": 0.7440421968116456,
"learning_rate": 2.6474820143884895e-05,
"loss": 0.5095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.570155918598175,
"step": 185,
"valid_targets_mean": 3422.4,
"valid_targets_min": 949
},
{
"epoch": 0.4797979797979798,
"grad_norm": 0.8024642384967607,
"learning_rate": 2.719424460431655e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5823109149932861,
"step": 190,
"valid_targets_mean": 2894.9,
"valid_targets_min": 1061
},
{
"epoch": 0.49242424242424243,
"grad_norm": 0.7498359662712905,
"learning_rate": 2.7913669064748203e-05,
"loss": 0.5014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5892109870910645,
"step": 195,
"valid_targets_mean": 3757.8,
"valid_targets_min": 1305
},
{
"epoch": 0.5050505050505051,
"grad_norm": 0.6969972771455335,
"learning_rate": 2.8633093525179858e-05,
"loss": 0.4966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4585283696651459,
"step": 200,
"valid_targets_mean": 3301.2,
"valid_targets_min": 1200
},
{
"epoch": 0.5176767676767676,
"grad_norm": 0.7428922534210859,
"learning_rate": 2.9352517985611512e-05,
"loss": 0.4873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35433435440063477,
"step": 205,
"valid_targets_mean": 2534.4,
"valid_targets_min": 1051
},
{
"epoch": 0.5303030303030303,
"grad_norm": 0.7952927627365796,
"learning_rate": 3.0071942446043167e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3344321846961975,
"step": 210,
"valid_targets_mean": 2273.5,
"valid_targets_min": 764
},
{
"epoch": 0.5429292929292929,
"grad_norm": 0.7452719253142043,
"learning_rate": 3.0791366906474824e-05,
"loss": 0.4887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4398002624511719,
"step": 215,
"valid_targets_mean": 2894.6,
"valid_targets_min": 1774
},
{
"epoch": 0.5555555555555556,
"grad_norm": 0.793089120317565,
"learning_rate": 3.1510791366906475e-05,
"loss": 0.4446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3552176058292389,
"step": 220,
"valid_targets_mean": 2370.2,
"valid_targets_min": 988
},
{
"epoch": 0.5681818181818182,
"grad_norm": 0.6957948039355799,
"learning_rate": 3.223021582733813e-05,
"loss": 0.4677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4744777977466583,
"step": 225,
"valid_targets_mean": 3270.9,
"valid_targets_min": 908
},
{
"epoch": 0.5808080808080808,
"grad_norm": 0.9598066573051235,
"learning_rate": 3.2949640287769784e-05,
"loss": 0.4678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.53702712059021,
"step": 230,
"valid_targets_mean": 3305.6,
"valid_targets_min": 1465
},
{
"epoch": 0.5934343434343434,
"grad_norm": 0.7385990473183633,
"learning_rate": 3.366906474820144e-05,
"loss": 0.4269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4913618564605713,
"step": 235,
"valid_targets_mean": 3022.6,
"valid_targets_min": 1359
},
{
"epoch": 0.6060606060606061,
"grad_norm": 0.8954334270151011,
"learning_rate": 3.438848920863309e-05,
"loss": 0.4773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4261593222618103,
"step": 240,
"valid_targets_mean": 3027.9,
"valid_targets_min": 780
},
{
"epoch": 0.6186868686868687,
"grad_norm": 0.7460534615902407,
"learning_rate": 3.510791366906475e-05,
"loss": 0.4695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5014075040817261,
"step": 245,
"valid_targets_mean": 3182.8,
"valid_targets_min": 1704
},
{
"epoch": 0.6313131313131313,
"grad_norm": 0.7476045212031468,
"learning_rate": 3.582733812949641e-05,
"loss": 0.4897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5569243431091309,
"step": 250,
"valid_targets_mean": 4160.6,
"valid_targets_min": 1184
},
{
"epoch": 0.6439393939393939,
"grad_norm": 0.7290825841839375,
"learning_rate": 3.654676258992806e-05,
"loss": 0.5141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5026414394378662,
"step": 255,
"valid_targets_mean": 3161.4,
"valid_targets_min": 710
},
{
"epoch": 0.6565656565656566,
"grad_norm": 0.7490321855827192,
"learning_rate": 3.726618705035972e-05,
"loss": 0.5036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46991053223609924,
"step": 260,
"valid_targets_mean": 2653.6,
"valid_targets_min": 647
},
{
"epoch": 0.6691919191919192,
"grad_norm": 0.739603256968017,
"learning_rate": 3.798561151079137e-05,
"loss": 0.4898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4988292157649994,
"step": 265,
"valid_targets_mean": 3293.9,
"valid_targets_min": 1137
},
{
"epoch": 0.6818181818181818,
"grad_norm": 0.8025519110811695,
"learning_rate": 3.8705035971223026e-05,
"loss": 0.5011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5377944707870483,
"step": 270,
"valid_targets_mean": 3180.2,
"valid_targets_min": 1127
},
{
"epoch": 0.6944444444444444,
"grad_norm": 0.7900087471325877,
"learning_rate": 3.942446043165468e-05,
"loss": 0.4673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5039912462234497,
"step": 275,
"valid_targets_mean": 2830.6,
"valid_targets_min": 1799
},
{
"epoch": 0.7070707070707071,
"grad_norm": 0.7659391333417415,
"learning_rate": 3.999998413256274e-05,
"loss": 0.5003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4912080764770508,
"step": 280,
"valid_targets_mean": 3327.0,
"valid_targets_min": 790
},
{
"epoch": 0.7196969696969697,
"grad_norm": 0.694845702448467,
"learning_rate": 3.9999428774902425e-05,
"loss": 0.4588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5030688643455505,
"step": 285,
"valid_targets_mean": 3079.2,
"valid_targets_min": 1122
},
{
"epoch": 0.7323232323232324,
"grad_norm": 0.7144245421458943,
"learning_rate": 3.999808007055667e-05,
"loss": 0.4796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5815045237541199,
"step": 290,
"valid_targets_mean": 4749.9,
"valid_targets_min": 880
},
{
"epoch": 0.7449494949494949,
"grad_norm": 0.8137606805905706,
"learning_rate": 3.999593807302654e-05,
"loss": 0.4778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3889826536178589,
"step": 295,
"valid_targets_mean": 2409.6,
"valid_targets_min": 1216
},
{
"epoch": 0.7575757575757576,
"grad_norm": 0.7671755034689156,
"learning_rate": 3.999300286728176e-05,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40401798486709595,
"step": 300,
"valid_targets_mean": 2374.2,
"valid_targets_min": 412
},
{
"epoch": 0.7702020202020202,
"grad_norm": 0.775435011663138,
"learning_rate": 3.9989274569757467e-05,
"loss": 0.4529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5113080143928528,
"step": 305,
"valid_targets_mean": 3065.1,
"valid_targets_min": 872
},
{
"epoch": 0.7828282828282829,
"grad_norm": 0.7829159491303057,
"learning_rate": 3.99847533283495e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4134717285633087,
"step": 310,
"valid_targets_mean": 2551.4,
"valid_targets_min": 511
},
{
"epoch": 0.7954545454545454,
"grad_norm": 0.70594805762661,
"learning_rate": 3.9979439322408575e-05,
"loss": 0.4722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5452604293823242,
"step": 315,
"valid_targets_mean": 4207.9,
"valid_targets_min": 782
},
{
"epoch": 0.8080808080808081,
"grad_norm": 0.741059134063674,
"learning_rate": 3.9973332762733165e-05,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.523596465587616,
"step": 320,
"valid_targets_mean": 3050.4,
"valid_targets_min": 1682
},
{
"epoch": 0.8207070707070707,
"grad_norm": 0.646169301673137,
"learning_rate": 3.996643389156114e-05,
"loss": 0.4531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4629998803138733,
"step": 325,
"valid_targets_mean": 3761.1,
"valid_targets_min": 1341
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.7311851901523451,
"learning_rate": 3.995874298256014e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49332910776138306,
"step": 330,
"valid_targets_mean": 3003.4,
"valid_targets_min": 1840
},
{
"epoch": 0.8459595959595959,
"grad_norm": 0.684697792793549,
"learning_rate": 3.9950260340816723e-05,
"loss": 0.4772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.476440966129303,
"step": 335,
"valid_targets_mean": 3521.4,
"valid_targets_min": 1763
},
{
"epoch": 0.8585858585858586,
"grad_norm": 0.7235672828868595,
"learning_rate": 3.9940986302824305e-05,
"loss": 0.4573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4808931350708008,
"step": 340,
"valid_targets_mean": 3157.8,
"valid_targets_min": 1116
},
{
"epoch": 0.8712121212121212,
"grad_norm": 0.618583293178677,
"learning_rate": 3.993092123646975e-05,
"loss": 0.4419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4222564101219177,
"step": 345,
"valid_targets_mean": 3462.4,
"valid_targets_min": 1697
},
{
"epoch": 0.8838383838383839,
"grad_norm": 0.9731914681849075,
"learning_rate": 3.992006554101881e-05,
"loss": 0.4431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4798777997493744,
"step": 350,
"valid_targets_mean": 2746.6,
"valid_targets_min": 674
},
{
"epoch": 0.8964646464646465,
"grad_norm": 0.6711603679996875,
"learning_rate": 3.99084196471003e-05,
"loss": 0.4315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39052852988243103,
"step": 355,
"valid_targets_mean": 2697.2,
"valid_targets_min": 467
},
{
"epoch": 0.9090909090909091,
"grad_norm": 0.6756824530106742,
"learning_rate": 3.9895984016688956e-05,
"loss": 0.4208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4884558618068695,
"step": 360,
"valid_targets_mean": 3316.8,
"valid_targets_min": 1433
},
{
"epoch": 0.9217171717171717,
"grad_norm": 0.6730754745335135,
"learning_rate": 3.9882759143087194e-05,
"loss": 0.4558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4529365003108978,
"step": 365,
"valid_targets_mean": 2792.6,
"valid_targets_min": 1934
},
{
"epoch": 0.9343434343434344,
"grad_norm": 0.7396239570533569,
"learning_rate": 3.9868745550905475e-05,
"loss": 0.4806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48611992597579956,
"step": 370,
"valid_targets_mean": 3224.1,
"valid_targets_min": 1756
},
{
"epoch": 0.946969696969697,
"grad_norm": 0.5859949295622379,
"learning_rate": 3.985394379604152e-05,
"loss": 0.4543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4721411466598511,
"step": 375,
"valid_targets_mean": 4448.3,
"valid_targets_min": 1472
},
{
"epoch": 0.9595959595959596,
"grad_norm": 0.6661047355223618,
"learning_rate": 3.983835446565826e-05,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49498146772384644,
"step": 380,
"valid_targets_mean": 3239.3,
"valid_targets_min": 479
},
{
"epoch": 0.9722222222222222,
"grad_norm": 0.5805898239548394,
"learning_rate": 3.982197817816054e-05,
"loss": 0.4422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38239431381225586,
"step": 385,
"valid_targets_mean": 3780.7,
"valid_targets_min": 779
},
{
"epoch": 0.9848484848484849,
"grad_norm": 0.7798921127063227,
"learning_rate": 3.980481558317057e-05,
"loss": 0.4662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5424267053604126,
"step": 390,
"valid_targets_mean": 3867.1,
"valid_targets_min": 632
},
{
"epoch": 0.9974747474747475,
"grad_norm": 0.6339986265381534,
"learning_rate": 3.978686736150221e-05,
"loss": 0.4535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47920912504196167,
"step": 395,
"valid_targets_mean": 3606.8,
"valid_targets_min": 1028
},
{
"epoch": 1.0101010101010102,
"grad_norm": 0.6706130776528586,
"learning_rate": 3.976813422513388e-05,
"loss": 0.437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4376629590988159,
"step": 400,
"valid_targets_mean": 3430.6,
"valid_targets_min": 1860
},
{
"epoch": 1.0227272727272727,
"grad_norm": 0.6708127261682855,
"learning_rate": 3.9748616917180406e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3455820381641388,
"step": 405,
"valid_targets_mean": 2637.0,
"valid_targets_min": 580
},
{
"epoch": 1.0353535353535352,
"grad_norm": 0.7742495725599213,
"learning_rate": 3.972831621186345e-05,
"loss": 0.417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3599938154220581,
"step": 410,
"valid_targets_mean": 2649.8,
"valid_targets_min": 1327
},
{
"epoch": 1.047979797979798,
"grad_norm": 0.6102251044562367,
"learning_rate": 3.970723291448092e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.445651650428772,
"step": 415,
"valid_targets_mean": 4083.1,
"valid_targets_min": 1361
},
{
"epoch": 1.0606060606060606,
"grad_norm": 0.6976342123087943,
"learning_rate": 3.968536786137487e-05,
"loss": 0.4382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40597984194755554,
"step": 420,
"valid_targets_mean": 2881.2,
"valid_targets_min": 1527
},
{
"epoch": 1.0732323232323233,
"grad_norm": 0.8976764193372789,
"learning_rate": 3.966272191989847e-05,
"loss": 0.4593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5112510323524475,
"step": 425,
"valid_targets_mean": 3042.1,
"valid_targets_min": 506
},
{
"epoch": 1.0858585858585859,
"grad_norm": 0.7365732301930217,
"learning_rate": 3.963929598838149e-05,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43491220474243164,
"step": 430,
"valid_targets_mean": 2794.9,
"valid_targets_min": 1679
},
{
"epoch": 1.0984848484848484,
"grad_norm": 0.6773959614029044,
"learning_rate": 3.9615090996094726e-05,
"loss": 0.4226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5162553787231445,
"step": 435,
"valid_targets_mean": 4462.0,
"valid_targets_min": 509
},
{
"epoch": 1.1111111111111112,
"grad_norm": 0.5970043671496138,
"learning_rate": 3.959010790321313e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33793818950653076,
"step": 440,
"valid_targets_mean": 3196.2,
"valid_targets_min": 1361
},
{
"epoch": 1.1237373737373737,
"grad_norm": 0.7763112041835692,
"learning_rate": 3.9564347700777705e-05,
"loss": 0.4279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4716646075248718,
"step": 445,
"valid_targets_mean": 2790.6,
"valid_targets_min": 596
},
{
"epoch": 1.1363636363636362,
"grad_norm": 0.7191861233677,
"learning_rate": 3.953781141065619e-05,
"loss": 0.4571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4991220235824585,
"step": 450,
"valid_targets_mean": 2805.2,
"valid_targets_min": 1500
},
{
"epoch": 1.148989898989899,
"grad_norm": 0.6931761780564214,
"learning_rate": 3.9510500085502556e-05,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3412482738494873,
"step": 455,
"valid_targets_mean": 2871.2,
"valid_targets_min": 1064
},
{
"epoch": 1.1616161616161615,
"grad_norm": 0.5776459149074374,
"learning_rate": 3.9482414808715194e-05,
"loss": 0.4203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4245602786540985,
"step": 460,
"valid_targets_mean": 4715.2,
"valid_targets_min": 808
},
{
"epoch": 1.1742424242424243,
"grad_norm": 0.6555627012964024,
"learning_rate": 3.945355669439399e-05,
"loss": 0.4475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44374722242355347,
"step": 465,
"valid_targets_mean": 3508.2,
"valid_targets_min": 882
},
{
"epoch": 1.1868686868686869,
"grad_norm": 1.2615252581904304,
"learning_rate": 3.9423926887296114e-05,
"loss": 0.4471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4283289909362793,
"step": 470,
"valid_targets_mean": 3297.8,
"valid_targets_min": 1445
},
{
"epoch": 1.1994949494949494,
"grad_norm": 0.7227367427497255,
"learning_rate": 3.939352656279059e-05,
"loss": 0.4105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4885120689868927,
"step": 475,
"valid_targets_mean": 3030.8,
"valid_targets_min": 1180
},
{
"epoch": 1.2121212121212122,
"grad_norm": 0.7171565868676774,
"learning_rate": 3.93623569268117e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37661659717559814,
"step": 480,
"valid_targets_mean": 2516.6,
"valid_targets_min": 935
},
{
"epoch": 1.2247474747474747,
"grad_norm": 0.6709298722578017,
"learning_rate": 3.933041921581113e-05,
"loss": 0.4524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4951278269290924,
"step": 485,
"valid_targets_mean": 3910.1,
"valid_targets_min": 1281
},
{
"epoch": 1.2373737373737375,
"grad_norm": 0.6284344251816701,
"learning_rate": 3.929771469670892e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4901544451713562,
"step": 490,
"valid_targets_mean": 5372.7,
"valid_targets_min": 863
},
{
"epoch": 1.25,
"grad_norm": 0.695150714261409,
"learning_rate": 3.926424466684321e-05,
"loss": 0.4036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3937031328678131,
"step": 495,
"valid_targets_mean": 2620.4,
"valid_targets_min": 1061
},
{
"epoch": 1.2626262626262625,
"grad_norm": 0.5659681496879514,
"learning_rate": 3.92300104539188e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43232929706573486,
"step": 500,
"valid_targets_mean": 4517.9,
"valid_targets_min": 1356
},
{
"epoch": 1.2752525252525253,
"grad_norm": 0.6499437965902374,
"learning_rate": 3.919501341595442e-05,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4581197500228882,
"step": 505,
"valid_targets_mean": 3634.6,
"valid_targets_min": 1176
},
{
"epoch": 1.2878787878787878,
"grad_norm": 0.5715005441806082,
"learning_rate": 3.9159254941228944e-05,
"loss": 0.4015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3313661217689514,
"step": 510,
"valid_targets_mean": 3508.3,
"valid_targets_min": 1355
},
{
"epoch": 1.3005050505050506,
"grad_norm": 0.7308800974579575,
"learning_rate": 3.912273644822625e-05,
"loss": 0.4295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4216563105583191,
"step": 515,
"valid_targets_mean": 2695.7,
"valid_targets_min": 1010
},
{
"epoch": 1.3131313131313131,
"grad_norm": 0.6837093491179472,
"learning_rate": 3.9085459385578984e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4423089027404785,
"step": 520,
"valid_targets_mean": 2883.6,
"valid_targets_min": 710
},
{
"epoch": 1.3257575757575757,
"grad_norm": 0.6554872754713126,
"learning_rate": 3.9047425232011076e-05,
"loss": 0.3826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3657465875148773,
"step": 525,
"valid_targets_mean": 3170.8,
"valid_targets_min": 1136
},
{
"epoch": 1.3383838383838385,
"grad_norm": 0.6685453762625018,
"learning_rate": 3.900863549627911e-05,
"loss": 0.428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4607548713684082,
"step": 530,
"valid_targets_mean": 3880.3,
"valid_targets_min": 1232
},
{
"epoch": 1.351010101010101,
"grad_norm": 0.6443269502166363,
"learning_rate": 3.896909171711245e-05,
"loss": 0.4348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4501422941684723,
"step": 535,
"valid_targets_mean": 3417.6,
"valid_targets_min": 1573
},
{
"epoch": 1.3636363636363638,
"grad_norm": 0.6126406593256342,
"learning_rate": 3.8928795463152186e-05,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3543352782726288,
"step": 540,
"valid_targets_mean": 3163.1,
"valid_targets_min": 1501
},
{
"epoch": 1.3762626262626263,
"grad_norm": 0.6881727131350188,
"learning_rate": 3.888774833288898e-05,
"loss": 0.4257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4091816842556,
"step": 545,
"valid_targets_mean": 3140.7,
"valid_targets_min": 1252
},
{
"epoch": 1.3888888888888888,
"grad_norm": 0.6580723165353671,
"learning_rate": 3.8845951954599545e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3906816244125366,
"step": 550,
"valid_targets_mean": 2895.7,
"valid_targets_min": 1240
},
{
"epoch": 1.4015151515151514,
"grad_norm": 0.6770136577009271,
"learning_rate": 3.8803407986282156e-05,
"loss": 0.4221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35806700587272644,
"step": 555,
"valid_targets_mean": 2287.6,
"valid_targets_min": 594
},
{
"epoch": 1.4141414141414141,
"grad_norm": 0.6405715120436977,
"learning_rate": 3.876011811559084e-05,
"loss": 0.4279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4252093434333801,
"step": 560,
"valid_targets_mean": 3118.0,
"valid_targets_min": 707
},
{
"epoch": 1.4267676767676767,
"grad_norm": 0.6944966556141179,
"learning_rate": 3.871608405976838e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42029836773872375,
"step": 565,
"valid_targets_mean": 2919.8,
"valid_targets_min": 1070
},
{
"epoch": 1.4393939393939394,
"grad_norm": 0.6466971885955511,
"learning_rate": 3.867130756557832e-05,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3371127247810364,
"step": 570,
"valid_targets_mean": 2752.6,
"valid_targets_min": 750
},
{
"epoch": 1.452020202020202,
"grad_norm": 0.6100566892783015,
"learning_rate": 3.862579040923552e-05,
"loss": 0.3838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3892483115196228,
"step": 575,
"valid_targets_mean": 3388.8,
"valid_targets_min": 968
},
{
"epoch": 1.4646464646464645,
"grad_norm": 0.6600534442172271,
"learning_rate": 3.8579534396335835e-05,
"loss": 0.412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46965640783309937,
"step": 580,
"valid_targets_mean": 3274.4,
"valid_targets_min": 685
},
{
"epoch": 1.4772727272727273,
"grad_norm": 0.6946470349793337,
"learning_rate": 3.853254136178437e-05,
"loss": 0.4195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4128877818584442,
"step": 585,
"valid_targets_mean": 2874.7,
"valid_targets_min": 1690
},
{
"epoch": 1.4898989898989898,
"grad_norm": 0.658007836439284,
"learning_rate": 3.8484813169722794e-05,
"loss": 0.4202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4265574812889099,
"step": 590,
"valid_targets_mean": 2866.8,
"valid_targets_min": 1791
},
{
"epoch": 1.5025252525252526,
"grad_norm": 0.7613954671864829,
"learning_rate": 3.843635171345532e-05,
"loss": 0.4369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44407981634140015,
"step": 595,
"valid_targets_mean": 3021.1,
"valid_targets_min": 638
},
{
"epoch": 1.5151515151515151,
"grad_norm": 0.7625903826308273,
"learning_rate": 3.838715891537365e-05,
"loss": 0.3805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34579938650131226,
"step": 600,
"valid_targets_mean": 2343.3,
"valid_targets_min": 844
},
{
"epoch": 1.5277777777777777,
"grad_norm": 0.6482084611263487,
"learning_rate": 3.8337236726880674e-05,
"loss": 0.441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41672322154045105,
"step": 605,
"valid_targets_mean": 2920.0,
"valid_targets_min": 1776
},
{
"epoch": 1.5404040404040404,
"grad_norm": 0.6065329237085881,
"learning_rate": 3.828658712831311e-05,
"loss": 0.398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3971773386001587,
"step": 610,
"valid_targets_mean": 3118.1,
"valid_targets_min": 1473
},
{
"epoch": 1.553030303030303,
"grad_norm": 0.6544115401255524,
"learning_rate": 3.823521212886287e-05,
"loss": 0.441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45314595103263855,
"step": 615,
"valid_targets_mean": 3466.2,
"valid_targets_min": 377
},
{
"epoch": 1.5656565656565657,
"grad_norm": 0.7218840612228915,
"learning_rate": 3.818311376649746e-05,
"loss": 0.3962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40665388107299805,
"step": 620,
"valid_targets_mean": 3132.6,
"valid_targets_min": 1208
},
{
"epoch": 1.5782828282828283,
"grad_norm": 0.6457705553977882,
"learning_rate": 3.813029410787906e-05,
"loss": 0.4014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4007648229598999,
"step": 625,
"valid_targets_mean": 3385.1,
"valid_targets_min": 1276
},
{
"epoch": 1.5909090909090908,
"grad_norm": 0.6340707674027326,
"learning_rate": 3.807675524828255e-05,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3663696050643921,
"step": 630,
"valid_targets_mean": 2994.5,
"valid_targets_min": 1839
},
{
"epoch": 1.6035353535353534,
"grad_norm": 0.6510799288150312,
"learning_rate": 3.802249931151245e-05,
"loss": 0.4083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4528045356273651,
"step": 635,
"valid_targets_mean": 3057.3,
"valid_targets_min": 724
},
{
"epoch": 1.6161616161616161,
"grad_norm": 0.7096957049322412,
"learning_rate": 3.7967528449818604e-05,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3862096667289734,
"step": 640,
"valid_targets_mean": 2390.7,
"valid_targets_min": 556
},
{
"epoch": 1.628787878787879,
"grad_norm": 0.7345826232266963,
"learning_rate": 3.791184484381083e-05,
"loss": 0.433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3896709382534027,
"step": 645,
"valid_targets_mean": 2601.5,
"valid_targets_min": 782
},
{
"epoch": 1.6414141414141414,
"grad_norm": 0.6381339146897167,
"learning_rate": 3.7855450702372446e-05,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42096877098083496,
"step": 650,
"valid_targets_mean": 2983.1,
"valid_targets_min": 1513
},
{
"epoch": 1.654040404040404,
"grad_norm": 0.7088141347121194,
"learning_rate": 3.7798348262572595e-05,
"loss": 0.4184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38489383459091187,
"step": 655,
"valid_targets_mean": 2589.2,
"valid_targets_min": 1265
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.6158104461556841,
"learning_rate": 3.774053978957754e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33309605717658997,
"step": 660,
"valid_targets_mean": 2628.7,
"valid_targets_min": 858
},
{
"epoch": 1.6792929292929293,
"grad_norm": 0.6621621785950462,
"learning_rate": 3.76820275765608e-05,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3812219202518463,
"step": 665,
"valid_targets_mean": 2696.2,
"valid_targets_min": 1315
},
{
"epoch": 1.691919191919192,
"grad_norm": 0.5915638746228544,
"learning_rate": 3.7622813944612184e-05,
"loss": 0.4268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45549070835113525,
"step": 670,
"valid_targets_mean": 4037.2,
"valid_targets_min": 1593
},
{
"epoch": 1.7045454545454546,
"grad_norm": 0.6214323792581383,
"learning_rate": 3.75629012426457e-05,
"loss": 0.4049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30740225315093994,
"step": 675,
"valid_targets_mean": 2484.4,
"valid_targets_min": 991
},
{
"epoch": 1.7171717171717171,
"grad_norm": 0.6181383119204046,
"learning_rate": 3.750229184730643e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41900163888931274,
"step": 680,
"valid_targets_mean": 3214.8,
"valid_targets_min": 1219
},
{
"epoch": 1.7297979797979797,
"grad_norm": 0.7022543694921178,
"learning_rate": 3.744098816287616e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3738209009170532,
"step": 685,
"valid_targets_mean": 2518.6,
"valid_targets_min": 1060
},
{
"epoch": 1.7424242424242424,
"grad_norm": 0.6444777112364757,
"learning_rate": 3.73789926211781e-05,
"loss": 0.4013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40667980909347534,
"step": 690,
"valid_targets_mean": 2943.8,
"valid_targets_min": 586
},
{
"epoch": 1.7550505050505052,
"grad_norm": 0.6456649483546918,
"learning_rate": 3.7316307681480364e-05,
"loss": 0.4464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5095163583755493,
"step": 695,
"valid_targets_mean": 3686.2,
"valid_targets_min": 1323
},
{
"epoch": 1.7676767676767677,
"grad_norm": 0.6312723135470779,
"learning_rate": 3.725293583039843e-05,
"loss": 0.4029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3778528869152069,
"step": 700,
"valid_targets_mean": 3107.6,
"valid_targets_min": 1432
},
{
"epoch": 1.7803030303030303,
"grad_norm": 0.6535661127784683,
"learning_rate": 3.71888795817965e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47286659479141235,
"step": 705,
"valid_targets_mean": 4064.8,
"valid_targets_min": 1051
},
{
"epoch": 1.7929292929292928,
"grad_norm": 0.6896428501647339,
"learning_rate": 3.712414147668777e-05,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4112127423286438,
"step": 710,
"valid_targets_mean": 2654.4,
"valid_targets_min": 1151
},
{
"epoch": 1.8055555555555556,
"grad_norm": 0.5820441201531631,
"learning_rate": 3.7058724083133645e-05,
"loss": 0.4077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34681016206741333,
"step": 715,
"valid_targets_mean": 2884.4,
"valid_targets_min": 1351
},
{
"epoch": 1.8181818181818183,
"grad_norm": 0.6800591266970959,
"learning_rate": 3.6992629996141864e-05,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4916991591453552,
"step": 720,
"valid_targets_mean": 3417.7,
"valid_targets_min": 1329
},
{
"epoch": 1.8308080808080809,
"grad_norm": 0.6563197557373552,
"learning_rate": 3.692586183756354e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3805094361305237,
"step": 725,
"valid_targets_mean": 2503.5,
"valid_targets_min": 1064
},
{
"epoch": 1.8434343434343434,
"grad_norm": 0.7047851378134344,
"learning_rate": 3.685842225598919e-05,
"loss": 0.4278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4543723464012146,
"step": 730,
"valid_targets_mean": 2930.4,
"valid_targets_min": 1798
},
{
"epoch": 1.856060606060606,
"grad_norm": 0.6499844550915188,
"learning_rate": 3.6790313926643664e-05,
"loss": 0.4119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3960087299346924,
"step": 735,
"valid_targets_mean": 2956.1,
"valid_targets_min": 1401
},
{
"epoch": 1.8686868686868687,
"grad_norm": 0.649385668021803,
"learning_rate": 3.6721539551279966e-05,
"loss": 0.4369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4332810640335083,
"step": 740,
"valid_targets_mean": 3076.4,
"valid_targets_min": 998
},
{
"epoch": 1.8813131313131313,
"grad_norm": 0.7091254200389234,
"learning_rate": 3.665210185807217e-05,
"loss": 0.4388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44163447618484497,
"step": 745,
"valid_targets_mean": 3328.9,
"valid_targets_min": 1660
},
{
"epoch": 1.893939393939394,
"grad_norm": 0.5985641510783979,
"learning_rate": 3.658200360150713e-05,
"loss": 0.4091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37661778926849365,
"step": 750,
"valid_targets_mean": 3146.1,
"valid_targets_min": 1067
},
{
"epoch": 1.9065656565656566,
"grad_norm": 0.6268419140387759,
"learning_rate": 3.651124756227525e-05,
"loss": 0.401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4080426096916199,
"step": 755,
"valid_targets_mean": 3422.2,
"valid_targets_min": 1798
},
{
"epoch": 1.9191919191919191,
"grad_norm": 0.7426620476089505,
"learning_rate": 3.6439836547160144e-05,
"loss": 0.4044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38891446590423584,
"step": 760,
"valid_targets_mean": 3295.2,
"valid_targets_min": 1546
},
{
"epoch": 1.9318181818181817,
"grad_norm": 0.6671491506286603,
"learning_rate": 3.636777338892732e-05,
"loss": 0.4466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44117462635040283,
"step": 765,
"valid_targets_mean": 2958.4,
"valid_targets_min": 1837
},
{
"epoch": 1.9444444444444444,
"grad_norm": 0.6342292838426378,
"learning_rate": 3.629506094621183e-05,
"loss": 0.3886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3897709250450134,
"step": 770,
"valid_targets_mean": 2692.6,
"valid_targets_min": 1547
},
{
"epoch": 1.9570707070707072,
"grad_norm": 0.621675970891514,
"learning_rate": 3.622170210340482e-05,
"loss": 0.4183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38866496086120605,
"step": 775,
"valid_targets_mean": 2999.8,
"valid_targets_min": 1116
},
{
"epoch": 1.9696969696969697,
"grad_norm": 0.5905010144602377,
"learning_rate": 3.614769977053914e-05,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3574790060520172,
"step": 780,
"valid_targets_mean": 3125.0,
"valid_targets_min": 963
},
{
"epoch": 1.9823232323232323,
"grad_norm": 0.5836024549642513,
"learning_rate": 3.607305688317391e-05,
"loss": 0.4046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4132801294326782,
"step": 785,
"valid_targets_mean": 3194.9,
"valid_targets_min": 1242
},
{
"epoch": 1.9949494949494948,
"grad_norm": 0.7228511270619273,
"learning_rate": 3.5997776402278055e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42261964082717896,
"step": 790,
"valid_targets_mean": 3067.1,
"valid_targets_min": 1603
},
{
"epoch": 2.007575757575758,
"grad_norm": 0.6700499879024988,
"learning_rate": 3.592186131411288e-05,
"loss": 0.376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3675363063812256,
"step": 795,
"valid_targets_mean": 2926.6,
"valid_targets_min": 1575
},
{
"epoch": 2.0202020202020203,
"grad_norm": 0.6733433964569425,
"learning_rate": 3.584531463011356e-05,
"loss": 0.3648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3609054982662201,
"step": 800,
"valid_targets_mean": 3172.1,
"valid_targets_min": 599
},
{
"epoch": 2.032828282828283,
"grad_norm": 0.6042940030317498,
"learning_rate": 3.576813938676973e-05,
"loss": 0.3973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3894050121307373,
"step": 805,
"valid_targets_mean": 3448.1,
"valid_targets_min": 923
},
{
"epoch": 2.0454545454545454,
"grad_norm": 0.6749197830689422,
"learning_rate": 3.569033864550501e-05,
"loss": 0.38,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3814485967159271,
"step": 810,
"valid_targets_mean": 2783.8,
"valid_targets_min": 880
},
{
"epoch": 2.058080808080808,
"grad_norm": 0.6483067354879916,
"learning_rate": 3.561191549255555e-05,
"loss": 0.3565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3972342312335968,
"step": 815,
"valid_targets_mean": 3241.1,
"valid_targets_min": 1649
},
{
"epoch": 2.0707070707070705,
"grad_norm": 0.6353320580780115,
"learning_rate": 3.553287303884762e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3591780662536621,
"step": 820,
"valid_targets_mean": 2904.1,
"valid_targets_min": 1116
},
{
"epoch": 2.0833333333333335,
"grad_norm": 0.6551388984986852,
"learning_rate": 3.545321441987422e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29770687222480774,
"step": 825,
"valid_targets_mean": 2442.8,
"valid_targets_min": 568
},
{
"epoch": 2.095959595959596,
"grad_norm": 0.6968910493636307,
"learning_rate": 3.5372942795570644e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3901800215244293,
"step": 830,
"valid_targets_mean": 2854.0,
"valid_targets_min": 682
},
{
"epoch": 2.1085858585858586,
"grad_norm": 0.568367502641086,
"learning_rate": 3.529206135018922e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4262069761753082,
"step": 835,
"valid_targets_mean": 4330.8,
"valid_targets_min": 2021
},
{
"epoch": 2.121212121212121,
"grad_norm": 0.6824608784442717,
"learning_rate": 3.521057329217289e-05,
"loss": 0.3845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3504842519760132,
"step": 840,
"valid_targets_mean": 2486.9,
"valid_targets_min": 1574
},
{
"epoch": 2.1338383838383836,
"grad_norm": 0.6810643162239562,
"learning_rate": 3.512848185402804e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42560821771621704,
"step": 845,
"valid_targets_mean": 3205.6,
"valid_targets_min": 1295
},
{
"epoch": 2.1464646464646466,
"grad_norm": 0.7051006217015395,
"learning_rate": 3.504579029219618e-05,
"loss": 0.385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47030025720596313,
"step": 850,
"valid_targets_mean": 4252.9,
"valid_targets_min": 620
},
{
"epoch": 2.159090909090909,
"grad_norm": 0.6158184161250323,
"learning_rate": 3.4962501886924817e-05,
"loss": 0.3643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3438853621482849,
"step": 855,
"valid_targets_mean": 3000.1,
"valid_targets_min": 1183
},
{
"epoch": 2.1717171717171717,
"grad_norm": 0.9033510849058328,
"learning_rate": 3.4878619942137346e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36623990535736084,
"step": 860,
"valid_targets_mean": 3486.9,
"valid_targets_min": 1208
},
{
"epoch": 2.1843434343434343,
"grad_norm": 0.6336084994385605,
"learning_rate": 3.479414778530194e-05,
"loss": 0.3553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3282182812690735,
"step": 865,
"valid_targets_mean": 2926.6,
"valid_targets_min": 527
},
{
"epoch": 2.196969696969697,
"grad_norm": 0.642030989385258,
"learning_rate": 3.470908876729958e-05,
"loss": 0.3757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38485634326934814,
"step": 870,
"valid_targets_mean": 3797.9,
"valid_targets_min": 1802
},
{
"epoch": 2.20959595959596,
"grad_norm": 0.6859750653264282,
"learning_rate": 3.462344626229113e-05,
"loss": 0.3831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4057656526565552,
"step": 875,
"valid_targets_mean": 3077.2,
"valid_targets_min": 1477
},
{
"epoch": 2.2222222222222223,
"grad_norm": 0.7051975354184825,
"learning_rate": 3.4537223667583517e-05,
"loss": 0.3941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3670094311237335,
"step": 880,
"valid_targets_mean": 2480.9,
"valid_targets_min": 949
},
{
"epoch": 2.234848484848485,
"grad_norm": 0.6263495715036997,
"learning_rate": 3.44504244034949e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38415664434432983,
"step": 885,
"valid_targets_mean": 3738.8,
"valid_targets_min": 1905
},
{
"epoch": 2.2474747474747474,
"grad_norm": 0.6736583840874508,
"learning_rate": 3.4363051913219054e-05,
"loss": 0.3787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32438012957572937,
"step": 890,
"valid_targets_mean": 2544.9,
"valid_targets_min": 1115
},
{
"epoch": 2.26010101010101,
"grad_norm": 0.6358475233857454,
"learning_rate": 3.427510966268874e-05,
"loss": 0.4206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38413217663764954,
"step": 895,
"valid_targets_mean": 3256.4,
"valid_targets_min": 1028
},
{
"epoch": 2.2727272727272725,
"grad_norm": 0.5703544012357852,
"learning_rate": 3.418660114043824e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34161847829818726,
"step": 900,
"valid_targets_mean": 3436.0,
"valid_targets_min": 1334
},
{
"epoch": 2.2853535353535355,
"grad_norm": 0.6756271018463891,
"learning_rate": 3.409752985746498e-05,
"loss": 0.3907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39379531145095825,
"step": 905,
"valid_targets_mean": 3228.2,
"valid_targets_min": 1693
},
{
"epoch": 2.297979797979798,
"grad_norm": 0.5750798297997253,
"learning_rate": 3.400789934709023e-05,
"loss": 0.4308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4697551727294922,
"step": 910,
"valid_targets_mean": 4887.2,
"valid_targets_min": 1320
},
{
"epoch": 2.3106060606060606,
"grad_norm": 0.6035695330159876,
"learning_rate": 3.391771316481895e-05,
"loss": 0.386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37602925300598145,
"step": 915,
"valid_targets_mean": 3335.6,
"valid_targets_min": 1865
},
{
"epoch": 2.323232323232323,
"grad_norm": 0.6231533529555526,
"learning_rate": 3.3826974888198764e-05,
"loss": 0.3847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46126362681388855,
"step": 920,
"valid_targets_mean": 4108.6,
"valid_targets_min": 1070
},
{
"epoch": 2.3358585858585856,
"grad_norm": 0.682022720271219,
"learning_rate": 3.373568811667802e-05,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39595192670822144,
"step": 925,
"valid_targets_mean": 2894.8,
"valid_targets_min": 1426
},
{
"epoch": 2.3484848484848486,
"grad_norm": 0.6797289333546708,
"learning_rate": 3.3643856471463036e-05,
"loss": 0.3785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38361161947250366,
"step": 930,
"valid_targets_mean": 3060.6,
"valid_targets_min": 1501
},
{
"epoch": 2.361111111111111,
"grad_norm": 0.6031465467740685,
"learning_rate": 3.355148359537441e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44060710072517395,
"step": 935,
"valid_targets_mean": 4271.9,
"valid_targets_min": 1417
},
{
"epoch": 2.3737373737373737,
"grad_norm": 0.8364843828650894,
"learning_rate": 3.3458573152702556e-05,
"loss": 0.3854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36398792266845703,
"step": 940,
"valid_targets_mean": 2913.2,
"valid_targets_min": 1188
},
{
"epoch": 2.3863636363636362,
"grad_norm": 0.5980417429474294,
"learning_rate": 3.336512882906234e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307436466217041,
"step": 945,
"valid_targets_mean": 2891.1,
"valid_targets_min": 1219
},
{
"epoch": 2.398989898989899,
"grad_norm": 0.6020944292492557,
"learning_rate": 3.3271154331246825e-05,
"loss": 0.3548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3505295515060425,
"step": 950,
"valid_targets_mean": 4080.4,
"valid_targets_min": 988
},
{
"epoch": 2.4116161616161618,
"grad_norm": 0.6948551306615971,
"learning_rate": 3.317665338708033e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38028645515441895,
"step": 955,
"valid_targets_mean": 3400.9,
"valid_targets_min": 452
},
{
"epoch": 2.4242424242424243,
"grad_norm": 0.7054147906410959,
"learning_rate": 3.308162974527045e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3440144658088684,
"step": 960,
"valid_targets_mean": 2568.9,
"valid_targets_min": 1248
},
{
"epoch": 2.436868686868687,
"grad_norm": 0.6502674537729093,
"learning_rate": 3.298608717525941e-05,
"loss": 0.3966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4167352616786957,
"step": 965,
"valid_targets_mean": 3487.2,
"valid_targets_min": 729
},
{
"epoch": 2.4494949494949494,
"grad_norm": 0.6945755822435844,
"learning_rate": 3.289002946707452e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38510334491729736,
"step": 970,
"valid_targets_mean": 3070.3,
"valid_targets_min": 1615
},
{
"epoch": 2.462121212121212,
"grad_norm": 0.7008172093994913,
"learning_rate": 3.2793460431177827e-05,
"loss": 0.3892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34910762310028076,
"step": 975,
"valid_targets_mean": 2654.6,
"valid_targets_min": 807
},
{
"epoch": 2.474747474747475,
"grad_norm": 0.6315928723707651,
"learning_rate": 3.269638389831498e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948976755142212,
"step": 980,
"valid_targets_mean": 2513.4,
"valid_targets_min": 1048
},
{
"epoch": 2.4873737373737375,
"grad_norm": 0.659399817304144,
"learning_rate": 3.2598803719363234e-05,
"loss": 0.3995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3890318274497986,
"step": 985,
"valid_targets_mean": 2942.6,
"valid_targets_min": 959
},
{
"epoch": 2.5,
"grad_norm": 0.6602751081844956,
"learning_rate": 3.250072376517873e-05,
"loss": 0.39,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31299781799316406,
"step": 990,
"valid_targets_mean": 2744.5,
"valid_targets_min": 1621
},
{
"epoch": 2.5126262626262625,
"grad_norm": 0.5849536829497557,
"learning_rate": 3.240214792644291e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4854844808578491,
"step": 995,
"valid_targets_mean": 4775.6,
"valid_targets_min": 1064
},
{
"epoch": 2.525252525252525,
"grad_norm": 0.5606732760702411,
"learning_rate": 3.2303080113508206e-05,
"loss": 0.3851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3052321672439575,
"step": 1000,
"valid_targets_mean": 3365.4,
"valid_targets_min": 1298
},
{
"epoch": 2.537878787878788,
"grad_norm": 0.6875908835706088,
"learning_rate": 3.220352425624292e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734514117240906,
"step": 1005,
"valid_targets_mean": 2893.5,
"valid_targets_min": 1773
},
{
"epoch": 2.5505050505050506,
"grad_norm": 0.5931935199736621,
"learning_rate": 3.210348430387531e-05,
"loss": 0.404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3862113058567047,
"step": 1010,
"valid_targets_mean": 3470.7,
"valid_targets_min": 2311
},
{
"epoch": 2.563131313131313,
"grad_norm": 0.5854966748703261,
"learning_rate": 3.200296422483694e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3955685496330261,
"step": 1015,
"valid_targets_mean": 3589.4,
"valid_targets_min": 1829
},
{
"epoch": 2.5757575757575757,
"grad_norm": 0.6466992426589206,
"learning_rate": 3.19019680066053e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3543087840080261,
"step": 1020,
"valid_targets_mean": 2809.2,
"valid_targets_min": 1982
},
{
"epoch": 2.5883838383838382,
"grad_norm": 0.6437875698154034,
"learning_rate": 3.180049965554554e-05,
"loss": 0.4091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5216984748840332,
"step": 1025,
"valid_targets_mean": 4236.3,
"valid_targets_min": 971
},
{
"epoch": 2.601010101010101,
"grad_norm": 0.6686276392769377,
"learning_rate": 3.169856319675163e-05,
"loss": 0.3711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4543102979660034,
"step": 1030,
"valid_targets_mean": 3561.1,
"valid_targets_min": 520
},
{
"epoch": 2.6136363636363638,
"grad_norm": 0.5951534964453324,
"learning_rate": 3.159616267388665e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3885546326637268,
"step": 1035,
"valid_targets_mean": 3710.8,
"valid_targets_min": 935
},
{
"epoch": 2.6262626262626263,
"grad_norm": 0.5998214906422664,
"learning_rate": 3.1493302149022394e-05,
"loss": 0.3643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3495018482208252,
"step": 1040,
"valid_targets_mean": 3388.9,
"valid_targets_min": 1017
},
{
"epoch": 2.638888888888889,
"grad_norm": 0.679459404989866,
"learning_rate": 3.1389985702478204e-05,
"loss": 0.3733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40621423721313477,
"step": 1045,
"valid_targets_mean": 2743.4,
"valid_targets_min": 638
},
{
"epoch": 2.6515151515151514,
"grad_norm": 0.49821839728054024,
"learning_rate": 3.1286217432659176e-05,
"loss": 0.3848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42677822709083557,
"step": 1050,
"valid_targets_mean": 5945.1,
"valid_targets_min": 1605
},
{
"epoch": 2.6641414141414144,
"grad_norm": 0.6245151459734792,
"learning_rate": 3.118200145589351e-05,
"loss": 0.4174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3920952081680298,
"step": 1055,
"valid_targets_mean": 3122.9,
"valid_targets_min": 1889
},
{
"epoch": 2.676767676767677,
"grad_norm": 0.6230627615382611,
"learning_rate": 3.1077341906269275e-05,
"loss": 0.3746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4046259820461273,
"step": 1060,
"valid_targets_mean": 3375.1,
"valid_targets_min": 876
},
{
"epoch": 2.6893939393939394,
"grad_norm": 0.5984044868920384,
"learning_rate": 3.097224293547039e-05,
"loss": 0.3761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37177756428718567,
"step": 1065,
"valid_targets_mean": 3157.3,
"valid_targets_min": 928
},
{
"epoch": 2.702020202020202,
"grad_norm": 0.6200698875715712,
"learning_rate": 3.086670871261193e-05,
"loss": 0.3824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4072413146495819,
"step": 1070,
"valid_targets_mean": 3493.7,
"valid_targets_min": 1659
},
{
"epoch": 2.7146464646464645,
"grad_norm": 0.7099464467086446,
"learning_rate": 3.076074342407476e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3890324532985687,
"step": 1075,
"valid_targets_mean": 2398.0,
"valid_targets_min": 580
},
{
"epoch": 2.7272727272727275,
"grad_norm": 0.5964382108688258,
"learning_rate": 3.0654351273339465e-05,
"loss": 0.3576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41678887605667114,
"step": 1080,
"valid_targets_mean": 4061.4,
"valid_targets_min": 587
},
{
"epoch": 2.73989898989899,
"grad_norm": 0.6483267090943723,
"learning_rate": 3.0547536480819584e-05,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38063323497772217,
"step": 1085,
"valid_targets_mean": 2821.2,
"valid_targets_min": 1120
},
{
"epoch": 2.7525252525252526,
"grad_norm": 0.6126539646079129,
"learning_rate": 3.044030328369422e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3242890238761902,
"step": 1090,
"valid_targets_mean": 2823.2,
"valid_targets_min": 674
},
{
"epoch": 2.765151515151515,
"grad_norm": 0.666211099047787,
"learning_rate": 3.033265593573994e-05,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35766348242759705,
"step": 1095,
"valid_targets_mean": 2767.8,
"valid_targets_min": 1512
},
{
"epoch": 2.7777777777777777,
"grad_norm": 0.5893274171238146,
"learning_rate": 3.0224598707162037e-05,
"loss": 0.3812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35240688920021057,
"step": 1100,
"valid_targets_mean": 3162.4,
"valid_targets_min": 855
},
{
"epoch": 2.7904040404040407,
"grad_norm": 0.6436336249871378,
"learning_rate": 3.0116135884425156e-05,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4571429193019867,
"step": 1105,
"valid_targets_mean": 3306.6,
"valid_targets_min": 999
},
{
"epoch": 2.8030303030303028,
"grad_norm": 0.6192587115834132,
"learning_rate": 3.0007271770083216e-05,
"loss": 0.3935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2913767397403717,
"step": 1110,
"valid_targets_mean": 2528.9,
"valid_targets_min": 780
},
{
"epoch": 2.8156565656565657,
"grad_norm": 0.606484213579456,
"learning_rate": 2.989801068260878e-05,
"loss": 0.3754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29592519998550415,
"step": 1115,
"valid_targets_mean": 2622.3,
"valid_targets_min": 1436
},
{
"epoch": 2.8282828282828283,
"grad_norm": 0.645202232373261,
"learning_rate": 2.9788356956221712e-05,
"loss": 0.3682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3493780195713043,
"step": 1120,
"valid_targets_mean": 2796.6,
"valid_targets_min": 1281
},
{
"epoch": 2.840909090909091,
"grad_norm": 0.6382732894080507,
"learning_rate": 2.9678314940717276e-05,
"loss": 0.3192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31767457723617554,
"step": 1125,
"valid_targets_mean": 2719.1,
"valid_targets_min": 1784
},
{
"epoch": 2.8535353535353534,
"grad_norm": 0.6864660560112232,
"learning_rate": 2.9567889001293553e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3313673436641693,
"step": 1130,
"valid_targets_mean": 2460.8,
"valid_targets_min": 588
},
{
"epoch": 2.866161616161616,
"grad_norm": 0.6023940706764531,
"learning_rate": 2.94570835183783e-05,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34224456548690796,
"step": 1135,
"valid_targets_mean": 3116.4,
"valid_targets_min": 1116
},
{
"epoch": 2.878787878787879,
"grad_norm": 0.6067779962957488,
"learning_rate": 2.93459028874552e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3636412024497986,
"step": 1140,
"valid_targets_mean": 3337.4,
"valid_targets_min": 571
},
{
"epoch": 2.8914141414141414,
"grad_norm": 0.6092698495443272,
"learning_rate": 2.9234351518889465e-05,
"loss": 0.4067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4876616597175598,
"step": 1145,
"valid_targets_mean": 4359.3,
"valid_targets_min": 1940
},
{
"epoch": 2.904040404040404,
"grad_norm": 0.6240475836405307,
"learning_rate": 2.9122433837752906e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31040680408477783,
"step": 1150,
"valid_targets_mean": 2761.3,
"valid_targets_min": 1568
},
{
"epoch": 2.9166666666666665,
"grad_norm": 0.5730069310790777,
"learning_rate": 2.9010154283648382e-05,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3821036219596863,
"step": 1155,
"valid_targets_mean": 3784.9,
"valid_targets_min": 1335
},
{
"epoch": 2.929292929292929,
"grad_norm": 0.6572646648160343,
"learning_rate": 2.8897517310533733e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128521740436554,
"step": 1160,
"valid_targets_mean": 2357.7,
"valid_targets_min": 1131
},
{
"epoch": 2.941919191919192,
"grad_norm": 0.6115860029185797,
"learning_rate": 2.8784527386545006e-05,
"loss": 0.4476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49554532766342163,
"step": 1165,
"valid_targets_mean": 4678.3,
"valid_targets_min": 808
},
{
"epoch": 2.9545454545454546,
"grad_norm": 0.6535005566432543,
"learning_rate": 2.8671188993819327e-05,
"loss": 0.4041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4300668239593506,
"step": 1170,
"valid_targets_mean": 3714.4,
"valid_targets_min": 2330
},
{
"epoch": 2.967171717171717,
"grad_norm": 0.6344464229430659,
"learning_rate": 2.8557506628317e-05,
"loss": 0.3867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4097946882247925,
"step": 1175,
"valid_targets_mean": 3480.2,
"valid_targets_min": 1844
},
{
"epoch": 2.9797979797979797,
"grad_norm": 0.5549040647946087,
"learning_rate": 2.844348479964323e-05,
"loss": 0.3997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36530980467796326,
"step": 1180,
"valid_targets_mean": 3680.7,
"valid_targets_min": 2068
},
{
"epoch": 2.992424242424242,
"grad_norm": 0.6350789264846295,
"learning_rate": 2.8329128030869183e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36941784620285034,
"step": 1185,
"valid_targets_mean": 2964.5,
"valid_targets_min": 598
},
{
"epoch": 3.005050505050505,
"grad_norm": 0.6101230464628173,
"learning_rate": 2.8214440858352602e-05,
"loss": 0.3585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3312152624130249,
"step": 1190,
"valid_targets_mean": 3049.0,
"valid_targets_min": 1661
},
{
"epoch": 3.0176767676767677,
"grad_norm": 0.6717050734051245,
"learning_rate": 2.8099427831557836e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3820994794368744,
"step": 1195,
"valid_targets_mean": 3147.5,
"valid_targets_min": 1505
},
{
"epoch": 3.0303030303030303,
"grad_norm": 0.6855402222878124,
"learning_rate": 2.798409351287537e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3795431852340698,
"step": 1200,
"valid_targets_mean": 3020.4,
"valid_targets_min": 1208
},
{
"epoch": 3.042929292929293,
"grad_norm": 0.6290362160754815,
"learning_rate": 2.7868442477440845e-05,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3297278881072998,
"step": 1205,
"valid_targets_mean": 3352.2,
"valid_targets_min": 1870
},
{
"epoch": 3.0555555555555554,
"grad_norm": 0.6542985881986048,
"learning_rate": 2.7752479312953576e-05,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37977492809295654,
"step": 1210,
"valid_targets_mean": 3504.4,
"valid_targets_min": 1174
},
{
"epoch": 3.0681818181818183,
"grad_norm": 0.6865766533109904,
"learning_rate": 2.763620861949456e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3136219382286072,
"step": 1215,
"valid_targets_mean": 2935.5,
"valid_targets_min": 671
},
{
"epoch": 3.080808080808081,
"grad_norm": 0.650463581157268,
"learning_rate": 2.7519635009343982e-05,
"loss": 0.3616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3669140934944153,
"step": 1220,
"valid_targets_mean": 3443.1,
"valid_targets_min": 1433
},
{
"epoch": 3.0934343434343434,
"grad_norm": 0.6374974160183221,
"learning_rate": 2.7402763106798295e-05,
"loss": 0.385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3267042636871338,
"step": 1225,
"valid_targets_mean": 3336.6,
"valid_targets_min": 1490
},
{
"epoch": 3.106060606060606,
"grad_norm": 0.7164459430574219,
"learning_rate": 2.7285597547986715e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801751732826233,
"step": 1230,
"valid_targets_mean": 3270.2,
"valid_targets_min": 1810
},
{
"epoch": 3.1186868686868685,
"grad_norm": 0.6786289930271091,
"learning_rate": 2.7168142980687394e-05,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.343783438205719,
"step": 1235,
"valid_targets_mean": 2905.7,
"valid_targets_min": 1686
},
{
"epoch": 3.1313131313131315,
"grad_norm": 0.8228076465104819,
"learning_rate": 2.7050404064142985e-05,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3551754355430603,
"step": 1240,
"valid_targets_mean": 3203.6,
"valid_targets_min": 599
},
{
"epoch": 3.143939393939394,
"grad_norm": 0.7057452290840084,
"learning_rate": 2.693238546887583e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38851505517959595,
"step": 1245,
"valid_targets_mean": 2690.1,
"valid_targets_min": 738
},
{
"epoch": 3.1565656565656566,
"grad_norm": 0.6516753493509879,
"learning_rate": 2.6814091876502738e-05,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30876827239990234,
"step": 1250,
"valid_targets_mean": 2591.5,
"valid_targets_min": 1481
},
{
"epoch": 3.169191919191919,
"grad_norm": 0.5373908122046772,
"learning_rate": 2.669552797954917e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4019007682800293,
"step": 1255,
"valid_targets_mean": 4778.8,
"valid_targets_min": 1761
},
{
"epoch": 3.1818181818181817,
"grad_norm": 0.656469897426696,
"learning_rate": 2.6576698481263216e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3878747522830963,
"step": 1260,
"valid_targets_mean": 3612.4,
"valid_targets_min": 1553
},
{
"epoch": 3.1944444444444446,
"grad_norm": 0.6890638135835326,
"learning_rate": 2.6457608095428925e-05,
"loss": 0.3607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37581291794776917,
"step": 1265,
"valid_targets_mean": 3227.2,
"valid_targets_min": 876
},
{
"epoch": 3.207070707070707,
"grad_norm": 0.6686732667303787,
"learning_rate": 2.633826154617938e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32370471954345703,
"step": 1270,
"valid_targets_mean": 3021.6,
"valid_targets_min": 555
},
{
"epoch": 3.2196969696969697,
"grad_norm": 0.60906879769235,
"learning_rate": 2.621866356780924e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982814908027649,
"step": 1275,
"valid_targets_mean": 3329.8,
"valid_targets_min": 1659
},
{
"epoch": 3.2323232323232323,
"grad_norm": 0.6788697674939761,
"learning_rate": 2.6098818904587014e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3478686213493347,
"step": 1280,
"valid_targets_mean": 3108.2,
"valid_targets_min": 1337
},
{
"epoch": 3.244949494949495,
"grad_norm": 0.7418192989966806,
"learning_rate": 2.597873231056679e-05,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3505740165710449,
"step": 1285,
"valid_targets_mean": 2378.4,
"valid_targets_min": 699
},
{
"epoch": 3.257575757575758,
"grad_norm": 0.6743259771608354,
"learning_rate": 2.585840854939969e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.337390661239624,
"step": 1290,
"valid_targets_mean": 2974.2,
"valid_targets_min": 869
},
{
"epoch": 3.2702020202020203,
"grad_norm": 0.6553868057444038,
"learning_rate": 2.5737852394144903e-05,
"loss": 0.3231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3390675187110901,
"step": 1295,
"valid_targets_mean": 2955.1,
"valid_targets_min": 1599
},
{
"epoch": 3.282828282828283,
"grad_norm": 0.6403703744617418,
"learning_rate": 2.5617068627080305e-05,
"loss": 0.3688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4630083739757538,
"step": 1300,
"valid_targets_mean": 4076.2,
"valid_targets_min": 689
},
{
"epoch": 3.2954545454545454,
"grad_norm": 0.6023984043375903,
"learning_rate": 2.5496062039512834e-05,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32059431076049805,
"step": 1305,
"valid_targets_mean": 3375.9,
"valid_targets_min": 1878
},
{
"epoch": 3.308080808080808,
"grad_norm": 0.6396425541446585,
"learning_rate": 2.5374837431588322e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3704610764980316,
"step": 1310,
"valid_targets_mean": 3331.3,
"valid_targets_min": 1406
},
{
"epoch": 3.320707070707071,
"grad_norm": 0.6776583962480702,
"learning_rate": 2.525339961210117e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2946220636367798,
"step": 1315,
"valid_targets_mean": 2489.2,
"valid_targets_min": 587
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.7512035560086019,
"learning_rate": 2.5131753398303546e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3226706385612488,
"step": 1320,
"valid_targets_mean": 2257.8,
"valid_targets_min": 513
},
{
"epoch": 3.345959595959596,
"grad_norm": 0.6691736317428321,
"learning_rate": 2.5009903615714288e-05,
"loss": 0.3713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38169464468955994,
"step": 1325,
"valid_targets_mean": 3674.4,
"valid_targets_min": 710
},
{
"epoch": 3.3585858585858586,
"grad_norm": 0.6529576389515854,
"learning_rate": 2.4887855097927515e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3396865725517273,
"step": 1330,
"valid_targets_mean": 3407.2,
"valid_targets_min": 755
},
{
"epoch": 3.371212121212121,
"grad_norm": 0.7154816898888791,
"learning_rate": 2.4765612686420855e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.343447744846344,
"step": 1335,
"valid_targets_mean": 2833.6,
"valid_targets_min": 506
},
{
"epoch": 3.3838383838383836,
"grad_norm": 0.6736312101027783,
"learning_rate": 2.46431812303634e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32376375794410706,
"step": 1340,
"valid_targets_mean": 2666.4,
"valid_targets_min": 1333
},
{
"epoch": 3.3964646464646466,
"grad_norm": 0.6475094233289387,
"learning_rate": 2.4520565586423364e-05,
"loss": 0.3204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29635465145111084,
"step": 1345,
"valid_targets_mean": 2748.7,
"valid_targets_min": 1392
},
{
"epoch": 3.409090909090909,
"grad_norm": 0.5843996644681299,
"learning_rate": 2.4397770618575402e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3405814468860626,
"step": 1350,
"valid_targets_mean": 3957.3,
"valid_targets_min": 1585
},
{
"epoch": 3.4217171717171717,
"grad_norm": 0.6569771648498826,
"learning_rate": 2.4274801197907665e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35267573595046997,
"step": 1355,
"valid_targets_mean": 3056.4,
"valid_targets_min": 1380
},
{
"epoch": 3.4343434343434343,
"grad_norm": 0.6278190545664051,
"learning_rate": 2.4151662202428613e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3695211410522461,
"step": 1360,
"valid_targets_mean": 3506.5,
"valid_targets_min": 1884
},
{
"epoch": 3.446969696969697,
"grad_norm": 0.634074126688538,
"learning_rate": 2.4028358516873427e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3146069645881653,
"step": 1365,
"valid_targets_mean": 3289.8,
"valid_targets_min": 1669
},
{
"epoch": 3.45959595959596,
"grad_norm": 0.6801530900407086,
"learning_rate": 2.390489503251034e-05,
"loss": 0.3597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4268019199371338,
"step": 1370,
"valid_targets_mean": 3845.6,
"valid_targets_min": 1843
},
{
"epoch": 3.4722222222222223,
"grad_norm": 0.6302056512933344,
"learning_rate": 2.3781276646946526e-05,
"loss": 0.3483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35302233695983887,
"step": 1375,
"valid_targets_mean": 3840.2,
"valid_targets_min": 1261
},
{
"epoch": 3.484848484848485,
"grad_norm": 0.6377742108475873,
"learning_rate": 2.3657508263933874e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33783674240112305,
"step": 1380,
"valid_targets_mean": 3263.4,
"valid_targets_min": 1149
},
{
"epoch": 3.4974747474747474,
"grad_norm": 0.7042898368764126,
"learning_rate": 2.3533594793174426e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3383498191833496,
"step": 1385,
"valid_targets_mean": 2682.6,
"valid_targets_min": 1382
},
{
"epoch": 3.51010101010101,
"grad_norm": 0.7030408364050017,
"learning_rate": 2.3409541150125645e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4075915217399597,
"step": 1390,
"valid_targets_mean": 3162.8,
"valid_targets_min": 1353
},
{
"epoch": 3.5227272727272725,
"grad_norm": 0.6274505021865276,
"learning_rate": 2.3285352255805398e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31670212745666504,
"step": 1395,
"valid_targets_mean": 3087.0,
"valid_targets_min": 392
},
{
"epoch": 3.5353535353535355,
"grad_norm": 1.2486599391824142,
"learning_rate": 2.316103303659678e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36197564005851746,
"step": 1400,
"valid_targets_mean": 3082.6,
"valid_targets_min": 527
},
{
"epoch": 3.547979797979798,
"grad_norm": 0.5371320718863393,
"learning_rate": 2.3036588424052672e-05,
"loss": 0.351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3815935254096985,
"step": 1405,
"valid_targets_mean": 4752.9,
"valid_targets_min": 1819
},
{
"epoch": 3.5606060606060606,
"grad_norm": 0.705016854939806,
"learning_rate": 2.2912023354700105e-05,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3603851795196533,
"step": 1410,
"valid_targets_mean": 2926.8,
"valid_targets_min": 1512
},
{
"epoch": 3.573232323232323,
"grad_norm": 0.5984653768510367,
"learning_rate": 2.2787342769844444e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3309054374694824,
"step": 1415,
"valid_targets_mean": 3481.1,
"valid_targets_min": 1110
},
{
"epoch": 3.5858585858585856,
"grad_norm": 0.8191525002477924,
"learning_rate": 2.2662551615373402e-05,
"loss": 0.3989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44843584299087524,
"step": 1420,
"valid_targets_mean": 2668.3,
"valid_targets_min": 648
},
{
"epoch": 3.5984848484848486,
"grad_norm": 0.6651567018600946,
"learning_rate": 2.25376548415608e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3173557221889496,
"step": 1425,
"valid_targets_mean": 2731.2,
"valid_targets_min": 1126
},
{
"epoch": 3.611111111111111,
"grad_norm": 0.6266431493382524,
"learning_rate": 2.241265740287021e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29255497455596924,
"step": 1430,
"valid_targets_mean": 2907.2,
"valid_targets_min": 1479
},
{
"epoch": 3.6237373737373737,
"grad_norm": 0.5693607197936612,
"learning_rate": 2.2287564257758446e-05,
"loss": 0.3977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41386911273002625,
"step": 1435,
"valid_targets_mean": 4703.8,
"valid_targets_min": 707
},
{
"epoch": 3.6363636363636362,
"grad_norm": 0.7080853718994018,
"learning_rate": 2.2162380368478836e-05,
"loss": 0.3847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3499618172645569,
"step": 1440,
"valid_targets_mean": 2786.1,
"valid_targets_min": 596
},
{
"epoch": 3.648989898989899,
"grad_norm": 0.5548114926983784,
"learning_rate": 2.2037110700884395e-05,
"loss": 0.3565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25791436433792114,
"step": 1445,
"valid_targets_mean": 3419.7,
"valid_targets_min": 1345
},
{
"epoch": 3.6616161616161618,
"grad_norm": 0.5977854910500919,
"learning_rate": 2.1911760224230824e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33634889125823975,
"step": 1450,
"valid_targets_mean": 3442.4,
"valid_targets_min": 1773
},
{
"epoch": 3.6742424242424243,
"grad_norm": 0.6796398481161333,
"learning_rate": 2.17863339109794e-05,
"loss": 0.3525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36308521032333374,
"step": 1455,
"valid_targets_mean": 3190.7,
"valid_targets_min": 1471
},
{
"epoch": 3.686868686868687,
"grad_norm": 0.6479531096999324,
"learning_rate": 2.166083673659973e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35041192173957825,
"step": 1460,
"valid_targets_mean": 3109.9,
"valid_targets_min": 880
},
{
"epoch": 3.6994949494949494,
"grad_norm": 0.6190656382920072,
"learning_rate": 2.153527367937236e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3769229054450989,
"step": 1465,
"valid_targets_mean": 3737.9,
"valid_targets_min": 1786
},
{
"epoch": 3.712121212121212,
"grad_norm": 0.6732653753234384,
"learning_rate": 2.140964972019132e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3730910122394562,
"step": 1470,
"valid_targets_mean": 3028.1,
"valid_targets_min": 786
},
{
"epoch": 3.724747474747475,
"grad_norm": 0.682620817181734,
"learning_rate": 2.128396984236651e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37931591272354126,
"step": 1475,
"valid_targets_mean": 3248.3,
"valid_targets_min": 1448
},
{
"epoch": 3.7373737373737375,
"grad_norm": 1.5193685144502576,
"learning_rate": 2.115823903142606e-05,
"loss": 0.3605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3566587567329407,
"step": 1480,
"valid_targets_mean": 3345.8,
"valid_targets_min": 603
},
{
"epoch": 3.75,
"grad_norm": 0.6092501389476551,
"learning_rate": 2.1032462274918517e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30876415967941284,
"step": 1485,
"valid_targets_mean": 3301.3,
"valid_targets_min": 952
},
{
"epoch": 3.7626262626262625,
"grad_norm": 0.7276893961486488,
"learning_rate": 2.0906644562215037e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3389100432395935,
"step": 1490,
"valid_targets_mean": 2715.4,
"valid_targets_min": 753
},
{
"epoch": 3.775252525252525,
"grad_norm": 0.5858712774395105,
"learning_rate": 2.078079088431143e-05,
"loss": 0.3767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3030000925064087,
"step": 1495,
"valid_targets_mean": 3219.7,
"valid_targets_min": 2366
},
{
"epoch": 3.787878787878788,
"grad_norm": 0.6888688838778153,
"learning_rate": 2.0654906233630197e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.416027694940567,
"step": 1500,
"valid_targets_mean": 3128.2,
"valid_targets_min": 534
},
{
"epoch": 2.516722408026756,
"grad_norm": 0.662986162649258,
"learning_rate": 3.23558282621135e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29847097396850586,
"step": 1505,
"valid_targets_mean": 3091.0,
"valid_targets_min": 508
},
{
"epoch": 2.5250836120401337,
"grad_norm": 0.6783328257944375,
"learning_rate": 3.229014188825108e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3512507975101471,
"step": 1510,
"valid_targets_mean": 3352.5,
"valid_targets_min": 1133
},
{
"epoch": 2.5334448160535117,
"grad_norm": 0.6677148404277962,
"learning_rate": 3.2224241814261216e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26659291982650757,
"step": 1515,
"valid_targets_mean": 2794.4,
"valid_targets_min": 1460
},
{
"epoch": 2.5418060200668897,
"grad_norm": 0.7219771342415074,
"learning_rate": 3.215812918600978e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3495546579360962,
"step": 1520,
"valid_targets_mean": 2987.6,
"valid_targets_min": 632
},
{
"epoch": 2.5501672240802673,
"grad_norm": 0.6560298605364091,
"learning_rate": 3.209180515305855e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.331092894077301,
"step": 1525,
"valid_targets_mean": 3713.1,
"valid_targets_min": 534
},
{
"epoch": 2.5585284280936453,
"grad_norm": 0.6919955457501047,
"learning_rate": 3.2025270868645146e-05,
"loss": 0.3497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3320353925228119,
"step": 1530,
"valid_targets_mean": 3199.7,
"valid_targets_min": 1028
},
{
"epoch": 2.5668896321070234,
"grad_norm": 0.708863656128023,
"learning_rate": 3.195852748966306e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36112624406814575,
"step": 1535,
"valid_targets_mean": 3085.5,
"valid_targets_min": 588
},
{
"epoch": 2.5752508361204014,
"grad_norm": 0.7471046326039033,
"learning_rate": 3.189157617664151e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28388604521751404,
"step": 1540,
"valid_targets_mean": 2699.7,
"valid_targets_min": 620
},
{
"epoch": 2.5836120401337794,
"grad_norm": 0.7471683542567666,
"learning_rate": 3.182441809372523e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33689889311790466,
"step": 1545,
"valid_targets_mean": 2698.6,
"valid_targets_min": 1551
},
{
"epoch": 2.591973244147157,
"grad_norm": 0.6750267862750765,
"learning_rate": 3.1757054408654266e-05,
"loss": 0.3833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789178192615509,
"step": 1550,
"valid_targets_mean": 2798.8,
"valid_targets_min": 1573
},
{
"epoch": 2.600334448160535,
"grad_norm": 0.681930396951124,
"learning_rate": 3.168948629274367e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054756820201874,
"step": 1555,
"valid_targets_mean": 2962.2,
"valid_targets_min": 1403
},
{
"epoch": 2.608695652173913,
"grad_norm": 0.6634403273333718,
"learning_rate": 3.1621714920863104e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4073365032672882,
"step": 1560,
"valid_targets_mean": 4461.2,
"valid_targets_min": 1433
},
{
"epoch": 2.617056856187291,
"grad_norm": 0.8238005424494197,
"learning_rate": 3.155374147141646e-05,
"loss": 0.3604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38494405150413513,
"step": 1565,
"valid_targets_mean": 2640.8,
"valid_targets_min": 863
},
{
"epoch": 2.625418060200669,
"grad_norm": 0.7052867973145739,
"learning_rate": 3.1485567126321295e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3390483260154724,
"step": 1570,
"valid_targets_mean": 3285.6,
"valid_targets_min": 1434
},
{
"epoch": 2.6337792642140467,
"grad_norm": 0.6953845280826801,
"learning_rate": 3.1417193070988383e-05,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3528243601322174,
"step": 1575,
"valid_targets_mean": 3543.2,
"valid_targets_min": 1601
},
{
"epoch": 2.6421404682274248,
"grad_norm": 0.7552847898076053,
"learning_rate": 3.134862049430099e-05,
"loss": 0.3392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39836952090263367,
"step": 1580,
"valid_targets_mean": 3433.9,
"valid_targets_min": 1805
},
{
"epoch": 2.650501672240803,
"grad_norm": 1.4277354366593005,
"learning_rate": 3.12798505885943e-05,
"loss": 0.36,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3085378408432007,
"step": 1585,
"valid_targets_mean": 3400.1,
"valid_targets_min": 1201
},
{
"epoch": 2.6588628762541804,
"grad_norm": 0.7410833217029822,
"learning_rate": 3.1210884549634624e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28592583537101746,
"step": 1590,
"valid_targets_mean": 2576.4,
"valid_targets_min": 1460
},
{
"epoch": 2.6672240802675584,
"grad_norm": 0.8296406296042037,
"learning_rate": 3.114172357659861e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.370746374130249,
"step": 1595,
"valid_targets_mean": 2589.8,
"valid_targets_min": 587
},
{
"epoch": 2.6755852842809364,
"grad_norm": 0.5928853152526612,
"learning_rate": 3.107236887205242e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33890628814697266,
"step": 1600,
"valid_targets_mean": 4613.9,
"valid_targets_min": 1582
},
{
"epoch": 2.6839464882943145,
"grad_norm": 0.7237916757375374,
"learning_rate": 3.1002821641930815e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3008784055709839,
"step": 1605,
"valid_targets_mean": 2820.9,
"valid_targets_min": 1351
},
{
"epoch": 2.6923076923076925,
"grad_norm": 0.6958603576096208,
"learning_rate": 3.093308309551616e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26427051424980164,
"step": 1610,
"valid_targets_mean": 2401.6,
"valid_targets_min": 377
},
{
"epoch": 2.70066889632107,
"grad_norm": 0.7246194414411228,
"learning_rate": 3.0863154445417426e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31494617462158203,
"step": 1615,
"valid_targets_mean": 2992.2,
"valid_targets_min": 1254
},
{
"epoch": 2.709030100334448,
"grad_norm": 0.6683077048389021,
"learning_rate": 3.079303690754908e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46505263447761536,
"step": 1620,
"valid_targets_mean": 4923.4,
"valid_targets_min": 1295
},
{
"epoch": 2.717391304347826,
"grad_norm": 0.6839193880655342,
"learning_rate": 3.072273170110998e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3480769693851471,
"step": 1625,
"valid_targets_mean": 3295.5,
"valid_targets_min": 698
},
{
"epoch": 2.7257525083612038,
"grad_norm": 0.6148350220041032,
"learning_rate": 3.0652240048562134e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3841598629951477,
"step": 1630,
"valid_targets_mean": 4531.8,
"valid_targets_min": 2092
},
{
"epoch": 2.734113712374582,
"grad_norm": 0.7604959335941064,
"learning_rate": 3.058156317560945e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3188338279724121,
"step": 1635,
"valid_targets_mean": 2672.3,
"valid_targets_min": 971
},
{
"epoch": 2.74247491638796,
"grad_norm": 0.7495694482080785,
"learning_rate": 3.0510702311176477e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28397685289382935,
"step": 1640,
"valid_targets_mean": 2509.3,
"valid_targets_min": 1020
},
{
"epoch": 2.750836120401338,
"grad_norm": 0.5960363613154568,
"learning_rate": 3.043965868738695e-05,
"loss": 0.33,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26706498861312866,
"step": 1645,
"valid_targets_mean": 3699.4,
"valid_targets_min": 638
},
{
"epoch": 2.759197324414716,
"grad_norm": 0.6692357148144276,
"learning_rate": 3.0368433539542433e-05,
"loss": 0.3714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700284719467163,
"step": 1650,
"valid_targets_mean": 3072.4,
"valid_targets_min": 1064
},
{
"epoch": 2.7675585284280935,
"grad_norm": 0.7677279753834415,
"learning_rate": 3.029702810610082e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3318488895893097,
"step": 1655,
"valid_targets_mean": 2859.8,
"valid_targets_min": 714
},
{
"epoch": 2.7759197324414715,
"grad_norm": 0.7231622567261902,
"learning_rate": 3.0225443628654787e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3072254955768585,
"step": 1660,
"valid_targets_mean": 3285.6,
"valid_targets_min": 1067
},
{
"epoch": 2.7842809364548495,
"grad_norm": 0.7351401519067079,
"learning_rate": 3.0153681351910226e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622933626174927,
"step": 1665,
"valid_targets_mean": 3139.9,
"valid_targets_min": 1919
},
{
"epoch": 2.7926421404682276,
"grad_norm": 0.7218998613996677,
"learning_rate": 3.0081742523664576e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2836865782737732,
"step": 1670,
"valid_targets_mean": 2875.6,
"valid_targets_min": 908
},
{
"epoch": 2.8010033444816056,
"grad_norm": 0.7498483662923942,
"learning_rate": 3.0009628394785158e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725030481815338,
"step": 1675,
"valid_targets_mean": 2490.9,
"valid_targets_min": 858
},
{
"epoch": 2.809364548494983,
"grad_norm": 0.7901928997172852,
"learning_rate": 2.9937340219187402e-05,
"loss": 0.3407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3297320008277893,
"step": 1680,
"valid_targets_mean": 2595.1,
"valid_targets_min": 1608
},
{
"epoch": 2.817725752508361,
"grad_norm": 0.6829285663175374,
"learning_rate": 2.986487925381304e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28002995252609253,
"step": 1685,
"valid_targets_mean": 2900.0,
"valid_targets_min": 810
},
{
"epoch": 2.8260869565217392,
"grad_norm": 0.7868893655628152,
"learning_rate": 2.9792246758608283e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678167164325714,
"step": 1690,
"valid_targets_mean": 3206.1,
"valid_targets_min": 1573
},
{
"epoch": 2.834448160535117,
"grad_norm": 0.6961974009885317,
"learning_rate": 2.9719443996501858e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3555162250995636,
"step": 1695,
"valid_targets_mean": 3276.0,
"valid_targets_min": 1491
},
{
"epoch": 2.842809364548495,
"grad_norm": 0.6616306549579406,
"learning_rate": 2.9646472233383118e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307451993227005,
"step": 1700,
"valid_targets_mean": 3025.1,
"valid_targets_min": 508
},
{
"epoch": 2.851170568561873,
"grad_norm": 0.699054155600686,
"learning_rate": 2.9573332738079964e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325960248708725,
"step": 1705,
"valid_targets_mean": 3397.9,
"valid_targets_min": 553
},
{
"epoch": 2.859531772575251,
"grad_norm": 0.5618995876602438,
"learning_rate": 2.9500026782336828e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3432704210281372,
"step": 1710,
"valid_targets_mean": 5129.1,
"valid_targets_min": 794
},
{
"epoch": 2.867892976588629,
"grad_norm": 0.7396609388739099,
"learning_rate": 2.942655564079254e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30100107192993164,
"step": 1715,
"valid_targets_mean": 2780.6,
"valid_targets_min": 741
},
{
"epoch": 2.8762541806020065,
"grad_norm": 0.6882252256679291,
"learning_rate": 2.9352920590958173e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3655456006526947,
"step": 1720,
"valid_targets_mean": 3660.6,
"valid_targets_min": 1486
},
{
"epoch": 2.8846153846153846,
"grad_norm": 0.6954294304011069,
"learning_rate": 2.927912291319482e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898782789707184,
"step": 1725,
"valid_targets_mean": 2949.5,
"valid_targets_min": 1417
},
{
"epoch": 2.8929765886287626,
"grad_norm": 0.7685790812651909,
"learning_rate": 2.9205163890691338e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.351645827293396,
"step": 1730,
"valid_targets_mean": 3392.4,
"valid_targets_min": 1028
},
{
"epoch": 2.90133779264214,
"grad_norm": 0.6514952351452494,
"learning_rate": 2.9131044809442038e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27277517318725586,
"step": 1735,
"valid_targets_mean": 3230.4,
"valid_targets_min": 1120
},
{
"epoch": 2.9096989966555182,
"grad_norm": 0.6336596359886507,
"learning_rate": 2.9056766958224324e-05,
"loss": 0.3282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31338661909103394,
"step": 1740,
"valid_targets_mean": 3871.8,
"valid_targets_min": 726
},
{
"epoch": 2.9180602006688963,
"grad_norm": 0.7074870527746576,
"learning_rate": 2.898233162857627e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31244152784347534,
"step": 1745,
"valid_targets_mean": 3252.4,
"valid_targets_min": 1672
},
{
"epoch": 2.9264214046822743,
"grad_norm": 0.7317476390005567,
"learning_rate": 2.8907740114774185e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3308480381965637,
"step": 1750,
"valid_targets_mean": 2940.5,
"valid_targets_min": 971
},
{
"epoch": 2.9347826086956523,
"grad_norm": 0.669207925359114,
"learning_rate": 2.8832993713810095e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34635135531425476,
"step": 1755,
"valid_targets_mean": 3485.1,
"valid_targets_min": 772
},
{
"epoch": 2.94314381270903,
"grad_norm": 0.7081348378617047,
"learning_rate": 2.8758093725369193e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41460931301116943,
"step": 1760,
"valid_targets_mean": 3348.2,
"valid_targets_min": 580
},
{
"epoch": 2.951505016722408,
"grad_norm": 0.6563436808159772,
"learning_rate": 2.868304145180722e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43143677711486816,
"step": 1765,
"valid_targets_mean": 5450.4,
"valid_targets_min": 1058
},
{
"epoch": 2.959866220735786,
"grad_norm": 1.0813836021947982,
"learning_rate": 2.8607838198127886e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3358667194843292,
"step": 1770,
"valid_targets_mean": 2942.9,
"valid_targets_min": 556
},
{
"epoch": 2.968227424749164,
"grad_norm": 0.6535458920771104,
"learning_rate": 2.8532485271960088e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30923616886138916,
"step": 1775,
"valid_targets_mean": 3134.3,
"valid_targets_min": 1443
},
{
"epoch": 2.976588628762542,
"grad_norm": 0.7051449951363025,
"learning_rate": 2.8456983983535243e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3197246789932251,
"step": 1780,
"valid_targets_mean": 3088.7,
"valid_targets_min": 722
},
{
"epoch": 2.9849498327759196,
"grad_norm": 0.7514550832469282,
"learning_rate": 2.838133564566447e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33178478479385376,
"step": 1785,
"valid_targets_mean": 2903.9,
"valid_targets_min": 1051
},
{
"epoch": 2.9933110367892977,
"grad_norm": 0.7487764007212119,
"learning_rate": 2.8305541573715775e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32397782802581787,
"step": 1790,
"valid_targets_mean": 2655.2,
"valid_targets_min": 364
},
{
"epoch": 3.0016722408026757,
"grad_norm": 0.697866012772672,
"learning_rate": 2.8229603085591178e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24206683039665222,
"step": 1795,
"valid_targets_mean": 2628.6,
"valid_targets_min": 1232
},
{
"epoch": 3.0100334448160537,
"grad_norm": 0.7292123243657525,
"learning_rate": 2.8153521501703803e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32684776186943054,
"step": 1800,
"valid_targets_mean": 3399.4,
"valid_targets_min": 1615
},
{
"epoch": 3.0183946488294313,
"grad_norm": 0.7473811261850504,
"learning_rate": 2.8077298144954904e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2628287672996521,
"step": 1805,
"valid_targets_mean": 2887.2,
"valid_targets_min": 807
},
{
"epoch": 3.0267558528428093,
"grad_norm": 0.7650083502129927,
"learning_rate": 2.8000934340710883e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30963340401649475,
"step": 1810,
"valid_targets_mean": 3063.6,
"valid_targets_min": 1264
},
{
"epoch": 3.0351170568561874,
"grad_norm": 0.7397530221539242,
"learning_rate": 2.792443141678022e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27429091930389404,
"step": 1815,
"valid_targets_mean": 2718.4,
"valid_targets_min": 757
},
{
"epoch": 3.0434782608695654,
"grad_norm": 0.889361629882369,
"learning_rate": 2.784779070339041e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3256457448005676,
"step": 1820,
"valid_targets_mean": 2798.4,
"valid_targets_min": 470
},
{
"epoch": 3.051839464882943,
"grad_norm": 0.6809205141917194,
"learning_rate": 2.7771013533164805e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3276858329772949,
"step": 1825,
"valid_targets_mean": 3351.5,
"valid_targets_min": 399
},
{
"epoch": 3.060200668896321,
"grad_norm": 0.6744548172485136,
"learning_rate": 2.7694101241099484e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4031035006046295,
"step": 1830,
"valid_targets_mean": 4916.2,
"valid_targets_min": 772
},
{
"epoch": 3.068561872909699,
"grad_norm": 0.7582120508573842,
"learning_rate": 2.7617055164539993e-05,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31827855110168457,
"step": 1835,
"valid_targets_mean": 2926.5,
"valid_targets_min": 2041
},
{
"epoch": 3.076923076923077,
"grad_norm": 0.8315396768017139,
"learning_rate": 2.753987664315813e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35661745071411133,
"step": 1840,
"valid_targets_mean": 2858.8,
"valid_targets_min": 726
},
{
"epoch": 3.0852842809364547,
"grad_norm": 0.7155190185107607,
"learning_rate": 2.746256701892861e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801868259906769,
"step": 1845,
"valid_targets_mean": 4064.2,
"valid_targets_min": 1411
},
{
"epoch": 3.0936454849498327,
"grad_norm": 0.6741071495612008,
"learning_rate": 2.738512763610579e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37737980484962463,
"step": 1850,
"valid_targets_mean": 4971.6,
"valid_targets_min": 1956
},
{
"epoch": 3.1020066889632107,
"grad_norm": 0.7590694014485702,
"learning_rate": 2.7307559841200238e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3324778079986572,
"step": 1855,
"valid_targets_mean": 2946.1,
"valid_targets_min": 1303
},
{
"epoch": 3.1103678929765888,
"grad_norm": 0.7215558419615479,
"learning_rate": 2.7229864982955328e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3469077944755554,
"step": 1860,
"valid_targets_mean": 3110.1,
"valid_targets_min": 1665
},
{
"epoch": 3.1187290969899664,
"grad_norm": 0.6897412184844943,
"learning_rate": 2.7152044412323842e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28832149505615234,
"step": 1865,
"valid_targets_mean": 3266.5,
"valid_targets_min": 1272
},
{
"epoch": 3.1270903010033444,
"grad_norm": 0.8950983106159963,
"learning_rate": 2.7074099482444406e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3346301317214966,
"step": 1870,
"valid_targets_mean": 2962.5,
"valid_targets_min": 794
},
{
"epoch": 3.1354515050167224,
"grad_norm": 0.6829362728624939,
"learning_rate": 2.699603154861801e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530469298362732,
"step": 1875,
"valid_targets_mean": 3057.2,
"valid_targets_min": 1148
},
{
"epoch": 3.1438127090301005,
"grad_norm": 0.7233648289737619,
"learning_rate": 2.6917841968284433e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3072529733181,
"step": 1880,
"valid_targets_mean": 2967.2,
"valid_targets_min": 1431
},
{
"epoch": 3.1521739130434785,
"grad_norm": 0.7416457175298982,
"learning_rate": 2.6839532100998623e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3872751295566559,
"step": 1885,
"valid_targets_mean": 3862.7,
"valid_targets_min": 1334
},
{
"epoch": 3.160535117056856,
"grad_norm": 0.7812518570866998,
"learning_rate": 2.6761103308407076e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25746119022369385,
"step": 1890,
"valid_targets_mean": 2487.5,
"valid_targets_min": 844
},
{
"epoch": 3.168896321070234,
"grad_norm": 0.7436986096190392,
"learning_rate": 2.668255695422415e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37360888719558716,
"step": 1895,
"valid_targets_mean": 3813.4,
"valid_targets_min": 1554
},
{
"epoch": 3.177257525083612,
"grad_norm": 0.7142319442876787,
"learning_rate": 2.660389440420836e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.272394061088562,
"step": 1900,
"valid_targets_mean": 2995.9,
"valid_targets_min": 1008
},
{
"epoch": 3.1856187290969897,
"grad_norm": 0.7424793152458009,
"learning_rate": 2.6525117026138614e-05,
"loss": 0.3392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34922927618026733,
"step": 1905,
"valid_targets_mean": 3819.7,
"valid_targets_min": 1601
},
{
"epoch": 3.1939799331103678,
"grad_norm": 0.7607562321366768,
"learning_rate": 2.644622618979047e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24981051683425903,
"step": 1910,
"valid_targets_mean": 2548.7,
"valid_targets_min": 923
},
{
"epoch": 3.202341137123746,
"grad_norm": 0.6904862318660174,
"learning_rate": 2.6367223266912252e-05,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37764304876327515,
"step": 1915,
"valid_targets_mean": 3910.4,
"valid_targets_min": 1349
},
{
"epoch": 3.210702341137124,
"grad_norm": 0.8961099343679048,
"learning_rate": 2.6288109631201266e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3819909393787384,
"step": 1920,
"valid_targets_mean": 2620.2,
"valid_targets_min": 942
},
{
"epoch": 3.219063545150502,
"grad_norm": 0.7566386982431123,
"learning_rate": 2.6208886658279875e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3507644534111023,
"step": 1925,
"valid_targets_mean": 3339.7,
"valid_targets_min": 1683
},
{
"epoch": 3.2274247491638794,
"grad_norm": 0.8144566736238488,
"learning_rate": 2.6129555725671586e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3747752010822296,
"step": 1930,
"valid_targets_mean": 2877.8,
"valid_targets_min": 1324
},
{
"epoch": 3.2357859531772575,
"grad_norm": 0.8094873874087346,
"learning_rate": 2.605011821277712e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171420693397522,
"step": 1935,
"valid_targets_mean": 2959.7,
"valid_targets_min": 783
},
{
"epoch": 3.2441471571906355,
"grad_norm": 0.8547392925559153,
"learning_rate": 2.597057550085037e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27529996633529663,
"step": 1940,
"valid_targets_mean": 2264.8,
"valid_targets_min": 971
},
{
"epoch": 3.2525083612040135,
"grad_norm": 0.6817740682466431,
"learning_rate": 2.589092897297447e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33298245072364807,
"step": 1945,
"valid_targets_mean": 3641.5,
"valid_targets_min": 2028
},
{
"epoch": 3.260869565217391,
"grad_norm": 0.7178992056677376,
"learning_rate": 2.581118001403767e-05,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.298176109790802,
"step": 1950,
"valid_targets_mean": 2812.1,
"valid_targets_min": 1666
},
{
"epoch": 3.269230769230769,
"grad_norm": 0.821395268384391,
"learning_rate": 2.573133001070928e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32294681668281555,
"step": 1955,
"valid_targets_mean": 2872.3,
"valid_targets_min": 1526
},
{
"epoch": 3.277591973244147,
"grad_norm": 0.7018121583116861,
"learning_rate": 2.565138035141558e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32964542508125305,
"step": 1960,
"valid_targets_mean": 3175.1,
"valid_targets_min": 1682
},
{
"epoch": 3.2859531772575252,
"grad_norm": 1.1803702361445025,
"learning_rate": 2.557133242631565e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171846866607666,
"step": 1965,
"valid_targets_mean": 3355.6,
"valid_targets_min": 467
},
{
"epoch": 3.294314381270903,
"grad_norm": 0.6610850683002595,
"learning_rate": 2.549118762727721e-05,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24194839596748352,
"step": 1970,
"valid_targets_mean": 3080.6,
"valid_targets_min": 1573
},
{
"epoch": 3.302675585284281,
"grad_norm": 0.7255555656749366,
"learning_rate": 2.5410947347852436e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4482927620410919,
"step": 1975,
"valid_targets_mean": 4331.0,
"valid_targets_min": 1168
},
{
"epoch": 3.311036789297659,
"grad_norm": 0.7459931964816805,
"learning_rate": 2.5330612983253667e-05,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28639882802963257,
"step": 1980,
"valid_targets_mean": 3048.4,
"valid_targets_min": 1599
},
{
"epoch": 3.319397993311037,
"grad_norm": 0.7132568663511498,
"learning_rate": 2.5250185930329235e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3665810227394104,
"step": 1985,
"valid_targets_mean": 3538.0,
"valid_targets_min": 1274
},
{
"epoch": 3.327759197324415,
"grad_norm": 0.8008208379218488,
"learning_rate": 2.5169667587539105e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30878740549087524,
"step": 1990,
"valid_targets_mean": 2999.9,
"valid_targets_min": 553
},
{
"epoch": 3.3361204013377925,
"grad_norm": 0.7114926198475543,
"learning_rate": 2.5089059354930584e-05,
"loss": 0.3253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3151680827140808,
"step": 1995,
"valid_targets_mean": 3198.5,
"valid_targets_min": 1876
},
{
"epoch": 3.3444816053511706,
"grad_norm": 0.6910899592340489,
"learning_rate": 2.5008362634113986e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27248960733413696,
"step": 2000,
"valid_targets_mean": 3219.5,
"valid_targets_min": 1548
},
{
"epoch": 3.3528428093645486,
"grad_norm": 0.9194983641690248,
"learning_rate": 2.4927578828238253e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30196303129196167,
"step": 2005,
"valid_targets_mean": 2675.1,
"valid_targets_min": 1560
},
{
"epoch": 3.361204013377926,
"grad_norm": 0.7413625053509546,
"learning_rate": 2.484670934196654e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616788148880005,
"step": 2010,
"valid_targets_mean": 2792.3,
"valid_targets_min": 1188
},
{
"epoch": 3.369565217391304,
"grad_norm": 0.7183291854874223,
"learning_rate": 2.476575558145183e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3487267792224884,
"step": 2015,
"valid_targets_mean": 3637.6,
"valid_targets_min": 1018
},
{
"epoch": 3.3779264214046822,
"grad_norm": 0.7490283521521003,
"learning_rate": 2.468471895431243e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325644314289093,
"step": 2020,
"valid_targets_mean": 3182.8,
"valid_targets_min": 1285
},
{
"epoch": 3.3862876254180603,
"grad_norm": 0.7101402332669482,
"learning_rate": 2.4603600869607564e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660444378852844,
"step": 2025,
"valid_targets_mean": 2812.0,
"valid_targets_min": 1258
},
{
"epoch": 3.3946488294314383,
"grad_norm": 0.730576453198831,
"learning_rate": 2.452240273781281e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26417773962020874,
"step": 2030,
"valid_targets_mean": 3180.6,
"valid_targets_min": 729
},
{
"epoch": 3.403010033444816,
"grad_norm": 0.7181814679922088,
"learning_rate": 2.444112597079558e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812889814376831,
"step": 2035,
"valid_targets_mean": 3133.4,
"valid_targets_min": 1126
},
{
"epoch": 3.411371237458194,
"grad_norm": 0.7924112516136512,
"learning_rate": 2.435977198179065e-05,
"loss": 0.3287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27810171246528625,
"step": 2040,
"valid_targets_mean": 2717.6,
"valid_targets_min": 682
},
{
"epoch": 3.419732441471572,
"grad_norm": 0.707141761893294,
"learning_rate": 2.4278342185375467e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31040269136428833,
"step": 2045,
"valid_targets_mean": 3125.6,
"valid_targets_min": 1931
},
{
"epoch": 3.42809364548495,
"grad_norm": 0.7561619308472627,
"learning_rate": 2.4196837997445636e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3123628795146942,
"step": 2050,
"valid_targets_mean": 3224.0,
"valid_targets_min": 1631
},
{
"epoch": 3.4364548494983276,
"grad_norm": 0.7289170075667627,
"learning_rate": 2.4115260835190285e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535760998725891,
"step": 2055,
"valid_targets_mean": 3353.6,
"valid_targets_min": 1805
},
{
"epoch": 3.4448160535117056,
"grad_norm": 0.945847336384475,
"learning_rate": 2.4033612117067396e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784852981567383,
"step": 2060,
"valid_targets_mean": 3911.6,
"valid_targets_min": 1064
},
{
"epoch": 3.4531772575250836,
"grad_norm": 0.7817559218890252,
"learning_rate": 2.395189326277918e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3658587336540222,
"step": 2065,
"valid_targets_mean": 3038.2,
"valid_targets_min": 1011
},
{
"epoch": 3.4615384615384617,
"grad_norm": 0.7908249845730267,
"learning_rate": 2.3870105693247347e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40112197399139404,
"step": 2070,
"valid_targets_mean": 3198.5,
"valid_targets_min": 707
},
{
"epoch": 3.4698996655518393,
"grad_norm": 0.7869243206602189,
"learning_rate": 2.3788250830588437e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704690992832184,
"step": 2075,
"valid_targets_mean": 2424.8,
"valid_targets_min": 580
},
{
"epoch": 3.4782608695652173,
"grad_norm": 0.7080463514373667,
"learning_rate": 2.3706330098089077e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3315350413322449,
"step": 2080,
"valid_targets_mean": 4324.7,
"valid_targets_min": 1855
},
{
"epoch": 3.4866220735785953,
"grad_norm": 0.8218808851621214,
"learning_rate": 2.3624344920181243e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3174235224723816,
"step": 2085,
"valid_targets_mean": 2845.2,
"valid_targets_min": 1569
},
{
"epoch": 3.4949832775919734,
"grad_norm": 0.7054886370767576,
"learning_rate": 2.3542296722417452e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3576347529888153,
"step": 2090,
"valid_targets_mean": 3957.9,
"valid_targets_min": 1892
},
{
"epoch": 3.5033444816053514,
"grad_norm": 0.7737550873720773,
"learning_rate": 2.346018693144605e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3562350869178772,
"step": 2095,
"valid_targets_mean": 3385.3,
"valid_targets_min": 1565
},
{
"epoch": 3.511705685618729,
"grad_norm": 0.793659888489234,
"learning_rate": 2.3378016974986326e-05,
"loss": 0.3287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3222711384296417,
"step": 2100,
"valid_targets_mean": 2910.6,
"valid_targets_min": 1569
},
{
"epoch": 3.520066889632107,
"grad_norm": 0.8708230054218504,
"learning_rate": 2.3295788281803733e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33255574107170105,
"step": 2105,
"valid_targets_mean": 3600.3,
"valid_targets_min": 1512
},
{
"epoch": 3.528428093645485,
"grad_norm": 0.7022641595914034,
"learning_rate": 2.321350228168505e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3107645511627197,
"step": 2110,
"valid_targets_mean": 3758.8,
"valid_targets_min": 1562
},
{
"epoch": 3.5367892976588626,
"grad_norm": 0.8652735159983888,
"learning_rate": 2.3131160405413472e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26982659101486206,
"step": 2115,
"valid_targets_mean": 2795.1,
"valid_targets_min": 1208
},
{
"epoch": 3.5451505016722407,
"grad_norm": 0.656569555739008,
"learning_rate": 2.30487640847438e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3019533157348633,
"step": 2120,
"valid_targets_mean": 3843.1,
"valid_targets_min": 1730
},
{
"epoch": 3.5535117056856187,
"grad_norm": 0.721412813412654,
"learning_rate": 2.296631475237749e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.326846718788147,
"step": 2125,
"valid_targets_mean": 3144.4,
"valid_targets_min": 963
},
{
"epoch": 3.5618729096989967,
"grad_norm": 0.8698536209082071,
"learning_rate": 2.2883813841937754e-05,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32312431931495667,
"step": 2130,
"valid_targets_mean": 2314.3,
"valid_targets_min": 467
},
{
"epoch": 3.5702341137123748,
"grad_norm": 0.8109874750171677,
"learning_rate": 2.2801262787944668e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.298412948846817,
"step": 2135,
"valid_targets_mean": 3258.5,
"valid_targets_min": 1480
},
{
"epoch": 3.5785953177257523,
"grad_norm": 0.8162989082018804,
"learning_rate": 2.2718663025790183e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839236259460449,
"step": 2140,
"valid_targets_mean": 2840.1,
"valid_targets_min": 1006
},
{
"epoch": 3.5869565217391304,
"grad_norm": 0.8038116768717268,
"learning_rate": 2.2636015991713167e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3331753611564636,
"step": 2145,
"valid_targets_mean": 2935.8,
"valid_targets_min": 1186
},
{
"epoch": 3.5953177257525084,
"grad_norm": 0.7739334985662348,
"learning_rate": 2.2553323122774487e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3323972821235657,
"step": 2150,
"valid_targets_mean": 3164.0,
"valid_targets_min": 527
},
{
"epoch": 3.6036789297658864,
"grad_norm": 0.7740161292149046,
"learning_rate": 2.2470585856831953e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25347644090652466,
"step": 2155,
"valid_targets_mean": 2834.1,
"valid_targets_min": 1341
},
{
"epoch": 3.6120401337792645,
"grad_norm": 0.6771441745861378,
"learning_rate": 2.2387805632515365e-05,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31761401891708374,
"step": 2160,
"valid_targets_mean": 4497.9,
"valid_targets_min": 699
},
{
"epoch": 3.620401337792642,
"grad_norm": 0.7521566633081039,
"learning_rate": 2.2304983889201467e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3334948420524597,
"step": 2165,
"valid_targets_mean": 3627.6,
"valid_targets_min": 1882
},
{
"epoch": 3.62876254180602,
"grad_norm": 0.7031338023674866,
"learning_rate": 2.222212206698894e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24446901679039001,
"step": 2170,
"valid_targets_mean": 2985.4,
"valid_targets_min": 620
},
{
"epoch": 3.637123745819398,
"grad_norm": 0.6866912372395072,
"learning_rate": 2.2139221606673353e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3053354024887085,
"step": 2175,
"valid_targets_mean": 3322.4,
"valid_targets_min": 1844
},
{
"epoch": 3.6454849498327757,
"grad_norm": 0.7043379955622305,
"learning_rate": 2.2056283949722114e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29806143045425415,
"step": 2180,
"valid_targets_mean": 3245.2,
"valid_targets_min": 1284
},
{
"epoch": 3.6538461538461537,
"grad_norm": 0.7223387295053122,
"learning_rate": 2.197331053824939e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2715410888195038,
"step": 2185,
"valid_targets_mean": 3403.3,
"valid_targets_min": 1091
},
{
"epoch": 3.6622073578595318,
"grad_norm": 0.7923524210124755,
"learning_rate": 2.1890302814991075e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27055805921554565,
"step": 2190,
"valid_targets_mean": 2505.2,
"valid_targets_min": 808
},
{
"epoch": 3.67056856187291,
"grad_norm": 0.9333927510801652,
"learning_rate": 2.1807262223279633e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33472126722335815,
"step": 2195,
"valid_targets_mean": 2667.6,
"valid_targets_min": 1058
},
{
"epoch": 3.678929765886288,
"grad_norm": 0.7418078632890535,
"learning_rate": 2.172419020701907e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2958923280239105,
"step": 2200,
"valid_targets_mean": 3098.1,
"valid_targets_min": 663
},
{
"epoch": 3.6872909698996654,
"grad_norm": 0.8027987445224076,
"learning_rate": 2.1641088210659804e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294519305229187,
"step": 2205,
"valid_targets_mean": 2970.6,
"valid_targets_min": 594
},
{
"epoch": 3.6956521739130435,
"grad_norm": 0.8206281052811005,
"learning_rate": 2.155795767917352e-05,
"loss": 0.2961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31719639897346497,
"step": 2210,
"valid_targets_mean": 3145.6,
"valid_targets_min": 1123
},
{
"epoch": 3.7040133779264215,
"grad_norm": 0.7960144879970568,
"learning_rate": 2.14748000580281e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015314042568207,
"step": 2215,
"valid_targets_mean": 2424.9,
"valid_targets_min": 1020
},
{
"epoch": 3.712374581939799,
"grad_norm": 0.7242043132987579,
"learning_rate": 2.1391616793162435e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29711389541625977,
"step": 2220,
"valid_targets_mean": 3244.1,
"valid_targets_min": 599
},
{
"epoch": 3.720735785953177,
"grad_norm": 0.8514530826111597,
"learning_rate": 2.1308409330961308e-05,
"loss": 0.309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3484026789665222,
"step": 2225,
"valid_targets_mean": 3235.6,
"valid_targets_min": 509
},
{
"epoch": 3.729096989966555,
"grad_norm": 0.7964054451384952,
"learning_rate": 2.122517911823027e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2610142230987549,
"step": 2230,
"valid_targets_mean": 2320.4,
"valid_targets_min": 779
},
{
"epoch": 3.737458193979933,
"grad_norm": 0.8055361034248192,
"learning_rate": 2.114192760217042e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3181573450565338,
"step": 2235,
"valid_targets_mean": 3128.3,
"valid_targets_min": 799
},
{
"epoch": 3.745819397993311,
"grad_norm": 0.7412318158314767,
"learning_rate": 2.10586562303533e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2673335671424866,
"step": 2240,
"valid_targets_mean": 2812.3,
"valid_targets_min": 511
},
{
"epoch": 3.754180602006689,
"grad_norm": 0.806735595661349,
"learning_rate": 2.0975366450695707e-05,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34919291734695435,
"step": 2245,
"valid_targets_mean": 2936.5,
"valid_targets_min": 723
},
{
"epoch": 3.762541806020067,
"grad_norm": 0.7799986710841482,
"learning_rate": 2.0892059711434496e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30157431960105896,
"step": 2250,
"valid_targets_mean": 2891.5,
"valid_targets_min": 937
},
{
"epoch": 3.770903010033445,
"grad_norm": 0.6961704800642899,
"learning_rate": 2.0808737461101417e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948909401893616,
"step": 2255,
"valid_targets_mean": 3901.8,
"valid_targets_min": 511
},
{
"epoch": 3.779264214046823,
"grad_norm": 0.6430882576013616,
"learning_rate": 2.0725401148497946e-05,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36942294239997864,
"step": 2260,
"valid_targets_mean": 4432.6,
"valid_targets_min": 2022
},
{
"epoch": 3.787625418060201,
"grad_norm": 0.9476578148171562,
"learning_rate": 2.0642052222670043e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34764429926872253,
"step": 2265,
"valid_targets_mean": 2577.2,
"valid_targets_min": 586
},
{
"epoch": 3.7959866220735785,
"grad_norm": 0.8377190542394216,
"learning_rate": 2.0558692132883008e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148440420627594,
"step": 2270,
"valid_targets_mean": 2928.6,
"valid_targets_min": 1524
},
{
"epoch": 3.8043478260869565,
"grad_norm": 0.7674746381928171,
"learning_rate": 2.047532232859625e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2882377505302429,
"step": 2275,
"valid_targets_mean": 3211.1,
"valid_targets_min": 666
},
{
"epoch": 3.8127090301003346,
"grad_norm": 0.7603539777572138,
"learning_rate": 2.039194425943808e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28924140334129333,
"step": 2280,
"valid_targets_mean": 2899.9,
"valid_targets_min": 1333
},
{
"epoch": 3.821070234113712,
"grad_norm": 0.6686475071499299,
"learning_rate": 2.0308559375180557e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22952501475811005,
"step": 2285,
"valid_targets_mean": 2880.6,
"valid_targets_min": 1364
},
{
"epoch": 3.82943143812709,
"grad_norm": 0.9368254198322394,
"learning_rate": 2.0225169125714193e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3129611909389496,
"step": 2290,
"valid_targets_mean": 3224.8,
"valid_targets_min": 1399
},
{
"epoch": 3.8377926421404682,
"grad_norm": 0.8093927362873512,
"learning_rate": 2.0141774961022826e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30943459272384644,
"step": 2295,
"valid_targets_mean": 2797.4,
"valid_targets_min": 1188
},
{
"epoch": 3.8461538461538463,
"grad_norm": 0.8283893332898696,
"learning_rate": 2.0058378331158357e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3456169366836548,
"step": 2300,
"valid_targets_mean": 3146.9,
"valid_targets_min": 983
},
{
"epoch": 3.8545150501672243,
"grad_norm": 0.8137074950993536,
"learning_rate": 1.9974980686215546e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24720898270606995,
"step": 2305,
"valid_targets_mean": 2561.4,
"valid_targets_min": 1072
},
{
"epoch": 3.862876254180602,
"grad_norm": 0.7732084599764113,
"learning_rate": 1.9891583476306814e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31134891510009766,
"step": 2310,
"valid_targets_mean": 2994.1,
"valid_targets_min": 377
},
{
"epoch": 3.87123745819398,
"grad_norm": 0.7919123584972602,
"learning_rate": 1.9808188151537008e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25116395950317383,
"step": 2315,
"valid_targets_mean": 2886.5,
"valid_targets_min": 1120
},
{
"epoch": 3.879598662207358,
"grad_norm": 0.7406481098660109,
"learning_rate": 1.972479616197821e-05,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27166545391082764,
"step": 2320,
"valid_targets_mean": 3462.1,
"valid_targets_min": 1420
},
{
"epoch": 3.8879598662207355,
"grad_norm": 0.8731416317069042,
"learning_rate": 1.96414089576445e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35053551197052,
"step": 2325,
"valid_targets_mean": 2947.4,
"valid_targets_min": 918
},
{
"epoch": 3.8963210702341136,
"grad_norm": 0.7355424472980551,
"learning_rate": 1.9558027988466743e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31646502017974854,
"step": 2330,
"valid_targets_mean": 3953.5,
"valid_targets_min": 1805
},
{
"epoch": 3.9046822742474916,
"grad_norm": 0.7933779157508104,
"learning_rate": 1.947465470426741e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982478141784668,
"step": 2335,
"valid_targets_mean": 3171.0,
"valid_targets_min": 587
},
{
"epoch": 3.9130434782608696,
"grad_norm": 0.8102903523307262,
"learning_rate": 1.9391290554735326e-05,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3341084122657776,
"step": 2340,
"valid_targets_mean": 2779.8,
"valid_targets_min": 919
},
{
"epoch": 3.9214046822742477,
"grad_norm": 0.7472511964464619,
"learning_rate": 1.93079369894005e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30373987555503845,
"step": 2345,
"valid_targets_mean": 3103.1,
"valid_targets_min": 1099
},
{
"epoch": 3.9297658862876252,
"grad_norm": 0.7947702151134352,
"learning_rate": 1.922459545760889e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.363625705242157,
"step": 2350,
"valid_targets_mean": 3638.0,
"valid_targets_min": 1698
},
{
"epoch": 3.9381270903010033,
"grad_norm": 0.8068716471695595,
"learning_rate": 1.914126740849723e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704453766345978,
"step": 2355,
"valid_targets_mean": 2755.2,
"valid_targets_min": 1140
},
{
"epoch": 3.9464882943143813,
"grad_norm": 0.8320104780946185,
"learning_rate": 1.9057954290967795e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38438886404037476,
"step": 2360,
"valid_targets_mean": 4250.0,
"valid_targets_min": 1306
},
{
"epoch": 3.9548494983277593,
"grad_norm": 0.7539305683119704,
"learning_rate": 1.897465755366325e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3422359228134155,
"step": 2365,
"valid_targets_mean": 3382.0,
"valid_targets_min": 692
},
{
"epoch": 3.9632107023411374,
"grad_norm": 0.7840574192641151,
"learning_rate": 1.8891378644941437e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31690046191215515,
"step": 2370,
"valid_targets_mean": 3137.6,
"valid_targets_min": 978
},
{
"epoch": 3.971571906354515,
"grad_norm": 0.7175563191342146,
"learning_rate": 1.88081190128502e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30410125851631165,
"step": 2375,
"valid_targets_mean": 3167.8,
"valid_targets_min": 1180
},
{
"epoch": 3.979933110367893,
"grad_norm": 0.7773926485050648,
"learning_rate": 1.8724880105102196e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2675161361694336,
"step": 2380,
"valid_targets_mean": 3070.1,
"valid_targets_min": 1741
},
{
"epoch": 3.988294314381271,
"grad_norm": 0.7560734554908822,
"learning_rate": 1.8641663369049724e-05,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527911365032196,
"step": 2385,
"valid_targets_mean": 2798.2,
"valid_targets_min": 660
},
{
"epoch": 3.9966555183946486,
"grad_norm": 0.9060459955316458,
"learning_rate": 1.8558470251659574e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27911093831062317,
"step": 2390,
"valid_targets_mean": 2562.9,
"valid_targets_min": 633
},
{
"epoch": 4.005016722408027,
"grad_norm": 0.8594449711299057,
"learning_rate": 1.8475302199487848e-05,
"loss": 0.309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793564200401306,
"step": 2395,
"valid_targets_mean": 3010.3,
"valid_targets_min": 1511
},
{
"epoch": 4.013377926421405,
"grad_norm": 0.8838950374531943,
"learning_rate": 1.8392160658654826e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361824154853821,
"step": 2400,
"valid_targets_mean": 3615.7,
"valid_targets_min": 1133
},
{
"epoch": 4.021739130434782,
"grad_norm": 0.7437793364772181,
"learning_rate": 1.8309047074819805e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967781126499176,
"step": 2405,
"valid_targets_mean": 3316.2,
"valid_targets_min": 508
},
{
"epoch": 4.030100334448161,
"grad_norm": 0.8335679273374376,
"learning_rate": 1.822596289315596e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29241418838500977,
"step": 2410,
"valid_targets_mean": 3000.0,
"valid_targets_min": 729
},
{
"epoch": 4.038461538461538,
"grad_norm": 0.9450863777551641,
"learning_rate": 1.814290955832523e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27432459592819214,
"step": 2415,
"valid_targets_mean": 2766.5,
"valid_targets_min": 701
},
{
"epoch": 4.046822742474917,
"grad_norm": 0.6892365494886082,
"learning_rate": 1.8059888514453196e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35358893871307373,
"step": 2420,
"valid_targets_mean": 4687.2,
"valid_targets_min": 707
},
{
"epoch": 4.055183946488294,
"grad_norm": 0.8546396818192133,
"learning_rate": 1.7976901205103953e-05,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2732149660587311,
"step": 2425,
"valid_targets_mean": 2872.1,
"valid_targets_min": 1565
},
{
"epoch": 4.063545150501672,
"grad_norm": 0.9074538701365267,
"learning_rate": 1.789394907325504e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27739718556404114,
"step": 2430,
"valid_targets_mean": 2549.9,
"valid_targets_min": 412
},
{
"epoch": 4.0719063545150505,
"grad_norm": 0.7010499122198948,
"learning_rate": 1.7811033561272328e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28559303283691406,
"step": 2435,
"valid_targets_mean": 4280.4,
"valid_targets_min": 1688
},
{
"epoch": 4.080267558528428,
"grad_norm": 0.7783072544646484,
"learning_rate": 1.7728156110884924e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27712807059288025,
"step": 2440,
"valid_targets_mean": 3133.4,
"valid_targets_min": 474
},
{
"epoch": 4.088628762541806,
"grad_norm": 0.8270554308257784,
"learning_rate": 1.7645318163160146e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2960726022720337,
"step": 2445,
"valid_targets_mean": 3287.0,
"valid_targets_min": 1298
},
{
"epoch": 4.096989966555184,
"grad_norm": 0.8001563378250733,
"learning_rate": 1.7562521158478432e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23369301855564117,
"step": 2450,
"valid_targets_mean": 3446.6,
"valid_targets_min": 924
},
{
"epoch": 4.105351170568562,
"grad_norm": 0.8436159622655983,
"learning_rate": 1.7479766536508313e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28451332449913025,
"step": 2455,
"valid_targets_mean": 3320.6,
"valid_targets_min": 1505
},
{
"epoch": 4.11371237458194,
"grad_norm": 0.8511630672848115,
"learning_rate": 1.7397055736181366e-05,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644152343273163,
"step": 2460,
"valid_targets_mean": 2837.6,
"valid_targets_min": 1265
},
{
"epoch": 4.122073578595318,
"grad_norm": 0.8329359927809505,
"learning_rate": 1.7314390195667193e-05,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27568697929382324,
"step": 2465,
"valid_targets_mean": 3675.1,
"valid_targets_min": 1439
},
{
"epoch": 4.130434782608695,
"grad_norm": 0.8456711766375431,
"learning_rate": 1.723177135234844e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696060538291931,
"step": 2470,
"valid_targets_mean": 3198.6,
"valid_targets_min": 550
},
{
"epoch": 4.138795986622074,
"grad_norm": 0.8660274510460868,
"learning_rate": 1.7149200642795765e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39124855399131775,
"step": 2475,
"valid_targets_mean": 3618.2,
"valid_targets_min": 1647
},
{
"epoch": 4.147157190635451,
"grad_norm": 0.8805366064387657,
"learning_rate": 1.70666795027429e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3205997943878174,
"step": 2480,
"valid_targets_mean": 3357.6,
"valid_targets_min": 1361
},
{
"epoch": 4.15551839464883,
"grad_norm": 0.8831645923939866,
"learning_rate": 1.6984209367061657e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3723400831222534,
"step": 2485,
"valid_targets_mean": 4439.7,
"valid_targets_min": 872
},
{
"epoch": 4.1638795986622075,
"grad_norm": 0.8033626392233867,
"learning_rate": 1.6901791669736974e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23729437589645386,
"step": 2490,
"valid_targets_mean": 3279.5,
"valid_targets_min": 1317
},
{
"epoch": 4.172240802675585,
"grad_norm": 0.8529045414447846,
"learning_rate": 1.6819427843842016e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24402417242527008,
"step": 2495,
"valid_targets_mean": 2829.3,
"valid_targets_min": 971
},
{
"epoch": 4.1806020066889635,
"grad_norm": 0.7772728028989128,
"learning_rate": 1.6737119321513224e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3176288604736328,
"step": 2500,
"valid_targets_mean": 3672.4,
"valid_targets_min": 965
},
{
"epoch": 4.188963210702341,
"grad_norm": 0.8338000934996834,
"learning_rate": 1.6654867533925418e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721063494682312,
"step": 2505,
"valid_targets_mean": 3436.9,
"valid_targets_min": 1539
},
{
"epoch": 4.197324414715719,
"grad_norm": 0.8267713909712678,
"learning_rate": 1.6572673911266943e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28024280071258545,
"step": 2510,
"valid_targets_mean": 3187.4,
"valid_targets_min": 1120
},
{
"epoch": 4.205685618729097,
"grad_norm": 0.9157546033073007,
"learning_rate": 1.6490539882714756e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2485034167766571,
"step": 2515,
"valid_targets_mean": 2835.7,
"valid_targets_min": 1525
},
{
"epoch": 4.214046822742475,
"grad_norm": 0.9249610301165988,
"learning_rate": 1.6408466876409596e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23990267515182495,
"step": 2520,
"valid_targets_mean": 2692.9,
"valid_targets_min": 490
},
{
"epoch": 4.222408026755853,
"grad_norm": 0.8518340628069135,
"learning_rate": 1.6326456319431154e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31082072854042053,
"step": 2525,
"valid_targets_mean": 3444.6,
"valid_targets_min": 1569
},
{
"epoch": 4.230769230769231,
"grad_norm": 0.9837882931443535,
"learning_rate": 1.6244509637773256e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29353979229927063,
"step": 2530,
"valid_targets_mean": 3000.7,
"valid_targets_min": 1243
},
{
"epoch": 4.239130434782608,
"grad_norm": 0.8579109041612042,
"learning_rate": 1.6162628256319078e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931848168373108,
"step": 2535,
"valid_targets_mean": 2974.6,
"valid_targets_min": 1303
},
{
"epoch": 4.247491638795987,
"grad_norm": 0.7372703580470882,
"learning_rate": 1.6080813598816355e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35204175114631653,
"step": 2540,
"valid_targets_mean": 4623.1,
"valid_targets_min": 1208
},
{
"epoch": 4.2558528428093645,
"grad_norm": 0.9167357129141266,
"learning_rate": 1.599906708785262e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23422318696975708,
"step": 2545,
"valid_targets_mean": 2499.6,
"valid_targets_min": 1144
},
{
"epoch": 4.264214046822742,
"grad_norm": 0.8898102183876689,
"learning_rate": 1.5917390144830488e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.295245885848999,
"step": 2550,
"valid_targets_mean": 3242.8,
"valid_targets_min": 1323
},
{
"epoch": 4.2725752508361206,
"grad_norm": 0.9416423066048137,
"learning_rate": 1.583578418994294e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23591409623622894,
"step": 2555,
"valid_targets_mean": 2772.4,
"valid_targets_min": 1460
},
{
"epoch": 4.280936454849498,
"grad_norm": 0.8396792312207702,
"learning_rate": 1.5754250642148592e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691681385040283,
"step": 2560,
"valid_targets_mean": 3140.4,
"valid_targets_min": 1822
},
{
"epoch": 4.289297658862877,
"grad_norm": 0.7552376746174522,
"learning_rate": 1.5672790919147096e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30901944637298584,
"step": 2565,
"valid_targets_mean": 3934.4,
"valid_targets_min": 1525
},
{
"epoch": 4.297658862876254,
"grad_norm": 0.9282959640580136,
"learning_rate": 1.5591406437354394e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631564736366272,
"step": 2570,
"valid_targets_mean": 3684.6,
"valid_targets_min": 603
},
{
"epoch": 4.306020066889632,
"grad_norm": 0.8408763401027246,
"learning_rate": 1.5510098611878177e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1855039745569229,
"step": 2575,
"valid_targets_mean": 2278.2,
"valid_targets_min": 685
},
{
"epoch": 4.31438127090301,
"grad_norm": 0.9661559358244203,
"learning_rate": 1.542886885649322e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20213311910629272,
"step": 2580,
"valid_targets_mean": 2565.0,
"valid_targets_min": 1622
},
{
"epoch": 4.322742474916388,
"grad_norm": 0.8691049252102782,
"learning_rate": 1.534771858361683e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2871206998825073,
"step": 2585,
"valid_targets_mean": 3261.2,
"valid_targets_min": 757
},
{
"epoch": 4.331103678929766,
"grad_norm": 0.8392260775398249,
"learning_rate": 1.5266649204284273e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738720774650574,
"step": 2590,
"valid_targets_mean": 3433.5,
"valid_targets_min": 1852
},
{
"epoch": 4.339464882943144,
"grad_norm": 0.8840473177758481,
"learning_rate": 1.5185662128124254e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2708375155925751,
"step": 2595,
"valid_targets_mean": 3278.4,
"valid_targets_min": 399
},
{
"epoch": 4.3478260869565215,
"grad_norm": 0.8804892196325519,
"learning_rate": 1.510475876333438e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23639748990535736,
"step": 2600,
"valid_targets_mean": 2654.6,
"valid_targets_min": 528
},
{
"epoch": 4.3561872909699,
"grad_norm": 0.8094688600381953,
"learning_rate": 1.5023940516656697e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2887652516365051,
"step": 2605,
"valid_targets_mean": 3643.9,
"valid_targets_min": 2109
},
{
"epoch": 4.364548494983278,
"grad_norm": 0.9244051200125512,
"learning_rate": 1.4943208793353235e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914060056209564,
"step": 2610,
"valid_targets_mean": 3336.8,
"valid_targets_min": 550
},
{
"epoch": 4.372909698996655,
"grad_norm": 0.7461063611424056,
"learning_rate": 1.4862564997181528e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36067837476730347,
"step": 2615,
"valid_targets_mean": 5280.1,
"valid_targets_min": 1147
},
{
"epoch": 4.381270903010034,
"grad_norm": 0.9652367742763335,
"learning_rate": 1.4782010530370294e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25113189220428467,
"step": 2620,
"valid_targets_mean": 2949.8,
"valid_targets_min": 1399
},
{
"epoch": 4.389632107023411,
"grad_norm": 0.8992134459024913,
"learning_rate": 1.470154679359495e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24360308051109314,
"step": 2625,
"valid_targets_mean": 2608.5,
"valid_targets_min": 935
},
{
"epoch": 4.39799331103679,
"grad_norm": 0.8220794903907007,
"learning_rate": 1.4621175185953322e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220457136631012,
"step": 2630,
"valid_targets_mean": 4098.1,
"valid_targets_min": 403
},
{
"epoch": 4.406354515050167,
"grad_norm": 0.8521683178016516,
"learning_rate": 1.4540897104941307e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3359491527080536,
"step": 2635,
"valid_targets_mean": 3451.1,
"valid_targets_min": 794
},
{
"epoch": 4.414715719063545,
"grad_norm": 0.8796923872304094,
"learning_rate": 1.4460713946428553e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24371229112148285,
"step": 2640,
"valid_targets_mean": 2400.8,
"valid_targets_min": 1000
},
{
"epoch": 4.423076923076923,
"grad_norm": 1.0131860235742853,
"learning_rate": 1.4380627104634224e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007010817527771,
"step": 2645,
"valid_targets_mean": 2731.2,
"valid_targets_min": 1006
},
{
"epoch": 4.431438127090301,
"grad_norm": 0.7392458747612428,
"learning_rate": 1.4300637972102721e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3089587688446045,
"step": 2650,
"valid_targets_mean": 4641.4,
"valid_targets_min": 1954
},
{
"epoch": 4.4397993311036785,
"grad_norm": 0.8818880175089461,
"learning_rate": 1.4220747939679478e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619357407093048,
"step": 2655,
"valid_targets_mean": 3080.8,
"valid_targets_min": 971
},
{
"epoch": 4.448160535117057,
"grad_norm": 0.9056508130411561,
"learning_rate": 1.414095839648679e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25068965554237366,
"step": 2660,
"valid_targets_mean": 2617.4,
"valid_targets_min": 1481
},
{
"epoch": 4.456521739130435,
"grad_norm": 0.8935220051791342,
"learning_rate": 1.4061270729899663e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26286935806274414,
"step": 2665,
"valid_targets_mean": 2883.9,
"valid_targets_min": 928
},
{
"epoch": 4.464882943143813,
"grad_norm": 0.8961547416267401,
"learning_rate": 1.3981686325521647e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29072946310043335,
"step": 2670,
"valid_targets_mean": 2993.4,
"valid_targets_min": 1894
},
{
"epoch": 4.473244147157191,
"grad_norm": 0.9599671002081342,
"learning_rate": 1.3902206567160827e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28398674726486206,
"step": 2675,
"valid_targets_mean": 2923.8,
"valid_targets_min": 534
},
{
"epoch": 4.481605351170568,
"grad_norm": 0.8341406674593823,
"learning_rate": 1.3822832836805667e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3429492115974426,
"step": 2680,
"valid_targets_mean": 3562.8,
"valid_targets_min": 949
},
{
"epoch": 4.489966555183947,
"grad_norm": 0.8660387274121687,
"learning_rate": 1.3743566514601037e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28438010811805725,
"step": 2685,
"valid_targets_mean": 3383.6,
"valid_targets_min": 1276
},
{
"epoch": 4.498327759197324,
"grad_norm": 0.8240982742485928,
"learning_rate": 1.3664408978824209e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2728864550590515,
"step": 2690,
"valid_targets_mean": 3949.8,
"valid_targets_min": 1505
},
{
"epoch": 4.506688963210703,
"grad_norm": 0.9047049810271199,
"learning_rate": 1.3585361605860863e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605753540992737,
"step": 2695,
"valid_targets_mean": 2817.6,
"valid_targets_min": 952
},
{
"epoch": 4.51505016722408,
"grad_norm": 0.8397078739499565,
"learning_rate": 1.3506425770181211e-05,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24365462362766266,
"step": 2700,
"valid_targets_mean": 2901.8,
"valid_targets_min": 2041
},
{
"epoch": 4.523411371237458,
"grad_norm": 0.8582678085193816,
"learning_rate": 1.342760284431603e-05,
"loss": 0.3192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986323833465576,
"step": 2705,
"valid_targets_mean": 3100.2,
"valid_targets_min": 1217
},
{
"epoch": 4.531772575250836,
"grad_norm": 0.7889072695692275,
"learning_rate": 1.3348894198832845e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26328298449516296,
"step": 2710,
"valid_targets_mean": 3108.0,
"valid_targets_min": 967
},
{
"epoch": 4.540133779264214,
"grad_norm": 0.742736182328933,
"learning_rate": 1.3270301202312075e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37916791439056396,
"step": 2715,
"valid_targets_mean": 5153.8,
"valid_targets_min": 1141
},
{
"epoch": 4.548494983277592,
"grad_norm": 0.9919759799813364,
"learning_rate": 1.3191825221323246e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30372777581214905,
"step": 2720,
"valid_targets_mean": 2784.2,
"valid_targets_min": 1361
},
{
"epoch": 4.55685618729097,
"grad_norm": 0.794724468575154,
"learning_rate": 1.311346762040123e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651178538799286,
"step": 2725,
"valid_targets_mean": 3715.1,
"valid_targets_min": 983
},
{
"epoch": 4.565217391304348,
"grad_norm": 0.9806561211664588,
"learning_rate": 1.3035229762022513e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2600407600402832,
"step": 2730,
"valid_targets_mean": 2778.1,
"valid_targets_min": 520
},
{
"epoch": 4.573578595317725,
"grad_norm": 0.8400790069869569,
"learning_rate": 1.2957113006581494e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30648618936538696,
"step": 2735,
"valid_targets_mean": 3071.6,
"valid_targets_min": 1115
},
{
"epoch": 4.581939799331104,
"grad_norm": 0.912124026132302,
"learning_rate": 1.2879118712366858e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3389705717563629,
"step": 2740,
"valid_targets_mean": 3479.6,
"valid_targets_min": 1737
},
{
"epoch": 4.590301003344481,
"grad_norm": 0.7136031625832305,
"learning_rate": 1.280124823553794e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26324355602264404,
"step": 2745,
"valid_targets_mean": 4402.9,
"valid_targets_min": 1958
},
{
"epoch": 4.59866220735786,
"grad_norm": 0.8876231778745343,
"learning_rate": 1.2723502930101126e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3144656717777252,
"step": 2750,
"valid_targets_mean": 4292.6,
"valid_targets_min": 568
},
{
"epoch": 4.607023411371237,
"grad_norm": 0.9123329157042492,
"learning_rate": 1.2645884147886376e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22034093737602234,
"step": 2755,
"valid_targets_mean": 3341.9,
"valid_targets_min": 998
},
{
"epoch": 4.615384615384615,
"grad_norm": 0.8627497975800223,
"learning_rate": 1.2568393238523627e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28283166885375977,
"step": 2760,
"valid_targets_mean": 3059.2,
"valid_targets_min": 1435
},
{
"epoch": 4.6237458193979935,
"grad_norm": 0.8879285250035446,
"learning_rate": 1.2491031549419396e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28905028104782104,
"step": 2765,
"valid_targets_mean": 3173.9,
"valid_targets_min": 1069
},
{
"epoch": 4.632107023411371,
"grad_norm": 0.7869539440700758,
"learning_rate": 1.2413800425733324e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23459485173225403,
"step": 2770,
"valid_targets_mean": 3455.7,
"valid_targets_min": 1705
},
{
"epoch": 4.6404682274247495,
"grad_norm": 0.874081153668911,
"learning_rate": 1.2336701210354774e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26058483123779297,
"step": 2775,
"valid_targets_mean": 3799.4,
"valid_targets_min": 2140
},
{
"epoch": 4.648829431438127,
"grad_norm": 0.8505418138060274,
"learning_rate": 1.2259735243879533e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2382025420665741,
"step": 2780,
"valid_targets_mean": 2949.2,
"valid_targets_min": 1662
},
{
"epoch": 4.657190635451505,
"grad_norm": 0.8408719538127842,
"learning_rate": 1.2182903864586424e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3271663188934326,
"step": 2785,
"valid_targets_mean": 3384.8,
"valid_targets_min": 1772
},
{
"epoch": 4.665551839464883,
"grad_norm": 0.7906487246754133,
"learning_rate": 1.2106208408414101e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23760370910167694,
"step": 2790,
"valid_targets_mean": 3003.1,
"valid_targets_min": 638
},
{
"epoch": 4.673913043478261,
"grad_norm": 0.7560469434433705,
"learning_rate": 1.202965020893779e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3065562844276428,
"step": 2795,
"valid_targets_mean": 4305.3,
"valid_targets_min": 1436
},
{
"epoch": 4.682274247491639,
"grad_norm": 0.931404543547185,
"learning_rate": 1.1953230597346116e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30321380496025085,
"step": 2800,
"valid_targets_mean": 3184.8,
"valid_targets_min": 1215
},
{
"epoch": 4.690635451505017,
"grad_norm": 0.8785086713293649,
"learning_rate": 1.1876950902417921e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660791277885437,
"step": 2805,
"valid_targets_mean": 2884.8,
"valid_targets_min": 991
},
{
"epoch": 4.698996655518394,
"grad_norm": 0.8658447278693211,
"learning_rate": 1.1800812450499227e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24090614914894104,
"step": 2810,
"valid_targets_mean": 2715.7,
"valid_targets_min": 764
},
{
"epoch": 4.707357859531773,
"grad_norm": 1.0374938153628415,
"learning_rate": 1.1724816565480092e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20534390211105347,
"step": 2815,
"valid_targets_mean": 2147.6,
"valid_targets_min": 401
},
{
"epoch": 4.7157190635451505,
"grad_norm": 0.7920774633218928,
"learning_rate": 1.1648964568771661e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18782053887844086,
"step": 2820,
"valid_targets_mean": 3404.8,
"valid_targets_min": 2009
},
{
"epoch": 4.724080267558528,
"grad_norm": 0.8633417845835815,
"learning_rate": 1.157325777928314e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30495747923851013,
"step": 2825,
"valid_targets_mean": 3513.8,
"valid_targets_min": 1059
},
{
"epoch": 4.7324414715719065,
"grad_norm": 0.9344722457587161,
"learning_rate": 1.149769751339889e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2682046592235565,
"step": 2830,
"valid_targets_mean": 3535.4,
"valid_targets_min": 1574
},
{
"epoch": 4.740802675585284,
"grad_norm": 0.9085942238263078,
"learning_rate": 1.142228508495553e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27757948637008667,
"step": 2835,
"valid_targets_mean": 2801.4,
"valid_targets_min": 1637
},
{
"epoch": 4.749163879598662,
"grad_norm": 0.9016528116196614,
"learning_rate": 1.1347021805219092e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24009665846824646,
"step": 2840,
"valid_targets_mean": 2991.9,
"valid_targets_min": 962
},
{
"epoch": 4.75752508361204,
"grad_norm": 0.8216538528179507,
"learning_rate": 1.1271908982862214e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618323862552643,
"step": 2845,
"valid_targets_mean": 4103.2,
"valid_targets_min": 1949
},
{
"epoch": 4.765886287625418,
"grad_norm": 1.0231544478271972,
"learning_rate": 1.11969479239414e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30647069215774536,
"step": 2850,
"valid_targets_mean": 2558.7,
"valid_targets_min": 364
},
{
"epoch": 4.774247491638796,
"grad_norm": 2.596885204828478,
"learning_rate": 1.1122139931874303e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3939549922943115,
"step": 2855,
"valid_targets_mean": 4341.0,
"valid_targets_min": 821
},
{
"epoch": 4.782608695652174,
"grad_norm": 0.9290067746793299,
"learning_rate": 1.104748630741705e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30313026905059814,
"step": 2860,
"valid_targets_mean": 2781.0,
"valid_targets_min": 392
},
{
"epoch": 4.790969899665551,
"grad_norm": 1.7683165858974776,
"learning_rate": 1.0972988348641643e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22824634611606598,
"step": 2865,
"valid_targets_mean": 2794.6,
"valid_targets_min": 721
},
{
"epoch": 4.79933110367893,
"grad_norm": 0.8612735757395678,
"learning_rate": 1.0898647350913376e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24694600701332092,
"step": 2870,
"valid_targets_mean": 3144.4,
"valid_targets_min": 1359
},
{
"epoch": 4.8076923076923075,
"grad_norm": 0.883437344029108,
"learning_rate": 1.0824464606868323e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24586498737335205,
"step": 2875,
"valid_targets_mean": 3431.4,
"valid_targets_min": 1257
},
{
"epoch": 4.816053511705686,
"grad_norm": 1.0330995770490803,
"learning_rate": 1.0750441406390841e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311995029449463,
"step": 2880,
"valid_targets_mean": 2488.1,
"valid_targets_min": 1242
},
{
"epoch": 4.8244147157190636,
"grad_norm": 0.958681058026221,
"learning_rate": 1.0676579036591167e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2965131998062134,
"step": 2885,
"valid_targets_mean": 3851.2,
"valid_targets_min": 1182
},
{
"epoch": 4.832775919732441,
"grad_norm": 0.788119350116846,
"learning_rate": 1.0602878781783019e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.328529953956604,
"step": 2890,
"valid_targets_mean": 3779.6,
"valid_targets_min": 1456
},
{
"epoch": 4.84113712374582,
"grad_norm": 0.8696431488480126,
"learning_rate": 1.0529341923461272e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26618334650993347,
"step": 2895,
"valid_targets_mean": 3219.2,
"valid_targets_min": 1480
},
{
"epoch": 4.849498327759197,
"grad_norm": 0.9950302873697183,
"learning_rate": 1.0455969740279675e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28443658351898193,
"step": 2900,
"valid_targets_mean": 2625.2,
"valid_targets_min": 999
},
{
"epoch": 4.857859531772576,
"grad_norm": 0.9363541770349809,
"learning_rate": 1.0382763508028615e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23824138939380646,
"step": 2905,
"valid_targets_mean": 2914.6,
"valid_targets_min": 580
},
{
"epoch": 4.866220735785953,
"grad_norm": 0.9212980221737899,
"learning_rate": 1.0309724499612939e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30664288997650146,
"step": 2910,
"valid_targets_mean": 3167.0,
"valid_targets_min": 1422
},
{
"epoch": 4.874581939799331,
"grad_norm": 0.9658354985211547,
"learning_rate": 1.0236853985029815e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978072762489319,
"step": 2915,
"valid_targets_mean": 4677.4,
"valid_targets_min": 1257
},
{
"epoch": 4.882943143812709,
"grad_norm": 0.8858319243242195,
"learning_rate": 1.0164153231346656e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24526861310005188,
"step": 2920,
"valid_targets_mean": 3126.1,
"valid_targets_min": 880
},
{
"epoch": 4.891304347826087,
"grad_norm": 1.0526204864364126,
"learning_rate": 1.0091623502679075e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3539399802684784,
"step": 2925,
"valid_targets_mean": 3289.9,
"valid_targets_min": 1212
},
{
"epoch": 4.8996655518394645,
"grad_norm": 0.885379966379974,
"learning_rate": 1.0019266060168929e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30143141746520996,
"step": 2930,
"valid_targets_mean": 3651.1,
"valid_targets_min": 1477
},
{
"epoch": 4.908026755852843,
"grad_norm": 1.1625828671998966,
"learning_rate": 9.947082161962363e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24516814947128296,
"step": 2935,
"valid_targets_mean": 2769.2,
"valid_targets_min": 569
},
{
"epoch": 4.916387959866221,
"grad_norm": 0.8652972290357003,
"learning_rate": 9.875073063187947e-06,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26153671741485596,
"step": 2940,
"valid_targets_mean": 3214.2,
"valid_targets_min": 1062
},
{
"epoch": 4.924749163879599,
"grad_norm": 0.9078402224774373,
"learning_rate": 9.803240015934859e-06,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2811887264251709,
"step": 2945,
"valid_targets_mean": 3040.2,
"valid_targets_min": 918
},
{
"epoch": 4.933110367892977,
"grad_norm": 0.855619293705552,
"learning_rate": 9.731584269231094e-06,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24628743529319763,
"step": 2950,
"valid_targets_mean": 3259.8,
"valid_targets_min": 1456
},
{
"epoch": 4.941471571906354,
"grad_norm": 0.9213152242653578,
"learning_rate": 9.660107069021767e-06,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33864572644233704,
"step": 2955,
"valid_targets_mean": 3462.7,
"valid_targets_min": 527
},
{
"epoch": 4.949832775919733,
"grad_norm": 0.8302602925046146,
"learning_rate": 9.588809658147433e-06,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28112542629241943,
"step": 2960,
"valid_targets_mean": 3587.3,
"valid_targets_min": 1509
},
{
"epoch": 4.95819397993311,
"grad_norm": 0.9191160601073972,
"learning_rate": 9.517693276322488e-06,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26543906331062317,
"step": 2965,
"valid_targets_mean": 2759.7,
"valid_targets_min": 520
},
{
"epoch": 4.966555183946488,
"grad_norm": 0.9353550508600107,
"learning_rate": 9.446759160113602e-06,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775583863258362,
"step": 2970,
"valid_targets_mean": 2901.1,
"valid_targets_min": 1694
},
{
"epoch": 4.974916387959866,
"grad_norm": 0.9139877304453574,
"learning_rate": 9.376008542918227e-06,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19975979626178741,
"step": 2975,
"valid_targets_mean": 2663.2,
"valid_targets_min": 1166
},
{
"epoch": 4.983277591973244,
"grad_norm": 0.922883713258425,
"learning_rate": 9.305442654943145e-06,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2600483000278473,
"step": 2980,
"valid_targets_mean": 2795.2,
"valid_targets_min": 1070
},
{
"epoch": 4.991638795986622,
"grad_norm": 0.9322875420888264,
"learning_rate": 9.235062723183076e-06,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565094232559204,
"step": 2985,
"valid_targets_mean": 2820.6,
"valid_targets_min": 1321
},
{
"epoch": 5.0,
"grad_norm": 0.7643560224911901,
"learning_rate": 9.164869971399359e-06,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3641391396522522,
"step": 2990,
"valid_targets_mean": 4868.6,
"valid_targets_min": 1329
},
{
"epoch": 5.008361204013378,
"grad_norm": 0.8481755315514735,
"learning_rate": 9.094865620098646e-06,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22899624705314636,
"step": 2995,
"valid_targets_mean": 3174.0,
"valid_targets_min": 1965
},
{
"epoch": 5.016722408026756,
"grad_norm": 0.8188076252143365,
"learning_rate": 9.025050886511702e-06,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067629039287567,
"step": 3000,
"valid_targets_mean": 4291.9,
"valid_targets_min": 1704
},
{
"epoch": 5.025083612040134,
"grad_norm": 0.8029644241788463,
"learning_rate": 8.955426984572228e-06,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037480115890503,
"step": 3005,
"valid_targets_mean": 4106.2,
"valid_targets_min": 973
},
{
"epoch": 5.033444816053512,
"grad_norm": 0.8661738149420555,
"learning_rate": 8.885995124895768e-06,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674838900566101,
"step": 3010,
"valid_targets_mean": 3359.9,
"valid_targets_min": 1500
},
{
"epoch": 5.04180602006689,
"grad_norm": 0.9620964614380081,
"learning_rate": 8.816756514758634e-06,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533591389656067,
"step": 3015,
"valid_targets_mean": 3118.5,
"valid_targets_min": 1356
},
{
"epoch": 5.050167224080267,
"grad_norm": 0.7541256752914219,
"learning_rate": 8.747712358076936e-06,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24237793684005737,
"step": 3020,
"valid_targets_mean": 4191.6,
"valid_targets_min": 1668
},
{
"epoch": 5.058528428093646,
"grad_norm": 0.9025605491692672,
"learning_rate": 8.678863855385646e-06,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33202728629112244,
"step": 3025,
"valid_targets_mean": 4466.5,
"valid_targets_min": 693
},
{
"epoch": 5.066889632107023,
"grad_norm": 0.8425388830294137,
"learning_rate": 8.61021220381771e-06,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3084254860877991,
"step": 3030,
"valid_targets_mean": 4306.9,
"valid_targets_min": 968
},
{
"epoch": 5.075250836120401,
"grad_norm": 0.8389860612401873,
"learning_rate": 8.54175859708324e-06,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22211232781410217,
"step": 3035,
"valid_targets_mean": 3588.2,
"valid_targets_min": 880
},
{
"epoch": 5.083612040133779,
"grad_norm": 0.9514036120737082,
"learning_rate": 8.473504225448765e-06,
"loss": 0.257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2409243881702423,
"step": 3040,
"valid_targets_mean": 2856.7,
"valid_targets_min": 967
},
{
"epoch": 5.091973244147157,
"grad_norm": 0.9560659512366602,
"learning_rate": 8.405450275716525e-06,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2601991891860962,
"step": 3045,
"valid_targets_mean": 3723.9,
"valid_targets_min": 1569
},
{
"epoch": 5.1003344481605355,
"grad_norm": 0.9864743563923629,
"learning_rate": 8.337597931203836e-06,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3188202381134033,
"step": 3050,
"valid_targets_mean": 3242.7,
"valid_targets_min": 1154
},
{
"epoch": 5.108695652173913,
"grad_norm": 1.1490912764067835,
"learning_rate": 8.269948371722518e-06,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21089932322502136,
"step": 3055,
"valid_targets_mean": 2516.8,
"valid_targets_min": 988
},
{
"epoch": 5.117056856187291,
"grad_norm": 0.8194749944721579,
"learning_rate": 8.20250277355838e-06,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3658130168914795,
"step": 3060,
"valid_targets_mean": 4739.9,
"valid_targets_min": 1512
},
{
"epoch": 5.125418060200669,
"grad_norm": 0.9728259830553914,
"learning_rate": 8.135262309450764e-06,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27498018741607666,
"step": 3065,
"valid_targets_mean": 3150.4,
"valid_targets_min": 594
},
{
"epoch": 5.133779264214047,
"grad_norm": 1.0179078265962471,
"learning_rate": 8.068228148572157e-06,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19528654217720032,
"step": 3070,
"valid_targets_mean": 2590.3,
"valid_targets_min": 513
},
{
"epoch": 5.142140468227424,
"grad_norm": 1.0414753424178975,
"learning_rate": 8.001401456507858e-06,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24913433194160461,
"step": 3075,
"valid_targets_mean": 2828.6,
"valid_targets_min": 1509
},
{
"epoch": 5.150501672240803,
"grad_norm": 0.9673371238498945,
"learning_rate": 7.934783395235716e-06,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619754672050476,
"step": 3080,
"valid_targets_mean": 3273.0,
"valid_targets_min": 1547
},
{
"epoch": 5.15886287625418,
"grad_norm": 1.0777145808692163,
"learning_rate": 7.868375123105921e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.241988867521286,
"step": 3085,
"valid_targets_mean": 2760.0,
"valid_targets_min": 1115
},
{
"epoch": 5.167224080267559,
"grad_norm": 0.9357681236144693,
"learning_rate": 7.802177794820857e-06,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4071310758590698,
"step": 3090,
"valid_targets_mean": 3665.1,
"valid_targets_min": 638
},
{
"epoch": 5.1755852842809364,
"grad_norm": 0.8810724848053256,
"learning_rate": 7.736192561415045e-06,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404349386692047,
"step": 3095,
"valid_targets_mean": 3941.1,
"valid_targets_min": 799
},
{
"epoch": 5.183946488294314,
"grad_norm": 0.9345756552103464,
"learning_rate": 7.670420570235113e-06,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20666499435901642,
"step": 3100,
"valid_targets_mean": 2741.7,
"valid_targets_min": 660
},
{
"epoch": 5.1923076923076925,
"grad_norm": 0.89831218286986,
"learning_rate": 7.604862964919819e-06,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26516643166542053,
"step": 3105,
"valid_targets_mean": 3194.3,
"valid_targets_min": 1893
},
{
"epoch": 5.20066889632107,
"grad_norm": 1.0235151109065963,
"learning_rate": 7.539520885380242e-06,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23447315394878387,
"step": 3110,
"valid_targets_mean": 2732.0,
"valid_targets_min": 1261
},
{
"epoch": 5.209030100334449,
"grad_norm": 1.0527575176171846,
"learning_rate": 7.474395467779885e-06,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24746760725975037,
"step": 3115,
"valid_targets_mean": 3079.3,
"valid_targets_min": 1647
},
{
"epoch": 5.217391304347826,
"grad_norm": 0.8412479852328654,
"learning_rate": 7.409487844514946e-06,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2139432430267334,
"step": 3120,
"valid_targets_mean": 3529.4,
"valid_targets_min": 2262
},
{
"epoch": 5.225752508361204,
"grad_norm": 0.8859243166629239,
"learning_rate": 7.344799144194647e-06,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30506086349487305,
"step": 3125,
"valid_targets_mean": 4511.6,
"valid_targets_min": 1709
},
{
"epoch": 5.234113712374582,
"grad_norm": 0.928318267325103,
"learning_rate": 7.280330491621579e-06,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25192520022392273,
"step": 3130,
"valid_targets_mean": 3102.3,
"valid_targets_min": 1604
},
{
"epoch": 5.24247491638796,
"grad_norm": 0.8514180338596942,
"learning_rate": 7.2160830077721655e-06,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42115187644958496,
"step": 3135,
"valid_targets_mean": 4393.4,
"valid_targets_min": 2044
},
{
"epoch": 5.250836120401337,
"grad_norm": 0.8701754054847802,
"learning_rate": 7.15205780977716e-06,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23187309503555298,
"step": 3140,
"valid_targets_mean": 3508.4,
"valid_targets_min": 1806
},
{
"epoch": 5.259197324414716,
"grad_norm": 1.0414461577784981,
"learning_rate": 7.0882560109022255e-06,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2434636354446411,
"step": 3145,
"valid_targets_mean": 2689.4,
"valid_targets_min": 860
},
{
"epoch": 5.2675585284280935,
"grad_norm": 0.9992819578511724,
"learning_rate": 7.02467872052858e-06,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20966418087482452,
"step": 3150,
"valid_targets_mean": 3109.2,
"valid_targets_min": 1471
},
{
"epoch": 5.275919732441472,
"grad_norm": 0.9478720751528437,
"learning_rate": 6.9613270441337075e-06,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22975382208824158,
"step": 3155,
"valid_targets_mean": 3196.7,
"valid_targets_min": 1774
},
{
"epoch": 5.2842809364548495,
"grad_norm": 0.8672829908504149,
"learning_rate": 6.8982020832721054e-06,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22695282101631165,
"step": 3160,
"valid_targets_mean": 3513.6,
"valid_targets_min": 723
},
{
"epoch": 5.292642140468227,
"grad_norm": 1.022405240131088,
"learning_rate": 6.835304935556198e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2423592507839203,
"step": 3165,
"valid_targets_mean": 3192.9,
"valid_targets_min": 1355
},
{
"epoch": 5.301003344481606,
"grad_norm": 1.081711172053293,
"learning_rate": 6.772636694637183e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25607234239578247,
"step": 3170,
"valid_targets_mean": 2742.1,
"valid_targets_min": 1670
},
{
"epoch": 5.309364548494983,
"grad_norm": 0.959669265454484,
"learning_rate": 6.710198450186047e-06,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2445649951696396,
"step": 3175,
"valid_targets_mean": 2531.1,
"valid_targets_min": 741
},
{
"epoch": 5.317725752508361,
"grad_norm": 1.0556452222632704,
"learning_rate": 6.6479912878746225e-06,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32292306423187256,
"step": 3180,
"valid_targets_mean": 3753.7,
"valid_targets_min": 1316
},
{
"epoch": 5.326086956521739,
"grad_norm": 1.110335544316918,
"learning_rate": 6.586016289356692e-06,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20516835153102875,
"step": 3185,
"valid_targets_mean": 2823.1,
"valid_targets_min": 965
},
{
"epoch": 5.334448160535117,
"grad_norm": 0.9443496373098136,
"learning_rate": 6.524274532249195e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2695116698741913,
"step": 3190,
"valid_targets_mean": 2830.7,
"valid_targets_min": 595
},
{
"epoch": 5.342809364548495,
"grad_norm": 1.2883459095067469,
"learning_rate": 6.462767090113486e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21128371357917786,
"step": 3195,
"valid_targets_mean": 2801.6,
"valid_targets_min": 1972
},
{
"epoch": 5.351170568561873,
"grad_norm": 0.7305670443838644,
"learning_rate": 6.401495032436667e-06,
"loss": 0.2613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34377604722976685,
"step": 3200,
"valid_targets_mean": 5868.9,
"valid_targets_min": 1873
},
{
"epoch": 5.3595317725752505,
"grad_norm": 0.9618080510519665,
"learning_rate": 6.34045942461299e-06,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20367145538330078,
"step": 3205,
"valid_targets_mean": 2934.6,
"valid_targets_min": 1274
},
{
"epoch": 5.367892976588629,
"grad_norm": 0.9183980494977025,
"learning_rate": 6.279661327925333e-06,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24812433123588562,
"step": 3210,
"valid_targets_mean": 3023.1,
"valid_targets_min": 1477
},
{
"epoch": 5.3762541806020065,
"grad_norm": 0.9596558209841023,
"learning_rate": 6.219101799526753e-06,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33065247535705566,
"step": 3215,
"valid_targets_mean": 4098.1,
"valid_targets_min": 1177
},
{
"epoch": 5.384615384615385,
"grad_norm": 1.065383634447373,
"learning_rate": 6.158781892422085e-06,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2475639134645462,
"step": 3220,
"valid_targets_mean": 2772.1,
"valid_targets_min": 1252
},
{
"epoch": 5.392976588628763,
"grad_norm": 1.044424208460433,
"learning_rate": 6.098702655449664e-06,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2278965413570404,
"step": 3225,
"valid_targets_mean": 2502.4,
"valid_targets_min": 721
},
{
"epoch": 5.40133779264214,
"grad_norm": 0.9665704851257386,
"learning_rate": 6.038865133263054e-06,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31926289200782776,
"step": 3230,
"valid_targets_mean": 3628.5,
"valid_targets_min": 1750
},
{
"epoch": 5.409698996655519,
"grad_norm": 0.964435362243508,
"learning_rate": 5.9792703663129125e-06,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21948401629924774,
"step": 3235,
"valid_targets_mean": 2733.2,
"valid_targets_min": 484
},
{
"epoch": 5.418060200668896,
"grad_norm": 0.9794403625903487,
"learning_rate": 5.919919390828859e-06,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22015729546546936,
"step": 3240,
"valid_targets_mean": 2922.4,
"valid_targets_min": 1575
},
{
"epoch": 5.426421404682274,
"grad_norm": 0.9982047586124657,
"learning_rate": 5.860813238801523e-06,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21148087084293365,
"step": 3245,
"valid_targets_mean": 3052.9,
"valid_targets_min": 1548
},
{
"epoch": 5.434782608695652,
"grad_norm": 0.8716785695051501,
"learning_rate": 5.801952937964537e-06,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23328334093093872,
"step": 3250,
"valid_targets_mean": 3625.8,
"valid_targets_min": 648
},
{
"epoch": 5.44314381270903,
"grad_norm": 1.0317002727776252,
"learning_rate": 5.743339511776693e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26123955845832825,
"step": 3255,
"valid_targets_mean": 3316.4,
"valid_targets_min": 553
},
{
"epoch": 5.451505016722408,
"grad_norm": 0.8933485431020612,
"learning_rate": 5.684973979404144e-06,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23536235094070435,
"step": 3260,
"valid_targets_mean": 3289.2,
"valid_targets_min": 1411
},
{
"epoch": 5.459866220735786,
"grad_norm": 0.9330309774110559,
"learning_rate": 5.6268573557026865e-06,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25734925270080566,
"step": 3265,
"valid_targets_mean": 3473.9,
"valid_targets_min": 1469
},
{
"epoch": 5.468227424749164,
"grad_norm": 1.0119464981075554,
"learning_rate": 5.568990651200108e-06,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644900977611542,
"step": 3270,
"valid_targets_mean": 3406.8,
"valid_targets_min": 569
},
{
"epoch": 5.476588628762542,
"grad_norm": 1.0468454697016878,
"learning_rate": 5.511374872078616e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29436013102531433,
"step": 3275,
"valid_targets_mean": 3085.1,
"valid_targets_min": 1665
},
{
"epoch": 5.48494983277592,
"grad_norm": 0.9588401461605252,
"learning_rate": 5.454011020157348e-06,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21803942322731018,
"step": 3280,
"valid_targets_mean": 3367.6,
"valid_targets_min": 1776
},
{
"epoch": 5.493311036789297,
"grad_norm": 0.8920342971378608,
"learning_rate": 5.396900092874953e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20749205350875854,
"step": 3285,
"valid_targets_mean": 3192.9,
"valid_targets_min": 1668
},
{
"epoch": 5.501672240802676,
"grad_norm": 0.8025673440389024,
"learning_rate": 5.340043083272239e-06,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25130224227905273,
"step": 3290,
"valid_targets_mean": 3616.1,
"valid_targets_min": 1456
},
{
"epoch": 5.510033444816053,
"grad_norm": 1.0290460488107447,
"learning_rate": 5.283440979974901e-06,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.255595326423645,
"step": 3295,
"valid_targets_mean": 3070.9,
"valid_targets_min": 858
},
{
"epoch": 5.518394648829432,
"grad_norm": 0.9036243917362351,
"learning_rate": 5.227094767176364e-06,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398861050605774,
"step": 3300,
"valid_targets_mean": 3360.8,
"valid_targets_min": 1448
},
{
"epoch": 5.526755852842809,
"grad_norm": 0.9707296599929639,
"learning_rate": 5.17100542462063e-06,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24867475032806396,
"step": 3305,
"valid_targets_mean": 3409.8,
"valid_targets_min": 1500
},
{
"epoch": 5.535117056856187,
"grad_norm": 1.0059190414101475,
"learning_rate": 5.115173927585264e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20245328545570374,
"step": 3310,
"valid_targets_mean": 2579.6,
"valid_targets_min": 965
},
{
"epoch": 5.543478260869565,
"grad_norm": 1.150440106449695,
"learning_rate": 5.059601246864438e-06,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2849067747592926,
"step": 3315,
"valid_targets_mean": 3054.2,
"valid_targets_min": 1511
},
{
"epoch": 5.551839464882943,
"grad_norm": 1.082246481751666,
"learning_rate": 5.004288348752018e-06,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24570798873901367,
"step": 3320,
"valid_targets_mean": 3292.1,
"valid_targets_min": 1374
},
{
"epoch": 5.5602006688963215,
"grad_norm": 0.9677466519631982,
"learning_rate": 4.949236195024825e-06,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21175232529640198,
"step": 3325,
"valid_targets_mean": 2859.6,
"valid_targets_min": 452
},
{
"epoch": 5.568561872909699,
"grad_norm": 0.9670337251548189,
"learning_rate": 4.894445742925853e-06,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23612819612026215,
"step": 3330,
"valid_targets_mean": 2778.9,
"valid_targets_min": 479
},
{
"epoch": 5.576923076923077,
"grad_norm": 0.9399114769292228,
"learning_rate": 4.839917945147647e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24552688002586365,
"step": 3335,
"valid_targets_mean": 2997.2,
"valid_targets_min": 1116
},
{
"epoch": 5.585284280936455,
"grad_norm": 0.8414887814395099,
"learning_rate": 4.785653749815744e-06,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29480239748954773,
"step": 3340,
"valid_targets_mean": 4310.2,
"valid_targets_min": 1636
},
{
"epoch": 5.593645484949833,
"grad_norm": 0.7931418317297482,
"learning_rate": 4.731654100472178e-06,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128657341003418,
"step": 3345,
"valid_targets_mean": 4607.0,
"valid_targets_min": 1093
},
{
"epoch": 5.602006688963211,
"grad_norm": 0.8840163267997618,
"learning_rate": 4.677919936059064e-06,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24446120858192444,
"step": 3350,
"valid_targets_mean": 3667.1,
"valid_targets_min": 1631
},
{
"epoch": 5.610367892976589,
"grad_norm": 0.9191791952149919,
"learning_rate": 4.624452190902304e-06,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651020884513855,
"step": 3355,
"valid_targets_mean": 3420.4,
"valid_targets_min": 1745
},
{
"epoch": 5.618729096989966,
"grad_norm": 0.9355892323378777,
"learning_rate": 4.571251794695308e-06,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29256555438041687,
"step": 3360,
"valid_targets_mean": 4212.4,
"valid_targets_min": 1120
},
{
"epoch": 5.627090301003345,
"grad_norm": 1.0090759936821445,
"learning_rate": 4.518319672482845e-06,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667285203933716,
"step": 3365,
"valid_targets_mean": 2737.7,
"valid_targets_min": 729
},
{
"epoch": 5.635451505016722,
"grad_norm": 1.0171835292538327,
"learning_rate": 4.465656744644957e-06,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30735355615615845,
"step": 3370,
"valid_targets_mean": 3446.8,
"valid_targets_min": 1726
},
{
"epoch": 5.6438127090301,
"grad_norm": 0.9819290282194414,
"learning_rate": 4.413263926880935e-06,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20418116450309753,
"step": 3375,
"valid_targets_mean": 3223.5,
"valid_targets_min": 726
},
{
"epoch": 5.6521739130434785,
"grad_norm": 0.9512457595996446,
"learning_rate": 4.3611421301934435e-06,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2649402320384979,
"step": 3380,
"valid_targets_mean": 2930.5,
"valid_targets_min": 1139
},
{
"epoch": 5.660535117056856,
"grad_norm": 0.9658417094141116,
"learning_rate": 4.309292260872633e-06,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21503464877605438,
"step": 3385,
"valid_targets_mean": 2954.3,
"valid_targets_min": 1684
},
{
"epoch": 5.668896321070234,
"grad_norm": 1.0062110489738594,
"learning_rate": 4.257715220480405e-06,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2543056011199951,
"step": 3390,
"valid_targets_mean": 3383.0,
"valid_targets_min": 1705
},
{
"epoch": 5.677257525083612,
"grad_norm": 1.0054767456103721,
"learning_rate": 4.206411905834733e-06,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3248503506183624,
"step": 3395,
"valid_targets_mean": 3018.8,
"valid_targets_min": 399
},
{
"epoch": 5.68561872909699,
"grad_norm": 1.085787300697935,
"learning_rate": 4.155383208994055e-06,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24291780591011047,
"step": 3400,
"valid_targets_mean": 3004.7,
"valid_targets_min": 1883
},
{
"epoch": 5.693979933110368,
"grad_norm": 1.0345601696467057,
"learning_rate": 4.10463001724178e-06,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24932274222373962,
"step": 3405,
"valid_targets_mean": 2949.5,
"valid_targets_min": 1622
},
{
"epoch": 5.702341137123746,
"grad_norm": 0.9908894862017844,
"learning_rate": 4.054153213070868e-06,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2516738772392273,
"step": 3410,
"valid_targets_mean": 3543.2,
"valid_targets_min": 1348
},
{
"epoch": 5.710702341137123,
"grad_norm": 1.0855149671023934,
"learning_rate": 4.003953674168455e-06,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2057594358921051,
"step": 3415,
"valid_targets_mean": 3033.4,
"valid_targets_min": 1026
},
{
"epoch": 5.719063545150502,
"grad_norm": 0.9852747879835021,
"learning_rate": 3.954032273400608e-06,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266365110874176,
"step": 3420,
"valid_targets_mean": 3131.4,
"valid_targets_min": 1591
},
{
"epoch": 5.7274247491638794,
"grad_norm": 0.8893474256351308,
"learning_rate": 3.904389878797159e-06,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2710364758968353,
"step": 3425,
"valid_targets_mean": 3534.0,
"valid_targets_min": 1096
},
{
"epoch": 5.735785953177258,
"grad_norm": 0.8715257939471994,
"learning_rate": 3.85502735353658e-06,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2547582983970642,
"step": 3430,
"valid_targets_mean": 3161.2,
"valid_targets_min": 1420
},
{
"epoch": 5.7441471571906355,
"grad_norm": 0.9676813409941313,
"learning_rate": 3.8059455559310167e-06,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2646714746952057,
"step": 3435,
"valid_targets_mean": 3319.5,
"valid_targets_min": 1710
},
{
"epoch": 5.752508361204013,
"grad_norm": 0.8470578522309716,
"learning_rate": 3.757145339411332e-06,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22734609246253967,
"step": 3440,
"valid_targets_mean": 4302.4,
"valid_targets_min": 667
},
{
"epoch": 5.760869565217392,
"grad_norm": 0.853636864130374,
"learning_rate": 3.708627552512276e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20801186561584473,
"step": 3445,
"valid_targets_mean": 3614.8,
"valid_targets_min": 1135
},
{
"epoch": 5.769230769230769,
"grad_norm": 0.8787913423829194,
"learning_rate": 3.660393038857739e-06,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22825166583061218,
"step": 3450,
"valid_targets_mean": 3887.0,
"valid_targets_min": 1180
},
{
"epoch": 5.777591973244148,
"grad_norm": 1.1205253969747466,
"learning_rate": 3.6124426371460542e-06,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.272126704454422,
"step": 3455,
"valid_targets_mean": 2778.0,
"valid_targets_min": 600
},
{
"epoch": 5.785953177257525,
"grad_norm": 1.0498337049709496,
"learning_rate": 3.564777181135466e-06,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2422400861978531,
"step": 3460,
"valid_targets_mean": 2545.4,
"valid_targets_min": 640
},
{
"epoch": 5.794314381270903,
"grad_norm": 1.1993568136310828,
"learning_rate": 3.517397499629589e-06,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2053757905960083,
"step": 3465,
"valid_targets_mean": 3302.1,
"valid_targets_min": 1127
},
{
"epoch": 5.802675585284281,
"grad_norm": 0.843797327600791,
"learning_rate": 3.4703044164630064e-06,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2291642725467682,
"step": 3470,
"valid_targets_mean": 4161.9,
"valid_targets_min": 1041
},
{
"epoch": 5.811036789297659,
"grad_norm": 0.8755458954346165,
"learning_rate": 3.4234987504869553e-06,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3180461823940277,
"step": 3475,
"valid_targets_mean": 4406.1,
"valid_targets_min": 2243
},
{
"epoch": 5.8193979933110365,
"grad_norm": 1.0301442813101,
"learning_rate": 3.376981315555086e-06,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27760040760040283,
"step": 3480,
"valid_targets_mean": 2683.6,
"valid_targets_min": 591
},
{
"epoch": 5.827759197324415,
"grad_norm": 0.9573217341539905,
"learning_rate": 3.3307529205092903e-06,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.368574321269989,
"step": 3485,
"valid_targets_mean": 4355.6,
"valid_targets_min": 520
},
{
"epoch": 5.8361204013377925,
"grad_norm": 1.029121606843474,
"learning_rate": 3.2848143691656807e-06,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23345233500003815,
"step": 3490,
"valid_targets_mean": 2955.6,
"valid_targets_min": 1126
},
{
"epoch": 5.84448160535117,
"grad_norm": 1.0526837100245612,
"learning_rate": 3.239166460300571e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23312462866306305,
"step": 3495,
"valid_targets_mean": 2799.9,
"valid_targets_min": 1173
},
{
"epoch": 5.852842809364549,
"grad_norm": 0.9555127758551365,
"learning_rate": 3.1938099876366047e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574623227119446,
"step": 3500,
"valid_targets_mean": 2801.6,
"valid_targets_min": 1072
},
{
"epoch": 5.861204013377926,
"grad_norm": 1.0434914071493264,
"learning_rate": 3.1487457398289645e-06,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2559327781200409,
"step": 3505,
"valid_targets_mean": 3459.7,
"valid_targets_min": 788
},
{
"epoch": 5.869565217391305,
"grad_norm": 1.012926148789505,
"learning_rate": 3.1039745004516207e-06,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865094840526581,
"step": 3510,
"valid_targets_mean": 3056.8,
"valid_targets_min": 696
},
{
"epoch": 5.877926421404682,
"grad_norm": 0.9712574615035141,
"learning_rate": 3.0594970479837683e-06,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21085739135742188,
"step": 3515,
"valid_targets_mean": 2824.9,
"valid_targets_min": 599
},
{
"epoch": 5.88628762541806,
"grad_norm": 1.0473259954733953,
"learning_rate": 3.015314155796234e-06,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2044457346200943,
"step": 3520,
"valid_targets_mean": 2760.9,
"valid_targets_min": 715
},
{
"epoch": 5.894648829431438,
"grad_norm": 0.9843115195011657,
"learning_rate": 2.9714265921380557e-06,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20010721683502197,
"step": 3525,
"valid_targets_mean": 2771.8,
"valid_targets_min": 963
},
{
"epoch": 5.903010033444816,
"grad_norm": 0.8585558006225893,
"learning_rate": 2.927835120123128e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3017348051071167,
"step": 3530,
"valid_targets_mean": 3708.9,
"valid_targets_min": 1217
},
{
"epoch": 5.911371237458194,
"grad_norm": 1.0365669573233212,
"learning_rate": 2.8845404977169057e-06,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24910643696784973,
"step": 3535,
"valid_targets_mean": 3256.1,
"valid_targets_min": 1093
},
{
"epoch": 5.919732441471572,
"grad_norm": 1.1977783758414982,
"learning_rate": 2.841543477723254e-06,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3304036557674408,
"step": 3540,
"valid_targets_mean": 4009.1,
"valid_targets_min": 1801
},
{
"epoch": 5.9280936454849495,
"grad_norm": 1.0475636986470853,
"learning_rate": 2.7988448077713592e-06,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23120662569999695,
"step": 3545,
"valid_targets_mean": 2633.4,
"valid_targets_min": 1628
},
{
"epoch": 5.936454849498328,
"grad_norm": 0.8986613684835274,
"learning_rate": 2.7564452303027024e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25718823075294495,
"step": 3550,
"valid_targets_mean": 3136.1,
"valid_targets_min": 1648
},
{
"epoch": 5.944816053511706,
"grad_norm": 0.8828527508561764,
"learning_rate": 2.7143454825581714e-06,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.189050555229187,
"step": 3555,
"valid_targets_mean": 3121.1,
"valid_targets_min": 1683
},
{
"epoch": 5.953177257525084,
"grad_norm": 1.117960588110681,
"learning_rate": 2.672546296565237e-06,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24358290433883667,
"step": 3560,
"valid_targets_mean": 3175.4,
"valid_targets_min": 1662
},
{
"epoch": 5.961538461538462,
"grad_norm": 1.0074867797130804,
"learning_rate": 2.6310483991252133e-06,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2374524474143982,
"step": 3565,
"valid_targets_mean": 2834.6,
"valid_targets_min": 1201
},
{
"epoch": 5.969899665551839,
"grad_norm": 1.0690795488474825,
"learning_rate": 2.589852511800646e-06,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17189118266105652,
"step": 3570,
"valid_targets_mean": 2602.5,
"valid_targets_min": 1331
},
{
"epoch": 5.978260869565218,
"grad_norm": 0.9971267052649938,
"learning_rate": 2.54895935090274e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21394936740398407,
"step": 3575,
"valid_targets_mean": 2751.8,
"valid_targets_min": 750
},
{
"epoch": 5.986622073578595,
"grad_norm": 0.9537557291572413,
"learning_rate": 2.508369627478917e-06,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22841092944145203,
"step": 3580,
"valid_targets_mean": 3169.6,
"valid_targets_min": 799
},
{
"epoch": 5.994983277591973,
"grad_norm": 0.9343814378914798,
"learning_rate": 2.468084047300452e-06,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2370833456516266,
"step": 3585,
"valid_targets_mean": 3215.1,
"valid_targets_min": 998
},
{
"epoch": 6.003344481605351,
"grad_norm": 0.8238052983578956,
"learning_rate": 2.4281033108501873e-06,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642517685890198,
"step": 3590,
"valid_targets_mean": 4032.8,
"valid_targets_min": 1390
},
{
"epoch": 6.011705685618729,
"grad_norm": 0.8851781452831197,
"learning_rate": 2.3884281133103725e-06,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2074108123779297,
"step": 3595,
"valid_targets_mean": 3117.4,
"valid_targets_min": 685
},
{
"epoch": 6.0200668896321075,
"grad_norm": 1.0191065552656804,
"learning_rate": 2.3490591445505715e-06,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20292872190475464,
"step": 3600,
"valid_targets_mean": 2607.1,
"valid_targets_min": 1071
},
{
"epoch": 6.028428093645485,
"grad_norm": 0.8274990269440808,
"learning_rate": 2.309997089115659e-06,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27467474341392517,
"step": 3605,
"valid_targets_mean": 4511.8,
"valid_targets_min": 1261
},
{
"epoch": 6.036789297658863,
"grad_norm": 0.9829693732867127,
"learning_rate": 2.271242626213925e-06,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838166654109955,
"step": 3610,
"valid_targets_mean": 3051.6,
"valid_targets_min": 848
},
{
"epoch": 6.045150501672241,
"grad_norm": 0.9430424383463232,
"learning_rate": 2.232796429705253e-06,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2801671028137207,
"step": 3615,
"valid_targets_mean": 3661.6,
"valid_targets_min": 783
},
{
"epoch": 6.053511705685619,
"grad_norm": 0.9799256756829944,
"learning_rate": 2.1946591680894145e-06,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21253493428230286,
"step": 3620,
"valid_targets_mean": 3080.5,
"valid_targets_min": 1116
},
{
"epoch": 6.061872909698996,
"grad_norm": 0.890449059990666,
"learning_rate": 2.1568315044944586e-06,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23232722282409668,
"step": 3625,
"valid_targets_mean": 3467.1,
"valid_targets_min": 689
},
{
"epoch": 6.070234113712375,
"grad_norm": 1.553508951062491,
"learning_rate": 2.1193140966651484e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310488224029541,
"step": 3630,
"valid_targets_mean": 3239.2,
"valid_targets_min": 1426
},
{
"epoch": 6.078595317725752,
"grad_norm": 1.0015740592300846,
"learning_rate": 2.082107596951548e-06,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560243308544159,
"step": 3635,
"valid_targets_mean": 3611.4,
"valid_targets_min": 1662
},
{
"epoch": 6.086956521739131,
"grad_norm": 0.9610763495680839,
"learning_rate": 2.0452126522976746e-06,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23907433450222015,
"step": 3640,
"valid_targets_mean": 3443.9,
"valid_targets_min": 971
},
{
"epoch": 6.095317725752508,
"grad_norm": 1.0195087469479902,
"learning_rate": 2.008629904230237e-06,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21630674600601196,
"step": 3645,
"valid_targets_mean": 3096.0,
"valid_targets_min": 1263
},
{
"epoch": 6.103678929765886,
"grad_norm": 1.1781421008430892,
"learning_rate": 1.972359988847499e-06,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22949744760990143,
"step": 3650,
"valid_targets_mean": 2490.5,
"valid_targets_min": 1214
},
{
"epoch": 6.1120401337792645,
"grad_norm": 1.0009259653669014,
"learning_rate": 1.9364035368082222e-06,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17091065645217896,
"step": 3655,
"valid_targets_mean": 2323.1,
"valid_targets_min": 1277
},
{
"epoch": 6.120401337792642,
"grad_norm": 0.9973471406872797,
"learning_rate": 1.9007611733206733e-06,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29807907342910767,
"step": 3660,
"valid_targets_mean": 3280.1,
"valid_targets_min": 919
},
{
"epoch": 6.12876254180602,
"grad_norm": 0.9458454127635654,
"learning_rate": 1.8654335181317784e-06,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26122528314590454,
"step": 3665,
"valid_targets_mean": 3286.4,
"valid_targets_min": 1471
},
{
"epoch": 6.137123745819398,
"grad_norm": 0.9302638864213695,
"learning_rate": 1.8304211855163311e-06,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30081790685653687,
"step": 3670,
"valid_targets_mean": 3793.2,
"valid_targets_min": 392
},
{
"epoch": 6.145484949832776,
"grad_norm": 0.9293216572645322,
"learning_rate": 1.7957247842663194e-06,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717227041721344,
"step": 3675,
"valid_targets_mean": 3530.5,
"valid_targets_min": 1072
},
{
"epoch": 6.153846153846154,
"grad_norm": 1.0642259780797343,
"learning_rate": 1.7613449176803476e-06,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18526840209960938,
"step": 3680,
"valid_targets_mean": 3227.3,
"valid_targets_min": 1819
},
{
"epoch": 6.162207357859532,
"grad_norm": 1.0950639668119169,
"learning_rate": 1.7272821835531295e-06,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23934021592140198,
"step": 3685,
"valid_targets_mean": 2936.0,
"valid_targets_min": 1404
},
{
"epoch": 6.170568561872909,
"grad_norm": 0.8320781108074271,
"learning_rate": 1.693537174165103e-06,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2670717239379883,
"step": 3690,
"valid_targets_mean": 4768.5,
"valid_targets_min": 754
},
{
"epoch": 6.178929765886288,
"grad_norm": 1.0190310935542606,
"learning_rate": 1.660110476272132e-06,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1878700852394104,
"step": 3695,
"valid_targets_mean": 2822.3,
"valid_targets_min": 1513
},
{
"epoch": 6.187290969899665,
"grad_norm": 0.946671940766795,
"learning_rate": 1.6270026710952924e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18372738361358643,
"step": 3700,
"valid_targets_mean": 3202.5,
"valid_targets_min": 1844
},
{
"epoch": 6.195652173913044,
"grad_norm": 1.0311761236131074,
"learning_rate": 1.5942143343107953e-06,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1737433671951294,
"step": 3705,
"valid_targets_mean": 2330.4,
"valid_targets_min": 983
},
{
"epoch": 6.2040133779264215,
"grad_norm": 1.7693463573078112,
"learning_rate": 1.5617460360399439e-06,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24771828949451447,
"step": 3710,
"valid_targets_mean": 2783.2,
"valid_targets_min": 674
},
{
"epoch": 6.212374581939799,
"grad_norm": 1.1913402227691237,
"learning_rate": 1.529598340839238e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20294560492038727,
"step": 3715,
"valid_targets_mean": 3321.5,
"valid_targets_min": 1623
},
{
"epoch": 6.2207357859531776,
"grad_norm": 1.1205061236211051,
"learning_rate": 1.4977718076905533e-06,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20099762082099915,
"step": 3720,
"valid_targets_mean": 2455.0,
"valid_targets_min": 682
},
{
"epoch": 6.229096989966555,
"grad_norm": 0.872701348205632,
"learning_rate": 1.4662669899914161e-06,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.240260511636734,
"step": 3725,
"valid_targets_mean": 4170.6,
"valid_targets_min": 587
},
{
"epoch": 6.237458193979933,
"grad_norm": 1.149500218715332,
"learning_rate": 1.4350844355453952e-06,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24577274918556213,
"step": 3730,
"valid_targets_mean": 2776.9,
"valid_targets_min": 1146
},
{
"epoch": 6.245819397993311,
"grad_norm": 0.9744589071128174,
"learning_rate": 1.404224686552571e-06,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2977054715156555,
"step": 3735,
"valid_targets_mean": 3161.8,
"valid_targets_min": 1420
},
{
"epoch": 6.254180602006689,
"grad_norm": 1.0622602777455052,
"learning_rate": 1.3736882796000983e-06,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2422657608985901,
"step": 3740,
"valid_targets_mean": 3276.9,
"valid_targets_min": 2083
},
{
"epoch": 6.262541806020067,
"grad_norm": 0.9192780596090956,
"learning_rate": 1.3434757456528868e-06,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23593655228614807,
"step": 3745,
"valid_targets_mean": 3154.8,
"valid_targets_min": 1058
},
{
"epoch": 6.270903010033445,
"grad_norm": 1.0794767225936577,
"learning_rate": 1.3135876100443557e-06,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19183969497680664,
"step": 3750,
"valid_targets_mean": 2641.8,
"valid_targets_min": 1122
},
{
"epoch": 6.2792642140468224,
"grad_norm": 1.1069267787089752,
"learning_rate": 1.2840243924673202e-06,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19526013731956482,
"step": 3755,
"valid_targets_mean": 2651.9,
"valid_targets_min": 1307
},
{
"epoch": 6.287625418060201,
"grad_norm": 0.9530346118359216,
"learning_rate": 1.2547866069649418e-06,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2443237155675888,
"step": 3760,
"valid_targets_mean": 2864.8,
"valid_targets_min": 1587
},
{
"epoch": 6.2959866220735785,
"grad_norm": 0.9997194895255284,
"learning_rate": 1.225874761921788e-06,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22411714494228363,
"step": 3765,
"valid_targets_mean": 2974.7,
"valid_targets_min": 1770
},
{
"epoch": 6.304347826086957,
"grad_norm": 0.9257546461579786,
"learning_rate": 1.1972893600550007e-06,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20396903157234192,
"step": 3770,
"valid_targets_mean": 3238.4,
"valid_targets_min": 696
},
{
"epoch": 6.312709030100335,
"grad_norm": 0.9526741297223604,
"learning_rate": 1.1690308984055454e-06,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31394025683403015,
"step": 3775,
"valid_targets_mean": 3941.2,
"valid_targets_min": 1904
},
{
"epoch": 6.321070234113712,
"grad_norm": 1.0127893431246604,
"learning_rate": 1.141099868329576e-06,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2128710150718689,
"step": 3780,
"valid_targets_mean": 3173.2,
"valid_targets_min": 2167
},
{
"epoch": 6.329431438127091,
"grad_norm": 0.8562910539058333,
"learning_rate": 1.1134967554898868e-06,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3077230155467987,
"step": 3785,
"valid_targets_mean": 3871.0,
"valid_targets_min": 1399
},
{
"epoch": 6.337792642140468,
"grad_norm": 1.0570481175477418,
"learning_rate": 1.0862220398474798e-06,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24611452221870422,
"step": 3790,
"valid_targets_mean": 2720.8,
"valid_targets_min": 1018
},
{
"epoch": 6.346153846153846,
"grad_norm": 0.9974643589859099,
"learning_rate": 1.0592761956531983e-06,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15949031710624695,
"step": 3795,
"valid_targets_mean": 2890.8,
"valid_targets_min": 693
},
{
"epoch": 6.354515050167224,
"grad_norm": 1.0285315175075678,
"learning_rate": 1.0326596914395015e-06,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.218702495098114,
"step": 3800,
"valid_targets_mean": 2983.0,
"valid_targets_min": 1307
},
{
"epoch": 6.362876254180602,
"grad_norm": 1.0391314709729795,
"learning_rate": 1.0063729900122943e-06,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22132647037506104,
"step": 3805,
"valid_targets_mean": 3014.7,
"valid_targets_min": 1600
},
{
"epoch": 6.3712374581939795,
"grad_norm": 1.0732291866174521,
"learning_rate": 9.80416548442904e-07,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16350066661834717,
"step": 3810,
"valid_targets_mean": 2471.2,
"valid_targets_min": 1252
},
{
"epoch": 6.379598662207358,
"grad_norm": 0.9478207894233418,
"learning_rate": 9.547908180601274e-07,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2005515992641449,
"step": 3815,
"valid_targets_mean": 3266.4,
"valid_targets_min": 1219
},
{
"epoch": 6.3879598662207355,
"grad_norm": 0.9884148175012485,
"learning_rate": 9.294962444423672e-07,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18229839205741882,
"step": 3820,
"valid_targets_mean": 2692.9,
"valid_targets_min": 1731
},
{
"epoch": 6.396321070234114,
"grad_norm": 1.0689420786608823,
"learning_rate": 9.045332674099039e-07,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2374996840953827,
"step": 3825,
"valid_targets_mean": 3234.9,
"valid_targets_min": 978
},
{
"epoch": 6.404682274247492,
"grad_norm": 0.9999053556423455,
"learning_rate": 8.799023210172319e-07,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577441334724426,
"step": 3830,
"valid_targets_mean": 3541.5,
"valid_targets_min": 860
},
{
"epoch": 6.413043478260869,
"grad_norm": 1.0162923003110396,
"learning_rate": 8.556038335455241e-07,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17862260341644287,
"step": 3835,
"valid_targets_mean": 3000.1,
"valid_targets_min": 1116
},
{
"epoch": 6.421404682274248,
"grad_norm": 0.9436887696227507,
"learning_rate": 8.316382274951773e-07,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3100453317165375,
"step": 3840,
"valid_targets_mean": 4021.4,
"valid_targets_min": 556
},
{
"epoch": 6.429765886287625,
"grad_norm": 0.9165404614671304,
"learning_rate": 8.080059195784829e-07,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29584699869155884,
"step": 3845,
"valid_targets_mean": 3990.2,
"valid_targets_min": 1509
},
{
"epoch": 6.438127090301004,
"grad_norm": 1.1633047424989935,
"learning_rate": 7.847073207123523e-07,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2624181807041168,
"step": 3850,
"valid_targets_mean": 2811.7,
"valid_targets_min": 1472
},
{
"epoch": 6.446488294314381,
"grad_norm": 0.9983233707225826,
"learning_rate": 7.617428360111945e-07,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.281194269657135,
"step": 3855,
"valid_targets_mean": 3405.9,
"valid_targets_min": 738
},
{
"epoch": 6.454849498327759,
"grad_norm": 1.1246524097930575,
"learning_rate": 7.391128647798607e-07,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22077451646327972,
"step": 3860,
"valid_targets_mean": 2505.6,
"valid_targets_min": 1234
},
{
"epoch": 6.463210702341137,
"grad_norm": 0.886456015080147,
"learning_rate": 7.168178005067062e-07,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29799652099609375,
"step": 3865,
"valid_targets_mean": 3983.9,
"valid_targets_min": 1248
},
{
"epoch": 6.471571906354515,
"grad_norm": 1.103332362483573,
"learning_rate": 6.948580308567532e-07,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571655511856079,
"step": 3870,
"valid_targets_mean": 2698.6,
"valid_targets_min": 710
},
{
"epoch": 6.479933110367893,
"grad_norm": 1.0813420856710951,
"learning_rate": 6.732339376649388e-07,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22849063575267792,
"step": 3875,
"valid_targets_mean": 2950.5,
"valid_targets_min": 1156
},
{
"epoch": 6.488294314381271,
"grad_norm": 1.0707482467762934,
"learning_rate": 6.519458969294845e-07,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18700650334358215,
"step": 3880,
"valid_targets_mean": 2505.4,
"valid_targets_min": 1004
},
{
"epoch": 6.496655518394649,
"grad_norm": 0.9136997187616676,
"learning_rate": 6.309942788053502e-07,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18983229994773865,
"step": 3885,
"valid_targets_mean": 2847.4,
"valid_targets_min": 1011
},
{
"epoch": 6.505016722408027,
"grad_norm": 0.9836787164297042,
"learning_rate": 6.103794475978086e-07,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27802348136901855,
"step": 3890,
"valid_targets_mean": 3571.6,
"valid_targets_min": 1766
},
{
"epoch": 6.513377926421405,
"grad_norm": 1.0040587188078438,
"learning_rate": 5.901017617560989e-07,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2178075611591339,
"step": 3895,
"valid_targets_mean": 3485.3,
"valid_targets_min": 1748
},
{
"epoch": 6.521739130434782,
"grad_norm": 0.9972334739609068,
"learning_rate": 5.701615738672073e-07,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2519034743309021,
"step": 3900,
"valid_targets_mean": 3683.1,
"valid_targets_min": 1279
},
{
"epoch": 6.530100334448161,
"grad_norm": 1.0048200677550907,
"learning_rate": 5.505592306497298e-07,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2037794291973114,
"step": 3905,
"valid_targets_mean": 2815.6,
"valid_targets_min": 1187
},
{
"epoch": 6.538461538461538,
"grad_norm": 0.9738058489579007,
"learning_rate": 5.312950729478327e-07,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917770355939865,
"step": 3910,
"valid_targets_mean": 2968.3,
"valid_targets_min": 1757
},
{
"epoch": 6.546822742474916,
"grad_norm": 0.9699331976466884,
"learning_rate": 5.123694357253439e-07,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19296962022781372,
"step": 3915,
"valid_targets_mean": 3587.3,
"valid_targets_min": 1059
},
{
"epoch": 6.555183946488294,
"grad_norm": 0.9210291981550992,
"learning_rate": 4.937826480599195e-07,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25981834530830383,
"step": 3920,
"valid_targets_mean": 3616.3,
"valid_targets_min": 772
},
{
"epoch": 6.563545150501672,
"grad_norm": 0.9639041354225487,
"learning_rate": 4.755350331373243e-07,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22324317693710327,
"step": 3925,
"valid_targets_mean": 3426.1,
"valid_targets_min": 1477
},
{
"epoch": 6.5719063545150505,
"grad_norm": 1.0060449285500996,
"learning_rate": 4.576269082458118e-07,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18587031960487366,
"step": 3930,
"valid_targets_mean": 2988.8,
"valid_targets_min": 1536
},
{
"epoch": 6.580267558528428,
"grad_norm": 1.125813362538308,
"learning_rate": 4.4005858477060404e-07,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21866926550865173,
"step": 3935,
"valid_targets_mean": 3366.3,
"valid_targets_min": 1060
},
{
"epoch": 6.588628762541806,
"grad_norm": 1.0628904813820763,
"learning_rate": 4.228303681884782e-07,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25543057918548584,
"step": 3940,
"valid_targets_mean": 3191.6,
"valid_targets_min": 1800
},
{
"epoch": 6.596989966555184,
"grad_norm": 0.9915725733061522,
"learning_rate": 4.059425580624576e-07,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28621232509613037,
"step": 3945,
"valid_targets_mean": 3603.1,
"valid_targets_min": 1548
},
{
"epoch": 6.605351170568562,
"grad_norm": 0.9949146897868569,
"learning_rate": 3.893954480366091e-07,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640351116657257,
"step": 3950,
"valid_targets_mean": 2460.5,
"valid_targets_min": 880
},
{
"epoch": 6.61371237458194,
"grad_norm": 1.111214711835855,
"learning_rate": 3.731893258309227e-07,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22030051052570343,
"step": 3955,
"valid_targets_mean": 2509.4,
"valid_targets_min": 553
},
{
"epoch": 6.622073578595318,
"grad_norm": 1.1676078726615438,
"learning_rate": 3.573244732363179e-07,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.243607297539711,
"step": 3960,
"valid_targets_mean": 3134.6,
"valid_targets_min": 689
},
{
"epoch": 6.630434782608695,
"grad_norm": 0.9596071900127525,
"learning_rate": 3.4180116610973645e-07,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.280606210231781,
"step": 3965,
"valid_targets_mean": 3487.9,
"valid_targets_min": 1539
},
{
"epoch": 6.638795986622074,
"grad_norm": 1.0307311782355484,
"learning_rate": 3.2661967436936394e-07,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2129300832748413,
"step": 3970,
"valid_targets_mean": 3150.9,
"valid_targets_min": 364
},
{
"epoch": 6.647157190635451,
"grad_norm": 0.9029900853777432,
"learning_rate": 3.117802619899113e-07,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2022523730993271,
"step": 3975,
"valid_targets_mean": 3131.2,
"valid_targets_min": 1462
},
{
"epoch": 6.65551839464883,
"grad_norm": 0.9353250337198755,
"learning_rate": 2.9728318699804525e-07,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26376834511756897,
"step": 3980,
"valid_targets_mean": 3456.8,
"valid_targets_min": 1636
},
{
"epoch": 6.6638795986622075,
"grad_norm": 1.1365720683226703,
"learning_rate": 2.831287014678941e-07,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19698631763458252,
"step": 3985,
"valid_targets_mean": 2634.6,
"valid_targets_min": 569
},
{
"epoch": 6.672240802675585,
"grad_norm": 0.9037444665225245,
"learning_rate": 2.693170515166599e-07,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17331139743328094,
"step": 3990,
"valid_targets_mean": 3423.4,
"valid_targets_min": 2070
},
{
"epoch": 6.6806020066889635,
"grad_norm": 1.012894148288379,
"learning_rate": 2.558484773003445e-07,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655693292617798,
"step": 3995,
"valid_targets_mean": 3323.4,
"valid_targets_min": 1844
},
{
"epoch": 6.688963210702341,
"grad_norm": 0.9548388318374232,
"learning_rate": 2.427232130095747e-07,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21322210133075714,
"step": 4000,
"valid_targets_mean": 2801.6,
"valid_targets_min": 1264
},
{
"epoch": 6.697324414715719,
"grad_norm": 1.0832658905494663,
"learning_rate": 2.299414868655281e-07,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2207055389881134,
"step": 4005,
"valid_targets_mean": 2772.9,
"valid_targets_min": 1399
},
{
"epoch": 6.705685618729097,
"grad_norm": 0.9005094142183284,
"learning_rate": 2.1750352111596707e-07,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24203582108020782,
"step": 4010,
"valid_targets_mean": 3876.8,
"valid_targets_min": 2273
},
{
"epoch": 6.714046822742475,
"grad_norm": 0.9978940251893587,
"learning_rate": 2.0540953203137093e-07,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1879318505525589,
"step": 4015,
"valid_targets_mean": 3497.7,
"valid_targets_min": 1234
},
{
"epoch": 6.722408026755852,
"grad_norm": 0.9909059278250834,
"learning_rate": 1.9365972990117e-07,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991642862558365,
"step": 4020,
"valid_targets_mean": 2930.1,
"valid_targets_min": 1353
},
{
"epoch": 6.730769230769231,
"grad_norm": 0.9925673396527694,
"learning_rate": 1.8225431903010403e-07,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23669245839118958,
"step": 4025,
"valid_targets_mean": 2976.0,
"valid_targets_min": 978
},
{
"epoch": 6.739130434782608,
"grad_norm": 0.97958659307702,
"learning_rate": 1.7119349773466076e-07,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18920472264289856,
"step": 4030,
"valid_targets_mean": 2922.8,
"valid_targets_min": 799
},
{
"epoch": 6.747491638795987,
"grad_norm": 0.9895938981944002,
"learning_rate": 1.6047745833962735e-07,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4012299180030823,
"step": 4035,
"valid_targets_mean": 4044.7,
"valid_targets_min": 750
},
{
"epoch": 6.7558528428093645,
"grad_norm": 1.005865202853038,
"learning_rate": 1.5010638717474878e-07,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2346489280462265,
"step": 4040,
"valid_targets_mean": 3234.9,
"valid_targets_min": 1001
},
{
"epoch": 6.764214046822742,
"grad_norm": 0.9665878862524135,
"learning_rate": 1.400804645714815e-07,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20860449969768524,
"step": 4045,
"valid_targets_mean": 2963.2,
"valid_targets_min": 1512
},
{
"epoch": 6.7725752508361206,
"grad_norm": 0.9073442199596257,
"learning_rate": 1.30399864859867e-07,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21425005793571472,
"step": 4050,
"valid_targets_mean": 4054.4,
"valid_targets_min": 970
},
{
"epoch": 6.780936454849498,
"grad_norm": 1.1395884258364646,
"learning_rate": 1.2106475636549654e-07,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2343166172504425,
"step": 4055,
"valid_targets_mean": 2424.9,
"valid_targets_min": 511
},
{
"epoch": 6.789297658862877,
"grad_norm": 1.2355832602043204,
"learning_rate": 1.1207530140658452e-07,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1832336038351059,
"step": 4060,
"valid_targets_mean": 2785.1,
"valid_targets_min": 1439
},
{
"epoch": 6.797658862876254,
"grad_norm": 1.0756162811102452,
"learning_rate": 1.0343165629114416e-07,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562386989593506,
"step": 4065,
"valid_targets_mean": 2926.1,
"valid_targets_min": 1110
},
{
"epoch": 6.806020066889632,
"grad_norm": 1.12479348737203,
"learning_rate": 9.513397131427404e-08,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19680562615394592,
"step": 4070,
"valid_targets_mean": 3050.8,
"valid_targets_min": 1505
},
{
"epoch": 6.81438127090301,
"grad_norm": 1.3027817427113138,
"learning_rate": 8.71823907555358e-08,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2448652684688568,
"step": 4075,
"valid_targets_mean": 3234.3,
"valid_targets_min": 965
},
{
"epoch": 6.822742474916388,
"grad_norm": 1.0120756120555998,
"learning_rate": 7.957705287645834e-08,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.236515074968338,
"step": 4080,
"valid_targets_mean": 3107.5,
"valid_targets_min": 1469
},
{
"epoch": 6.831103678929766,
"grad_norm": 1.1643671752495577,
"learning_rate": 7.231808991812639e-08,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24128901958465576,
"step": 4085,
"valid_targets_mean": 2651.4,
"valid_targets_min": 513
},
{
"epoch": 6.839464882943144,
"grad_norm": 1.0224383394242054,
"learning_rate": 6.540562809887574e-08,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2086195945739746,
"step": 4090,
"valid_targets_mean": 2881.9,
"valid_targets_min": 594
},
{
"epoch": 6.8478260869565215,
"grad_norm": 0.8984874112503329,
"learning_rate": 5.8839787612114955e-08,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19981077313423157,
"step": 4095,
"valid_targets_mean": 3368.8,
"valid_targets_min": 1532
},
{
"epoch": 6.8561872909699,
"grad_norm": 1.1889036672332234,
"learning_rate": 5.2620682624213714e-08,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057703673839569,
"step": 4100,
"valid_targets_mean": 2838.0,
"valid_targets_min": 520
},
{
"epoch": 6.864548494983278,
"grad_norm": 0.9722791686736607,
"learning_rate": 4.6748421272537756e-08,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3012353777885437,
"step": 4105,
"valid_targets_mean": 3410.2,
"valid_targets_min": 401
},
{
"epoch": 6.872909698996655,
"grad_norm": 0.8439698339063494,
"learning_rate": 4.1223105663554806e-08,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22458210587501526,
"step": 4110,
"valid_targets_mean": 4013.0,
"valid_targets_min": 967
},
{
"epoch": 6.881270903010034,
"grad_norm": 0.9937076155434867,
"learning_rate": 3.604483187106711e-08,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21647757291793823,
"step": 4115,
"valid_targets_mean": 2891.7,
"valid_targets_min": 1398
},
{
"epoch": 6.889632107023411,
"grad_norm": 0.9554683145250049,
"learning_rate": 3.1213689934537215e-08,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.227905735373497,
"step": 4120,
"valid_targets_mean": 3056.9,
"valid_targets_min": 1091
},
{
"epoch": 6.897993311036789,
"grad_norm": 0.9851841831055532,
"learning_rate": 2.6729763857522573e-08,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20012471079826355,
"step": 4125,
"valid_targets_mean": 2812.2,
"valid_targets_min": 959
},
{
"epoch": 6.906354515050167,
"grad_norm": 0.9102139042294596,
"learning_rate": 2.2593131606216677e-08,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22855457663536072,
"step": 4130,
"valid_targets_mean": 3411.4,
"valid_targets_min": 780
},
{
"epoch": 6.914715719063545,
"grad_norm": 0.9968709409763933,
"learning_rate": 1.880386510809018e-08,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24055655300617218,
"step": 4135,
"valid_targets_mean": 2944.4,
"valid_targets_min": 1447
},
{
"epoch": 6.923076923076923,
"grad_norm": 1.0089101681026145,
"learning_rate": 1.536203025064742e-08,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23049476742744446,
"step": 4140,
"valid_targets_mean": 3192.5,
"valid_targets_min": 1745
},
{
"epoch": 6.931438127090301,
"grad_norm": 1.0054169631158152,
"learning_rate": 1.226768688026736e-08,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21784156560897827,
"step": 4145,
"valid_targets_mean": 2982.2,
"valid_targets_min": 663
},
{
"epoch": 6.9397993311036785,
"grad_norm": 1.0500654956007207,
"learning_rate": 9.520888801182182e-09,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21303492784500122,
"step": 4150,
"valid_targets_mean": 2794.8,
"valid_targets_min": 1323
},
{
"epoch": 6.948160535117057,
"grad_norm": 1.054419064540089,
"learning_rate": 7.121683774518051e-09,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17308101058006287,
"step": 4155,
"valid_targets_mean": 2646.4,
"valid_targets_min": 1295
},
{
"epoch": 6.956521739130435,
"grad_norm": 1.00371154489669,
"learning_rate": 5.0701135174890944e-09,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29931163787841797,
"step": 4160,
"valid_targets_mean": 3849.4,
"valid_targets_min": 403
},
{
"epoch": 6.964882943143813,
"grad_norm": 0.930732845194307,
"learning_rate": 3.3662137026535537e-09,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22841259837150574,
"step": 4165,
"valid_targets_mean": 3192.3,
"valid_targets_min": 1398
},
{
"epoch": 6.973244147157191,
"grad_norm": 0.9699847666900223,
"learning_rate": 2.0100139573031584e-09,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2246263176202774,
"step": 4170,
"valid_targets_mean": 2845.4,
"valid_targets_min": 1337
},
{
"epoch": 6.981605351170568,
"grad_norm": 0.9378995458223955,
"learning_rate": 1.0015378629413265e-09,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21635910868644714,
"step": 4175,
"valid_targets_mean": 2931.9,
"valid_targets_min": 780
},
{
"epoch": 6.989966555183947,
"grad_norm": 1.0220155583231438,
"learning_rate": 3.4080295488347903e-10,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2119850516319275,
"step": 4180,
"valid_targets_mean": 2728.2,
"valid_targets_min": 1313
},
{
"epoch": 6.998327759197324,
"grad_norm": 0.9751477515928492,
"learning_rate": 2.7820721939519902e-11,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21303658187389374,
"step": 4185,
"valid_targets_mean": 3151.9,
"valid_targets_min": 1522
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22936706244945526,
"step": 4186,
"total_flos": 791537577689088.0,
"train_loss": 0.17696809689205084,
"train_runtime": 13311.7439,
"train_samples_per_second": 5.027,
"train_steps_per_second": 0.314,
"valid_targets_mean": 3387.6,
"valid_targets_min": 1204
}
],
"logging_steps": 5,
"max_steps": 4186,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 791537577689088.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}