{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4368, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.00801924619085806, "grad_norm": 8.313740982008923, "learning_rate": 3.661327231121282e-07, "loss": 0.869, "loss_nan_ranks": 0, "loss_rank_avg": 0.48422402143478394, "step": 5, "valid_targets_mean": 3345.4, "valid_targets_min": 1130 }, { "epoch": 0.01603849238171612, "grad_norm": 8.69878286285814, "learning_rate": 8.237986270022884e-07, "loss": 0.8969, "loss_nan_ranks": 0, "loss_rank_avg": 0.5387725234031677, "step": 10, "valid_targets_mean": 3215.9, "valid_targets_min": 1626 }, { "epoch": 0.024057738572574178, "grad_norm": 7.088732892506888, "learning_rate": 1.2814645308924487e-06, "loss": 0.8442, "loss_nan_ranks": 0, "loss_rank_avg": 0.3239784836769104, "step": 15, "valid_targets_mean": 4054.0, "valid_targets_min": 1373 }, { "epoch": 0.03207698476343224, "grad_norm": 5.514543935307852, "learning_rate": 1.7391304347826088e-06, "loss": 0.8457, "loss_nan_ranks": 0, "loss_rank_avg": 0.30969667434692383, "step": 20, "valid_targets_mean": 3318.2, "valid_targets_min": 1351 }, { "epoch": 0.040096230954290296, "grad_norm": 4.91461430890284, "learning_rate": 2.196796338672769e-06, "loss": 0.8157, "loss_nan_ranks": 0, "loss_rank_avg": 0.30109691619873047, "step": 25, "valid_targets_mean": 4198.5, "valid_targets_min": 1501 }, { "epoch": 0.048115477145148355, "grad_norm": 4.047882001978824, "learning_rate": 2.654462242562929e-06, "loss": 0.7751, "loss_nan_ranks": 0, "loss_rank_avg": 0.5099153518676758, "step": 30, "valid_targets_mean": 4115.9, "valid_targets_min": 1498 }, { "epoch": 0.056134723336006415, "grad_norm": 3.0199670668025567, "learning_rate": 3.1121281464530894e-06, "loss": 0.7276, "loss_nan_ranks": 0, "loss_rank_avg": 0.37805676460266113, "step": 35, "valid_targets_mean": 3285.9, "valid_targets_min": 1410 }, { "epoch": 0.06415396952686447, "grad_norm": 1.9962784811319771, "learning_rate": 3.56979405034325e-06, "loss": 0.7159, "loss_nan_ranks": 0, "loss_rank_avg": 0.36083686351776123, "step": 40, "valid_targets_mean": 4623.9, "valid_targets_min": 1285 }, { "epoch": 0.07217321571772253, "grad_norm": 1.3260517674540337, "learning_rate": 4.0274599542334094e-06, "loss": 0.6569, "loss_nan_ranks": 0, "loss_rank_avg": 0.4008219540119171, "step": 45, "valid_targets_mean": 4624.8, "valid_targets_min": 1879 }, { "epoch": 0.08019246190858059, "grad_norm": 1.243564937333077, "learning_rate": 4.48512585812357e-06, "loss": 0.6293, "loss_nan_ranks": 0, "loss_rank_avg": 0.26258644461631775, "step": 50, "valid_targets_mean": 2541.2, "valid_targets_min": 692 }, { "epoch": 0.08821170809943865, "grad_norm": 1.0342084536151661, "learning_rate": 4.94279176201373e-06, "loss": 0.6711, "loss_nan_ranks": 0, "loss_rank_avg": 0.3230687975883484, "step": 55, "valid_targets_mean": 3970.5, "valid_targets_min": 938 }, { "epoch": 0.09623095429029671, "grad_norm": 1.000715187181818, "learning_rate": 5.400457665903891e-06, "loss": 0.6423, "loss_nan_ranks": 0, "loss_rank_avg": 0.4008551836013794, "step": 60, "valid_targets_mean": 6482.1, "valid_targets_min": 2441 }, { "epoch": 0.10425020048115477, "grad_norm": 0.9742888960296938, "learning_rate": 5.858123569794051e-06, "loss": 0.6364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3344465494155884, "step": 65, "valid_targets_mean": 3673.5, "valid_targets_min": 1071 }, { "epoch": 0.11226944667201283, "grad_norm": 0.8790762890640784, "learning_rate": 6.31578947368421e-06, "loss": 0.6252, "loss_nan_ranks": 0, "loss_rank_avg": 0.3023986220359802, "step": 70, "valid_targets_mean": 3469.6, "valid_targets_min": 1955 }, { "epoch": 0.12028869286287089, "grad_norm": 0.8929131904667906, "learning_rate": 6.773455377574372e-06, "loss": 0.606, "loss_nan_ranks": 0, "loss_rank_avg": 0.21897467970848083, "step": 75, "valid_targets_mean": 2452.0, "valid_targets_min": 1645 }, { "epoch": 0.12830793905372895, "grad_norm": 0.7663072367257558, "learning_rate": 7.231121281464531e-06, "loss": 0.5629, "loss_nan_ranks": 0, "loss_rank_avg": 0.241590678691864, "step": 80, "valid_targets_mean": 4069.1, "valid_targets_min": 1336 }, { "epoch": 0.136327185244587, "grad_norm": 0.7343387826633802, "learning_rate": 7.688787185354691e-06, "loss": 0.6027, "loss_nan_ranks": 0, "loss_rank_avg": 0.21094068884849548, "step": 85, "valid_targets_mean": 3845.5, "valid_targets_min": 1581 }, { "epoch": 0.14434643143544507, "grad_norm": 0.8153893864380317, "learning_rate": 8.146453089244852e-06, "loss": 0.5877, "loss_nan_ranks": 0, "loss_rank_avg": 0.3595584034919739, "step": 90, "valid_targets_mean": 4052.0, "valid_targets_min": 1634 }, { "epoch": 0.15236567762630313, "grad_norm": 0.6932668353955103, "learning_rate": 8.604118993135013e-06, "loss": 0.5497, "loss_nan_ranks": 0, "loss_rank_avg": 0.33834296464920044, "step": 95, "valid_targets_mean": 5480.1, "valid_targets_min": 1283 }, { "epoch": 0.16038492381716118, "grad_norm": 0.7777890816483226, "learning_rate": 9.061784897025172e-06, "loss": 0.5655, "loss_nan_ranks": 0, "loss_rank_avg": 0.33180496096611023, "step": 100, "valid_targets_mean": 3460.2, "valid_targets_min": 1868 }, { "epoch": 0.16840417000801924, "grad_norm": 0.5283169926803735, "learning_rate": 9.519450800915333e-06, "loss": 0.5399, "loss_nan_ranks": 0, "loss_rank_avg": 0.2036198526620865, "step": 105, "valid_targets_mean": 5922.9, "valid_targets_min": 2107 }, { "epoch": 0.1764234161988773, "grad_norm": 0.697221665984805, "learning_rate": 9.977116704805492e-06, "loss": 0.5073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2451438009738922, "step": 110, "valid_targets_mean": 3265.9, "valid_targets_min": 2124 }, { "epoch": 0.18444266238973536, "grad_norm": 0.7008730936667373, "learning_rate": 1.0434782608695653e-05, "loss": 0.5299, "loss_nan_ranks": 0, "loss_rank_avg": 0.3022688925266266, "step": 115, "valid_targets_mean": 4371.0, "valid_targets_min": 1146 }, { "epoch": 0.19246190858059342, "grad_norm": 0.6439155109775441, "learning_rate": 1.0892448512585814e-05, "loss": 0.4918, "loss_nan_ranks": 0, "loss_rank_avg": 0.25761961936950684, "step": 120, "valid_targets_mean": 4046.0, "valid_targets_min": 1546 }, { "epoch": 0.20048115477145148, "grad_norm": 0.5833963512550437, "learning_rate": 1.1350114416475973e-05, "loss": 0.5327, "loss_nan_ranks": 0, "loss_rank_avg": 0.21748362481594086, "step": 125, "valid_targets_mean": 4139.4, "valid_targets_min": 1287 }, { "epoch": 0.20850040096230954, "grad_norm": 0.7103416991437168, "learning_rate": 1.1807780320366134e-05, "loss": 0.5084, "loss_nan_ranks": 0, "loss_rank_avg": 0.2946273684501648, "step": 130, "valid_targets_mean": 4061.2, "valid_targets_min": 1811 }, { "epoch": 0.2165196471531676, "grad_norm": 0.6807314277664426, "learning_rate": 1.2265446224256295e-05, "loss": 0.5241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2987809181213379, "step": 135, "valid_targets_mean": 4009.8, "valid_targets_min": 1916 }, { "epoch": 0.22453889334402566, "grad_norm": 0.7480876393642586, "learning_rate": 1.2723112128146454e-05, "loss": 0.5581, "loss_nan_ranks": 0, "loss_rank_avg": 0.30567678809165955, "step": 140, "valid_targets_mean": 3422.6, "valid_targets_min": 1463 }, { "epoch": 0.23255813953488372, "grad_norm": 0.6184882136658373, "learning_rate": 1.3180778032036615e-05, "loss": 0.5081, "loss_nan_ranks": 0, "loss_rank_avg": 0.2955462336540222, "step": 145, "valid_targets_mean": 5266.5, "valid_targets_min": 1721 }, { "epoch": 0.24057738572574178, "grad_norm": 0.629492550820491, "learning_rate": 1.3638443935926776e-05, "loss": 0.5211, "loss_nan_ranks": 0, "loss_rank_avg": 0.20750996470451355, "step": 150, "valid_targets_mean": 3665.2, "valid_targets_min": 1339 }, { "epoch": 0.24859663191659984, "grad_norm": 0.7885648489531245, "learning_rate": 1.4096109839816933e-05, "loss": 0.4779, "loss_nan_ranks": 0, "loss_rank_avg": 0.34341418743133545, "step": 155, "valid_targets_mean": 4196.0, "valid_targets_min": 1501 }, { "epoch": 0.2566158781074579, "grad_norm": 0.6300044643868511, "learning_rate": 1.4553775743707096e-05, "loss": 0.4933, "loss_nan_ranks": 0, "loss_rank_avg": 0.2758129835128784, "step": 160, "valid_targets_mean": 5468.2, "valid_targets_min": 1288 }, { "epoch": 0.264635124298316, "grad_norm": 0.6391644825807138, "learning_rate": 1.5011441647597256e-05, "loss": 0.4866, "loss_nan_ranks": 0, "loss_rank_avg": 0.3081105649471283, "step": 165, "valid_targets_mean": 5716.5, "valid_targets_min": 2127 }, { "epoch": 0.272654370489174, "grad_norm": 0.7935923586616551, "learning_rate": 1.5469107551487414e-05, "loss": 0.5083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117885947227478, "step": 170, "valid_targets_mean": 2941.4, "valid_targets_min": 810 }, { "epoch": 0.2806736166800321, "grad_norm": 0.6530606093704732, "learning_rate": 1.5926773455377575e-05, "loss": 0.4928, "loss_nan_ranks": 0, "loss_rank_avg": 0.195469468832016, "step": 175, "valid_targets_mean": 3944.8, "valid_targets_min": 1484 }, { "epoch": 0.28869286287089013, "grad_norm": 0.6446059581638844, "learning_rate": 1.6384439359267736e-05, "loss": 0.4739, "loss_nan_ranks": 0, "loss_rank_avg": 0.29873958230018616, "step": 180, "valid_targets_mean": 5453.0, "valid_targets_min": 1483 }, { "epoch": 0.2967121090617482, "grad_norm": 0.6138929387268349, "learning_rate": 1.6842105263157896e-05, "loss": 0.4805, "loss_nan_ranks": 0, "loss_rank_avg": 0.15602803230285645, "step": 185, "valid_targets_mean": 3395.1, "valid_targets_min": 1011 }, { "epoch": 0.30473135525260625, "grad_norm": 0.7895610581771481, "learning_rate": 1.7299771167048057e-05, "loss": 0.4829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2401597499847412, "step": 190, "valid_targets_mean": 2895.6, "valid_targets_min": 1599 }, { "epoch": 0.31275060144346434, "grad_norm": 0.729603285280062, "learning_rate": 1.7757437070938218e-05, "loss": 0.527, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671535015106201, "step": 195, "valid_targets_mean": 3562.6, "valid_targets_min": 1527 }, { "epoch": 0.32076984763432237, "grad_norm": 0.5253955703069345, "learning_rate": 1.8215102974828376e-05, "loss": 0.5199, "loss_nan_ranks": 0, "loss_rank_avg": 0.2831480801105499, "step": 200, "valid_targets_mean": 7620.6, "valid_targets_min": 1700 }, { "epoch": 0.32878909382518046, "grad_norm": 0.6865277172463633, "learning_rate": 1.8672768878718537e-05, "loss": 0.4971, "loss_nan_ranks": 0, "loss_rank_avg": 0.16837254166603088, "step": 205, "valid_targets_mean": 3245.9, "valid_targets_min": 1096 }, { "epoch": 0.3368083400160385, "grad_norm": 0.6470638235142138, "learning_rate": 1.9130434782608697e-05, "loss": 0.4501, "loss_nan_ranks": 0, "loss_rank_avg": 0.1938144564628601, "step": 210, "valid_targets_mean": 4453.6, "valid_targets_min": 1014 }, { "epoch": 0.3448275862068966, "grad_norm": 0.702129479232604, "learning_rate": 1.9588100686498858e-05, "loss": 0.4925, "loss_nan_ranks": 0, "loss_rank_avg": 0.21430332958698273, "step": 215, "valid_targets_mean": 3609.4, "valid_targets_min": 1152 }, { "epoch": 0.3528468323977546, "grad_norm": 0.6475901989881273, "learning_rate": 2.004576659038902e-05, "loss": 0.4987, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964100241661072, "step": 220, "valid_targets_mean": 5638.2, "valid_targets_min": 1248 }, { "epoch": 0.3608660785886127, "grad_norm": 0.6638281189029952, "learning_rate": 2.050343249427918e-05, "loss": 0.4839, "loss_nan_ranks": 0, "loss_rank_avg": 0.20554473996162415, "step": 225, "valid_targets_mean": 3964.6, "valid_targets_min": 1751 }, { "epoch": 0.3688853247794707, "grad_norm": 0.6011178975893025, "learning_rate": 2.0961098398169337e-05, "loss": 0.4699, "loss_nan_ranks": 0, "loss_rank_avg": 0.21771050989627838, "step": 230, "valid_targets_mean": 5652.9, "valid_targets_min": 1419 }, { "epoch": 0.3769045709703288, "grad_norm": 0.6918051581990787, "learning_rate": 2.14187643020595e-05, "loss": 0.4965, "loss_nan_ranks": 0, "loss_rank_avg": 0.23044303059577942, "step": 235, "valid_targets_mean": 4066.4, "valid_targets_min": 989 }, { "epoch": 0.38492381716118684, "grad_norm": 0.6397795878243587, "learning_rate": 2.187643020594966e-05, "loss": 0.4772, "loss_nan_ranks": 0, "loss_rank_avg": 0.2183871567249298, "step": 240, "valid_targets_mean": 4418.2, "valid_targets_min": 1634 }, { "epoch": 0.39294306335204493, "grad_norm": 0.6314059989661045, "learning_rate": 2.2334096109839817e-05, "loss": 0.4586, "loss_nan_ranks": 0, "loss_rank_avg": 0.23583510518074036, "step": 245, "valid_targets_mean": 3972.2, "valid_targets_min": 1116 }, { "epoch": 0.40096230954290296, "grad_norm": 0.7521340694225619, "learning_rate": 2.279176201372998e-05, "loss": 0.4214, "loss_nan_ranks": 0, "loss_rank_avg": 0.18104761838912964, "step": 250, "valid_targets_mean": 2805.6, "valid_targets_min": 1609 }, { "epoch": 0.40898155573376105, "grad_norm": 0.6589043727793573, "learning_rate": 2.3249427917620138e-05, "loss": 0.4829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823362410068512, "step": 255, "valid_targets_mean": 2975.9, "valid_targets_min": 964 }, { "epoch": 0.4170008019246191, "grad_norm": 0.6273900082236032, "learning_rate": 2.37070938215103e-05, "loss": 0.4885, "loss_nan_ranks": 0, "loss_rank_avg": 0.22542431950569153, "step": 260, "valid_targets_mean": 3486.6, "valid_targets_min": 881 }, { "epoch": 0.42502004811547717, "grad_norm": 0.6081957372926003, "learning_rate": 2.4164759725400463e-05, "loss": 0.4647, "loss_nan_ranks": 0, "loss_rank_avg": 0.24096626043319702, "step": 265, "valid_targets_mean": 5235.9, "valid_targets_min": 1595 }, { "epoch": 0.4330392943063352, "grad_norm": 0.7845378461800494, "learning_rate": 2.462242562929062e-05, "loss": 0.5028, "loss_nan_ranks": 0, "loss_rank_avg": 0.23097199201583862, "step": 270, "valid_targets_mean": 3027.6, "valid_targets_min": 1364 }, { "epoch": 0.4410585404971933, "grad_norm": 0.7755771169814443, "learning_rate": 2.508009153318078e-05, "loss": 0.4452, "loss_nan_ranks": 0, "loss_rank_avg": 0.2752797305583954, "step": 275, "valid_targets_mean": 3456.0, "valid_targets_min": 1642 }, { "epoch": 0.4490777866880513, "grad_norm": 0.6442704506397136, "learning_rate": 2.5537757437070943e-05, "loss": 0.4668, "loss_nan_ranks": 0, "loss_rank_avg": 0.29733771085739136, "step": 280, "valid_targets_mean": 7013.9, "valid_targets_min": 1802 }, { "epoch": 0.4570970328789094, "grad_norm": 0.7352489212493196, "learning_rate": 2.59954233409611e-05, "loss": 0.4845, "loss_nan_ranks": 0, "loss_rank_avg": 0.28917449712753296, "step": 285, "valid_targets_mean": 4661.9, "valid_targets_min": 3003 }, { "epoch": 0.46511627906976744, "grad_norm": 0.7720755855494124, "learning_rate": 2.645308924485126e-05, "loss": 0.5035, "loss_nan_ranks": 0, "loss_rank_avg": 0.2599334716796875, "step": 290, "valid_targets_mean": 2824.4, "valid_targets_min": 1320 }, { "epoch": 0.4731355252606255, "grad_norm": 0.7363743109818579, "learning_rate": 2.6910755148741422e-05, "loss": 0.479, "loss_nan_ranks": 0, "loss_rank_avg": 0.31573259830474854, "step": 295, "valid_targets_mean": 4273.9, "valid_targets_min": 1738 }, { "epoch": 0.48115477145148355, "grad_norm": 0.744633521519781, "learning_rate": 2.7368421052631583e-05, "loss": 0.4797, "loss_nan_ranks": 0, "loss_rank_avg": 0.3156285881996155, "step": 300, "valid_targets_mean": 5315.2, "valid_targets_min": 360 }, { "epoch": 0.48917401764234164, "grad_norm": 0.7129949807940422, "learning_rate": 2.782608695652174e-05, "loss": 0.4419, "loss_nan_ranks": 0, "loss_rank_avg": 0.27106714248657227, "step": 305, "valid_targets_mean": 3763.2, "valid_targets_min": 1351 }, { "epoch": 0.4971932638331997, "grad_norm": 0.6175971826717892, "learning_rate": 2.8283752860411904e-05, "loss": 0.4453, "loss_nan_ranks": 0, "loss_rank_avg": 0.16650423407554626, "step": 310, "valid_targets_mean": 5072.0, "valid_targets_min": 1509 }, { "epoch": 0.5052125100240578, "grad_norm": 0.7040236348581613, "learning_rate": 2.8741418764302062e-05, "loss": 0.4844, "loss_nan_ranks": 0, "loss_rank_avg": 0.3040885329246521, "step": 315, "valid_targets_mean": 4063.0, "valid_targets_min": 1296 }, { "epoch": 0.5132317562149158, "grad_norm": 0.8830857148509627, "learning_rate": 2.9199084668192223e-05, "loss": 0.4629, "loss_nan_ranks": 0, "loss_rank_avg": 0.24983727931976318, "step": 320, "valid_targets_mean": 3427.4, "valid_targets_min": 1365 }, { "epoch": 0.5212510024057738, "grad_norm": 0.7984683477663427, "learning_rate": 2.9656750572082384e-05, "loss": 0.458, "loss_nan_ranks": 0, "loss_rank_avg": 0.2035318911075592, "step": 325, "valid_targets_mean": 2357.1, "valid_targets_min": 1003 }, { "epoch": 0.529270248596632, "grad_norm": 0.7839299118682744, "learning_rate": 3.0114416475972544e-05, "loss": 0.4703, "loss_nan_ranks": 0, "loss_rank_avg": 0.2685667872428894, "step": 330, "valid_targets_mean": 4827.5, "valid_targets_min": 1605 }, { "epoch": 0.53728949478749, "grad_norm": 0.6794195326992597, "learning_rate": 3.05720823798627e-05, "loss": 0.4873, "loss_nan_ranks": 0, "loss_rank_avg": 0.19377443194389343, "step": 335, "valid_targets_mean": 3683.9, "valid_targets_min": 1199 }, { "epoch": 0.545308740978348, "grad_norm": 0.5213966576318203, "learning_rate": 3.102974828375286e-05, "loss": 0.4295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12621726095676422, "step": 340, "valid_targets_mean": 4432.0, "valid_targets_min": 1576 }, { "epoch": 0.5533279871692061, "grad_norm": 0.706356642791585, "learning_rate": 3.1487414187643024e-05, "loss": 0.4458, "loss_nan_ranks": 0, "loss_rank_avg": 0.21022140979766846, "step": 345, "valid_targets_mean": 5536.6, "valid_targets_min": 1518 }, { "epoch": 0.5613472333600642, "grad_norm": 0.6835233787156912, "learning_rate": 3.1945080091533184e-05, "loss": 0.4444, "loss_nan_ranks": 0, "loss_rank_avg": 0.2203514128923416, "step": 350, "valid_targets_mean": 4027.5, "valid_targets_min": 1358 }, { "epoch": 0.5693664795509222, "grad_norm": 0.6619068795239736, "learning_rate": 3.240274599542334e-05, "loss": 0.4171, "loss_nan_ranks": 0, "loss_rank_avg": 0.19794681668281555, "step": 355, "valid_targets_mean": 4365.2, "valid_targets_min": 2057 }, { "epoch": 0.5773857257417803, "grad_norm": 0.7758989332936811, "learning_rate": 3.2860411899313506e-05, "loss": 0.4951, "loss_nan_ranks": 0, "loss_rank_avg": 0.3366064429283142, "step": 360, "valid_targets_mean": 3579.4, "valid_targets_min": 1889 }, { "epoch": 0.5854049719326383, "grad_norm": 0.572316916164085, "learning_rate": 3.331807780320366e-05, "loss": 0.4308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2127903699874878, "step": 365, "valid_targets_mean": 4391.5, "valid_targets_min": 1306 }, { "epoch": 0.5934242181234964, "grad_norm": 0.8060101627155969, "learning_rate": 3.377574370709382e-05, "loss": 0.4272, "loss_nan_ranks": 0, "loss_rank_avg": 0.2559089660644531, "step": 370, "valid_targets_mean": 4548.6, "valid_targets_min": 1743 }, { "epoch": 0.6014434643143545, "grad_norm": 0.7342884918292761, "learning_rate": 3.423340961098399e-05, "loss": 0.4531, "loss_nan_ranks": 0, "loss_rank_avg": 0.2449020892381668, "step": 375, "valid_targets_mean": 4173.0, "valid_targets_min": 851 }, { "epoch": 0.6094627105052125, "grad_norm": 0.6932121954679972, "learning_rate": 3.469107551487414e-05, "loss": 0.4438, "loss_nan_ranks": 0, "loss_rank_avg": 0.2163270115852356, "step": 380, "valid_targets_mean": 3886.9, "valid_targets_min": 1276 }, { "epoch": 0.6174819566960705, "grad_norm": 0.7715154208797361, "learning_rate": 3.5148741418764304e-05, "loss": 0.4325, "loss_nan_ranks": 0, "loss_rank_avg": 0.2262679934501648, "step": 385, "valid_targets_mean": 4779.1, "valid_targets_min": 2040 }, { "epoch": 0.6255012028869287, "grad_norm": 0.6983503647349161, "learning_rate": 3.5606407322654464e-05, "loss": 0.4289, "loss_nan_ranks": 0, "loss_rank_avg": 0.25364089012145996, "step": 390, "valid_targets_mean": 4373.1, "valid_targets_min": 1653 }, { "epoch": 0.6335204490777867, "grad_norm": 0.650166494248333, "learning_rate": 3.6064073226544625e-05, "loss": 0.4424, "loss_nan_ranks": 0, "loss_rank_avg": 0.1815357506275177, "step": 395, "valid_targets_mean": 3892.1, "valid_targets_min": 1493 }, { "epoch": 0.6415396952686447, "grad_norm": 0.6281878304316749, "learning_rate": 3.6521739130434786e-05, "loss": 0.4248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615407705307007, "step": 400, "valid_targets_mean": 5092.6, "valid_targets_min": 2034 }, { "epoch": 0.6495589414595028, "grad_norm": 0.6316023344367048, "learning_rate": 3.697940503432495e-05, "loss": 0.4216, "loss_nan_ranks": 0, "loss_rank_avg": 0.2884695529937744, "step": 405, "valid_targets_mean": 5941.5, "valid_targets_min": 1671 }, { "epoch": 0.6575781876503609, "grad_norm": 0.6656637581337326, "learning_rate": 3.743707093821511e-05, "loss": 0.4533, "loss_nan_ranks": 0, "loss_rank_avg": 0.2328605353832245, "step": 410, "valid_targets_mean": 4097.0, "valid_targets_min": 1930 }, { "epoch": 0.6655974338412189, "grad_norm": 0.6571360392327468, "learning_rate": 3.789473684210526e-05, "loss": 0.4429, "loss_nan_ranks": 0, "loss_rank_avg": 0.1997435986995697, "step": 415, "valid_targets_mean": 5019.8, "valid_targets_min": 1927 }, { "epoch": 0.673616680032077, "grad_norm": 0.6170027112876605, "learning_rate": 3.835240274599543e-05, "loss": 0.4043, "loss_nan_ranks": 0, "loss_rank_avg": 0.237014502286911, "step": 420, "valid_targets_mean": 5630.4, "valid_targets_min": 1932 }, { "epoch": 0.681635926222935, "grad_norm": 0.6551577656712124, "learning_rate": 3.8810068649885584e-05, "loss": 0.4169, "loss_nan_ranks": 0, "loss_rank_avg": 0.19945791363716125, "step": 425, "valid_targets_mean": 5277.8, "valid_targets_min": 1138 }, { "epoch": 0.6896551724137931, "grad_norm": 0.5852441140362239, "learning_rate": 3.9267734553775745e-05, "loss": 0.4136, "loss_nan_ranks": 0, "loss_rank_avg": 0.13955387473106384, "step": 430, "valid_targets_mean": 3020.5, "valid_targets_min": 2087 }, { "epoch": 0.6976744186046512, "grad_norm": 0.6021829173481317, "learning_rate": 3.9725400457665905e-05, "loss": 0.4141, "loss_nan_ranks": 0, "loss_rank_avg": 0.1376398205757141, "step": 435, "valid_targets_mean": 4271.9, "valid_targets_min": 1333 }, { "epoch": 0.7056936647955092, "grad_norm": 0.6479698160689082, "learning_rate": 3.999997445219712e-05, "loss": 0.4438, "loss_nan_ranks": 0, "loss_rank_avg": 0.22524264454841614, "step": 440, "valid_targets_mean": 5391.4, "valid_targets_min": 1757 }, { "epoch": 0.7137129109863672, "grad_norm": 0.7208389560786789, "learning_rate": 3.999968704016428e-05, "loss": 0.429, "loss_nan_ranks": 0, "loss_rank_avg": 0.15243616700172424, "step": 445, "valid_targets_mean": 2479.2, "valid_targets_min": 970 }, { "epoch": 0.7217321571772254, "grad_norm": 0.7748329379807736, "learning_rate": 3.9999080285949514e-05, "loss": 0.4357, "loss_nan_ranks": 0, "loss_rank_avg": 0.25249481201171875, "step": 450, "valid_targets_mean": 5528.8, "valid_targets_min": 1407 }, { "epoch": 0.7297514033680834, "grad_norm": 0.5195534551910792, "learning_rate": 3.999815419924108e-05, "loss": 0.4554, "loss_nan_ranks": 0, "loss_rank_avg": 0.26327452063560486, "step": 455, "valid_targets_mean": 6266.9, "valid_targets_min": 1342 }, { "epoch": 0.7377706495589414, "grad_norm": 0.5635412505100377, "learning_rate": 3.999690879482614e-05, "loss": 0.4385, "loss_nan_ranks": 0, "loss_rank_avg": 0.18464183807373047, "step": 460, "valid_targets_mean": 5252.4, "valid_targets_min": 1665 }, { "epoch": 0.7457898957497995, "grad_norm": 0.9951524748597607, "learning_rate": 3.9995344092590506e-05, "loss": 0.4318, "loss_nan_ranks": 0, "loss_rank_avg": 0.21847239136695862, "step": 465, "valid_targets_mean": 2516.6, "valid_targets_min": 1035 }, { "epoch": 0.7538091419406576, "grad_norm": 1.1079483899236926, "learning_rate": 3.999346011751835e-05, "loss": 0.4161, "loss_nan_ranks": 0, "loss_rank_avg": 0.2754901945590973, "step": 470, "valid_targets_mean": 4657.5, "valid_targets_min": 917 }, { "epoch": 0.7618283881315157, "grad_norm": 0.6457266593716856, "learning_rate": 3.999125689969176e-05, "loss": 0.4559, "loss_nan_ranks": 0, "loss_rank_avg": 0.15281400084495544, "step": 475, "valid_targets_mean": 2690.4, "valid_targets_min": 1158 }, { "epoch": 0.7698476343223737, "grad_norm": 0.7161175072619643, "learning_rate": 3.9988734474290324e-05, "loss": 0.4136, "loss_nan_ranks": 0, "loss_rank_avg": 0.16189947724342346, "step": 480, "valid_targets_mean": 3288.2, "valid_targets_min": 1547 }, { "epoch": 0.7778668805132317, "grad_norm": 0.8425818311311937, "learning_rate": 3.9985892881590513e-05, "loss": 0.4483, "loss_nan_ranks": 0, "loss_rank_avg": 0.25789886713027954, "step": 485, "valid_targets_mean": 5527.6, "valid_targets_min": 2131 }, { "epoch": 0.7858861267040899, "grad_norm": 0.6816766014086393, "learning_rate": 3.9982732166965054e-05, "loss": 0.4129, "loss_nan_ranks": 0, "loss_rank_avg": 0.2202441394329071, "step": 490, "valid_targets_mean": 4515.8, "valid_targets_min": 1461 }, { "epoch": 0.7939053728949479, "grad_norm": 0.6711499035511631, "learning_rate": 3.997925238088221e-05, "loss": 0.4046, "loss_nan_ranks": 0, "loss_rank_avg": 0.2616243362426758, "step": 495, "valid_targets_mean": 4674.5, "valid_targets_min": 1175 }, { "epoch": 0.8019246190858059, "grad_norm": 0.5792692946536627, "learning_rate": 3.9975453578904975e-05, "loss": 0.4182, "loss_nan_ranks": 0, "loss_rank_avg": 0.17172032594680786, "step": 500, "valid_targets_mean": 3829.4, "valid_targets_min": 1661 }, { "epoch": 0.809943865276664, "grad_norm": 0.6479080676210576, "learning_rate": 3.997133582169018e-05, "loss": 0.4088, "loss_nan_ranks": 0, "loss_rank_avg": 0.2771586775779724, "step": 505, "valid_targets_mean": 4916.1, "valid_targets_min": 2111 }, { "epoch": 0.8179631114675221, "grad_norm": 0.7284911471862828, "learning_rate": 3.996689917498754e-05, "loss": 0.423, "loss_nan_ranks": 0, "loss_rank_avg": 0.22784632444381714, "step": 510, "valid_targets_mean": 3270.2, "valid_targets_min": 1364 }, { "epoch": 0.8259823576583801, "grad_norm": 0.7537417338532415, "learning_rate": 3.9962143709638585e-05, "loss": 0.4254, "loss_nan_ranks": 0, "loss_rank_avg": 0.20665107667446136, "step": 515, "valid_targets_mean": 2749.4, "valid_targets_min": 1224 }, { "epoch": 0.8340016038492382, "grad_norm": 0.5735317711929651, "learning_rate": 3.995706950157554e-05, "loss": 0.4128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2083359658718109, "step": 520, "valid_targets_mean": 4386.8, "valid_targets_min": 1563 }, { "epoch": 0.8420208500400962, "grad_norm": 0.5775968083813575, "learning_rate": 3.995167663182008e-05, "loss": 0.4133, "loss_nan_ranks": 0, "loss_rank_avg": 0.3303985595703125, "step": 525, "valid_targets_mean": 4967.6, "valid_targets_min": 1500 }, { "epoch": 0.8500400962309543, "grad_norm": 0.6953060852286664, "learning_rate": 3.994596518648214e-05, "loss": 0.4705, "loss_nan_ranks": 0, "loss_rank_avg": 0.2025911808013916, "step": 530, "valid_targets_mean": 4558.0, "valid_targets_min": 1886 }, { "epoch": 0.8580593424218124, "grad_norm": 0.6934565862515342, "learning_rate": 3.993993525675838e-05, "loss": 0.4309, "loss_nan_ranks": 0, "loss_rank_avg": 0.3160518705844879, "step": 535, "valid_targets_mean": 5058.6, "valid_targets_min": 1445 }, { "epoch": 0.8660785886126704, "grad_norm": 0.6799717965973326, "learning_rate": 3.993358693893086e-05, "loss": 0.4284, "loss_nan_ranks": 0, "loss_rank_avg": 0.24555282294750214, "step": 540, "valid_targets_mean": 4132.4, "valid_targets_min": 1349 }, { "epoch": 0.8740978348035284, "grad_norm": 0.6091069047749981, "learning_rate": 3.9926920334365457e-05, "loss": 0.4297, "loss_nan_ranks": 0, "loss_rank_avg": 0.09333278238773346, "step": 545, "valid_targets_mean": 2423.5, "valid_targets_min": 833 }, { "epoch": 0.8821170809943866, "grad_norm": 0.9935398003007877, "learning_rate": 3.991993554951023e-05, "loss": 0.4177, "loss_nan_ranks": 0, "loss_rank_avg": 0.20457065105438232, "step": 550, "valid_targets_mean": 2924.2, "valid_targets_min": 1456 }, { "epoch": 0.8901363271852446, "grad_norm": 0.6506939503312682, "learning_rate": 3.991263269589376e-05, "loss": 0.4013, "loss_nan_ranks": 0, "loss_rank_avg": 0.24844929575920105, "step": 555, "valid_targets_mean": 4460.2, "valid_targets_min": 1352 }, { "epoch": 0.8981555733761026, "grad_norm": 0.7904296869066102, "learning_rate": 3.990501189012332e-05, "loss": 0.409, "loss_nan_ranks": 0, "loss_rank_avg": 0.25031614303588867, "step": 560, "valid_targets_mean": 3274.9, "valid_targets_min": 1033 }, { "epoch": 0.9061748195669607, "grad_norm": 0.6243782360832607, "learning_rate": 3.989707325388305e-05, "loss": 0.4202, "loss_nan_ranks": 0, "loss_rank_avg": 0.20207425951957703, "step": 565, "valid_targets_mean": 4446.5, "valid_targets_min": 1798 }, { "epoch": 0.9141940657578188, "grad_norm": 0.6243052859782692, "learning_rate": 3.9888816913932016e-05, "loss": 0.4132, "loss_nan_ranks": 0, "loss_rank_avg": 0.20946535468101501, "step": 570, "valid_targets_mean": 4064.6, "valid_targets_min": 1004 }, { "epoch": 0.9222133119486768, "grad_norm": 0.8133657221603788, "learning_rate": 3.988024300210215e-05, "loss": 0.4147, "loss_nan_ranks": 0, "loss_rank_avg": 0.17629793286323547, "step": 575, "valid_targets_mean": 2829.0, "valid_targets_min": 1334 }, { "epoch": 0.9302325581395349, "grad_norm": 0.5933036701633775, "learning_rate": 3.987135165529618e-05, "loss": 0.3945, "loss_nan_ranks": 0, "loss_rank_avg": 0.14002780616283417, "step": 580, "valid_targets_mean": 3140.2, "valid_targets_min": 1598 }, { "epoch": 0.9382518043303929, "grad_norm": 0.6572313159662928, "learning_rate": 3.9862143015485446e-05, "loss": 0.41, "loss_nan_ranks": 0, "loss_rank_avg": 0.19144278764724731, "step": 585, "valid_targets_mean": 4209.8, "valid_targets_min": 951 }, { "epoch": 0.946271050521251, "grad_norm": 0.7182512157499061, "learning_rate": 3.985261722970759e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.2679348587989807, "step": 590, "valid_targets_mean": 3733.0, "valid_targets_min": 1711 }, { "epoch": 0.9542902967121091, "grad_norm": 0.6599170152735541, "learning_rate": 3.984277445006426e-05, "loss": 0.4245, "loss_nan_ranks": 0, "loss_rank_avg": 0.21976399421691895, "step": 595, "valid_targets_mean": 3530.1, "valid_targets_min": 1079 }, { "epoch": 0.9623095429029671, "grad_norm": 0.5769175180828044, "learning_rate": 3.9832614833718654e-05, "loss": 0.4254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2880416512489319, "step": 600, "valid_targets_mean": 6344.4, "valid_targets_min": 937 }, { "epoch": 0.9703287890938251, "grad_norm": 0.6263189640875445, "learning_rate": 3.9822138542893005e-05, "loss": 0.4096, "loss_nan_ranks": 0, "loss_rank_avg": 0.1385025531053543, "step": 605, "valid_targets_mean": 3284.1, "valid_targets_min": 1832 }, { "epoch": 0.9783480352846833, "grad_norm": 0.7609485085875123, "learning_rate": 3.9811345744866014e-05, "loss": 0.4249, "loss_nan_ranks": 0, "loss_rank_avg": 0.180627703666687, "step": 610, "valid_targets_mean": 1876.9, "valid_targets_min": 855 }, { "epoch": 0.9863672814755413, "grad_norm": 0.6052202116295862, "learning_rate": 3.980023661197016e-05, "loss": 0.431, "loss_nan_ranks": 0, "loss_rank_avg": 0.28665053844451904, "step": 615, "valid_targets_mean": 5199.5, "valid_targets_min": 1140 }, { "epoch": 0.9943865276663993, "grad_norm": 0.7582336087430221, "learning_rate": 3.978881132158896e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.23537395894527435, "step": 620, "valid_targets_mean": 3701.1, "valid_targets_min": 1152 }, { "epoch": 1.0016038492381716, "grad_norm": 0.695598402136173, "learning_rate": 3.9777070056154124e-05, "loss": 0.3859, "loss_nan_ranks": 0, "loss_rank_avg": 0.17286968231201172, "step": 625, "valid_targets_mean": 2414.4, "valid_targets_min": 1434 }, { "epoch": 1.0096230954290297, "grad_norm": 0.615630823687904, "learning_rate": 3.976501300314264e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.1431884765625, "step": 630, "valid_targets_mean": 3064.6, "valid_targets_min": 1214 }, { "epoch": 1.0176423416198876, "grad_norm": 0.6850838344428346, "learning_rate": 3.9752640355073825e-05, "loss": 0.4045, "loss_nan_ranks": 0, "loss_rank_avg": 0.16621248424053192, "step": 635, "valid_targets_mean": 3180.9, "valid_targets_min": 1285 }, { "epoch": 1.0256615878107458, "grad_norm": 0.5619195455110378, "learning_rate": 3.9739952309506175e-05, "loss": 0.3786, "loss_nan_ranks": 0, "loss_rank_avg": 0.15314628183841705, "step": 640, "valid_targets_mean": 4104.9, "valid_targets_min": 1536 }, { "epoch": 1.033680834001604, "grad_norm": 0.6675969722042899, "learning_rate": 3.972694906903427e-05, "loss": 0.3833, "loss_nan_ranks": 0, "loss_rank_avg": 0.21451722085475922, "step": 645, "valid_targets_mean": 3510.8, "valid_targets_min": 945 }, { "epoch": 1.0417000801924619, "grad_norm": 0.6796820596998153, "learning_rate": 3.971363084128552e-05, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.1613035798072815, "step": 650, "valid_targets_mean": 2254.0, "valid_targets_min": 883 }, { "epoch": 1.04971932638332, "grad_norm": 0.5138699133063548, "learning_rate": 3.969999783891685e-05, "loss": 0.3736, "loss_nan_ranks": 0, "loss_rank_avg": 0.14441242814064026, "step": 655, "valid_targets_mean": 5016.5, "valid_targets_min": 1355 }, { "epoch": 1.057738572574178, "grad_norm": 0.549376268830875, "learning_rate": 3.96860502796113e-05, "loss": 0.4123, "loss_nan_ranks": 0, "loss_rank_avg": 0.2061927616596222, "step": 660, "valid_targets_mean": 6110.9, "valid_targets_min": 2075 }, { "epoch": 1.065757818765036, "grad_norm": 0.7311459967280249, "learning_rate": 3.967178838607456e-05, "loss": 0.3839, "loss_nan_ranks": 0, "loss_rank_avg": 0.2232741117477417, "step": 665, "valid_targets_mean": 3224.8, "valid_targets_min": 1420 }, { "epoch": 1.0737770649558942, "grad_norm": 0.5499017486701547, "learning_rate": 3.965721238603139e-05, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.16423560678958893, "step": 670, "valid_targets_mean": 4179.4, "valid_targets_min": 1366 }, { "epoch": 1.0817963111467521, "grad_norm": 0.6875258421977899, "learning_rate": 3.964232251222203e-05, "loss": 0.4207, "loss_nan_ranks": 0, "loss_rank_avg": 0.15144357085227966, "step": 675, "valid_targets_mean": 2502.8, "valid_targets_min": 1463 }, { "epoch": 1.0898155573376103, "grad_norm": 0.6340623830629193, "learning_rate": 3.962711900239844e-05, "loss": 0.3697, "loss_nan_ranks": 0, "loss_rank_avg": 0.16017653048038483, "step": 680, "valid_targets_mean": 2854.1, "valid_targets_min": 1136 }, { "epoch": 1.0978348035284684, "grad_norm": 0.6347481474391807, "learning_rate": 3.961160209932051e-05, "loss": 0.3914, "loss_nan_ranks": 0, "loss_rank_avg": 0.21811774373054504, "step": 685, "valid_targets_mean": 4877.0, "valid_targets_min": 1327 }, { "epoch": 1.1058540497193263, "grad_norm": 0.7578764836248371, "learning_rate": 3.95957720507522e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.19442862272262573, "step": 690, "valid_targets_mean": 4939.2, "valid_targets_min": 1418 }, { "epoch": 1.1138732959101845, "grad_norm": 0.7135318700261571, "learning_rate": 3.957962910945759e-05, "loss": 0.3791, "loss_nan_ranks": 0, "loss_rank_avg": 0.14678996801376343, "step": 695, "valid_targets_mean": 3328.9, "valid_targets_min": 1303 }, { "epoch": 1.1218925421010426, "grad_norm": 0.7595496965888743, "learning_rate": 3.9563173533196805e-05, "loss": 0.4045, "loss_nan_ranks": 0, "loss_rank_avg": 0.17554423213005066, "step": 700, "valid_targets_mean": 2093.6, "valid_targets_min": 1237 }, { "epoch": 1.1299117882919005, "grad_norm": 0.6255982334737784, "learning_rate": 3.954640558472195e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.230742409825325, "step": 705, "valid_targets_mean": 5426.8, "valid_targets_min": 1559 }, { "epoch": 1.1379310344827587, "grad_norm": 0.7293239045809642, "learning_rate": 3.952932553177287e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.20457494258880615, "step": 710, "valid_targets_mean": 4382.8, "valid_targets_min": 1631 }, { "epoch": 1.1459502806736166, "grad_norm": 0.6938425440543589, "learning_rate": 3.95119336470729e-05, "loss": 0.3949, "loss_nan_ranks": 0, "loss_rank_avg": 0.23677586019039154, "step": 715, "valid_targets_mean": 5619.5, "valid_targets_min": 2168 }, { "epoch": 1.1539695268644747, "grad_norm": 0.6576001630605337, "learning_rate": 3.949423020832451e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.24037396907806396, "step": 720, "valid_targets_mean": 4540.8, "valid_targets_min": 851 }, { "epoch": 1.1619887730553329, "grad_norm": 0.4483035830808508, "learning_rate": 3.947621549820485e-05, "loss": 0.3639, "loss_nan_ranks": 0, "loss_rank_avg": 0.12731903791427612, "step": 725, "valid_targets_mean": 4211.2, "valid_targets_min": 1614 }, { "epoch": 1.1700080192461908, "grad_norm": 0.804348533347129, "learning_rate": 3.945788980436129e-05, "loss": 0.3855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18650484085083008, "step": 730, "valid_targets_mean": 2705.8, "valid_targets_min": 1271 }, { "epoch": 1.178027265437049, "grad_norm": 0.6041634251187872, "learning_rate": 3.943925341940673e-05, "loss": 0.4054, "loss_nan_ranks": 0, "loss_rank_avg": 0.19750933349132538, "step": 735, "valid_targets_mean": 3846.0, "valid_targets_min": 1926 }, { "epoch": 1.1860465116279069, "grad_norm": 0.58747886152978, "learning_rate": 3.942030664091503e-05, "loss": 0.3805, "loss_nan_ranks": 0, "loss_rank_avg": 0.17710307240486145, "step": 740, "valid_targets_mean": 2780.9, "valid_targets_min": 1708 }, { "epoch": 1.194065757818765, "grad_norm": 0.6404869784227899, "learning_rate": 3.9401049771416214e-05, "loss": 0.3925, "loss_nan_ranks": 0, "loss_rank_avg": 0.16430872678756714, "step": 745, "valid_targets_mean": 2718.2, "valid_targets_min": 1046 }, { "epoch": 1.2020850040096231, "grad_norm": 0.5710025270152095, "learning_rate": 3.938148311839162e-05, "loss": 0.4026, "loss_nan_ranks": 0, "loss_rank_avg": 0.18448391556739807, "step": 750, "valid_targets_mean": 5132.5, "valid_targets_min": 2265 }, { "epoch": 1.210104250200481, "grad_norm": 0.6497135461400895, "learning_rate": 3.9361606994269014e-05, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.26077187061309814, "step": 755, "valid_targets_mean": 4660.1, "valid_targets_min": 1580 }, { "epoch": 1.2181234963913392, "grad_norm": 0.607110503560847, "learning_rate": 3.934142171641763e-05, "loss": 0.3793, "loss_nan_ranks": 0, "loss_rank_avg": 0.15704308450222015, "step": 760, "valid_targets_mean": 4377.2, "valid_targets_min": 1097 }, { "epoch": 1.2261427425821974, "grad_norm": 0.6094554796598396, "learning_rate": 3.9320927607143003e-05, "loss": 0.4103, "loss_nan_ranks": 0, "loss_rank_avg": 0.12785972654819489, "step": 765, "valid_targets_mean": 2213.1, "valid_targets_min": 1267 }, { "epoch": 1.2341619887730553, "grad_norm": 0.6363340342249799, "learning_rate": 3.9300124993681976e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.1621864140033722, "step": 770, "valid_targets_mean": 3536.1, "valid_targets_min": 1263 }, { "epoch": 1.2421812349639134, "grad_norm": 0.6622582879084168, "learning_rate": 3.9279014208197317e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.1941109001636505, "step": 775, "valid_targets_mean": 3288.6, "valid_targets_min": 1263 }, { "epoch": 1.2502004811547716, "grad_norm": 0.638376853403367, "learning_rate": 3.925759558777252e-05, "loss": 0.3892, "loss_nan_ranks": 0, "loss_rank_avg": 0.23520147800445557, "step": 780, "valid_targets_mean": 4333.1, "valid_targets_min": 1946 }, { "epoch": 1.2582197273456295, "grad_norm": 0.7287126082613413, "learning_rate": 3.923586947440639e-05, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.1913953721523285, "step": 785, "valid_targets_mean": 2964.0, "valid_targets_min": 1587 }, { "epoch": 1.2662389735364876, "grad_norm": 0.5821074784665079, "learning_rate": 3.921383621500758e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.2320612668991089, "step": 790, "valid_targets_mean": 5262.9, "valid_targets_min": 2208 }, { "epoch": 1.2742582197273458, "grad_norm": 0.5959266410039498, "learning_rate": 3.919149616138906e-05, "loss": 0.4131, "loss_nan_ranks": 0, "loss_rank_avg": 0.18204858899116516, "step": 795, "valid_targets_mean": 4003.8, "valid_targets_min": 1494 }, { "epoch": 1.2822774659182037, "grad_norm": 0.538833079574803, "learning_rate": 3.916884967026246e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.15234261751174927, "step": 800, "valid_targets_mean": 3804.1, "valid_targets_min": 1563 }, { "epoch": 1.2902967121090618, "grad_norm": 0.8247769067262545, "learning_rate": 3.914589710323245e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.13381686806678772, "step": 805, "valid_targets_mean": 3968.5, "valid_targets_min": 1180 }, { "epoch": 1.2983159582999197, "grad_norm": 0.773159132160585, "learning_rate": 3.912263882679091e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.16676564514636993, "step": 810, "valid_targets_mean": 2239.8, "valid_targets_min": 1398 }, { "epoch": 1.306335204490778, "grad_norm": 0.6435973604228074, "learning_rate": 3.9099075212311076e-05, "loss": 0.4118, "loss_nan_ranks": 0, "loss_rank_avg": 0.22716866433620453, "step": 815, "valid_targets_mean": 3918.2, "valid_targets_min": 1291 }, { "epoch": 1.3143544506816358, "grad_norm": 0.5259675841357822, "learning_rate": 3.9075206636041646e-05, "loss": 0.3927, "loss_nan_ranks": 0, "loss_rank_avg": 0.24232850968837738, "step": 820, "valid_targets_mean": 7605.0, "valid_targets_min": 1967 }, { "epoch": 1.322373696872494, "grad_norm": 0.7325220804411511, "learning_rate": 3.905103347910075e-05, "loss": 0.396, "loss_nan_ranks": 0, "loss_rank_avg": 0.22928906977176666, "step": 825, "valid_targets_mean": 2980.9, "valid_targets_min": 1683 }, { "epoch": 1.330392943063352, "grad_norm": 0.5647785923965424, "learning_rate": 3.902655612746985e-05, "loss": 0.3951, "loss_nan_ranks": 0, "loss_rank_avg": 0.14142805337905884, "step": 830, "valid_targets_mean": 4535.4, "valid_targets_min": 1344 }, { "epoch": 1.33841218925421, "grad_norm": 0.6198274246253738, "learning_rate": 3.900177497198761e-05, "loss": 0.4102, "loss_nan_ranks": 0, "loss_rank_avg": 0.15712687373161316, "step": 835, "valid_targets_mean": 3244.4, "valid_targets_min": 1910 }, { "epoch": 1.3464314354450682, "grad_norm": 0.7479328322426334, "learning_rate": 3.8976690408343635e-05, "loss": 0.378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1526011973619461, "step": 840, "valid_targets_mean": 1959.6, "valid_targets_min": 1236 }, { "epoch": 1.3544506816359263, "grad_norm": 0.5705913022888958, "learning_rate": 3.8951302837072165e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.21281887590885162, "step": 845, "valid_targets_mean": 5731.0, "valid_targets_min": 1996 }, { "epoch": 1.3624699278267842, "grad_norm": 0.6305200044274495, "learning_rate": 3.892561266354566e-05, "loss": 0.3924, "loss_nan_ranks": 0, "loss_rank_avg": 0.1274857521057129, "step": 850, "valid_targets_mean": 2638.5, "valid_targets_min": 1475 }, { "epoch": 1.3704891740176424, "grad_norm": 0.6540817528238299, "learning_rate": 3.889962029796833e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.22636473178863525, "step": 855, "valid_targets_mean": 4248.0, "valid_targets_min": 1631 }, { "epoch": 1.3785084202085005, "grad_norm": 0.6384044783744945, "learning_rate": 3.887332615536962e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.19277402758598328, "step": 860, "valid_targets_mean": 3839.9, "valid_targets_min": 1393 }, { "epoch": 1.3865276663993584, "grad_norm": 0.5403507036239689, "learning_rate": 3.8846730655597535e-05, "loss": 0.3861, "loss_nan_ranks": 0, "loss_rank_avg": 0.2178334891796112, "step": 865, "valid_targets_mean": 6470.2, "valid_targets_min": 1213 }, { "epoch": 1.3945469125902166, "grad_norm": 0.5879412330667896, "learning_rate": 3.881983422331198e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1219518780708313, "step": 870, "valid_targets_mean": 2703.0, "valid_targets_min": 1619 }, { "epoch": 1.4025661587810747, "grad_norm": 0.5119560422076794, "learning_rate": 3.879263728797792e-05, "loss": 0.4172, "loss_nan_ranks": 0, "loss_rank_avg": 0.2390919178724289, "step": 875, "valid_targets_mean": 7733.4, "valid_targets_min": 1100 }, { "epoch": 1.4105854049719326, "grad_norm": 0.5841873090375073, "learning_rate": 3.876514028385861e-05, "loss": 0.3823, "loss_nan_ranks": 0, "loss_rank_avg": 0.25305986404418945, "step": 880, "valid_targets_mean": 6032.5, "valid_targets_min": 1255 }, { "epoch": 1.4186046511627908, "grad_norm": 0.6537532789732419, "learning_rate": 3.873734365000857e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.17425492405891418, "step": 885, "valid_targets_mean": 3659.5, "valid_targets_min": 814 }, { "epoch": 1.4266238973536487, "grad_norm": 0.6485041173010123, "learning_rate": 3.870924783026663e-05, "loss": 0.3935, "loss_nan_ranks": 0, "loss_rank_avg": 0.2005024552345276, "step": 890, "valid_targets_mean": 3811.0, "valid_targets_min": 951 }, { "epoch": 1.4346431435445068, "grad_norm": 0.7275313045075661, "learning_rate": 3.8680853273248826e-05, "loss": 0.3998, "loss_nan_ranks": 0, "loss_rank_avg": 0.19834119081497192, "step": 895, "valid_targets_mean": 2894.2, "valid_targets_min": 1179 }, { "epoch": 1.4426623897353648, "grad_norm": 0.6458382459028278, "learning_rate": 3.865216043234126e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.23739655315876007, "step": 900, "valid_targets_mean": 3600.1, "valid_targets_min": 1565 }, { "epoch": 1.450681635926223, "grad_norm": 0.667902826457069, "learning_rate": 3.862316976569281e-05, "loss": 0.3911, "loss_nan_ranks": 0, "loss_rank_avg": 0.18984192609786987, "step": 905, "valid_targets_mean": 3311.0, "valid_targets_min": 1529 }, { "epoch": 1.458700882117081, "grad_norm": 0.5301348528975791, "learning_rate": 3.859388173620785e-05, "loss": 0.3768, "loss_nan_ranks": 0, "loss_rank_avg": 0.20433899760246277, "step": 910, "valid_targets_mean": 5428.2, "valid_targets_min": 1908 }, { "epoch": 1.466720128307939, "grad_norm": 0.5548703258066876, "learning_rate": 3.8564296811538874e-05, "loss": 0.418, "loss_nan_ranks": 0, "loss_rank_avg": 0.21961280703544617, "step": 915, "valid_targets_mean": 5185.6, "valid_targets_min": 1395 }, { "epoch": 1.474739374498797, "grad_norm": 0.597151997949445, "learning_rate": 3.853441546407898e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.22741135954856873, "step": 920, "valid_targets_mean": 4965.1, "valid_targets_min": 1490 }, { "epoch": 1.4827586206896552, "grad_norm": 0.5010688320540237, "learning_rate": 3.850423817095438e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.13275910913944244, "step": 925, "valid_targets_mean": 4258.0, "valid_targets_min": 1493 }, { "epoch": 1.4907778668805132, "grad_norm": 0.8174306620777976, "learning_rate": 3.847376541401674e-05, "loss": 0.3943, "loss_nan_ranks": 0, "loss_rank_avg": 0.20243340730667114, "step": 930, "valid_targets_mean": 3649.5, "valid_targets_min": 1774 }, { "epoch": 1.4987971130713713, "grad_norm": 0.7021462499744725, "learning_rate": 3.844299767983551e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.1653379201889038, "step": 935, "valid_targets_mean": 3139.4, "valid_targets_min": 1300 }, { "epoch": 1.5068163592622295, "grad_norm": 0.551702554538306, "learning_rate": 3.841193545969015e-05, "loss": 0.36, "loss_nan_ranks": 0, "loss_rank_avg": 0.16654658317565918, "step": 940, "valid_targets_mean": 4287.2, "valid_targets_min": 1712 }, { "epoch": 1.5148356054530874, "grad_norm": 0.6123396594792097, "learning_rate": 3.8380579249562265e-05, "loss": 0.3755, "loss_nan_ranks": 0, "loss_rank_avg": 0.11518816649913788, "step": 945, "valid_targets_mean": 2894.8, "valid_targets_min": 1059 }, { "epoch": 1.5228548516439455, "grad_norm": 0.6187761971179958, "learning_rate": 3.8348929550127734e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.15089167654514313, "step": 950, "valid_targets_mean": 3219.1, "valid_targets_min": 1324 }, { "epoch": 1.5308740978348037, "grad_norm": 0.6758921374968958, "learning_rate": 3.831698686674866e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.19325017929077148, "step": 955, "valid_targets_mean": 3923.2, "valid_targets_min": 1380 }, { "epoch": 1.5388933440256616, "grad_norm": 0.553373368309608, "learning_rate": 3.828475170946534e-05, "loss": 0.3656, "loss_nan_ranks": 0, "loss_rank_avg": 0.17428003251552582, "step": 960, "valid_targets_mean": 4634.9, "valid_targets_min": 1615 }, { "epoch": 1.5469125902165195, "grad_norm": 0.6395790172827835, "learning_rate": 3.8252224592988087e-05, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.18858684599399567, "step": 965, "valid_targets_mean": 4211.4, "valid_targets_min": 2032 }, { "epoch": 1.5549318364073779, "grad_norm": 0.6854114367908858, "learning_rate": 3.821940603668906e-05, "loss": 0.3721, "loss_nan_ranks": 0, "loss_rank_avg": 0.15687119960784912, "step": 970, "valid_targets_mean": 3116.8, "valid_targets_min": 1047 }, { "epoch": 1.5629510825982358, "grad_norm": 0.7202300491845391, "learning_rate": 3.8186296564593924e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.20200546085834503, "step": 975, "valid_targets_mean": 3873.4, "valid_targets_min": 1518 }, { "epoch": 1.5709703287890937, "grad_norm": 0.6492604424261679, "learning_rate": 3.815289670537351e-05, "loss": 0.3986, "loss_nan_ranks": 0, "loss_rank_avg": 0.09067234396934509, "step": 980, "valid_targets_mean": 2164.9, "valid_targets_min": 1549 }, { "epoch": 1.5789895749799518, "grad_norm": 0.5755956725155771, "learning_rate": 3.811920699233535e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.24794843792915344, "step": 985, "valid_targets_mean": 5809.8, "valid_targets_min": 1139 }, { "epoch": 1.58700882117081, "grad_norm": 0.6035656260523917, "learning_rate": 3.8085227963415186e-05, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.23764899373054504, "step": 990, "valid_targets_mean": 4744.6, "valid_targets_min": 1419 }, { "epoch": 1.595028067361668, "grad_norm": 0.6279806954292144, "learning_rate": 3.805096016116838e-05, "loss": 0.4146, "loss_nan_ranks": 0, "loss_rank_avg": 0.1629919707775116, "step": 995, "valid_targets_mean": 2693.1, "valid_targets_min": 1798 }, { "epoch": 1.603047313552526, "grad_norm": 0.7382597775124584, "learning_rate": 3.801640413276121e-05, "loss": 0.4079, "loss_nan_ranks": 0, "loss_rank_avg": 0.2260105013847351, "step": 1000, "valid_targets_mean": 2633.6, "valid_targets_min": 1706 }, { "epoch": 1.6110665597433842, "grad_norm": 0.573979477466008, "learning_rate": 3.7981560429962204e-05, "loss": 0.3784, "loss_nan_ranks": 0, "loss_rank_avg": 0.18031983077526093, "step": 1005, "valid_targets_mean": 4727.4, "valid_targets_min": 1945 }, { "epoch": 1.6190858059342421, "grad_norm": 0.5255671835014767, "learning_rate": 3.7946429609133274e-05, "loss": 0.3751, "loss_nan_ranks": 0, "loss_rank_avg": 0.1784265786409378, "step": 1010, "valid_targets_mean": 4758.0, "valid_targets_min": 1600 }, { "epoch": 1.6271050521251003, "grad_norm": 0.6913493291750783, "learning_rate": 3.791101223122084e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.18905776739120483, "step": 1015, "valid_targets_mean": 3459.2, "valid_targets_min": 1501 }, { "epoch": 1.6351242983159584, "grad_norm": 0.5676146782725685, "learning_rate": 3.787530886174688e-05, "loss": 0.3933, "loss_nan_ranks": 0, "loss_rank_avg": 0.14749515056610107, "step": 1020, "valid_targets_mean": 3031.5, "valid_targets_min": 1067 }, { "epoch": 1.6431435445068163, "grad_norm": 0.5975286122354355, "learning_rate": 3.783932007079992e-05, "loss": 0.3832, "loss_nan_ranks": 0, "loss_rank_avg": 0.1427052915096283, "step": 1025, "valid_targets_mean": 2939.0, "valid_targets_min": 1255 }, { "epoch": 1.6511627906976745, "grad_norm": 0.6486448049857164, "learning_rate": 3.7803046433025905e-05, "loss": 0.3681, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567174643278122, "step": 1030, "valid_targets_mean": 2957.6, "valid_targets_min": 1203 }, { "epoch": 1.6591820368885326, "grad_norm": 0.649120297289315, "learning_rate": 3.7766488527619024e-05, "loss": 0.384, "loss_nan_ranks": 0, "loss_rank_avg": 0.19277894496917725, "step": 1035, "valid_targets_mean": 4205.9, "valid_targets_min": 1722 }, { "epoch": 1.6672012830793905, "grad_norm": 0.504041788849741, "learning_rate": 3.772964693831247e-05, "loss": 0.392, "loss_nan_ranks": 0, "loss_rank_avg": 0.20917224884033203, "step": 1040, "valid_targets_mean": 6204.8, "valid_targets_min": 925 }, { "epoch": 1.6752205292702484, "grad_norm": 0.5006556041596575, "learning_rate": 3.7692522253369136e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799381971359253, "step": 1045, "valid_targets_mean": 5656.5, "valid_targets_min": 1801 }, { "epoch": 1.6832397754611068, "grad_norm": 0.5355916567478674, "learning_rate": 3.7655115065572194e-05, "loss": 0.3731, "loss_nan_ranks": 0, "loss_rank_avg": 0.1617688238620758, "step": 1050, "valid_targets_mean": 5315.2, "valid_targets_min": 1195 }, { "epoch": 1.6912590216519647, "grad_norm": 0.6605006405457838, "learning_rate": 3.7617425972215626e-05, "loss": 0.3847, "loss_nan_ranks": 0, "loss_rank_avg": 0.15565674006938934, "step": 1055, "valid_targets_mean": 3047.6, "valid_targets_min": 991 }, { "epoch": 1.6992782678428227, "grad_norm": 0.5867059394810048, "learning_rate": 3.757945557509472e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.2331041693687439, "step": 1060, "valid_targets_mean": 5444.6, "valid_targets_min": 1102 }, { "epoch": 1.7072975140336808, "grad_norm": 0.5720752116389921, "learning_rate": 3.7541204480496444e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.1441497951745987, "step": 1065, "valid_targets_mean": 3124.1, "valid_targets_min": 501 }, { "epoch": 1.715316760224539, "grad_norm": 0.7595156059225239, "learning_rate": 3.7502673299189745e-05, "loss": 0.3827, "loss_nan_ranks": 0, "loss_rank_avg": 0.16775290668010712, "step": 1070, "valid_targets_mean": 2317.6, "valid_targets_min": 1106 }, { "epoch": 1.7233360064153969, "grad_norm": 0.5755424388708024, "learning_rate": 3.746386264641583e-05, "loss": 0.3813, "loss_nan_ranks": 0, "loss_rank_avg": 0.16708099842071533, "step": 1075, "valid_targets_mean": 3082.5, "valid_targets_min": 1554 }, { "epoch": 1.731355252606255, "grad_norm": 0.631158884641858, "learning_rate": 3.7424773141878324e-05, "loss": 0.3713, "loss_nan_ranks": 0, "loss_rank_avg": 0.15561020374298096, "step": 1080, "valid_targets_mean": 3028.0, "valid_targets_min": 1479 }, { "epoch": 1.7393744987971131, "grad_norm": 0.5965028551998798, "learning_rate": 3.738540540973338e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.25275903940200806, "step": 1085, "valid_targets_mean": 5063.2, "valid_targets_min": 1365 }, { "epoch": 1.747393744987971, "grad_norm": 0.5659192371242109, "learning_rate": 3.7345760078579695e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16954252123832703, "step": 1090, "valid_targets_mean": 3610.2, "valid_targets_min": 1634 }, { "epoch": 1.7554129911788292, "grad_norm": 0.5069380849543149, "learning_rate": 3.730583778144852e-05, "loss": 0.3525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1400984525680542, "step": 1095, "valid_targets_mean": 3182.9, "valid_targets_min": 1170 }, { "epoch": 1.7634322373696873, "grad_norm": 0.605006474711256, "learning_rate": 3.7265639155793494e-05, "loss": 0.4027, "loss_nan_ranks": 0, "loss_rank_avg": 0.18291226029396057, "step": 1100, "valid_targets_mean": 3794.0, "valid_targets_min": 1094 }, { "epoch": 1.7714514835605453, "grad_norm": 0.574090621545591, "learning_rate": 3.7225164843480503e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.15381957590579987, "step": 1105, "valid_targets_mean": 3089.6, "valid_targets_min": 907 }, { "epoch": 1.7794707297514034, "grad_norm": 0.6430771990270066, "learning_rate": 3.7184415490777426e-05, "loss": 0.387, "loss_nan_ranks": 0, "loss_rank_avg": 0.21809989213943481, "step": 1110, "valid_targets_mean": 4406.8, "valid_targets_min": 1385 }, { "epoch": 1.7874899759422616, "grad_norm": 0.6411894477736148, "learning_rate": 3.714339174834379e-05, "loss": 0.3764, "loss_nan_ranks": 0, "loss_rank_avg": 0.19796337187290192, "step": 1115, "valid_targets_mean": 4073.0, "valid_targets_min": 1535 }, { "epoch": 1.7955092221331195, "grad_norm": 0.6562575782675708, "learning_rate": 3.710209427122044e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.16205215454101562, "step": 1120, "valid_targets_mean": 2719.2, "valid_targets_min": 1448 }, { "epoch": 1.8035284683239774, "grad_norm": 0.6609794155101337, "learning_rate": 3.7060523718819e-05, "loss": 0.3969, "loss_nan_ranks": 0, "loss_rank_avg": 0.31307533383369446, "step": 1125, "valid_targets_mean": 5189.6, "valid_targets_min": 1513 }, { "epoch": 1.8115477145148358, "grad_norm": 0.8729671860828194, "learning_rate": 3.701868075491139e-05, "loss": 0.3853, "loss_nan_ranks": 0, "loss_rank_avg": 0.20690149068832397, "step": 1130, "valid_targets_mean": 3036.1, "valid_targets_min": 1501 }, { "epoch": 1.8195669607056937, "grad_norm": 0.5347078058683018, "learning_rate": 3.697656604761926e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.12335579097270966, "step": 1135, "valid_targets_mean": 2996.4, "valid_targets_min": 977 }, { "epoch": 1.8275862068965516, "grad_norm": 2.15564282147594, "learning_rate": 3.693418026940325e-05, "loss": 0.377, "loss_nan_ranks": 0, "loss_rank_avg": 0.19620174169540405, "step": 1140, "valid_targets_mean": 3806.0, "valid_targets_min": 915 }, { "epoch": 1.8356054530874097, "grad_norm": 0.8361541825039279, "learning_rate": 3.689152409705229e-05, "loss": 0.3795, "loss_nan_ranks": 0, "loss_rank_avg": 0.20147132873535156, "step": 1145, "valid_targets_mean": 2509.1, "valid_targets_min": 1137 }, { "epoch": 1.8436246992782679, "grad_norm": 0.5485386517037776, "learning_rate": 3.6848598211672794e-05, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.14361560344696045, "step": 1150, "valid_targets_mean": 3387.9, "valid_targets_min": 1678 }, { "epoch": 1.8516439454691258, "grad_norm": 0.523212489254307, "learning_rate": 3.6805403298677797e-05, "loss": 0.3892, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377015858888626, "step": 1155, "valid_targets_mean": 4157.6, "valid_targets_min": 1320 }, { "epoch": 1.859663191659984, "grad_norm": 0.5805720706667392, "learning_rate": 3.6761940047775966e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.18016770482063293, "step": 1160, "valid_targets_mean": 5156.2, "valid_targets_min": 1920 }, { "epoch": 1.867682437850842, "grad_norm": 0.7073699077015825, "learning_rate": 3.671820915296063e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.12544605135917664, "step": 1165, "valid_targets_mean": 2071.5, "valid_targets_min": 1669 }, { "epoch": 1.8757016840417, "grad_norm": 0.5785725133606808, "learning_rate": 3.667421131249869e-05, "loss": 0.3971, "loss_nan_ranks": 0, "loss_rank_avg": 0.143942728638649, "step": 1170, "valid_targets_mean": 4040.6, "valid_targets_min": 1152 }, { "epoch": 1.8837209302325582, "grad_norm": 0.7097749219675242, "learning_rate": 3.662994722891946e-05, "loss": 0.384, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935431808233261, "step": 1175, "valid_targets_mean": 2891.0, "valid_targets_min": 1207 }, { "epoch": 1.8917401764234163, "grad_norm": 0.5737892028472221, "learning_rate": 3.658541760900344e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.16055023670196533, "step": 1180, "valid_targets_mean": 3619.0, "valid_targets_min": 1179 }, { "epoch": 1.8997594226142742, "grad_norm": 0.7232340601273627, "learning_rate": 3.654062316377106e-05, "loss": 0.4098, "loss_nan_ranks": 0, "loss_rank_avg": 0.10650050640106201, "step": 1185, "valid_targets_mean": 1760.5, "valid_targets_min": 1013 }, { "epoch": 1.9077786688051324, "grad_norm": 0.6443220988369217, "learning_rate": 3.649556460847131e-05, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.14743563532829285, "step": 1190, "valid_targets_mean": 3203.2, "valid_targets_min": 1358 }, { "epoch": 1.9157979149959905, "grad_norm": 0.5582690367284744, "learning_rate": 3.6450242662570314e-05, "loss": 0.3863, "loss_nan_ranks": 0, "loss_rank_avg": 0.19748684763908386, "step": 1195, "valid_targets_mean": 4101.1, "valid_targets_min": 924 }, { "epoch": 1.9238171611868484, "grad_norm": 0.6001754112517981, "learning_rate": 3.6404658049739854e-05, "loss": 0.3866, "loss_nan_ranks": 0, "loss_rank_avg": 0.13483411073684692, "step": 1200, "valid_targets_mean": 3079.5, "valid_targets_min": 2280 }, { "epoch": 1.9318364073777063, "grad_norm": 0.5966029488469835, "learning_rate": 3.63588114978458e-05, "loss": 0.3956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1857229471206665, "step": 1205, "valid_targets_mean": 3873.2, "valid_targets_min": 1460 }, { "epoch": 1.9398556535685647, "grad_norm": 0.6168496251026493, "learning_rate": 3.6312703738936504e-05, "loss": 0.356, "loss_nan_ranks": 0, "loss_rank_avg": 0.13357146084308624, "step": 1210, "valid_targets_mean": 2732.0, "valid_targets_min": 1303 }, { "epoch": 1.9478748997594226, "grad_norm": 0.6311909475544676, "learning_rate": 3.626633550923111e-05, "loss": 0.3864, "loss_nan_ranks": 0, "loss_rank_avg": 0.22280068695545197, "step": 1215, "valid_targets_mean": 4697.6, "valid_targets_min": 1197 }, { "epoch": 1.9558941459502805, "grad_norm": 0.6330802569242555, "learning_rate": 3.621970754910778e-05, "loss": 0.3879, "loss_nan_ranks": 0, "loss_rank_avg": 0.17384251952171326, "step": 1220, "valid_targets_mean": 3419.2, "valid_targets_min": 1113 }, { "epoch": 1.9639133921411387, "grad_norm": 0.6832101537550106, "learning_rate": 3.6172820603091885e-05, "loss": 0.3898, "loss_nan_ranks": 0, "loss_rank_avg": 0.23188313841819763, "step": 1225, "valid_targets_mean": 5003.0, "valid_targets_min": 1552 }, { "epoch": 1.9719326383319968, "grad_norm": 0.5453371948123984, "learning_rate": 3.612567541984413e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.1720346063375473, "step": 1230, "valid_targets_mean": 4566.8, "valid_targets_min": 1636 }, { "epoch": 1.9799518845228548, "grad_norm": 0.6263399586173676, "learning_rate": 3.6078272752148574e-05, "loss": 0.3594, "loss_nan_ranks": 0, "loss_rank_avg": 0.18737949430942535, "step": 1235, "valid_targets_mean": 4321.5, "valid_targets_min": 1472 }, { "epoch": 1.987971130713713, "grad_norm": 0.627134594554725, "learning_rate": 3.6030613356900635e-05, "loss": 0.3852, "loss_nan_ranks": 0, "loss_rank_avg": 0.22431224584579468, "step": 1240, "valid_targets_mean": 4424.0, "valid_targets_min": 1391 }, { "epoch": 1.995990376904571, "grad_norm": 0.5993458413134857, "learning_rate": 3.598269799509498e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.20022183656692505, "step": 1245, "valid_targets_mean": 4605.9, "valid_targets_min": 1823 }, { "epoch": 2.003207698476343, "grad_norm": 0.5663208864221956, "learning_rate": 3.5934527431813385e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.12005630880594254, "step": 1250, "valid_targets_mean": 2945.0, "valid_targets_min": 1420 }, { "epoch": 2.011226944667201, "grad_norm": 0.8872549889160983, "learning_rate": 3.5886102436212536e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.22787944972515106, "step": 1255, "valid_targets_mean": 2892.1, "valid_targets_min": 1151 }, { "epoch": 2.0192461908580595, "grad_norm": 0.70325046246873, "learning_rate": 3.583742378151171e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.09715551137924194, "step": 1260, "valid_targets_mean": 1930.8, "valid_targets_min": 1236 }, { "epoch": 2.0272654370489174, "grad_norm": 0.45173903036506174, "learning_rate": 3.5788492244980464e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.15271684527397156, "step": 1265, "valid_targets_mean": 5269.2, "valid_targets_min": 1086 }, { "epoch": 2.0352846832397753, "grad_norm": 0.6267349391058774, "learning_rate": 3.573930860792621e-05, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.12874770164489746, "step": 1270, "valid_targets_mean": 3163.2, "valid_targets_min": 1708 }, { "epoch": 2.0433039294306337, "grad_norm": 0.6511298081327664, "learning_rate": 3.568987365568173e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15595881640911102, "step": 1275, "valid_targets_mean": 4213.8, "valid_targets_min": 2064 }, { "epoch": 2.0513231756214916, "grad_norm": 0.6887412815570042, "learning_rate": 3.564018817759266e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.19574494659900665, "step": 1280, "valid_targets_mean": 3699.8, "valid_targets_min": 1734 }, { "epoch": 2.0593424218123495, "grad_norm": 0.5876985128109127, "learning_rate": 3.559025296700484e-05, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2059636414051056, "step": 1285, "valid_targets_mean": 5620.4, "valid_targets_min": 1040 }, { "epoch": 2.067361668003208, "grad_norm": 0.6489766733954635, "learning_rate": 3.554006882125173e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.14607182145118713, "step": 1290, "valid_targets_mean": 3392.2, "valid_targets_min": 1345 }, { "epoch": 2.075380914194066, "grad_norm": 0.6998589814788587, "learning_rate": 3.5489636541641586e-05, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.25323814153671265, "step": 1295, "valid_targets_mean": 4242.2, "valid_targets_min": 1980 }, { "epoch": 2.0834001603849237, "grad_norm": 0.6809616848578639, "learning_rate": 3.543895693344472e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.26932215690612793, "step": 1300, "valid_targets_mean": 6057.2, "valid_targets_min": 1100 }, { "epoch": 2.091419406575782, "grad_norm": 0.7197676582601361, "learning_rate": 3.538803080588063e-05, "loss": 0.3771, "loss_nan_ranks": 0, "loss_rank_avg": 0.13603916764259338, "step": 1305, "valid_targets_mean": 2857.4, "valid_targets_min": 1126 }, { "epoch": 2.09943865276664, "grad_norm": 0.5586827477126696, "learning_rate": 3.5336858972105076e-05, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.16107013821601868, "step": 1310, "valid_targets_mean": 5763.4, "valid_targets_min": 912 }, { "epoch": 2.107457898957498, "grad_norm": 0.6466104512256226, "learning_rate": 3.528544224919708e-05, "loss": 0.3284, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799907684326172, "step": 1315, "valid_targets_mean": 4982.8, "valid_targets_min": 1556 }, { "epoch": 2.115477145148356, "grad_norm": 0.7350409668585496, "learning_rate": 3.5233781458145934e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.22638684511184692, "step": 1320, "valid_targets_mean": 4702.5, "valid_targets_min": 1729 }, { "epoch": 2.123496391339214, "grad_norm": 0.7064124825894162, "learning_rate": 3.5181877423838034e-05, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.14431232213974, "step": 1325, "valid_targets_mean": 2504.0, "valid_targets_min": 1463 }, { "epoch": 2.131515637530072, "grad_norm": 0.6170135621678351, "learning_rate": 3.512973097504371e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.1600828617811203, "step": 1330, "valid_targets_mean": 4526.1, "valid_targets_min": 1870 }, { "epoch": 2.13953488372093, "grad_norm": 0.6334913259623194, "learning_rate": 3.507734294440403e-05, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.22223691642284393, "step": 1335, "valid_targets_mean": 3722.9, "valid_targets_min": 1819 }, { "epoch": 2.1475541299117884, "grad_norm": 0.5896282676984603, "learning_rate": 3.50247141684175e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.1323956400156021, "step": 1340, "valid_targets_mean": 3185.5, "valid_targets_min": 1339 }, { "epoch": 2.1555733761026463, "grad_norm": 0.7760657508108424, "learning_rate": 3.497184548742667e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.19285187125205994, "step": 1345, "valid_targets_mean": 2632.2, "valid_targets_min": 1300 }, { "epoch": 2.1635926222935042, "grad_norm": 0.6467658716847074, "learning_rate": 3.491873774560473e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351018100976944, "step": 1350, "valid_targets_mean": 3104.2, "valid_targets_min": 1488 }, { "epoch": 2.1716118684843626, "grad_norm": 0.6572971280106079, "learning_rate": 3.486539179094208e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.19534534215927124, "step": 1355, "valid_targets_mean": 4289.0, "valid_targets_min": 954 }, { "epoch": 2.1796311146752205, "grad_norm": 0.576102818448099, "learning_rate": 3.481180847523272e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.10375870019197464, "step": 1360, "valid_targets_mean": 3130.5, "valid_targets_min": 2285 }, { "epoch": 2.1876503608660784, "grad_norm": 0.5976408294352582, "learning_rate": 3.4757988654060684e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.22457639873027802, "step": 1365, "valid_targets_mean": 4272.2, "valid_targets_min": 1063 }, { "epoch": 2.195669607056937, "grad_norm": 0.6876863275492887, "learning_rate": 3.470393318678637e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.13346576690673828, "step": 1370, "valid_targets_mean": 3217.4, "valid_targets_min": 1409 }, { "epoch": 2.2036888532477947, "grad_norm": 0.5667005128855648, "learning_rate": 3.4649642936532836e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1915643811225891, "step": 1375, "valid_targets_mean": 4325.4, "valid_targets_min": 1274 }, { "epoch": 2.2117080994386527, "grad_norm": 0.6805553682250962, "learning_rate": 3.4595118770171984e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.16712094843387604, "step": 1380, "valid_targets_mean": 3757.0, "valid_targets_min": 1767 }, { "epoch": 2.219727345629511, "grad_norm": 0.5851592379232585, "learning_rate": 3.454036155831077e-05, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.18492160737514496, "step": 1385, "valid_targets_mean": 4730.1, "valid_targets_min": 1819 }, { "epoch": 2.227746591820369, "grad_norm": 0.5941379064666082, "learning_rate": 3.4485372175277236e-05, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.17360571026802063, "step": 1390, "valid_targets_mean": 4303.4, "valid_targets_min": 1718 }, { "epoch": 2.235765838011227, "grad_norm": 0.7120870875424696, "learning_rate": 3.44301514991066e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.1876790076494217, "step": 1395, "valid_targets_mean": 3447.5, "valid_targets_min": 1887 }, { "epoch": 2.2437850842020852, "grad_norm": 0.8987849319173, "learning_rate": 3.4374700411527225e-05, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1342727690935135, "step": 1400, "valid_targets_mean": 2107.1, "valid_targets_min": 1157 }, { "epoch": 2.251804330392943, "grad_norm": 0.7207343049659005, "learning_rate": 3.431901979794653e-05, "loss": 0.3784, "loss_nan_ranks": 0, "loss_rank_avg": 0.14748650789260864, "step": 1405, "valid_targets_mean": 4076.9, "valid_targets_min": 2404 }, { "epoch": 2.259823576583801, "grad_norm": 0.646268203387511, "learning_rate": 3.426311054743685e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.17233049869537354, "step": 1410, "valid_targets_mean": 3841.1, "valid_targets_min": 1958 }, { "epoch": 2.267842822774659, "grad_norm": 0.6555687819002504, "learning_rate": 3.420697355272127e-05, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.21643511950969696, "step": 1415, "valid_targets_mean": 4472.8, "valid_targets_min": 988 }, { "epoch": 2.2758620689655173, "grad_norm": 0.6365450212470497, "learning_rate": 3.415060971015933e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.15613329410552979, "step": 1420, "valid_targets_mean": 3359.0, "valid_targets_min": 1872 }, { "epoch": 2.2838813151563753, "grad_norm": 0.5472941463259734, "learning_rate": 3.4094019919732736e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.18104006350040436, "step": 1425, "valid_targets_mean": 3852.8, "valid_targets_min": 1580 }, { "epoch": 2.291900561347233, "grad_norm": 0.6778575739718365, "learning_rate": 3.403720508503098e-05, "loss": 0.3188, "loss_nan_ranks": 0, "loss_rank_avg": 0.11832959949970245, "step": 1430, "valid_targets_mean": 2429.9, "valid_targets_min": 1140 }, { "epoch": 2.2999198075380916, "grad_norm": 0.7046598918064869, "learning_rate": 3.398016611323693e-05, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872364580631256, "step": 1435, "valid_targets_mean": 2780.0, "valid_targets_min": 989 }, { "epoch": 2.3079390537289495, "grad_norm": 0.5903200079092314, "learning_rate": 3.392290391511232e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.24641390144824982, "step": 1440, "valid_targets_mean": 5554.1, "valid_targets_min": 1395 }, { "epoch": 2.3159582999198074, "grad_norm": 0.5877596462721397, "learning_rate": 3.386541940498322e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.20738443732261658, "step": 1445, "valid_targets_mean": 5463.1, "valid_targets_min": 1245 }, { "epoch": 2.3239775461106658, "grad_norm": 0.518772079301355, "learning_rate": 3.380771350072543e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.14182378351688385, "step": 1450, "valid_targets_mean": 4598.1, "valid_targets_min": 1677 }, { "epoch": 2.3319967923015237, "grad_norm": 0.6214771748168114, "learning_rate": 3.374978712374986e-05, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1580396294593811, "step": 1455, "valid_targets_mean": 3403.0, "valid_targets_min": 804 }, { "epoch": 2.3400160384923816, "grad_norm": 0.6601543484544395, "learning_rate": 3.369164119898774e-05, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1316310465335846, "step": 1460, "valid_targets_mean": 2555.2, "valid_targets_min": 708 }, { "epoch": 2.34803528468324, "grad_norm": 0.5865229505252662, "learning_rate": 3.363327665487593e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.1241571456193924, "step": 1465, "valid_targets_mean": 2880.8, "valid_targets_min": 1233 }, { "epoch": 2.356054530874098, "grad_norm": 0.5980685298620095, "learning_rate": 3.357469442334206e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2264668047428131, "step": 1470, "valid_targets_mean": 6163.9, "valid_targets_min": 1401 }, { "epoch": 2.364073777064956, "grad_norm": 0.6627796109058691, "learning_rate": 3.351589543978965e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2296164184808731, "step": 1475, "valid_targets_mean": 3652.5, "valid_targets_min": 1154 }, { "epoch": 2.3720930232558137, "grad_norm": 0.5294058440362729, "learning_rate": 3.345688064308317e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.09211620688438416, "step": 1480, "valid_targets_mean": 1971.9, "valid_targets_min": 1273 }, { "epoch": 2.380112269446672, "grad_norm": 0.5811757127018823, "learning_rate": 3.339765097553307e-05, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.1387772560119629, "step": 1485, "valid_targets_mean": 4018.6, "valid_targets_min": 1418 }, { "epoch": 2.38813151563753, "grad_norm": 0.6531008698660362, "learning_rate": 3.33382073828807e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.2030208259820938, "step": 1490, "valid_targets_mean": 3304.8, "valid_targets_min": 345 }, { "epoch": 2.3961507618283884, "grad_norm": 0.5940837552451501, "learning_rate": 3.327855081428326e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.11011539399623871, "step": 1495, "valid_targets_mean": 2390.4, "valid_targets_min": 1365 }, { "epoch": 2.4041700080192463, "grad_norm": 0.6349081771533944, "learning_rate": 3.3218682222298584e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.17606303095817566, "step": 1500, "valid_targets_mean": 4131.0, "valid_targets_min": 1191 }, { "epoch": 2.412189254210104, "grad_norm": 0.6551570262937156, "learning_rate": 3.315860256286996e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725284457206726, "step": 1505, "valid_targets_mean": 3694.4, "valid_targets_min": 1828 }, { "epoch": 2.420208500400962, "grad_norm": 0.576066249468684, "learning_rate": 3.3098312795310894e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.11704175174236298, "step": 1510, "valid_targets_mean": 3280.1, "valid_targets_min": 2248 }, { "epoch": 2.4282277465918205, "grad_norm": 0.5960437561557996, "learning_rate": 3.303781388228974e-05, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.1958293616771698, "step": 1515, "valid_targets_mean": 4049.8, "valid_targets_min": 1618 }, { "epoch": 2.4362469927826784, "grad_norm": 0.8307745047978246, "learning_rate": 3.297710678981435e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351197361946106, "step": 1520, "valid_targets_mean": 2351.6, "valid_targets_min": 1405 }, { "epoch": 2.4442662389735363, "grad_norm": 0.6476048564369427, "learning_rate": 3.291619248721667e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.21313653886318207, "step": 1525, "valid_targets_mean": 3757.8, "valid_targets_min": 1368 }, { "epoch": 2.4522854851643947, "grad_norm": 0.6101060365763258, "learning_rate": 3.285507194713724e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.19842976331710815, "step": 1530, "valid_targets_mean": 4398.0, "valid_targets_min": 1107 }, { "epoch": 2.4603047313552526, "grad_norm": 0.5916014914557419, "learning_rate": 3.279374614550966e-05, "loss": 0.3277, "loss_nan_ranks": 0, "loss_rank_avg": 0.13822132349014282, "step": 1535, "valid_targets_mean": 3856.4, "valid_targets_min": 1457 }, { "epoch": 2.4683239775461105, "grad_norm": 0.6072793114889506, "learning_rate": 3.2732216061545e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.20727184414863586, "step": 1540, "valid_targets_mean": 4482.2, "valid_targets_min": 1559 }, { "epoch": 2.476343223736969, "grad_norm": 0.5182531096963034, "learning_rate": 3.2670482677716214e-05, "loss": 0.3488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823084056377411, "step": 1545, "valid_targets_mean": 6600.6, "valid_targets_min": 1566 }, { "epoch": 2.484362469927827, "grad_norm": 0.6588849437987316, "learning_rate": 3.2608546979742394e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.2547794282436371, "step": 1550, "valid_targets_mean": 4279.4, "valid_targets_min": 1003 }, { "epoch": 2.4923817161186848, "grad_norm": 0.5210067181618686, "learning_rate": 3.254640995657307e-05, "loss": 0.3334, "loss_nan_ranks": 0, "loss_rank_avg": 0.12388885021209717, "step": 1555, "valid_targets_mean": 3967.8, "valid_targets_min": 1582 }, { "epoch": 2.500400962309543, "grad_norm": 0.6675420827290998, "learning_rate": 3.248407260037239e-05, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.17942309379577637, "step": 1560, "valid_targets_mean": 4615.5, "valid_targets_min": 1587 }, { "epoch": 2.508420208500401, "grad_norm": 0.7303300679097665, "learning_rate": 3.24215359065033e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.2134750932455063, "step": 1565, "valid_targets_mean": 3633.2, "valid_targets_min": 1707 }, { "epoch": 2.516439454691259, "grad_norm": 0.6444335496667586, "learning_rate": 3.235880087351164e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.23998838663101196, "step": 1570, "valid_targets_mean": 5089.2, "valid_targets_min": 1714 }, { "epoch": 2.524458700882117, "grad_norm": 0.5748610625680467, "learning_rate": 3.2295868503110184e-05, "loss": 0.34, "loss_nan_ranks": 0, "loss_rank_avg": 0.2552739977836609, "step": 1575, "valid_targets_mean": 6235.0, "valid_targets_min": 1689 }, { "epoch": 2.5324779470729752, "grad_norm": 0.6462216645868455, "learning_rate": 3.22327398001627e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.16141477227210999, "step": 1580, "valid_targets_mean": 2878.8, "valid_targets_min": 1170 }, { "epoch": 2.540497193263833, "grad_norm": 0.5609462119008043, "learning_rate": 3.216941577266783e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2184831202030182, "step": 1585, "valid_targets_mean": 6295.1, "valid_targets_min": 1501 }, { "epoch": 2.5485164394546915, "grad_norm": 0.4957075570354505, "learning_rate": 3.210589743174308e-05, "loss": 0.327, "loss_nan_ranks": 0, "loss_rank_avg": 0.2078409641981125, "step": 1590, "valid_targets_mean": 7591.4, "valid_targets_min": 1955 }, { "epoch": 2.5565356856455494, "grad_norm": 0.6463964641560773, "learning_rate": 3.204218579160857e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.24058961868286133, "step": 1595, "valid_targets_mean": 5036.2, "valid_targets_min": 1200 }, { "epoch": 2.5645549318364074, "grad_norm": 0.5516304479142902, "learning_rate": 3.197828186957094e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.1926528811454773, "step": 1600, "valid_targets_mean": 5438.1, "valid_targets_min": 1771 }, { "epoch": 2.5725741780272653, "grad_norm": 0.5248474906462943, "learning_rate": 3.191418668600705e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.15956036746501923, "step": 1605, "valid_targets_mean": 5140.5, "valid_targets_min": 1973 }, { "epoch": 2.5805934242181237, "grad_norm": 0.6278892330122797, "learning_rate": 3.184990126434771e-05, "loss": 0.3503, "loss_nan_ranks": 0, "loss_rank_avg": 0.21146860718727112, "step": 1610, "valid_targets_mean": 3795.6, "valid_targets_min": 1006 }, { "epoch": 2.5886126704089816, "grad_norm": 0.6365412145603873, "learning_rate": 3.178542663106131e-05, "loss": 0.3514, "loss_nan_ranks": 0, "loss_rank_avg": 0.165127694606781, "step": 1615, "valid_targets_mean": 3648.6, "valid_targets_min": 1373 }, { "epoch": 2.5966319165998395, "grad_norm": 0.6105168700748761, "learning_rate": 3.172076381563748e-05, "loss": 0.3697, "loss_nan_ranks": 0, "loss_rank_avg": 0.2247442901134491, "step": 1620, "valid_targets_mean": 4797.0, "valid_targets_min": 1482 }, { "epoch": 2.604651162790698, "grad_norm": 0.5552391542865701, "learning_rate": 3.165591385057058e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.16839686036109924, "step": 1625, "valid_targets_mean": 4180.8, "valid_targets_min": 2486 }, { "epoch": 2.612670408981556, "grad_norm": 0.6258173020249116, "learning_rate": 3.1590877771343316e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.20165500044822693, "step": 1630, "valid_targets_mean": 4232.8, "valid_targets_min": 954 }, { "epoch": 2.6206896551724137, "grad_norm": 0.6291679923624242, "learning_rate": 3.152565661641008e-05, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.2278696447610855, "step": 1635, "valid_targets_mean": 5187.6, "valid_targets_min": 1647 }, { "epoch": 2.6287089013632716, "grad_norm": 0.629899100817526, "learning_rate": 3.1460251427180474e-05, "loss": 0.3488, "loss_nan_ranks": 0, "loss_rank_avg": 0.13377898931503296, "step": 1640, "valid_targets_mean": 2682.0, "valid_targets_min": 1718 }, { "epoch": 2.63672814755413, "grad_norm": 0.6868725842453621, "learning_rate": 3.139466324800263e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.12783987820148468, "step": 1645, "valid_targets_mean": 3092.1, "valid_targets_min": 1504 }, { "epoch": 2.644747393744988, "grad_norm": 0.655325240952164, "learning_rate": 3.132889312614655e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.1781664788722992, "step": 1650, "valid_targets_mean": 3401.0, "valid_targets_min": 1985 }, { "epoch": 2.6527666399358463, "grad_norm": 0.6228530990624284, "learning_rate": 3.126294211178737e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.17397254705429077, "step": 1655, "valid_targets_mean": 3983.8, "valid_targets_min": 1548 }, { "epoch": 2.660785886126704, "grad_norm": 0.5714671399749158, "learning_rate": 3.1196811257988634e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.16387617588043213, "step": 1660, "valid_targets_mean": 4429.9, "valid_targets_min": 1463 }, { "epoch": 2.668805132317562, "grad_norm": 0.7483517252874993, "learning_rate": 3.1130501620685394e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.23365803062915802, "step": 1665, "valid_targets_mean": 2976.1, "valid_targets_min": 1136 }, { "epoch": 2.67682437850842, "grad_norm": 0.6639005033164377, "learning_rate": 3.106401425866745e-05, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.19206903874874115, "step": 1670, "valid_targets_mean": 3576.8, "valid_targets_min": 1679 }, { "epoch": 2.6848436246992784, "grad_norm": 0.5766789644867589, "learning_rate": 3.099735023356236e-05, "loss": 0.3651, "loss_nan_ranks": 0, "loss_rank_avg": 0.21450704336166382, "step": 1675, "valid_targets_mean": 5612.0, "valid_targets_min": 849 }, { "epoch": 2.6928628708901363, "grad_norm": 0.5871168709870269, "learning_rate": 3.0930510609818564e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.17829036712646484, "step": 1680, "valid_targets_mean": 4906.4, "valid_targets_min": 1779 }, { "epoch": 2.7008821170809942, "grad_norm": 0.5872313358818464, "learning_rate": 3.086349645468831e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11560177803039551, "step": 1685, "valid_targets_mean": 4144.8, "valid_targets_min": 1313 }, { "epoch": 2.7089013632718526, "grad_norm": 0.5826035312015911, "learning_rate": 3.079630883821067e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.21896260976791382, "step": 1690, "valid_targets_mean": 4781.9, "valid_targets_min": 2115 }, { "epoch": 2.7169206094627105, "grad_norm": 0.6011395273868881, "learning_rate": 3.0728948833194436e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.21181732416152954, "step": 1695, "valid_targets_mean": 5069.0, "valid_targets_min": 1363 }, { "epoch": 2.7249398556535684, "grad_norm": 0.6651359418444572, "learning_rate": 3.066141751520099e-05, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.1747858226299286, "step": 1700, "valid_targets_mean": 3284.0, "valid_targets_min": 1926 }, { "epoch": 2.7329591018444264, "grad_norm": 0.6115176677200098, "learning_rate": 3.059371596252712e-05, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.162808358669281, "step": 1705, "valid_targets_mean": 3847.5, "valid_targets_min": 1296 }, { "epoch": 2.7409783480352847, "grad_norm": 0.6656515539528712, "learning_rate": 3.0525845256187834e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.14415833353996277, "step": 1710, "valid_targets_mean": 3631.0, "valid_targets_min": 2313 }, { "epoch": 2.7489975942261426, "grad_norm": 0.6083830291868935, "learning_rate": 3.0457806479899044e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.18218392133712769, "step": 1715, "valid_targets_mean": 4358.8, "valid_targets_min": 1822 }, { "epoch": 2.757016840417001, "grad_norm": 0.6011013868022232, "learning_rate": 3.0389600720060318e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.2295471429824829, "step": 1720, "valid_targets_mean": 4038.2, "valid_targets_min": 1807 }, { "epoch": 2.765036086607859, "grad_norm": 0.6611587519621636, "learning_rate": 3.0321229065737522e-05, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.16769525408744812, "step": 1725, "valid_targets_mean": 2427.5, "valid_targets_min": 1552 }, { "epoch": 2.773055332798717, "grad_norm": 0.8131060808181708, "learning_rate": 3.0252692608645384e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.18336832523345947, "step": 1730, "valid_targets_mean": 3267.2, "valid_targets_min": 894 }, { "epoch": 2.7810745789895748, "grad_norm": 0.5610531465944066, "learning_rate": 3.0183992443130127e-05, "loss": 0.3633, "loss_nan_ranks": 0, "loss_rank_avg": 0.16682939231395721, "step": 1735, "valid_targets_mean": 4752.2, "valid_targets_min": 2202 }, { "epoch": 2.789093825180433, "grad_norm": 0.5997382925590476, "learning_rate": 3.011512966615195e-05, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.12142496556043625, "step": 1740, "valid_targets_mean": 2443.5, "valid_targets_min": 1471 }, { "epoch": 2.797113071371291, "grad_norm": 0.5762907495346832, "learning_rate": 3.0046105377267523e-05, "loss": 0.3301, "loss_nan_ranks": 0, "loss_rank_avg": 0.17085179686546326, "step": 1745, "valid_targets_mean": 4630.1, "valid_targets_min": 1542 }, { "epoch": 2.8051323175621494, "grad_norm": 0.5829196843633385, "learning_rate": 2.9976920678612456e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.24269111454486847, "step": 1750, "valid_targets_mean": 5201.4, "valid_targets_min": 1951 }, { "epoch": 2.8131515637530073, "grad_norm": 0.6277816875568113, "learning_rate": 2.9907576674883664e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.2342943698167801, "step": 1755, "valid_targets_mean": 5771.5, "valid_targets_min": 2030 }, { "epoch": 2.8211708099438653, "grad_norm": 0.5566183050309045, "learning_rate": 2.983807447332174e-05, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.12989120185375214, "step": 1760, "valid_targets_mean": 3220.8, "valid_targets_min": 1346 }, { "epoch": 2.829190056134723, "grad_norm": 0.5843107774579075, "learning_rate": 2.9768415183693293e-05, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.15450912714004517, "step": 1765, "valid_targets_mean": 3541.1, "valid_targets_min": 1458 }, { "epoch": 2.8372093023255816, "grad_norm": 0.6007068163414647, "learning_rate": 2.9698599918273197e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.17683474719524384, "step": 1770, "valid_targets_mean": 4956.5, "valid_targets_min": 881 }, { "epoch": 2.8452285485164395, "grad_norm": 0.6439652957844222, "learning_rate": 2.962862979182686e-05, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.13516972959041595, "step": 1775, "valid_targets_mean": 2771.8, "valid_targets_min": 1059 }, { "epoch": 2.8532477947072974, "grad_norm": 0.5806838903580533, "learning_rate": 2.95585059215924e-05, "loss": 0.3445, "loss_nan_ranks": 0, "loss_rank_avg": 0.14902666211128235, "step": 1780, "valid_targets_mean": 3495.1, "valid_targets_min": 1494 }, { "epoch": 2.8612670408981558, "grad_norm": 0.8405453402220504, "learning_rate": 2.948822942726284e-05, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.19173868000507355, "step": 1785, "valid_targets_mean": 2640.8, "valid_targets_min": 1046 }, { "epoch": 2.8692862870890137, "grad_norm": 0.5958007208888075, "learning_rate": 2.941780143096817e-05, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.19616219401359558, "step": 1790, "valid_targets_mean": 4756.8, "valid_targets_min": 1433 }, { "epoch": 2.8773055332798716, "grad_norm": 0.5542905432219679, "learning_rate": 2.9347223057257505e-05, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591700315475464, "step": 1795, "valid_targets_mean": 5558.9, "valid_targets_min": 1023 }, { "epoch": 2.8853247794707295, "grad_norm": 0.4833364708765064, "learning_rate": 2.927649543308106e-05, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.18111169338226318, "step": 1800, "valid_targets_mean": 6311.6, "valid_targets_min": 1023 }, { "epoch": 2.893344025661588, "grad_norm": 0.5957529324717237, "learning_rate": 2.9205619687772212e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.18495184183120728, "step": 1805, "valid_targets_mean": 4080.9, "valid_targets_min": 1787 }, { "epoch": 2.901363271852446, "grad_norm": 0.6158328047841045, "learning_rate": 2.9134596953029413e-05, "loss": 0.3501, "loss_nan_ranks": 0, "loss_rank_avg": 0.17425167560577393, "step": 1810, "valid_targets_mean": 4262.2, "valid_targets_min": 1576 }, { "epoch": 2.909382518043304, "grad_norm": 0.4842742755340218, "learning_rate": 2.9063428362898168e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.13343685865402222, "step": 1815, "valid_targets_mean": 5032.9, "valid_targets_min": 1627 }, { "epoch": 2.917401764234162, "grad_norm": 0.5503873137781846, "learning_rate": 2.8992115053752905e-05, "loss": 0.3271, "loss_nan_ranks": 0, "loss_rank_avg": 0.1701168566942215, "step": 1820, "valid_targets_mean": 4278.1, "valid_targets_min": 1496 }, { "epoch": 2.92542101042502, "grad_norm": 0.5745206673048178, "learning_rate": 2.8920658164278816e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.14051708579063416, "step": 1825, "valid_targets_mean": 3690.9, "valid_targets_min": 1271 }, { "epoch": 2.933440256615878, "grad_norm": 0.6857547647409145, "learning_rate": 2.884905883545373e-05, "loss": 0.344, "loss_nan_ranks": 0, "loss_rank_avg": 0.15106357634067535, "step": 1830, "valid_targets_mean": 3079.5, "valid_targets_min": 1457 }, { "epoch": 2.9414595028067363, "grad_norm": 0.5480224874709139, "learning_rate": 2.877731821052981e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.23945242166519165, "step": 1835, "valid_targets_mean": 5315.8, "valid_targets_min": 1619 }, { "epoch": 2.949478748997594, "grad_norm": 0.5679922622553645, "learning_rate": 2.8705437435015375e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.21760649979114532, "step": 1840, "valid_targets_mean": 5026.5, "valid_targets_min": 1646 }, { "epoch": 2.957497995188452, "grad_norm": 0.5313840600274049, "learning_rate": 2.8633417656656566e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11117774248123169, "step": 1845, "valid_targets_mean": 3457.6, "valid_targets_min": 1578 }, { "epoch": 2.9655172413793105, "grad_norm": 0.6297881056735455, "learning_rate": 2.8561260025419036e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.2085118293762207, "step": 1850, "valid_targets_mean": 4719.8, "valid_targets_min": 1504 }, { "epoch": 2.9735364875701684, "grad_norm": 0.8963545587577034, "learning_rate": 2.8488965693469583e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.17817959189414978, "step": 1855, "valid_targets_mean": 3197.5, "valid_targets_min": 1654 }, { "epoch": 2.9815557337610263, "grad_norm": 0.5354808191697631, "learning_rate": 2.8416535815157763e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702459305524826, "step": 1860, "valid_targets_mean": 4165.6, "valid_targets_min": 1186 }, { "epoch": 2.9895749799518843, "grad_norm": 0.6498642625370372, "learning_rate": 2.8343971546997434e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.157914936542511, "step": 1865, "valid_targets_mean": 2609.2, "valid_targets_min": 1441 }, { "epoch": 2.9975942261427426, "grad_norm": 0.6297407453522518, "learning_rate": 2.827127404764831e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.11299164593219757, "step": 1870, "valid_targets_mean": 2654.1, "valid_targets_min": 1182 }, { "epoch": 3.0048115477145148, "grad_norm": 0.7032762627174555, "learning_rate": 2.8198444477897467e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.15206965804100037, "step": 1875, "valid_targets_mean": 2631.5, "valid_targets_min": 1636 }, { "epoch": 3.0128307939053727, "grad_norm": 0.7155942882812133, "learning_rate": 2.8125484000640787e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.10091409832239151, "step": 1880, "valid_targets_mean": 2218.4, "valid_targets_min": 808 }, { "epoch": 3.020850040096231, "grad_norm": 0.4981371502776664, "learning_rate": 2.8052393780864394e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.1289309561252594, "step": 1885, "valid_targets_mean": 4298.6, "valid_targets_min": 1512 }, { "epoch": 3.028869286287089, "grad_norm": 0.575400474472258, "learning_rate": 2.797917498562607e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.1485946774482727, "step": 1890, "valid_targets_mean": 4350.4, "valid_targets_min": 1291 }, { "epoch": 3.036888532477947, "grad_norm": 0.5120704781400871, "learning_rate": 2.7905828784036596e-05, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.21469643712043762, "step": 1895, "valid_targets_mean": 7091.8, "valid_targets_min": 1765 }, { "epoch": 3.0449077786688052, "grad_norm": 0.5767259511228147, "learning_rate": 2.78323563472411e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.18228240311145782, "step": 1900, "valid_targets_mean": 5326.8, "valid_targets_min": 1610 }, { "epoch": 3.052927024859663, "grad_norm": 0.5491197579142447, "learning_rate": 2.7758758848400354e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.1779412031173706, "step": 1905, "valid_targets_mean": 5061.5, "valid_targets_min": 1582 }, { "epoch": 3.060946271050521, "grad_norm": 0.6842155517498201, "learning_rate": 2.7685037462672043e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.19132070243358612, "step": 1910, "valid_targets_mean": 3660.1, "valid_targets_min": 1162 }, { "epoch": 3.0689655172413794, "grad_norm": 0.6760878064304382, "learning_rate": 2.7611193367191993e-05, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.22465574741363525, "step": 1915, "valid_targets_mean": 4018.1, "valid_targets_min": 2057 }, { "epoch": 3.0769847634322374, "grad_norm": 0.6414087031460661, "learning_rate": 2.7537227741055378e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.10675209015607834, "step": 1920, "valid_targets_mean": 2162.2, "valid_targets_min": 1006 }, { "epoch": 3.0850040096230953, "grad_norm": 0.6858636117457415, "learning_rate": 2.746314176529791e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.16336016356945038, "step": 1925, "valid_targets_mean": 3358.5, "valid_targets_min": 1381 }, { "epoch": 3.0930232558139537, "grad_norm": 0.4896718696555601, "learning_rate": 2.7388936622876957e-05, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.17518985271453857, "step": 1930, "valid_targets_mean": 7132.2, "valid_targets_min": 1765 }, { "epoch": 3.1010425020048116, "grad_norm": 0.5104354367503314, "learning_rate": 2.7314613498652663e-05, "loss": 0.3179, "loss_nan_ranks": 0, "loss_rank_avg": 0.17402449250221252, "step": 1935, "valid_targets_mean": 5995.6, "valid_targets_min": 1169 }, { "epoch": 3.1090617481956695, "grad_norm": 0.6254156399773187, "learning_rate": 2.7240173579369025e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.12640006840229034, "step": 1940, "valid_targets_mean": 3783.9, "valid_targets_min": 1231 }, { "epoch": 3.117080994386528, "grad_norm": 0.5304276087744046, "learning_rate": 2.7165618053634962e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.13664016127586365, "step": 1945, "valid_targets_mean": 6537.9, "valid_targets_min": 2060 }, { "epoch": 3.125100240577386, "grad_norm": 0.6393804177692343, "learning_rate": 2.7090948111905304e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.15379135310649872, "step": 1950, "valid_targets_mean": 3703.0, "valid_targets_min": 1171 }, { "epoch": 3.1331194867682437, "grad_norm": 0.7483845792341272, "learning_rate": 2.701616494646183e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.16798612475395203, "step": 1955, "valid_targets_mean": 2964.4, "valid_targets_min": 2087 }, { "epoch": 3.141138732959102, "grad_norm": 0.6571338517574732, "learning_rate": 2.6941269751394174e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.19471541047096252, "step": 1960, "valid_targets_mean": 4089.4, "valid_targets_min": 1584 }, { "epoch": 3.14915797914996, "grad_norm": 0.7937141144340575, "learning_rate": 2.686626372258081e-05, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.2159966677427292, "step": 1965, "valid_targets_mean": 3406.1, "valid_targets_min": 1393 }, { "epoch": 3.157177225340818, "grad_norm": 0.6798355217613847, "learning_rate": 2.6791148057669913e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.19850729405879974, "step": 1970, "valid_targets_mean": 4502.8, "valid_targets_min": 1625 }, { "epoch": 3.165196471531676, "grad_norm": 0.5314856867903979, "learning_rate": 2.671592395606027e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.0934186726808548, "step": 1975, "valid_targets_mean": 3235.5, "valid_targets_min": 1488 }, { "epoch": 3.173215717722534, "grad_norm": 0.7120381313874422, "learning_rate": 2.6640592618882114e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.19404734671115875, "step": 1980, "valid_targets_mean": 3064.2, "valid_targets_min": 1401 }, { "epoch": 3.181234963913392, "grad_norm": 0.4626762807628728, "learning_rate": 2.656515524897795e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.19291116297245026, "step": 1985, "valid_targets_mean": 7916.4, "valid_targets_min": 1706 }, { "epoch": 3.18925421010425, "grad_norm": 0.5223576381813416, "learning_rate": 2.6489613050883343e-05, "loss": 0.3548, "loss_nan_ranks": 0, "loss_rank_avg": 0.132581427693367, "step": 1990, "valid_targets_mean": 5168.0, "valid_targets_min": 1191 }, { "epoch": 3.1972734562951084, "grad_norm": 0.5813867725843586, "learning_rate": 2.6413967230807677e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.17431476712226868, "step": 1995, "valid_targets_mean": 4458.4, "valid_targets_min": 1123 }, { "epoch": 3.2052927024859663, "grad_norm": 0.6202033622798051, "learning_rate": 2.6338218996614924e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445320099592209, "step": 2000, "valid_targets_mean": 3833.1, "valid_targets_min": 1692 }, { "epoch": 3.2133119486768242, "grad_norm": 0.6448556178568718, "learning_rate": 2.6262369557804325e-05, "loss": 0.3133, "loss_nan_ranks": 0, "loss_rank_avg": 0.1171756237745285, "step": 2005, "valid_targets_mean": 2876.5, "valid_targets_min": 1136 }, { "epoch": 3.2213311948676826, "grad_norm": 0.6092126401517288, "learning_rate": 2.6186420125491094e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.14689497649669647, "step": 2010, "valid_targets_mean": 3826.5, "valid_targets_min": 2248 }, { "epoch": 3.2293504410585405, "grad_norm": 0.6043324360660347, "learning_rate": 2.6110371912387083e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.1918356716632843, "step": 2015, "valid_targets_mean": 5438.6, "valid_targets_min": 1884 }, { "epoch": 3.2373696872493984, "grad_norm": 0.47063226408624154, "learning_rate": 2.6034226132781407e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.22369518876075745, "step": 2020, "valid_targets_mean": 8461.0, "valid_targets_min": 1896 }, { "epoch": 3.245388933440257, "grad_norm": 0.9275068584587873, "learning_rate": 2.5957984002521066e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.197782963514328, "step": 2025, "valid_targets_mean": 3524.5, "valid_targets_min": 1703 }, { "epoch": 3.2534081796311147, "grad_norm": 0.5533054991481485, "learning_rate": 2.588164673899151e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.13876253366470337, "step": 2030, "valid_targets_mean": 4418.5, "valid_targets_min": 1813 }, { "epoch": 3.2614274258219726, "grad_norm": 0.7212838634122106, "learning_rate": 2.580521556109724e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.20015841722488403, "step": 2035, "valid_targets_mean": 3805.8, "valid_targets_min": 1421 }, { "epoch": 3.2694466720128306, "grad_norm": 0.7597766574519237, "learning_rate": 2.57286916892423e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.15914931893348694, "step": 2040, "valid_targets_mean": 2774.2, "valid_targets_min": 1255 }, { "epoch": 3.277465918203689, "grad_norm": 0.5821850834880777, "learning_rate": 2.5652076345310822e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.1513526290655136, "step": 2045, "valid_targets_mean": 5144.5, "valid_targets_min": 1597 }, { "epoch": 3.285485164394547, "grad_norm": 0.6255573781506097, "learning_rate": 2.5575370752647507e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.2162339985370636, "step": 2050, "valid_targets_mean": 5110.9, "valid_targets_min": 1532 }, { "epoch": 3.293504410585405, "grad_norm": 0.696164430308172, "learning_rate": 2.5498576136038077e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.1917979121208191, "step": 2055, "valid_targets_mean": 3515.4, "valid_targets_min": 1727 }, { "epoch": 3.301523656776263, "grad_norm": 0.6295572557942658, "learning_rate": 2.542169372168976e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.12846094369888306, "step": 2060, "valid_targets_mean": 3133.1, "valid_targets_min": 1526 }, { "epoch": 3.309542902967121, "grad_norm": 0.7413126077265113, "learning_rate": 2.5344724737211646e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.11233331263065338, "step": 2065, "valid_targets_mean": 2601.6, "valid_targets_min": 1160 }, { "epoch": 3.317562149157979, "grad_norm": 0.7018220334438993, "learning_rate": 2.5267670411595152e-05, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.18812254071235657, "step": 2070, "valid_targets_mean": 4047.4, "valid_targets_min": 1636 }, { "epoch": 3.3255813953488373, "grad_norm": 0.7023439898521772, "learning_rate": 2.5190531975194345e-05, "loss": 0.3201, "loss_nan_ranks": 0, "loss_rank_avg": 0.12871921062469482, "step": 2075, "valid_targets_mean": 3000.5, "valid_targets_min": 1178 }, { "epoch": 3.3336006415396953, "grad_norm": 0.6859887980576995, "learning_rate": 2.5113310659706322e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.14714935421943665, "step": 2080, "valid_targets_mean": 3496.4, "valid_targets_min": 1499 }, { "epoch": 3.341619887730553, "grad_norm": 0.6210652673938497, "learning_rate": 2.5036007698151553e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.11785542219877243, "step": 2085, "valid_targets_mean": 3337.6, "valid_targets_min": 1170 }, { "epoch": 3.3496391339214115, "grad_norm": 0.723666478833868, "learning_rate": 2.4958624324854185e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654890716075897, "step": 2090, "valid_targets_mean": 4701.8, "valid_targets_min": 1820 }, { "epoch": 3.3576583801122695, "grad_norm": 0.6623344321527482, "learning_rate": 2.4881161775422303e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.14719511568546295, "step": 2095, "valid_targets_mean": 3824.8, "valid_targets_min": 1739 }, { "epoch": 3.3656776263031274, "grad_norm": 1.4563673300691875, "learning_rate": 2.480362128672824e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1964644342660904, "step": 2100, "valid_targets_mean": 3709.1, "valid_targets_min": 1576 }, { "epoch": 3.3736968724939858, "grad_norm": 0.6842287679822243, "learning_rate": 2.4726004096888817e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.10231268405914307, "step": 2105, "valid_targets_mean": 2384.8, "valid_targets_min": 948 }, { "epoch": 3.3817161186848437, "grad_norm": 0.6061497280938558, "learning_rate": 2.4648311445245558e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11788766831159592, "step": 2110, "valid_targets_mean": 3423.9, "valid_targets_min": 1617 }, { "epoch": 3.3897353648757016, "grad_norm": 0.6208122569688548, "learning_rate": 2.457054457234493e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.18449848890304565, "step": 2115, "valid_targets_mean": 5041.8, "valid_targets_min": 1682 }, { "epoch": 3.39775461106656, "grad_norm": 0.6169483248382215, "learning_rate": 2.4492704719918497e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.1982535421848297, "step": 2120, "valid_targets_mean": 4748.6, "valid_targets_min": 1276 }, { "epoch": 3.405773857257418, "grad_norm": 0.6248745182773543, "learning_rate": 2.4414793130863134e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.20577558875083923, "step": 2125, "valid_targets_mean": 5071.9, "valid_targets_min": 1111 }, { "epoch": 3.413793103448276, "grad_norm": 0.6631257350229737, "learning_rate": 2.433681104922114e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.1303030252456665, "step": 2130, "valid_targets_mean": 3573.0, "valid_targets_min": 1133 }, { "epoch": 3.4218123496391337, "grad_norm": 0.5854169688561389, "learning_rate": 2.4258759720160412e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.09749852865934372, "step": 2135, "valid_targets_mean": 2798.1, "valid_targets_min": 1635 }, { "epoch": 3.429831595829992, "grad_norm": 0.7655917364113674, "learning_rate": 2.4180640389954534e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.15098845958709717, "step": 2140, "valid_targets_mean": 2984.9, "valid_targets_min": 1296 }, { "epoch": 3.43785084202085, "grad_norm": 0.7793522714461361, "learning_rate": 2.4102454305962892e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.1879688799381256, "step": 2145, "valid_targets_mean": 2992.2, "valid_targets_min": 1347 }, { "epoch": 3.445870088211708, "grad_norm": 0.5389302191512596, "learning_rate": 2.402420271661076e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2137525975704193, "step": 2150, "valid_targets_mean": 5566.5, "valid_targets_min": 1084 }, { "epoch": 3.4538893344025663, "grad_norm": 0.5578382143957197, "learning_rate": 2.3945886871369338e-05, "loss": 0.3198, "loss_nan_ranks": 0, "loss_rank_avg": 0.20459142327308655, "step": 2155, "valid_targets_mean": 5751.5, "valid_targets_min": 855 }, { "epoch": 3.461908580593424, "grad_norm": 0.6820518141435146, "learning_rate": 2.3867508020735865e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.15902569890022278, "step": 2160, "valid_targets_mean": 3122.2, "valid_targets_min": 1646 }, { "epoch": 3.469927826784282, "grad_norm": 0.7101366612068016, "learning_rate": 2.3789067416213568e-05, "loss": 0.3133, "loss_nan_ranks": 0, "loss_rank_avg": 0.23392510414123535, "step": 2165, "valid_targets_mean": 3977.8, "valid_targets_min": 1901 }, { "epoch": 3.4779470729751405, "grad_norm": 0.5959411507559745, "learning_rate": 2.3710566310291733e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12113741040229797, "step": 2170, "valid_targets_mean": 3409.2, "valid_targets_min": 1170 }, { "epoch": 3.4859663191659984, "grad_norm": 0.825513561005537, "learning_rate": 2.36320059564257e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.18326623737812042, "step": 2175, "valid_targets_mean": 2507.5, "valid_targets_min": 1314 }, { "epoch": 3.4939855653568563, "grad_norm": 0.5881807614207331, "learning_rate": 2.3553387609016833e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.17981299757957458, "step": 2180, "valid_targets_mean": 4888.0, "valid_targets_min": 1192 }, { "epoch": 3.5020048115477147, "grad_norm": 0.6376036084209341, "learning_rate": 2.347471252339252e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.13395290076732635, "step": 2185, "valid_targets_mean": 4075.9, "valid_targets_min": 1563 }, { "epoch": 3.5100240577385726, "grad_norm": 0.7048620960136164, "learning_rate": 2.339598195578608e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.15857946872711182, "step": 2190, "valid_targets_mean": 3868.2, "valid_targets_min": 1272 }, { "epoch": 3.5180433039294305, "grad_norm": 0.6021136042957389, "learning_rate": 2.3317197163316757e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.15142685174942017, "step": 2195, "valid_targets_mean": 4533.5, "valid_targets_min": 1038 }, { "epoch": 3.5260625501202885, "grad_norm": 0.6263357498807368, "learning_rate": 2.3238359403969608e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935206949710846, "step": 2200, "valid_targets_mean": 4888.2, "valid_targets_min": 1624 }, { "epoch": 3.534081796311147, "grad_norm": 0.5754085355874449, "learning_rate": 2.315946993657543e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1102745458483696, "step": 2205, "valid_targets_mean": 3415.2, "valid_targets_min": 1243 }, { "epoch": 3.5421010425020047, "grad_norm": 0.6423875097563647, "learning_rate": 2.3080530020790673e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.14007174968719482, "step": 2210, "valid_targets_mean": 3485.9, "valid_targets_min": 1035 }, { "epoch": 3.550120288692863, "grad_norm": 0.6750320761835421, "learning_rate": 2.300154091707731e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.117277592420578, "step": 2215, "valid_targets_mean": 2678.0, "valid_targets_min": 1380 }, { "epoch": 3.558139534883721, "grad_norm": 0.6925001340893145, "learning_rate": 2.2922503886682706e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.12452782690525055, "step": 2220, "valid_targets_mean": 2616.5, "valid_targets_min": 1483 }, { "epoch": 3.566158781074579, "grad_norm": 0.6234691562412563, "learning_rate": 2.28434201916195e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.13704489171504974, "step": 2225, "valid_targets_mean": 3737.6, "valid_targets_min": 1066 }, { "epoch": 3.574178027265437, "grad_norm": 0.5773390397694997, "learning_rate": 2.2764291094645446e-05, "loss": 0.3299, "loss_nan_ranks": 0, "loss_rank_avg": 0.163415789604187, "step": 2230, "valid_targets_mean": 4716.2, "valid_targets_min": 945 }, { "epoch": 3.5821972734562952, "grad_norm": 0.4634986618987104, "learning_rate": 2.2685117859243223e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.0939498022198677, "step": 2235, "valid_targets_mean": 4529.6, "valid_targets_min": 1421 }, { "epoch": 3.590216519647153, "grad_norm": 0.5818654879010436, "learning_rate": 2.2605901749600312e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.17287366092205048, "step": 2240, "valid_targets_mean": 4227.2, "valid_targets_min": 1826 }, { "epoch": 3.598235765838011, "grad_norm": 0.7271214583355132, "learning_rate": 2.2526644030588764e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.159470796585083, "step": 2245, "valid_targets_mean": 3116.0, "valid_targets_min": 1306 }, { "epoch": 3.6062550120288694, "grad_norm": 0.6303736540938414, "learning_rate": 2.2447345967745036e-05, "loss": 0.311, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228410840034485, "step": 2250, "valid_targets_mean": 4970.2, "valid_targets_min": 1644 }, { "epoch": 3.6142742582197274, "grad_norm": 0.6640983802312498, "learning_rate": 2.2368008827249756e-05, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.14799731969833374, "step": 2255, "valid_targets_mean": 3004.9, "valid_targets_min": 1629 }, { "epoch": 3.6222935044105853, "grad_norm": 0.6702618106749398, "learning_rate": 2.228863387590752e-05, "loss": 0.3103, "loss_nan_ranks": 0, "loss_rank_avg": 0.17356805503368378, "step": 2260, "valid_targets_mean": 3511.9, "valid_targets_min": 1761 }, { "epoch": 3.630312750601443, "grad_norm": 0.6574381856226909, "learning_rate": 2.2209222381126687e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.13788670301437378, "step": 2265, "valid_targets_mean": 3237.2, "valid_targets_min": 1420 }, { "epoch": 3.6383319967923016, "grad_norm": 0.6413893082198431, "learning_rate": 2.212977561089908e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.12281788140535355, "step": 2270, "valid_targets_mean": 3069.0, "valid_targets_min": 1542 }, { "epoch": 3.6463512429831595, "grad_norm": 0.5679373919087424, "learning_rate": 2.20502948337798e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.14298275113105774, "step": 2275, "valid_targets_mean": 4023.9, "valid_targets_min": 852 }, { "epoch": 3.654370489174018, "grad_norm": 0.6109697268123285, "learning_rate": 2.1970781318866953e-05, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.20169465243816376, "step": 2280, "valid_targets_mean": 4718.6, "valid_targets_min": 1267 }, { "epoch": 3.6623897353648758, "grad_norm": 0.6979138557796742, "learning_rate": 2.1891236335781363e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.215728297829628, "step": 2285, "valid_targets_mean": 4399.8, "valid_targets_min": 1068 }, { "epoch": 3.6704089815557337, "grad_norm": 0.5586803216815522, "learning_rate": 2.1811661154646332e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.15370899438858032, "step": 2290, "valid_targets_mean": 4967.1, "valid_targets_min": 1803 }, { "epoch": 3.6784282277465916, "grad_norm": 0.6642607846469272, "learning_rate": 2.173205704606735e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.1577022671699524, "step": 2295, "valid_targets_mean": 3313.6, "valid_targets_min": 1050 }, { "epoch": 3.68644747393745, "grad_norm": 0.47285164686405123, "learning_rate": 2.1652425281111785e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.12954489886760712, "step": 2300, "valid_targets_mean": 5698.8, "valid_targets_min": 1217 }, { "epoch": 3.694466720128308, "grad_norm": 0.616931928903888, "learning_rate": 2.1572767131288607e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.20086967945098877, "step": 2305, "valid_targets_mean": 4502.0, "valid_targets_min": 1995 }, { "epoch": 3.7024859663191663, "grad_norm": 0.6776466099415515, "learning_rate": 2.1493083868528095e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.14949862658977509, "step": 2310, "valid_targets_mean": 2669.6, "valid_targets_min": 1321 }, { "epoch": 3.710505212510024, "grad_norm": 0.5879844987206615, "learning_rate": 2.141337676516151e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.14676722884178162, "step": 2315, "valid_targets_mean": 4159.5, "valid_targets_min": 1297 }, { "epoch": 3.718524458700882, "grad_norm": 0.5316094998452582, "learning_rate": 2.1333647093900772e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.13722524046897888, "step": 2320, "valid_targets_mean": 4758.6, "valid_targets_min": 1388 }, { "epoch": 3.72654370489174, "grad_norm": 0.5384516550528783, "learning_rate": 2.1253896127818175e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.12726837396621704, "step": 2325, "valid_targets_mean": 3886.1, "valid_targets_min": 954 }, { "epoch": 3.7345629510825984, "grad_norm": 0.5685626865932278, "learning_rate": 2.1174125140326013e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.14816422760486603, "step": 2330, "valid_targets_mean": 5391.9, "valid_targets_min": 1217 }, { "epoch": 3.7425821972734563, "grad_norm": 0.6959300369817977, "learning_rate": 2.1094335405156277e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.1291712373495102, "step": 2335, "valid_targets_mean": 2644.0, "valid_targets_min": 1115 }, { "epoch": 3.7506014434643142, "grad_norm": 0.5721691342290822, "learning_rate": 2.1014528196340316e-05, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.13201016187667847, "step": 2340, "valid_targets_mean": 4654.4, "valid_targets_min": 1343 }, { "epoch": 3.7586206896551726, "grad_norm": 0.5308921374713382, "learning_rate": 2.093470478818847e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.13984020054340363, "step": 2345, "valid_targets_mean": 4449.5, "valid_targets_min": 1874 }, { "epoch": 3.7666399358460305, "grad_norm": 0.5537790122050558, "learning_rate": 2.0854866455269756e-05, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.1428103893995285, "step": 2350, "valid_targets_mean": 4530.8, "valid_targets_min": 1901 }, { "epoch": 3.7746591820368884, "grad_norm": 0.6191705377884588, "learning_rate": 2.0775014472391496e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.12096063047647476, "step": 2355, "valid_targets_mean": 2235.4, "valid_targets_min": 894 }, { "epoch": 3.7826784282277464, "grad_norm": 0.7862911510988639, "learning_rate": 2.0695150114578958e-05, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.2139546275138855, "step": 2360, "valid_targets_mean": 4749.4, "valid_targets_min": 1306 }, { "epoch": 3.7906976744186047, "grad_norm": 0.5933421737639701, "learning_rate": 2.061527465705502e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.19528578221797943, "step": 2365, "valid_targets_mean": 5284.5, "valid_targets_min": 781 }, { "epoch": 3.7987169206094626, "grad_norm": 0.7884471934753257, "learning_rate": 2.0535389375219773e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.15380559861660004, "step": 2370, "valid_targets_mean": 2415.1, "valid_targets_min": 769 }, { "epoch": 3.806736166800321, "grad_norm": 0.5628187445041986, "learning_rate": 2.045549554463019e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.16172266006469727, "step": 2375, "valid_targets_mean": 5658.4, "valid_targets_min": 1996 }, { "epoch": 3.814755412991179, "grad_norm": 0.7023321168544707, "learning_rate": 2.0375594440979744e-05, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.1851782500743866, "step": 2380, "valid_targets_mean": 3709.6, "valid_targets_min": 940 }, { "epoch": 3.822774659182037, "grad_norm": 0.49816800365299313, "learning_rate": 2.0295687340078037e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.13774600625038147, "step": 2385, "valid_targets_mean": 5824.8, "valid_targets_min": 1088 }, { "epoch": 3.8307939053728948, "grad_norm": 0.5434759259403616, "learning_rate": 2.0215775517830437e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.10222262889146805, "step": 2390, "valid_targets_mean": 2964.1, "valid_targets_min": 1235 }, { "epoch": 3.838813151563753, "grad_norm": 0.5582954462858974, "learning_rate": 2.013586025021769e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320442408323288, "step": 2395, "valid_targets_mean": 4672.4, "valid_targets_min": 1916 }, { "epoch": 3.846832397754611, "grad_norm": 0.6219244880549153, "learning_rate": 2.0055942813275564e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.1533651351928711, "step": 2400, "valid_targets_mean": 3792.5, "valid_targets_min": 1635 }, { "epoch": 3.854851643945469, "grad_norm": 0.583133909428859, "learning_rate": 1.9976024483074456e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.13537335395812988, "step": 2405, "valid_targets_mean": 3669.5, "valid_targets_min": 777 }, { "epoch": 3.8628708901363273, "grad_norm": 0.5710475515218163, "learning_rate": 1.9896106535699025e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.17371848225593567, "step": 2410, "valid_targets_mean": 4763.5, "valid_targets_min": 1886 }, { "epoch": 3.8708901363271853, "grad_norm": 0.7422087750459289, "learning_rate": 1.9816190247227834e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.20205745100975037, "step": 2415, "valid_targets_mean": 3689.9, "valid_targets_min": 910 }, { "epoch": 3.878909382518043, "grad_norm": 0.5735536579762645, "learning_rate": 1.9736276893712954e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.10921778529882431, "step": 2420, "valid_targets_mean": 2331.6, "valid_targets_min": 1712 }, { "epoch": 3.886928628708901, "grad_norm": 0.8290520620887073, "learning_rate": 1.9656367751159565e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.16875413060188293, "step": 2425, "valid_targets_mean": 5420.2, "valid_targets_min": 942 }, { "epoch": 3.8949478748997595, "grad_norm": 0.6634118467936565, "learning_rate": 1.957646409550565e-05, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.162868469953537, "step": 2430, "valid_targets_mean": 3375.5, "valid_targets_min": 1776 }, { "epoch": 3.9029671210906174, "grad_norm": 0.5514424320141615, "learning_rate": 1.9496567202601545e-05, "loss": 0.3416, "loss_nan_ranks": 0, "loss_rank_avg": 0.11645983159542084, "step": 2435, "valid_targets_mean": 4063.9, "valid_targets_min": 1093 }, { "epoch": 3.9109863672814758, "grad_norm": 0.7559637270619394, "learning_rate": 1.9416678348189627e-05, "loss": 0.3209, "loss_nan_ranks": 0, "loss_rank_avg": 0.13118937611579895, "step": 2440, "valid_targets_mean": 2165.9, "valid_targets_min": 1256 }, { "epoch": 3.9190056134723337, "grad_norm": 0.5721686798208526, "learning_rate": 1.9336798807883907e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.15008927881717682, "step": 2445, "valid_targets_mean": 4456.1, "valid_targets_min": 1478 }, { "epoch": 3.9270248596631916, "grad_norm": 0.6746770874611306, "learning_rate": 1.9256929857149686e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.1619241088628769, "step": 2450, "valid_targets_mean": 4323.2, "valid_targets_min": 360 }, { "epoch": 3.9350441058540495, "grad_norm": 0.4588461813998274, "learning_rate": 1.9177072771283167e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.12452046573162079, "step": 2455, "valid_targets_mean": 6464.2, "valid_targets_min": 1916 }, { "epoch": 3.943063352044908, "grad_norm": 0.7611903980866798, "learning_rate": 1.9097228825391087e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.12964674830436707, "step": 2460, "valid_targets_mean": 2518.0, "valid_targets_min": 1172 }, { "epoch": 3.951082598235766, "grad_norm": 0.5770073146825253, "learning_rate": 1.9017399294370413e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.18876230716705322, "step": 2465, "valid_targets_mean": 5568.9, "valid_targets_min": 1405 }, { "epoch": 3.959101844426624, "grad_norm": 0.5817238464553584, "learning_rate": 1.893758545288791e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423710584640503, "step": 2470, "valid_targets_mean": 4295.6, "valid_targets_min": 1645 }, { "epoch": 3.967121090617482, "grad_norm": 0.6317461077406834, "learning_rate": 1.8857788575359847e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.16364887356758118, "step": 2475, "valid_targets_mean": 3607.5, "valid_targets_min": 1407 }, { "epoch": 3.97514033680834, "grad_norm": 0.8827850222282876, "learning_rate": 1.87780099359316e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.185146763920784, "step": 2480, "valid_targets_mean": 2134.6, "valid_targets_min": 1129 }, { "epoch": 3.983159582999198, "grad_norm": 0.6645940380342159, "learning_rate": 1.869825080845734e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.10959568619728088, "step": 2485, "valid_targets_mean": 3266.5, "valid_targets_min": 932 }, { "epoch": 3.9911788291900563, "grad_norm": 0.6186510386974092, "learning_rate": 1.8618512466479686e-05, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.15738460421562195, "step": 2490, "valid_targets_mean": 3458.0, "valid_targets_min": 1685 }, { "epoch": 3.999198075380914, "grad_norm": 0.6807919040257233, "learning_rate": 1.8538796183209373e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.1197328045964241, "step": 2495, "valid_targets_mean": 2409.2, "valid_targets_min": 725 }, { "epoch": 4.006415396952686, "grad_norm": 0.7664612910352315, "learning_rate": 1.845910323150491e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.12675949931144714, "step": 2500, "valid_targets_mean": 2815.8, "valid_targets_min": 1370 }, { "epoch": 4.014434643143544, "grad_norm": 0.6249341429920836, "learning_rate": 1.8379434883852255e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351551115512848, "step": 2505, "valid_targets_mean": 3788.1, "valid_targets_min": 1445 }, { "epoch": 4.022453889334402, "grad_norm": 0.6169426406721958, "learning_rate": 1.8299792412344524e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.19960349798202515, "step": 2510, "valid_targets_mean": 5476.1, "valid_targets_min": 1675 }, { "epoch": 4.030473135525261, "grad_norm": 0.6980740210909196, "learning_rate": 1.8220177088661635e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375872790813446, "step": 2515, "valid_targets_mean": 3389.1, "valid_targets_min": 1106 }, { "epoch": 4.038492381716119, "grad_norm": 0.6326648876922993, "learning_rate": 1.814059018405004e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.2054217904806137, "step": 2520, "valid_targets_mean": 4802.5, "valid_targets_min": 1526 }, { "epoch": 4.046511627906977, "grad_norm": 0.5533039222556833, "learning_rate": 1.806103296930243e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.12456436455249786, "step": 2525, "valid_targets_mean": 4612.8, "valid_targets_min": 917 }, { "epoch": 4.054530874097835, "grad_norm": 0.7546658667065802, "learning_rate": 1.7981506714737392e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.1207520067691803, "step": 2530, "valid_targets_mean": 2114.4, "valid_targets_min": 1501 }, { "epoch": 4.062550120288693, "grad_norm": 0.7903494861888394, "learning_rate": 1.7902012690179188e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.17907792329788208, "step": 2535, "valid_targets_mean": 2663.4, "valid_targets_min": 1352 }, { "epoch": 4.070569366479551, "grad_norm": 0.5392010413967019, "learning_rate": 1.7822552164937437e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.1764984130859375, "step": 2540, "valid_targets_mean": 6216.5, "valid_targets_min": 1486 }, { "epoch": 4.078588612670409, "grad_norm": 0.6218958225310146, "learning_rate": 1.7743126407786873e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.12865877151489258, "step": 2545, "valid_targets_mean": 3260.6, "valid_targets_min": 1072 }, { "epoch": 4.086607858861267, "grad_norm": 0.6988079855685614, "learning_rate": 1.766373668694707e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.18029667437076569, "step": 2550, "valid_targets_mean": 4027.5, "valid_targets_min": 1291 }, { "epoch": 4.094627105052125, "grad_norm": 0.6850210709213693, "learning_rate": 1.7584384270062195e-05, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.1642959713935852, "step": 2555, "valid_targets_mean": 3666.5, "valid_targets_min": 1856 }, { "epoch": 4.102646351242983, "grad_norm": 0.7292850754819737, "learning_rate": 1.7505070424180772e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.1267768293619156, "step": 2560, "valid_targets_mean": 3086.2, "valid_targets_min": 2045 }, { "epoch": 4.110665597433841, "grad_norm": 0.5967251682445334, "learning_rate": 1.7425796415735454e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.1499030888080597, "step": 2565, "valid_targets_mean": 5102.1, "valid_targets_min": 1401 }, { "epoch": 4.118684843624699, "grad_norm": 0.6571378352373214, "learning_rate": 1.7346563510522783e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.16292981803417206, "step": 2570, "valid_targets_mean": 4743.0, "valid_targets_min": 1578 }, { "epoch": 4.126704089815557, "grad_norm": 0.675497128387472, "learning_rate": 1.7267372973682998e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1479819118976593, "step": 2575, "valid_targets_mean": 3963.6, "valid_targets_min": 1729 }, { "epoch": 4.134723336006416, "grad_norm": 0.7326592923300912, "learning_rate": 1.7188226069679834e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.19977575540542603, "step": 2580, "valid_targets_mean": 3865.2, "valid_targets_min": 1590 }, { "epoch": 4.142742582197274, "grad_norm": 0.6873671648413628, "learning_rate": 1.7109124062280307e-05, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.14063113927841187, "step": 2585, "valid_targets_mean": 4487.2, "valid_targets_min": 692 }, { "epoch": 4.150761828388132, "grad_norm": 0.6095576855334193, "learning_rate": 1.7030068214534567e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.23792943358421326, "step": 2590, "valid_targets_mean": 5420.4, "valid_targets_min": 1196 }, { "epoch": 4.1587810745789895, "grad_norm": 0.5830732903880987, "learning_rate": 1.695105978875572e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.23750761151313782, "step": 2595, "valid_targets_mean": 6366.0, "valid_targets_min": 1360 }, { "epoch": 4.166800320769847, "grad_norm": 1.3716635476926997, "learning_rate": 1.687210004649965e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.16633760929107666, "step": 2600, "valid_targets_mean": 3487.9, "valid_targets_min": 1588 }, { "epoch": 4.174819566960705, "grad_norm": 0.5938899390350082, "learning_rate": 1.679319024854491e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.11015024781227112, "step": 2605, "valid_targets_mean": 3193.2, "valid_targets_min": 2061 }, { "epoch": 4.182838813151564, "grad_norm": 0.6326797027989053, "learning_rate": 1.6714331654872564e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.11679890751838684, "step": 2610, "valid_targets_mean": 3417.5, "valid_targets_min": 1365 }, { "epoch": 4.190858059342422, "grad_norm": 0.7312342864342426, "learning_rate": 1.663552552464609e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.18835344910621643, "step": 2615, "valid_targets_mean": 4148.8, "valid_targets_min": 1673 }, { "epoch": 4.19887730553328, "grad_norm": 0.7173472704001893, "learning_rate": 1.6556773116191257e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.20450419187545776, "step": 2620, "valid_targets_mean": 3396.1, "valid_targets_min": 1668 }, { "epoch": 4.206896551724138, "grad_norm": 0.77329570396891, "learning_rate": 1.647807568697603e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.11599031090736389, "step": 2625, "valid_targets_mean": 2351.6, "valid_targets_min": 1421 }, { "epoch": 4.214915797914996, "grad_norm": 0.5845000243505154, "learning_rate": 1.6399434493590524e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.09674696624279022, "step": 2630, "valid_targets_mean": 4645.5, "valid_targets_min": 989 }, { "epoch": 4.222935044105854, "grad_norm": 0.6011721501271884, "learning_rate": 1.6320850791726884e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.12517546117305756, "step": 2635, "valid_targets_mean": 4551.5, "valid_targets_min": 1533 }, { "epoch": 4.230954290296712, "grad_norm": 0.6399303295964973, "learning_rate": 1.6242325836159304e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.08618373423814774, "step": 2640, "valid_targets_mean": 3065.9, "valid_targets_min": 1593 }, { "epoch": 4.2389735364875705, "grad_norm": 0.6249080756872688, "learning_rate": 1.6163860880723923e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666812002658844, "step": 2645, "valid_targets_mean": 5007.8, "valid_targets_min": 1590 }, { "epoch": 4.246992782678428, "grad_norm": 0.7629237085664993, "learning_rate": 1.6085457178298866e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.20086871087551117, "step": 2650, "valid_targets_mean": 3285.4, "valid_targets_min": 1072 }, { "epoch": 4.255012028869286, "grad_norm": 0.6291560094829501, "learning_rate": 1.6007115980784182e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.14886760711669922, "step": 2655, "valid_targets_mean": 3889.0, "valid_targets_min": 984 }, { "epoch": 4.263031275060144, "grad_norm": 0.592396380167956, "learning_rate": 1.592883853908188e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.16692480444908142, "step": 2660, "valid_targets_mean": 5258.0, "valid_targets_min": 1757 }, { "epoch": 4.271050521251002, "grad_norm": 0.614901407527612, "learning_rate": 1.585062610307599e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.12212534993886948, "step": 2665, "valid_targets_mean": 3828.4, "valid_targets_min": 1512 }, { "epoch": 4.27906976744186, "grad_norm": 0.539175507420039, "learning_rate": 1.5772479921612543e-05, "loss": 0.2961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1522282361984253, "step": 2670, "valid_targets_mean": 5116.0, "valid_targets_min": 2192 }, { "epoch": 4.287089013632719, "grad_norm": 0.7880906493055246, "learning_rate": 1.5694401242479677e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.14232610166072845, "step": 2675, "valid_targets_mean": 2413.8, "valid_targets_min": 947 }, { "epoch": 4.295108259823577, "grad_norm": 0.7072732280589041, "learning_rate": 1.5616391312387683e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.12438453733921051, "step": 2680, "valid_targets_mean": 2989.5, "valid_targets_min": 1407 }, { "epoch": 4.303127506014435, "grad_norm": 0.6071341451929586, "learning_rate": 1.5538451376949106e-05, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.16311699151992798, "step": 2685, "valid_targets_mean": 3806.5, "valid_targets_min": 2208 }, { "epoch": 4.311146752205293, "grad_norm": 0.6800851010260914, "learning_rate": 1.5460582680658888e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.16989164054393768, "step": 2690, "valid_targets_mean": 3681.4, "valid_targets_min": 1333 }, { "epoch": 4.319165998396151, "grad_norm": 0.48556758234567987, "learning_rate": 1.5382786466874446e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.14437130093574524, "step": 2695, "valid_targets_mean": 4970.8, "valid_targets_min": 1122 }, { "epoch": 4.3271852445870085, "grad_norm": 0.6577443016532359, "learning_rate": 1.5305063977795856e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.11139737069606781, "step": 2700, "valid_targets_mean": 2757.2, "valid_targets_min": 1281 }, { "epoch": 4.335204490777867, "grad_norm": 0.6182840648525525, "learning_rate": 1.5227416454445995e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.12627378106117249, "step": 2705, "valid_targets_mean": 3772.1, "valid_targets_min": 1144 }, { "epoch": 4.343223736968725, "grad_norm": 0.6243168028194502, "learning_rate": 1.5149845136650748e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.12724119424819946, "step": 2710, "valid_targets_mean": 3995.0, "valid_targets_min": 1201 }, { "epoch": 4.351242983159583, "grad_norm": 0.6417026983652291, "learning_rate": 1.5072351263019177e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.1036786288022995, "step": 2715, "valid_targets_mean": 3606.6, "valid_targets_min": 1458 }, { "epoch": 4.359262229350441, "grad_norm": 0.844392440282072, "learning_rate": 1.4994936070923784e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.32359081506729126, "step": 2720, "valid_targets_mean": 4454.1, "valid_targets_min": 1068 }, { "epoch": 4.367281475541299, "grad_norm": 0.7084510197391164, "learning_rate": 1.4917600796480745e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.1323051005601883, "step": 2725, "valid_targets_mean": 2887.8, "valid_targets_min": 1694 }, { "epoch": 4.375300721732157, "grad_norm": 0.6594726779847885, "learning_rate": 1.4840346674530122e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922025829553604, "step": 2730, "valid_targets_mean": 4383.1, "valid_targets_min": 1635 }, { "epoch": 4.383319967923015, "grad_norm": 0.6820193540630956, "learning_rate": 1.4763174938616232e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.14726585149765015, "step": 2735, "valid_targets_mean": 3319.2, "valid_targets_min": 1885 }, { "epoch": 4.391339214113874, "grad_norm": 0.6015328925160687, "learning_rate": 1.4686086820967865e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.162798672914505, "step": 2740, "valid_targets_mean": 4476.4, "valid_targets_min": 1696 }, { "epoch": 4.3993584603047315, "grad_norm": 0.8278448591901193, "learning_rate": 1.460908355247868e-05, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.14701534807682037, "step": 2745, "valid_targets_mean": 2546.6, "valid_targets_min": 1403 }, { "epoch": 4.4073777064955895, "grad_norm": 0.7021457185806277, "learning_rate": 1.4532166362687507e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.25253719091415405, "step": 2750, "valid_targets_mean": 4316.8, "valid_targets_min": 2207 }, { "epoch": 4.415396952686447, "grad_norm": 0.7067776926843179, "learning_rate": 1.445533647975871e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.16636572778224945, "step": 2755, "valid_targets_mean": 3728.9, "valid_targets_min": 1401 }, { "epoch": 4.423416198877305, "grad_norm": 0.553065216859592, "learning_rate": 1.437859513046263e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.22052179276943207, "step": 2760, "valid_targets_mean": 7221.8, "valid_targets_min": 2063 }, { "epoch": 4.431435445068163, "grad_norm": 0.7333787563498618, "learning_rate": 1.4301943540155914e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.14278584718704224, "step": 2765, "valid_targets_mean": 3379.8, "valid_targets_min": 1436 }, { "epoch": 4.439454691259022, "grad_norm": 0.7014878612639377, "learning_rate": 1.4225382932762033e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.12255248427391052, "step": 2770, "valid_targets_mean": 2985.6, "valid_targets_min": 1121 }, { "epoch": 4.44747393744988, "grad_norm": 0.5983108500408503, "learning_rate": 1.4148914530751681e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.15522173047065735, "step": 2775, "valid_targets_mean": 4806.6, "valid_targets_min": 1304 }, { "epoch": 4.455493183640738, "grad_norm": 0.6016213588313895, "learning_rate": 1.4072539555123292e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.11137634515762329, "step": 2780, "valid_targets_mean": 3612.9, "valid_targets_min": 1023 }, { "epoch": 4.463512429831596, "grad_norm": 0.708603157173453, "learning_rate": 1.3996259225383514e-05, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.19193142652511597, "step": 2785, "valid_targets_mean": 3475.4, "valid_targets_min": 1384 }, { "epoch": 4.471531676022454, "grad_norm": 0.6595079377732089, "learning_rate": 1.3920074759527737e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.14381149411201477, "step": 2790, "valid_targets_mean": 4244.5, "valid_targets_min": 1644 }, { "epoch": 4.479550922213312, "grad_norm": 0.682347199348743, "learning_rate": 1.3843987374020689e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.11310821771621704, "step": 2795, "valid_targets_mean": 2818.0, "valid_targets_min": 1144 }, { "epoch": 4.4875701684041704, "grad_norm": 0.673708092784138, "learning_rate": 1.376799828377696e-05, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1609186977148056, "step": 2800, "valid_targets_mean": 4392.5, "valid_targets_min": 1682 }, { "epoch": 4.495589414595028, "grad_norm": 0.7701654224555916, "learning_rate": 1.3692108702141642e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.16439709067344666, "step": 2805, "valid_targets_mean": 3979.4, "valid_targets_min": 1068 }, { "epoch": 4.503608660785886, "grad_norm": 0.747752295214148, "learning_rate": 1.361631984087091e-05, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.19700704514980316, "step": 2810, "valid_targets_mean": 4090.0, "valid_targets_min": 1721 }, { "epoch": 4.511627906976744, "grad_norm": 0.6477208313095743, "learning_rate": 1.354063291011273e-05, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.16184011101722717, "step": 2815, "valid_targets_mean": 4613.4, "valid_targets_min": 1128 }, { "epoch": 4.519647153167602, "grad_norm": 0.6733680816426071, "learning_rate": 1.3465049118387486e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.10472169518470764, "step": 2820, "valid_targets_mean": 2796.8, "valid_targets_min": 851 }, { "epoch": 4.52766639935846, "grad_norm": 0.6424194689152843, "learning_rate": 1.3389569672568707e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.13144317269325256, "step": 2825, "valid_targets_mean": 3813.0, "valid_targets_min": 1258 }, { "epoch": 4.535685645549318, "grad_norm": 0.711628727877956, "learning_rate": 1.331419577786381e-05, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445176601409912, "step": 2830, "valid_targets_mean": 3091.0, "valid_targets_min": 1269 }, { "epoch": 4.543704891740177, "grad_norm": 0.5858426317676418, "learning_rate": 1.3238928637794816e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1151544451713562, "step": 2835, "valid_targets_mean": 3128.2, "valid_targets_min": 1702 }, { "epoch": 4.551724137931035, "grad_norm": 0.5285642967965074, "learning_rate": 1.3163769454179183e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.11126041412353516, "step": 2840, "valid_targets_mean": 4345.5, "valid_targets_min": 1215 }, { "epoch": 4.559743384121893, "grad_norm": 0.6880573162367785, "learning_rate": 1.3088719427110552e-05, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.17842459678649902, "step": 2845, "valid_targets_mean": 3686.1, "valid_targets_min": 1141 }, { "epoch": 4.5677626303127505, "grad_norm": 0.5738068890763433, "learning_rate": 1.3013779754939666e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.08108074963092804, "step": 2850, "valid_targets_mean": 3041.1, "valid_targets_min": 1131 }, { "epoch": 4.5757818765036085, "grad_norm": 0.6727608318013361, "learning_rate": 1.2938951634255164e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.14837145805358887, "step": 2855, "valid_targets_mean": 3484.1, "valid_targets_min": 781 }, { "epoch": 4.583801122694466, "grad_norm": 0.7491945483704048, "learning_rate": 1.2864236259864495e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.17192235589027405, "step": 2860, "valid_targets_mean": 3492.8, "valid_targets_min": 1388 }, { "epoch": 4.591820368885324, "grad_norm": 0.7333536011748594, "learning_rate": 1.2789634824774887e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.12326601147651672, "step": 2865, "valid_targets_mean": 2463.1, "valid_targets_min": 849 }, { "epoch": 4.599839615076183, "grad_norm": 0.6618282090733283, "learning_rate": 1.2715148520174206e-05, "loss": 0.3116, "loss_nan_ranks": 0, "loss_rank_avg": 0.13372093439102173, "step": 2870, "valid_targets_mean": 3236.8, "valid_targets_min": 1867 }, { "epoch": 4.607858861267041, "grad_norm": 0.5773713859304231, "learning_rate": 1.2640778535412036e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293078362941742, "step": 2875, "valid_targets_mean": 4062.0, "valid_targets_min": 1491 }, { "epoch": 4.615878107457899, "grad_norm": 0.5752357451602147, "learning_rate": 1.2566526057980608e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.14979536831378937, "step": 2880, "valid_targets_mean": 6125.9, "valid_targets_min": 1865 }, { "epoch": 4.623897353648757, "grad_norm": 0.718233009091973, "learning_rate": 1.2492392273495879e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.15855081379413605, "step": 2885, "valid_targets_mean": 3574.5, "valid_targets_min": 1157 }, { "epoch": 4.631916599839615, "grad_norm": 0.6385022169911636, "learning_rate": 1.2418378365678612e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.11923573911190033, "step": 2890, "valid_targets_mean": 3496.6, "valid_targets_min": 1233 }, { "epoch": 4.639935846030474, "grad_norm": 0.6741105564550025, "learning_rate": 1.234448551633542e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.13079974055290222, "step": 2895, "valid_targets_mean": 3383.1, "valid_targets_min": 1756 }, { "epoch": 4.6479550922213315, "grad_norm": 0.6731032246078844, "learning_rate": 1.2270714905339969e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.13784664869308472, "step": 2900, "valid_targets_mean": 3501.4, "valid_targets_min": 1172 }, { "epoch": 4.655974338412189, "grad_norm": 0.5459817806212016, "learning_rate": 1.2197067710614075e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.1550457924604416, "step": 2905, "valid_targets_mean": 6346.2, "valid_targets_min": 1452 }, { "epoch": 4.663993584603047, "grad_norm": 0.6580847788724664, "learning_rate": 1.2123545108108943e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.14394521713256836, "step": 2910, "valid_targets_mean": 3643.9, "valid_targets_min": 1347 }, { "epoch": 4.672012830793905, "grad_norm": 0.5599219227017097, "learning_rate": 1.2050148271786348e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.20623619854450226, "step": 2915, "valid_targets_mean": 5556.8, "valid_targets_min": 2400 }, { "epoch": 4.680032076984763, "grad_norm": 0.664894094376875, "learning_rate": 1.1976878373599928e-05, "loss": 0.278, "loss_nan_ranks": 0, "loss_rank_avg": 0.09952618926763535, "step": 2920, "valid_targets_mean": 2577.0, "valid_targets_min": 1282 }, { "epoch": 4.688051323175621, "grad_norm": 0.7111094446633587, "learning_rate": 1.1903736583476441e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.12671411037445068, "step": 2925, "valid_targets_mean": 3261.9, "valid_targets_min": 1935 }, { "epoch": 4.69607056936648, "grad_norm": 0.5847651766990055, "learning_rate": 1.1830724069297106e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.1780378818511963, "step": 2930, "valid_targets_mean": 5556.0, "valid_targets_min": 1506 }, { "epoch": 4.704089815557338, "grad_norm": 0.5177468999912241, "learning_rate": 1.1757841996878957e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.16140317916870117, "step": 2935, "valid_targets_mean": 7164.5, "valid_targets_min": 1599 }, { "epoch": 4.712109061748196, "grad_norm": 0.6591016413495835, "learning_rate": 1.1685091529956187e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.17742176353931427, "step": 2940, "valid_targets_mean": 4117.8, "valid_targets_min": 1422 }, { "epoch": 4.720128307939054, "grad_norm": 0.5580423423386793, "learning_rate": 1.161247383016163e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.1325514018535614, "step": 2945, "valid_targets_mean": 4791.0, "valid_targets_min": 1252 }, { "epoch": 4.728147554129912, "grad_norm": 0.698865733709361, "learning_rate": 1.1539990057008166e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.18542318046092987, "step": 2950, "valid_targets_mean": 4443.1, "valid_targets_min": 1629 }, { "epoch": 4.7361668003207695, "grad_norm": 0.7173027421251956, "learning_rate": 1.1467641367870198e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12904459238052368, "step": 2955, "valid_targets_mean": 2821.5, "valid_targets_min": 1393 }, { "epoch": 4.7441860465116275, "grad_norm": 0.6104913487741482, "learning_rate": 1.1395428917965239e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.12366154789924622, "step": 2960, "valid_targets_mean": 3687.4, "valid_targets_min": 2668 }, { "epoch": 4.752205292702486, "grad_norm": 0.6573756048140178, "learning_rate": 1.1323353860335385e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.14900854229927063, "step": 2965, "valid_targets_mean": 3873.4, "valid_targets_min": 1095 }, { "epoch": 4.760224538893344, "grad_norm": 0.5454178642416636, "learning_rate": 1.1251417345828962e-05, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.1441696435213089, "step": 2970, "valid_targets_mean": 4109.6, "valid_targets_min": 1283 }, { "epoch": 4.768243785084202, "grad_norm": 1.1921633161653373, "learning_rate": 1.1179620523082107e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.18217259645462036, "step": 2975, "valid_targets_mean": 5515.0, "valid_targets_min": 1708 }, { "epoch": 4.77626303127506, "grad_norm": 0.7839193007975936, "learning_rate": 1.110796453850047e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.15419209003448486, "step": 2980, "valid_targets_mean": 3332.9, "valid_targets_min": 897 }, { "epoch": 4.784282277465918, "grad_norm": 0.5924502741680564, "learning_rate": 1.1036450536240877e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.17344138026237488, "step": 2985, "valid_targets_mean": 4609.0, "valid_targets_min": 1500 }, { "epoch": 4.792301523656777, "grad_norm": 0.6375960120782795, "learning_rate": 1.0965079658193068e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.20021280646324158, "step": 2990, "valid_targets_mean": 5160.4, "valid_targets_min": 2007 }, { "epoch": 4.800320769847635, "grad_norm": 0.7333265185533147, "learning_rate": 1.0893853043961475e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.13082224130630493, "step": 2995, "valid_targets_mean": 2873.8, "valid_targets_min": 961 }, { "epoch": 4.808340016038493, "grad_norm": 0.8117410325104224, "learning_rate": 1.0822771830847011e-05, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.11903451383113861, "step": 3000, "valid_targets_mean": 2380.4, "valid_targets_min": 1009 }, { "epoch": 4.8163592622293505, "grad_norm": 0.6321140084556661, "learning_rate": 1.0751837153828926e-05, "loss": 0.3312, "loss_nan_ranks": 0, "loss_rank_avg": 0.13263818621635437, "step": 3005, "valid_targets_mean": 3883.4, "valid_targets_min": 1728 }, { "epoch": 4.824378508420208, "grad_norm": 0.5936225667367856, "learning_rate": 1.0681050145546666e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.10457971692085266, "step": 3010, "valid_targets_mean": 2851.5, "valid_targets_min": 1276 }, { "epoch": 4.832397754611066, "grad_norm": 0.747286134721582, "learning_rate": 1.0610411936281801e-05, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.15670940279960632, "step": 3015, "valid_targets_mean": 2873.4, "valid_targets_min": 1605 }, { "epoch": 4.840417000801924, "grad_norm": 0.5763464609476979, "learning_rate": 1.0539923653939978e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.13804122805595398, "step": 3020, "valid_targets_mean": 4552.0, "valid_targets_min": 1908 }, { "epoch": 4.848436246992783, "grad_norm": 0.6601870709466612, "learning_rate": 1.0469586424032903e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.13651859760284424, "step": 3025, "valid_targets_mean": 3073.1, "valid_targets_min": 1515 }, { "epoch": 4.856455493183641, "grad_norm": 0.6137610848624081, "learning_rate": 1.0399401369660369e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.1242741197347641, "step": 3030, "valid_targets_mean": 3265.4, "valid_targets_min": 1837 }, { "epoch": 4.864474739374499, "grad_norm": 0.5798299445809169, "learning_rate": 1.0329369611492334e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.1235361248254776, "step": 3035, "valid_targets_mean": 4151.0, "valid_targets_min": 1387 }, { "epoch": 4.872493985565357, "grad_norm": 0.7065656337789246, "learning_rate": 1.0259492267751022e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.14881673455238342, "step": 3040, "valid_targets_mean": 3253.1, "valid_targets_min": 1251 }, { "epoch": 4.880513231756215, "grad_norm": 0.7084555430039885, "learning_rate": 1.0189770454193052e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.13089048862457275, "step": 3045, "valid_targets_mean": 3153.9, "valid_targets_min": 1193 }, { "epoch": 4.888532477947073, "grad_norm": 0.6319452934618477, "learning_rate": 1.0120205284091673e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.2694340944290161, "step": 3050, "valid_targets_mean": 5772.9, "valid_targets_min": 1506 }, { "epoch": 4.896551724137931, "grad_norm": 0.7347361203826404, "learning_rate": 1.0050797868218907e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.13853907585144043, "step": 3055, "valid_targets_mean": 2785.8, "valid_targets_min": 1055 }, { "epoch": 4.904570970328789, "grad_norm": 0.6858744703319833, "learning_rate": 9.981549314827876e-06, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.10932730883359909, "step": 3060, "valid_targets_mean": 3593.2, "valid_targets_min": 1509 }, { "epoch": 4.912590216519647, "grad_norm": 0.7463965117098917, "learning_rate": 9.912460729635097e-06, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.12026022374629974, "step": 3065, "valid_targets_mean": 2690.9, "valid_targets_min": 1464 }, { "epoch": 4.920609462710505, "grad_norm": 0.6255584551399795, "learning_rate": 9.843533215802796e-06, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.12835003435611725, "step": 3070, "valid_targets_mean": 4192.9, "valid_targets_min": 1599 }, { "epoch": 4.928628708901363, "grad_norm": 0.6195598668042773, "learning_rate": 9.774767873921357e-06, "loss": 0.2901, "loss_nan_ranks": 0, "loss_rank_avg": 0.15083155035972595, "step": 3075, "valid_targets_mean": 4717.8, "valid_targets_min": 1495 }, { "epoch": 4.936647955092221, "grad_norm": 0.6716462013810224, "learning_rate": 9.706165801991651e-06, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.14034923911094666, "step": 3080, "valid_targets_mean": 3910.9, "valid_targets_min": 1345 }, { "epoch": 4.944667201283079, "grad_norm": 0.6569835195641757, "learning_rate": 9.637728095407593e-06, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.12612038850784302, "step": 3085, "valid_targets_mean": 3746.1, "valid_targets_min": 1577 }, { "epoch": 4.952686447473938, "grad_norm": 0.63238747810288, "learning_rate": 9.56945584693861e-06, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501215100288391, "step": 3090, "valid_targets_mean": 4018.1, "valid_targets_min": 1625 }, { "epoch": 4.960705693664796, "grad_norm": 0.7230137708810255, "learning_rate": 9.501350146712193e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.24168968200683594, "step": 3095, "valid_targets_mean": 4028.8, "valid_targets_min": 1868 }, { "epoch": 4.968724939855654, "grad_norm": 0.6319990610308012, "learning_rate": 9.433412082196527e-06, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.12605804204940796, "step": 3100, "valid_targets_mean": 3486.5, "valid_targets_min": 2160 }, { "epoch": 4.976744186046512, "grad_norm": 0.5708536969900101, "learning_rate": 9.365642738183044e-06, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.15920937061309814, "step": 3105, "valid_targets_mean": 4990.1, "valid_targets_min": 1545 }, { "epoch": 4.9847634322373695, "grad_norm": 0.5821919214576043, "learning_rate": 9.298043196769217e-06, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.15933553874492645, "step": 3110, "valid_targets_mean": 3565.8, "valid_targets_min": 1102 }, { "epoch": 4.992782678428227, "grad_norm": 0.6786847357729681, "learning_rate": 9.230614537341167e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.11117031425237656, "step": 3115, "valid_targets_mean": 2432.1, "valid_targets_min": 1158 }, { "epoch": 5.0, "grad_norm": 1.193829679462879, "learning_rate": 9.163357836556498e-06, "loss": 0.2992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2876368761062622, "step": 3120, "valid_targets_mean": 2031.5, "valid_targets_min": 1107 }, { "epoch": 5.008019246190858, "grad_norm": 0.6109747091355935, "learning_rate": 9.096274168327122e-06, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.12701627612113953, "step": 3125, "valid_targets_mean": 4074.0, "valid_targets_min": 1501 }, { "epoch": 5.016038492381716, "grad_norm": 0.6942276035599934, "learning_rate": 9.029364603802017e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.15716278553009033, "step": 3130, "valid_targets_mean": 4931.4, "valid_targets_min": 1926 }, { "epoch": 5.024057738572574, "grad_norm": 0.759887487112266, "learning_rate": 8.962630211350248e-06, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.14439627528190613, "step": 3135, "valid_targets_mean": 2814.2, "valid_targets_min": 1342 }, { "epoch": 5.032076984763433, "grad_norm": 0.599795720615974, "learning_rate": 8.89607205654378e-06, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.09469808638095856, "step": 3140, "valid_targets_mean": 3236.1, "valid_targets_min": 1353 }, { "epoch": 5.0400962309542905, "grad_norm": 0.6440035501543131, "learning_rate": 8.829691202140591e-06, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.12207989394664764, "step": 3145, "valid_targets_mean": 3591.8, "valid_targets_min": 1063 }, { "epoch": 5.048115477145148, "grad_norm": 0.5238916332457338, "learning_rate": 8.763488708067604e-06, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.19291779398918152, "step": 3150, "valid_targets_mean": 6842.5, "valid_targets_min": 1696 }, { "epoch": 5.056134723336006, "grad_norm": 0.627305644963957, "learning_rate": 8.69746563140379e-06, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.15898439288139343, "step": 3155, "valid_targets_mean": 5154.2, "valid_targets_min": 1161 }, { "epoch": 5.064153969526864, "grad_norm": 0.6325013348334049, "learning_rate": 8.631623026363331e-06, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.17437998950481415, "step": 3160, "valid_targets_mean": 4743.2, "valid_targets_min": 1142 }, { "epoch": 5.072173215717722, "grad_norm": 0.5083461337913077, "learning_rate": 8.56596194427873e-06, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.10465358197689056, "step": 3165, "valid_targets_mean": 4556.4, "valid_targets_min": 1869 }, { "epoch": 5.080192461908581, "grad_norm": 0.6420578870001568, "learning_rate": 8.500483433584054e-06, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.14743009209632874, "step": 3170, "valid_targets_mean": 4409.9, "valid_targets_min": 2802 }, { "epoch": 5.088211708099439, "grad_norm": 0.5800945332781065, "learning_rate": 8.435188539798187e-06, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412481814622879, "step": 3175, "valid_targets_mean": 5302.6, "valid_targets_min": 1094 }, { "epoch": 5.096230954290297, "grad_norm": 0.5487995493169565, "learning_rate": 8.370078305508136e-06, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.12816378474235535, "step": 3180, "valid_targets_mean": 3939.6, "valid_targets_min": 2281 }, { "epoch": 5.104250200481155, "grad_norm": 0.7209217869168146, "learning_rate": 8.305153770352384e-06, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.19583243131637573, "step": 3185, "valid_targets_mean": 4046.2, "valid_targets_min": 1050 }, { "epoch": 5.112269446672013, "grad_norm": 0.9153844934361973, "learning_rate": 8.240415971004285e-06, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.16246981918811798, "step": 3190, "valid_targets_mean": 3443.2, "valid_targets_min": 1358 }, { "epoch": 5.120288692862871, "grad_norm": 0.7035173116926543, "learning_rate": 8.175865941155525e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.16265368461608887, "step": 3195, "valid_targets_mean": 3864.9, "valid_targets_min": 1076 }, { "epoch": 5.1283079390537285, "grad_norm": 0.5779187110976927, "learning_rate": 8.111504711499598e-06, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.18262943625450134, "step": 3200, "valid_targets_mean": 6109.2, "valid_targets_min": 1422 }, { "epoch": 5.136327185244587, "grad_norm": 0.7399562834821453, "learning_rate": 8.04733330971536e-06, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.16191628575325012, "step": 3205, "valid_targets_mean": 3651.8, "valid_targets_min": 1524 }, { "epoch": 5.144346431435445, "grad_norm": 0.5525253134787564, "learning_rate": 7.983352760450618e-06, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.0911126509308815, "step": 3210, "valid_targets_mean": 3176.1, "valid_targets_min": 1182 }, { "epoch": 5.152365677626303, "grad_norm": 0.5882943311329101, "learning_rate": 7.919564085305768e-06, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.1868501901626587, "step": 3215, "valid_targets_mean": 6299.4, "valid_targets_min": 1645 }, { "epoch": 5.160384923817161, "grad_norm": 0.6106884984641533, "learning_rate": 7.855968302817487e-06, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.12039339542388916, "step": 3220, "valid_targets_mean": 3778.2, "valid_targets_min": 2175 }, { "epoch": 5.168404170008019, "grad_norm": 0.7089376796426653, "learning_rate": 7.792566428442456e-06, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.11271081864833832, "step": 3225, "valid_targets_mean": 2812.2, "valid_targets_min": 1319 }, { "epoch": 5.176423416198877, "grad_norm": 0.5888497319322781, "learning_rate": 7.729359474541168e-06, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.09802419692277908, "step": 3230, "valid_targets_mean": 3390.8, "valid_targets_min": 1416 }, { "epoch": 5.184442662389736, "grad_norm": 0.5942736764463901, "learning_rate": 7.666348450361737e-06, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.09806996583938599, "step": 3235, "valid_targets_mean": 4160.8, "valid_targets_min": 1040 }, { "epoch": 5.192461908580594, "grad_norm": 0.6959182547618397, "learning_rate": 7.60353436202381e-06, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.13760900497436523, "step": 3240, "valid_targets_mean": 3679.8, "valid_targets_min": 925 }, { "epoch": 5.200481154771452, "grad_norm": 0.7867712939025543, "learning_rate": 7.540918212502479e-06, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.1103554517030716, "step": 3245, "valid_targets_mean": 2345.2, "valid_targets_min": 1059 }, { "epoch": 5.2085004009623095, "grad_norm": 0.6692820136265186, "learning_rate": 7.478501001612281e-06, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.14655274152755737, "step": 3250, "valid_targets_mean": 4338.4, "valid_targets_min": 2237 }, { "epoch": 5.216519647153167, "grad_norm": 0.7032072972079363, "learning_rate": 7.416283725991229e-06, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.12942096590995789, "step": 3255, "valid_targets_mean": 3271.1, "valid_targets_min": 1351 }, { "epoch": 5.224538893344025, "grad_norm": 0.7202212720662927, "learning_rate": 7.354267379084896e-06, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.10814294219017029, "step": 3260, "valid_targets_mean": 2909.4, "valid_targets_min": 1419 }, { "epoch": 5.232558139534884, "grad_norm": 0.6622834667881968, "learning_rate": 7.292452951130548e-06, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.12850156426429749, "step": 3265, "valid_targets_mean": 3660.1, "valid_targets_min": 1224 }, { "epoch": 5.240577385725742, "grad_norm": 0.6598360930022297, "learning_rate": 7.230841429141347e-06, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.15915730595588684, "step": 3270, "valid_targets_mean": 4591.1, "valid_targets_min": 1677 }, { "epoch": 5.2485966319166, "grad_norm": 0.5650035570886325, "learning_rate": 7.169433796890595e-06, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.1909146010875702, "step": 3275, "valid_targets_mean": 5763.5, "valid_targets_min": 1282 }, { "epoch": 5.256615878107458, "grad_norm": 0.7786393273005862, "learning_rate": 7.108231034895976e-06, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.12871766090393066, "step": 3280, "valid_targets_mean": 3066.1, "valid_targets_min": 1747 }, { "epoch": 5.264635124298316, "grad_norm": 0.5847129918611397, "learning_rate": 7.047234120403972e-06, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.15970800817012787, "step": 3285, "valid_targets_mean": 4016.0, "valid_targets_min": 1848 }, { "epoch": 5.272654370489174, "grad_norm": 0.7449037107821327, "learning_rate": 6.986444027374211e-06, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.12065094709396362, "step": 3290, "valid_targets_mean": 2694.6, "valid_targets_min": 825 }, { "epoch": 5.280673616680032, "grad_norm": 0.7299928241856165, "learning_rate": 6.925861726463919e-06, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.10395687818527222, "step": 3295, "valid_targets_mean": 2786.4, "valid_targets_min": 1582 }, { "epoch": 5.2886928628708905, "grad_norm": 0.5820419035629211, "learning_rate": 6.865488185012464e-06, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.16662782430648804, "step": 3300, "valid_targets_mean": 5864.4, "valid_targets_min": 1432 }, { "epoch": 5.296712109061748, "grad_norm": 0.5820333959976953, "learning_rate": 6.805324367025825e-06, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.09692417085170746, "step": 3305, "valid_targets_mean": 4125.8, "valid_targets_min": 1384 }, { "epoch": 5.304731355252606, "grad_norm": 0.5958545841346957, "learning_rate": 6.745371233161309e-06, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.19019240140914917, "step": 3310, "valid_targets_mean": 6345.2, "valid_targets_min": 1722 }, { "epoch": 5.312750601443464, "grad_norm": 0.7556127215227147, "learning_rate": 6.685629740712103e-06, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.09946641325950623, "step": 3315, "valid_targets_mean": 2636.1, "valid_targets_min": 1172 }, { "epoch": 5.320769847634322, "grad_norm": 0.5877343531269578, "learning_rate": 6.6261008435920605e-06, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.19391608238220215, "step": 3320, "valid_targets_mean": 6642.2, "valid_targets_min": 3260 }, { "epoch": 5.32878909382518, "grad_norm": 0.8406015809943042, "learning_rate": 6.566785492320471e-06, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.1828058362007141, "step": 3325, "valid_targets_mean": 3091.1, "valid_targets_min": 932 }, { "epoch": 5.336808340016039, "grad_norm": 0.6630809875941652, "learning_rate": 6.507684634006815e-06, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.11142952740192413, "step": 3330, "valid_targets_mean": 3407.4, "valid_targets_min": 1374 }, { "epoch": 5.344827586206897, "grad_norm": 0.6972165813383657, "learning_rate": 6.448799212335734e-06, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595240831375122, "step": 3335, "valid_targets_mean": 4169.5, "valid_targets_min": 1688 }, { "epoch": 5.352846832397755, "grad_norm": 0.6323461664571374, "learning_rate": 6.390130167551869e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.10348061472177505, "step": 3340, "valid_targets_mean": 3504.0, "valid_targets_min": 1129 }, { "epoch": 5.360866078588613, "grad_norm": 0.5607270131280743, "learning_rate": 6.331678436444939e-06, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412566602230072, "step": 3345, "valid_targets_mean": 5841.9, "valid_targets_min": 1321 }, { "epoch": 5.368885324779471, "grad_norm": 0.8274449782443676, "learning_rate": 6.273444952334713e-06, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447286307811737, "step": 3350, "valid_targets_mean": 4034.0, "valid_targets_min": 1182 }, { "epoch": 5.3769045709703285, "grad_norm": 0.6736548127167691, "learning_rate": 6.2154306450561175e-06, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.24714772403240204, "step": 3355, "valid_targets_mean": 6792.6, "valid_targets_min": 1244 }, { "epoch": 5.384923817161187, "grad_norm": 0.76791519754358, "learning_rate": 6.157636440944445e-06, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.18893024325370789, "step": 3360, "valid_targets_mean": 3262.1, "valid_targets_min": 1045 }, { "epoch": 5.392943063352045, "grad_norm": 0.6506598342927086, "learning_rate": 6.100063262820474e-06, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.17875610291957855, "step": 3365, "valid_targets_mean": 5643.9, "valid_targets_min": 1452 }, { "epoch": 5.400962309542903, "grad_norm": 0.535214932942372, "learning_rate": 6.0427120299758236e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.12076449394226074, "step": 3370, "valid_targets_mean": 6959.5, "valid_targets_min": 1356 }, { "epoch": 5.408981555733761, "grad_norm": 0.6584811079234478, "learning_rate": 5.985583658158212e-06, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.12384140491485596, "step": 3375, "valid_targets_mean": 3983.8, "valid_targets_min": 2305 }, { "epoch": 5.417000801924619, "grad_norm": 0.677555957298812, "learning_rate": 5.928679059556852e-06, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.12068624049425125, "step": 3380, "valid_targets_mean": 3473.6, "valid_targets_min": 1195 }, { "epoch": 5.425020048115477, "grad_norm": 1.0135790155597735, "learning_rate": 5.871999142787908e-06, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.13749045133590698, "step": 3385, "valid_targets_mean": 2260.4, "valid_targets_min": 937 }, { "epoch": 5.433039294306335, "grad_norm": 0.8039034351308703, "learning_rate": 5.815544812879936e-06, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.13829991221427917, "step": 3390, "valid_targets_mean": 2838.2, "valid_targets_min": 1416 }, { "epoch": 5.441058540497194, "grad_norm": 0.641324943268092, "learning_rate": 5.759316971259503e-06, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.09990415722131729, "step": 3395, "valid_targets_mean": 3651.2, "valid_targets_min": 1471 }, { "epoch": 5.4490777866880515, "grad_norm": 0.7607138645745484, "learning_rate": 5.703316515736734e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.13912031054496765, "step": 3400, "valid_targets_mean": 2623.8, "valid_targets_min": 1205 }, { "epoch": 5.4570970328789095, "grad_norm": 0.6774223564603659, "learning_rate": 5.647544340491007e-06, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.12906160950660706, "step": 3405, "valid_targets_mean": 3493.5, "valid_targets_min": 1513 }, { "epoch": 5.465116279069767, "grad_norm": 3.1286340870646976, "learning_rate": 5.592001336056659e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.11892290413379669, "step": 3410, "valid_targets_mean": 2599.0, "valid_targets_min": 1301 }, { "epoch": 5.473135525260625, "grad_norm": 0.8035364009185652, "learning_rate": 5.536688389308782e-06, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.1144896149635315, "step": 3415, "valid_targets_mean": 2427.1, "valid_targets_min": 1085 }, { "epoch": 5.481154771451483, "grad_norm": 0.7442012893993346, "learning_rate": 5.4816063834490496e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.12948277592658997, "step": 3420, "valid_targets_mean": 2744.4, "valid_targets_min": 1542 }, { "epoch": 5.489174017642342, "grad_norm": 0.7023135477533802, "learning_rate": 5.426756197991625e-06, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.145607128739357, "step": 3425, "valid_targets_mean": 4299.5, "valid_targets_min": 1776 }, { "epoch": 5.4971932638332, "grad_norm": 0.6787099010377489, "learning_rate": 5.372138708749104e-06, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.14306356012821198, "step": 3430, "valid_targets_mean": 4279.4, "valid_targets_min": 1414 }, { "epoch": 5.505212510024058, "grad_norm": 0.7198686312973578, "learning_rate": 5.3177547878185436e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.11792582273483276, "step": 3435, "valid_targets_mean": 2626.5, "valid_targets_min": 1683 }, { "epoch": 5.513231756214916, "grad_norm": 0.6788117637567427, "learning_rate": 5.263605303567532e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.11016759276390076, "step": 3440, "valid_targets_mean": 3527.2, "valid_targets_min": 1300 }, { "epoch": 5.521251002405774, "grad_norm": 0.5905284944796608, "learning_rate": 5.20969112062032e-06, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.11519446969032288, "step": 3445, "valid_targets_mean": 4631.0, "valid_targets_min": 1645 }, { "epoch": 5.529270248596632, "grad_norm": 0.6080932302389219, "learning_rate": 5.156013099844017e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.11113663017749786, "step": 3450, "valid_targets_mean": 3602.1, "valid_targets_min": 772 }, { "epoch": 5.53728949478749, "grad_norm": 0.7288808414312432, "learning_rate": 5.1025720983348544e-06, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.15324431657791138, "step": 3455, "valid_targets_mean": 3440.1, "valid_targets_min": 1892 }, { "epoch": 5.545308740978348, "grad_norm": 0.7316756200535461, "learning_rate": 5.049368969404484e-06, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.18235455453395844, "step": 3460, "valid_targets_mean": 3642.9, "valid_targets_min": 1808 }, { "epoch": 5.553327987169206, "grad_norm": 0.6966803567024507, "learning_rate": 4.99640456256636e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.08969349414110184, "step": 3465, "valid_targets_mean": 3088.2, "valid_targets_min": 1576 }, { "epoch": 5.561347233360064, "grad_norm": 0.7596935347056445, "learning_rate": 4.9436797235221814e-06, "loss": 0.2901, "loss_nan_ranks": 0, "loss_rank_avg": 0.15548765659332275, "step": 3470, "valid_targets_mean": 4137.1, "valid_targets_min": 1414 }, { "epoch": 5.569366479550922, "grad_norm": 0.6598274436780546, "learning_rate": 4.891195294148376e-06, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.1944895088672638, "step": 3475, "valid_targets_mean": 4596.1, "valid_targets_min": 1689 }, { "epoch": 5.57738572574178, "grad_norm": 0.7378986972846266, "learning_rate": 4.838952112482671e-06, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.16218118369579315, "step": 3480, "valid_targets_mean": 3069.6, "valid_targets_min": 1139 }, { "epoch": 5.585404971932638, "grad_norm": 0.5945094620185116, "learning_rate": 4.786951012710699e-06, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.11682992428541183, "step": 3485, "valid_targets_mean": 4199.4, "valid_targets_min": 1645 }, { "epoch": 5.593424218123497, "grad_norm": 0.6940384063458671, "learning_rate": 4.735192825152686e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.15601713955402374, "step": 3490, "valid_targets_mean": 3884.2, "valid_targets_min": 1300 }, { "epoch": 5.601443464314355, "grad_norm": 0.6599876260544516, "learning_rate": 4.683678376250189e-06, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.18536148965358734, "step": 3495, "valid_targets_mean": 4424.0, "valid_targets_min": 1243 }, { "epoch": 5.609462710505213, "grad_norm": 0.7201106735919834, "learning_rate": 4.6324084885529086e-06, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.21292556822299957, "step": 3500, "valid_targets_mean": 4139.2, "valid_targets_min": 1123 }, { "epoch": 5.6174819566960705, "grad_norm": 0.5875396290488495, "learning_rate": 4.581383980705538e-06, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.15536782145500183, "step": 3505, "valid_targets_mean": 6571.2, "valid_targets_min": 2178 }, { "epoch": 5.6255012028869285, "grad_norm": 0.6143731813541532, "learning_rate": 4.530605667434727e-06, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.11163066327571869, "step": 3510, "valid_targets_mean": 3917.9, "valid_targets_min": 1530 }, { "epoch": 5.633520449077786, "grad_norm": 0.9096910759644121, "learning_rate": 4.480074359536013e-06, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.14102259278297424, "step": 3515, "valid_targets_mean": 2312.6, "valid_targets_min": 1279 }, { "epoch": 5.641539695268644, "grad_norm": 0.7248396656648093, "learning_rate": 4.429790863860934e-06, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.17408156394958496, "step": 3520, "valid_targets_mean": 3632.6, "valid_targets_min": 1274 }, { "epoch": 5.649558941459503, "grad_norm": 0.7149084191703611, "learning_rate": 4.3797559833041146e-06, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.14481118321418762, "step": 3525, "valid_targets_mean": 4124.4, "valid_targets_min": 1556 }, { "epoch": 5.657578187650361, "grad_norm": 0.6821009433950561, "learning_rate": 4.329970516790447e-06, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.12271390855312347, "step": 3530, "valid_targets_mean": 3484.8, "valid_targets_min": 1535 }, { "epoch": 5.665597433841219, "grad_norm": 0.8982050367879706, "learning_rate": 4.280435259262363e-06, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.10625463724136353, "step": 3535, "valid_targets_mean": 1793.9, "valid_targets_min": 942 }, { "epoch": 5.673616680032077, "grad_norm": 0.8223177683921912, "learning_rate": 4.231151001667077e-06, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.15554620325565338, "step": 3540, "valid_targets_mean": 6827.8, "valid_targets_min": 2382 }, { "epoch": 5.681635926222935, "grad_norm": 0.643420527087105, "learning_rate": 4.182118530944044e-06, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.14312048256397247, "step": 3545, "valid_targets_mean": 4710.2, "valid_targets_min": 1910 }, { "epoch": 5.689655172413794, "grad_norm": 0.6471702234310968, "learning_rate": 4.133338630012307e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.15536224842071533, "step": 3550, "valid_targets_mean": 5084.6, "valid_targets_min": 1081 }, { "epoch": 5.6976744186046515, "grad_norm": 0.5528436647261742, "learning_rate": 4.0848120777580554e-06, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.12030863016843796, "step": 3555, "valid_targets_mean": 5179.9, "valid_targets_min": 1397 }, { "epoch": 5.705693664795509, "grad_norm": 0.5396611921495026, "learning_rate": 4.036539649022182e-06, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2417977899312973, "step": 3560, "valid_targets_mean": 7620.6, "valid_targets_min": 1939 }, { "epoch": 5.713712910986367, "grad_norm": 0.650216464185914, "learning_rate": 3.988522114587865e-06, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.09948883205652237, "step": 3565, "valid_targets_mean": 3263.5, "valid_targets_min": 961 }, { "epoch": 5.721732157177225, "grad_norm": 0.5381622998244979, "learning_rate": 3.940760241168331e-06, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.20080620050430298, "step": 3570, "valid_targets_mean": 8185.6, "valid_targets_min": 1067 }, { "epoch": 5.729751403368083, "grad_norm": 0.7212188608624658, "learning_rate": 3.893254791394541e-06, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.20672596991062164, "step": 3575, "valid_targets_mean": 4884.8, "valid_targets_min": 1743 }, { "epoch": 5.737770649558941, "grad_norm": 0.669092022617526, "learning_rate": 3.846006523803074e-06, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.1462830901145935, "step": 3580, "valid_targets_mean": 3797.6, "valid_targets_min": 1137 }, { "epoch": 5.7457898957498, "grad_norm": 0.8029880791009278, "learning_rate": 3.799016192823981e-06, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.1821311116218567, "step": 3585, "valid_targets_mean": 4097.9, "valid_targets_min": 1582 }, { "epoch": 5.753809141940658, "grad_norm": 0.5732364301633718, "learning_rate": 3.7522845487687276e-06, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.13184769451618195, "step": 3590, "valid_targets_mean": 5341.0, "valid_targets_min": 1348 }, { "epoch": 5.761828388131516, "grad_norm": 0.7644038643363767, "learning_rate": 3.7058123378182664e-06, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.17732053995132446, "step": 3595, "valid_targets_mean": 3186.9, "valid_targets_min": 1418 }, { "epoch": 5.769847634322374, "grad_norm": 0.5889080563512636, "learning_rate": 3.6596003020110636e-06, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.1895439326763153, "step": 3600, "valid_targets_mean": 4825.1, "valid_targets_min": 1217 }, { "epoch": 5.777866880513232, "grad_norm": 0.7001673848354629, "learning_rate": 3.613649179231287e-06, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.10094672441482544, "step": 3605, "valid_targets_mean": 2560.6, "valid_targets_min": 1881 }, { "epoch": 5.7858861267040895, "grad_norm": 0.7113191211178155, "learning_rate": 3.5679597031970017e-06, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.1153012216091156, "step": 3610, "valid_targets_mean": 3266.9, "valid_targets_min": 1394 }, { "epoch": 5.7939053728949474, "grad_norm": 0.6038915015284441, "learning_rate": 3.5225326034484764e-06, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.20703008770942688, "step": 3615, "valid_targets_mean": 5885.2, "valid_targets_min": 1229 }, { "epoch": 5.801924619085806, "grad_norm": 0.7051731320703262, "learning_rate": 3.4773686053365197e-06, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.10645755380392075, "step": 3620, "valid_targets_mean": 3316.8, "valid_targets_min": 1509 }, { "epoch": 5.809943865276664, "grad_norm": 0.5541262922082779, "learning_rate": 3.4324684300109003e-06, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1505921185016632, "step": 3625, "valid_targets_mean": 5566.5, "valid_targets_min": 1045 }, { "epoch": 5.817963111467522, "grad_norm": 0.6614777960578949, "learning_rate": 3.387832794408832e-06, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.10717364400625229, "step": 3630, "valid_targets_mean": 2447.9, "valid_targets_min": 910 }, { "epoch": 5.82598235765838, "grad_norm": 0.6530849619363815, "learning_rate": 3.3434624112435342e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.11250616610050201, "step": 3635, "valid_targets_mean": 3679.1, "valid_targets_min": 1252 }, { "epoch": 5.834001603849238, "grad_norm": 0.8457840930871934, "learning_rate": 3.2993579889928397e-06, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.12079623341560364, "step": 3640, "valid_targets_mean": 2276.9, "valid_targets_min": 781 }, { "epoch": 5.842020850040096, "grad_norm": 0.5424570068999839, "learning_rate": 3.25552023188789e-06, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.11634393036365509, "step": 3645, "valid_targets_mean": 5780.5, "valid_targets_min": 1631 }, { "epoch": 5.850040096230955, "grad_norm": 0.6609099224803072, "learning_rate": 3.211949839901889e-06, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.07904715836048126, "step": 3650, "valid_targets_mean": 1853.6, "valid_targets_min": 583 }, { "epoch": 5.858059342421813, "grad_norm": 0.7054665857775407, "learning_rate": 3.168647508738927e-06, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.11137621849775314, "step": 3655, "valid_targets_mean": 3421.8, "valid_targets_min": 1086 }, { "epoch": 5.8660785886126705, "grad_norm": 0.5673837151999918, "learning_rate": 3.125613929822866e-06, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.16755767166614532, "step": 3660, "valid_targets_mean": 4874.6, "valid_targets_min": 1170 }, { "epoch": 5.874097834803528, "grad_norm": 0.6430654552670423, "learning_rate": 3.0828497902863106e-06, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.14625166356563568, "step": 3665, "valid_targets_mean": 4878.0, "valid_targets_min": 1679 }, { "epoch": 5.882117080994386, "grad_norm": 0.7773523165873664, "learning_rate": 3.0403557729596267e-06, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.15384423732757568, "step": 3670, "valid_targets_mean": 3396.4, "valid_targets_min": 1055 }, { "epoch": 5.890136327185244, "grad_norm": 0.5560053959749172, "learning_rate": 2.998132556360038e-06, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.09452245384454727, "step": 3675, "valid_targets_mean": 3702.9, "valid_targets_min": 2185 }, { "epoch": 5.898155573376103, "grad_norm": 0.7832758816536532, "learning_rate": 2.9561808146808068e-06, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.15402548015117645, "step": 3680, "valid_targets_mean": 3342.1, "valid_targets_min": 1422 }, { "epoch": 5.906174819566961, "grad_norm": 0.5874927264256125, "learning_rate": 2.9145012177804476e-06, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.1170136108994484, "step": 3685, "valid_targets_mean": 4333.6, "valid_targets_min": 1515 }, { "epoch": 5.914194065757819, "grad_norm": 0.7250685172338484, "learning_rate": 2.8730944311720454e-06, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.16327306628227234, "step": 3690, "valid_targets_mean": 4079.8, "valid_targets_min": 1035 }, { "epoch": 5.922213311948677, "grad_norm": 0.6049201069316128, "learning_rate": 2.8319611160126226e-06, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.10896667838096619, "step": 3695, "valid_targets_mean": 4256.0, "valid_targets_min": 1479 }, { "epoch": 5.930232558139535, "grad_norm": 0.8074696599106505, "learning_rate": 2.791101929092592e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.18283414840698242, "step": 3700, "valid_targets_mean": 3042.2, "valid_targets_min": 1025 }, { "epoch": 5.938251804330393, "grad_norm": 0.6418415192706601, "learning_rate": 2.750517522825251e-06, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.14782294631004333, "step": 3705, "valid_targets_mean": 4387.5, "valid_targets_min": 2406 }, { "epoch": 5.946271050521251, "grad_norm": 0.7128403749449099, "learning_rate": 2.710208545236397e-06, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.13058456778526306, "step": 3710, "valid_targets_mean": 3053.6, "valid_targets_min": 1380 }, { "epoch": 5.954290296712109, "grad_norm": 0.5020374709645875, "learning_rate": 2.670175639953929e-06, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.09986815601587296, "step": 3715, "valid_targets_mean": 3981.4, "valid_targets_min": 981 }, { "epoch": 5.962309542902967, "grad_norm": 0.7439070604641389, "learning_rate": 2.6304194461976207e-06, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.13553877174854279, "step": 3720, "valid_targets_mean": 2815.2, "valid_targets_min": 1368 }, { "epoch": 5.970328789093825, "grad_norm": 0.8061327031659907, "learning_rate": 2.5909405987688896e-06, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.16787466406822205, "step": 3725, "valid_targets_mean": 2979.1, "valid_targets_min": 1029 }, { "epoch": 5.978348035284683, "grad_norm": 0.7233469829920061, "learning_rate": 2.5517397280406565e-06, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.1734805703163147, "step": 3730, "valid_targets_mean": 4583.1, "valid_targets_min": 1858 }, { "epoch": 5.986367281475541, "grad_norm": 0.7616891829738133, "learning_rate": 2.512817459947312e-06, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.11115828156471252, "step": 3735, "valid_targets_mean": 2511.5, "valid_targets_min": 1029 }, { "epoch": 5.994386527666399, "grad_norm": 0.6285399195870048, "learning_rate": 2.4741744159746618e-06, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.12156839668750763, "step": 3740, "valid_targets_mean": 3640.2, "valid_targets_min": 2044 }, { "epoch": 6.001603849238172, "grad_norm": 0.5991692363576295, "learning_rate": 2.435811213150079e-06, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12158750742673874, "step": 3745, "valid_targets_mean": 4298.0, "valid_targets_min": 1453 }, { "epoch": 6.0096230954290295, "grad_norm": 0.5838065514388638, "learning_rate": 2.3977284640325805e-06, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1734558641910553, "step": 3750, "valid_targets_mean": 5849.6, "valid_targets_min": 1131 }, { "epoch": 6.017642341619887, "grad_norm": 0.7515761152464798, "learning_rate": 2.359926776703092e-06, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.1791701316833496, "step": 3755, "valid_targets_mean": 4131.6, "valid_targets_min": 1807 }, { "epoch": 6.025661587810745, "grad_norm": 0.5615783508002681, "learning_rate": 2.3224067547547357e-06, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.16611458361148834, "step": 3760, "valid_targets_mean": 5644.5, "valid_targets_min": 1826 }, { "epoch": 6.033680834001604, "grad_norm": 0.6349112012821538, "learning_rate": 2.2851689972831536e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.09982097148895264, "step": 3765, "valid_targets_mean": 3284.1, "valid_targets_min": 1652 }, { "epoch": 6.041700080192462, "grad_norm": 0.4936466599303436, "learning_rate": 2.248214098877002e-06, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.16967222094535828, "step": 3770, "valid_targets_mean": 7187.9, "valid_targets_min": 1142 }, { "epoch": 6.04971932638332, "grad_norm": 0.6975506989696647, "learning_rate": 2.2115426496083958e-06, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.15700647234916687, "step": 3775, "valid_targets_mean": 3620.6, "valid_targets_min": 1094 }, { "epoch": 6.057738572574178, "grad_norm": 0.5213863781241199, "learning_rate": 2.175155235023536e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.13770925998687744, "step": 3780, "valid_targets_mean": 6736.9, "valid_targets_min": 2195 }, { "epoch": 6.065757818765036, "grad_norm": 0.7034256718400578, "learning_rate": 2.1390524361333355e-06, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.13219033181667328, "step": 3785, "valid_targets_mean": 3660.4, "valid_targets_min": 1566 }, { "epoch": 6.073777064955894, "grad_norm": 0.6915785323589456, "learning_rate": 2.1032348294041305e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.1072409376502037, "step": 3790, "valid_targets_mean": 2984.6, "valid_targets_min": 1478 }, { "epoch": 6.081796311146753, "grad_norm": 0.6525266844739303, "learning_rate": 2.067702986748521e-06, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530601680278778, "step": 3795, "valid_targets_mean": 4701.8, "valid_targets_min": 1128 }, { "epoch": 6.0898155573376105, "grad_norm": 0.6239357292972502, "learning_rate": 2.0324574755161764e-06, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.11305804550647736, "step": 3800, "valid_targets_mean": 3578.0, "valid_targets_min": 1575 }, { "epoch": 6.097834803528468, "grad_norm": 0.6645665897198888, "learning_rate": 1.9974988584848385e-06, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.14500468969345093, "step": 3805, "valid_targets_mean": 4432.5, "valid_targets_min": 1748 }, { "epoch": 6.105854049719326, "grad_norm": 0.8009084871999578, "learning_rate": 1.96282769385129e-06, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.16477596759796143, "step": 3810, "valid_targets_mean": 5450.1, "valid_targets_min": 2265 }, { "epoch": 6.113873295910184, "grad_norm": 0.6177586996719383, "learning_rate": 1.9284445352224625e-06, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.14988410472869873, "step": 3815, "valid_targets_mean": 3910.0, "valid_targets_min": 1244 }, { "epoch": 6.121892542101042, "grad_norm": 0.893366067941702, "learning_rate": 1.894349931606596e-06, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.17635749280452728, "step": 3820, "valid_targets_mean": 2809.9, "valid_targets_min": 999 }, { "epoch": 6.129911788291901, "grad_norm": 0.7176410005122456, "learning_rate": 1.8605444274044493e-06, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.12091509997844696, "step": 3825, "valid_targets_mean": 3264.6, "valid_targets_min": 1410 }, { "epoch": 6.137931034482759, "grad_norm": 0.6593417551637085, "learning_rate": 1.827028562400659e-06, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.11562930047512054, "step": 3830, "valid_targets_mean": 2925.2, "valid_targets_min": 1676 }, { "epoch": 6.145950280673617, "grad_norm": 0.7489493000181351, "learning_rate": 1.793802871755066e-06, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.12282755225896835, "step": 3835, "valid_targets_mean": 4057.5, "valid_targets_min": 1500 }, { "epoch": 6.153969526864475, "grad_norm": 0.6571208032513868, "learning_rate": 1.760867885994202e-06, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.11998392641544342, "step": 3840, "valid_targets_mean": 4374.6, "valid_targets_min": 1591 }, { "epoch": 6.161988773055333, "grad_norm": 0.8039505872062598, "learning_rate": 1.7282241310028047e-06, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.17138797044754028, "step": 3845, "valid_targets_mean": 3309.2, "valid_targets_min": 1124 }, { "epoch": 6.170008019246191, "grad_norm": 0.5963452400390175, "learning_rate": 1.6958721280154232e-06, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.1287102848291397, "step": 3850, "valid_targets_mean": 4082.4, "valid_targets_min": 1429 }, { "epoch": 6.1780272654370485, "grad_norm": 0.5536501052142992, "learning_rate": 1.6638123936081085e-06, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.11305131018161774, "step": 3855, "valid_targets_mean": 5233.0, "valid_targets_min": 1520 }, { "epoch": 6.186046511627907, "grad_norm": 1.1404604574734827, "learning_rate": 1.6320454396901463e-06, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419065296649933, "step": 3860, "valid_targets_mean": 4052.0, "valid_targets_min": 1598 }, { "epoch": 6.194065757818765, "grad_norm": 0.7161367900264296, "learning_rate": 1.6005717734958914e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.1022464781999588, "step": 3865, "valid_targets_mean": 3001.2, "valid_targets_min": 1102 }, { "epoch": 6.202085004009623, "grad_norm": 0.7281191839480282, "learning_rate": 1.569391897576671e-06, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.11236599832773209, "step": 3870, "valid_targets_mean": 2805.0, "valid_targets_min": 1458 }, { "epoch": 6.210104250200481, "grad_norm": 0.6886143528876548, "learning_rate": 1.5385063097927533e-06, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.09367795288562775, "step": 3875, "valid_targets_mean": 2750.8, "valid_targets_min": 1252 }, { "epoch": 6.218123496391339, "grad_norm": 0.7374096316470432, "learning_rate": 1.5079155033054104e-06, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338837891817093, "step": 3880, "valid_targets_mean": 3094.1, "valid_targets_min": 1037 }, { "epoch": 6.226142742582197, "grad_norm": 0.6462423085656397, "learning_rate": 1.4776199665690239e-06, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.09631840884685516, "step": 3885, "valid_targets_mean": 3532.2, "valid_targets_min": 1504 }, { "epoch": 6.234161988773056, "grad_norm": 0.6543467487593563, "learning_rate": 1.4476201833233084e-06, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.19178268313407898, "step": 3890, "valid_targets_mean": 5289.2, "valid_targets_min": 1841 }, { "epoch": 6.242181234963914, "grad_norm": 0.5293959822986096, "learning_rate": 1.4179166325855676e-06, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.12478166818618774, "step": 3895, "valid_targets_mean": 5240.5, "valid_targets_min": 2239 }, { "epoch": 6.250200481154772, "grad_norm": 0.5543609876923493, "learning_rate": 1.3885097886430599e-06, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.10484036803245544, "step": 3900, "valid_targets_mean": 5359.6, "valid_targets_min": 2709 }, { "epoch": 6.2582197273456295, "grad_norm": 0.7216036614629309, "learning_rate": 1.35940012104542e-06, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.10729452222585678, "step": 3905, "valid_targets_mean": 3561.8, "valid_targets_min": 1506 }, { "epoch": 6.266238973536487, "grad_norm": 0.7478663074770113, "learning_rate": 1.3305880945971583e-06, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.14511063694953918, "step": 3910, "valid_targets_mean": 2780.2, "valid_targets_min": 1023 }, { "epoch": 6.274258219727345, "grad_norm": 0.550060865375561, "learning_rate": 1.3020741693502403e-06, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.15165145695209503, "step": 3915, "valid_targets_mean": 6547.9, "valid_targets_min": 2000 }, { "epoch": 6.282277465918204, "grad_norm": 0.6615177499929813, "learning_rate": 1.27385880059675e-06, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.10962480306625366, "step": 3920, "valid_targets_mean": 4424.0, "valid_targets_min": 1093 }, { "epoch": 6.290296712109062, "grad_norm": 0.694246980988033, "learning_rate": 1.245942438861607e-06, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.10474206507205963, "step": 3925, "valid_targets_mean": 3367.9, "valid_targets_min": 1102 }, { "epoch": 6.29831595829992, "grad_norm": 0.7157635807579565, "learning_rate": 1.2183255298953788e-06, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.1532362550497055, "step": 3930, "valid_targets_mean": 4046.2, "valid_targets_min": 2199 }, { "epoch": 6.306335204490778, "grad_norm": 0.69158602977965, "learning_rate": 1.1910085146671645e-06, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.11300238966941833, "step": 3935, "valid_targets_mean": 3600.0, "valid_targets_min": 1316 }, { "epoch": 6.314354450681636, "grad_norm": 0.827641902397557, "learning_rate": 1.1639918293575492e-06, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277027130126953, "step": 3940, "valid_targets_mean": 2965.0, "valid_targets_min": 1300 }, { "epoch": 6.322373696872494, "grad_norm": 0.6439877820560833, "learning_rate": 1.1372759053516536e-06, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.14757797122001648, "step": 3945, "valid_targets_mean": 5060.8, "valid_targets_min": 1476 }, { "epoch": 6.330392943063352, "grad_norm": 0.8237834476733428, "learning_rate": 1.1108611692322157e-06, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.14925746619701385, "step": 3950, "valid_targets_mean": 3301.4, "valid_targets_min": 1894 }, { "epoch": 6.3384121892542105, "grad_norm": 0.6933010368323701, "learning_rate": 1.0847480427728142e-06, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.18430668115615845, "step": 3955, "valid_targets_mean": 4292.0, "valid_targets_min": 1172 }, { "epoch": 6.346431435445068, "grad_norm": 0.6863177670467828, "learning_rate": 1.0589369429311125e-06, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.13784122467041016, "step": 3960, "valid_targets_mean": 4396.8, "valid_targets_min": 1687 }, { "epoch": 6.354450681635926, "grad_norm": 0.6371680102976265, "learning_rate": 1.0334282818422037e-06, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15805824100971222, "step": 3965, "valid_targets_mean": 5949.5, "valid_targets_min": 1945 }, { "epoch": 6.362469927826784, "grad_norm": 0.6568792404928988, "learning_rate": 1.008222466812041e-06, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.1167311817407608, "step": 3970, "valid_targets_mean": 3345.5, "valid_targets_min": 1287 }, { "epoch": 6.370489174017642, "grad_norm": 0.6559067333173757, "learning_rate": 9.83319900310915e-07, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.10906291007995605, "step": 3975, "valid_targets_mean": 3599.5, "valid_targets_min": 1912 }, { "epoch": 6.3785084202085, "grad_norm": 0.7723309861979427, "learning_rate": 9.587209799670495e-07, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628764122724533, "step": 3980, "valid_targets_mean": 3042.9, "valid_targets_min": 1527 }, { "epoch": 6.386527666399359, "grad_norm": 0.734200484710398, "learning_rate": 9.344260985602327e-07, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.12474434822797775, "step": 3985, "valid_targets_mean": 3176.6, "valid_targets_min": 1617 }, { "epoch": 6.394546912590217, "grad_norm": 0.5800212945862554, "learning_rate": 9.104356440155526e-07, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.1241566613316536, "step": 3990, "valid_targets_mean": 5577.8, "valid_targets_min": 1150 }, { "epoch": 6.402566158781075, "grad_norm": 0.5664850555279295, "learning_rate": 8.867499993972162e-07, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.19933608174324036, "step": 3995, "valid_targets_mean": 8049.4, "valid_targets_min": 2446 }, { "epoch": 6.410585404971933, "grad_norm": 0.7356802978325007, "learning_rate": 8.633695429024058e-07, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.18359798192977905, "step": 4000, "valid_targets_mean": 4368.5, "valid_targets_min": 1938 }, { "epoch": 6.4186046511627906, "grad_norm": 0.7546287387709505, "learning_rate": 8.402946478552732e-07, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.17862293124198914, "step": 4005, "valid_targets_mean": 3321.8, "valid_targets_min": 736 }, { "epoch": 6.4266238973536485, "grad_norm": 0.7309273625638524, "learning_rate": 8.175256827009392e-07, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.12505288422107697, "step": 4010, "valid_targets_mean": 4053.5, "valid_targets_min": 1398 }, { "epoch": 6.434643143544507, "grad_norm": 0.6264446725047349, "learning_rate": 7.95063010999646e-07, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.1693299412727356, "step": 4015, "valid_targets_mean": 4615.9, "valid_targets_min": 1216 }, { "epoch": 6.442662389735365, "grad_norm": 0.7464025775211349, "learning_rate": 7.729069914209409e-07, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.13851439952850342, "step": 4020, "valid_targets_mean": 3684.0, "valid_targets_min": 1045 }, { "epoch": 6.450681635926223, "grad_norm": 0.5524150098685408, "learning_rate": 7.510579777379345e-07, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.21182794868946075, "step": 4025, "valid_targets_mean": 6848.2, "valid_targets_min": 1806 }, { "epoch": 6.458700882117081, "grad_norm": 0.6643165903460105, "learning_rate": 7.295163188216792e-07, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.10513627529144287, "step": 4030, "valid_targets_mean": 3270.2, "valid_targets_min": 894 }, { "epoch": 6.466720128307939, "grad_norm": 0.7738257068533779, "learning_rate": 7.08282358635568e-07, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.13248899579048157, "step": 4035, "valid_targets_mean": 2989.2, "valid_targets_min": 1229 }, { "epoch": 6.474739374498797, "grad_norm": 0.663638489935353, "learning_rate": 6.87356436229869e-07, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.08959473669528961, "step": 4040, "valid_targets_mean": 3430.5, "valid_targets_min": 1771 }, { "epoch": 6.482758620689655, "grad_norm": 0.8146828017163209, "learning_rate": 6.667388857362977e-07, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.14155611395835876, "step": 4045, "valid_targets_mean": 3218.6, "valid_targets_min": 1283 }, { "epoch": 6.490777866880514, "grad_norm": 0.6793827790016271, "learning_rate": 6.464300363626797e-07, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.09733996540307999, "step": 4050, "valid_targets_mean": 2679.1, "valid_targets_min": 1106 }, { "epoch": 6.4987971130713715, "grad_norm": 0.6285180608759408, "learning_rate": 6.264302123877053e-07, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.13995882868766785, "step": 4055, "valid_targets_mean": 5047.8, "valid_targets_min": 1303 }, { "epoch": 6.5068163592622295, "grad_norm": 0.6873892553192886, "learning_rate": 6.067397331557412e-07, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.11077672243118286, "step": 4060, "valid_targets_mean": 3205.5, "valid_targets_min": 1584 }, { "epoch": 6.514835605453087, "grad_norm": 0.5517625384903336, "learning_rate": 5.873589130717405e-07, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.08499126881361008, "step": 4065, "valid_targets_mean": 3437.4, "valid_targets_min": 1191 }, { "epoch": 6.522854851643945, "grad_norm": 0.6755583113168804, "learning_rate": 5.682880615962116e-07, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.14547117054462433, "step": 4070, "valid_targets_mean": 4614.2, "valid_targets_min": 1265 }, { "epoch": 6.530874097834803, "grad_norm": 0.6395651118677016, "learning_rate": 5.495274832402841e-07, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.12784671783447266, "step": 4075, "valid_targets_mean": 3884.9, "valid_targets_min": 1306 }, { "epoch": 6.538893344025661, "grad_norm": 0.5770813261830327, "learning_rate": 5.310774775608529e-07, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.12950290739536285, "step": 4080, "valid_targets_mean": 4559.6, "valid_targets_min": 1370 }, { "epoch": 6.54691259021652, "grad_norm": 0.6331014040707633, "learning_rate": 5.129383391557751e-07, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.165439635515213, "step": 4085, "valid_targets_mean": 4090.6, "valid_targets_min": 1282 }, { "epoch": 6.554931836407378, "grad_norm": 0.6511365230785408, "learning_rate": 4.951103576591876e-07, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.13743093609809875, "step": 4090, "valid_targets_mean": 4554.4, "valid_targets_min": 1653 }, { "epoch": 6.562951082598236, "grad_norm": 0.7987173023729609, "learning_rate": 4.7759381773687e-07, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.13793396949768066, "step": 4095, "valid_targets_mean": 2783.2, "valid_targets_min": 1066 }, { "epoch": 6.570970328789094, "grad_norm": 0.7544997486665157, "learning_rate": 4.6038899908170234e-07, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.12955988943576813, "step": 4100, "valid_targets_mean": 3326.0, "valid_targets_min": 2170 }, { "epoch": 6.578989574979952, "grad_norm": 0.5854788552810375, "learning_rate": 4.4349617640920164e-07, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.09501869231462479, "step": 4105, "valid_targets_mean": 2814.2, "valid_targets_min": 1177 }, { "epoch": 6.58700882117081, "grad_norm": 0.7772905310391393, "learning_rate": 4.2691561945312764e-07, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.1361604928970337, "step": 4110, "valid_targets_mean": 3158.1, "valid_targets_min": 1647 }, { "epoch": 6.595028067361668, "grad_norm": 0.6055157996600555, "learning_rate": 4.106475929611886e-07, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.10309708118438721, "step": 4115, "valid_targets_mean": 3729.2, "valid_targets_min": 1610 }, { "epoch": 6.603047313552526, "grad_norm": 0.7008833517826353, "learning_rate": 3.9469235669080007e-07, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.12836217880249023, "step": 4120, "valid_targets_mean": 3563.2, "valid_targets_min": 1348 }, { "epoch": 6.611066559743384, "grad_norm": 0.5659713506979073, "learning_rate": 3.7905016540495053e-07, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.10678073763847351, "step": 4125, "valid_targets_mean": 5325.9, "valid_targets_min": 1283 }, { "epoch": 6.619085805934242, "grad_norm": 0.8252214089753425, "learning_rate": 3.63721268868118e-07, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.13685831427574158, "step": 4130, "valid_targets_mean": 2919.6, "valid_targets_min": 1197 }, { "epoch": 6.6271050521251, "grad_norm": 0.7225618863258757, "learning_rate": 3.487059118422997e-07, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.12511911988258362, "step": 4135, "valid_targets_mean": 3616.0, "valid_targets_min": 1859 }, { "epoch": 6.635124298315958, "grad_norm": 0.7213244827448435, "learning_rate": 3.3400433408308895e-07, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.11407344788312912, "step": 4140, "valid_targets_mean": 3371.5, "valid_targets_min": 1165 }, { "epoch": 6.643143544506817, "grad_norm": 0.5863803353807132, "learning_rate": 3.196167703358577e-07, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.2087329626083374, "step": 4145, "valid_targets_mean": 6667.9, "valid_targets_min": 2033 }, { "epoch": 6.651162790697675, "grad_norm": 0.7306156531205246, "learning_rate": 3.0554345033199985e-07, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.10838615149259567, "step": 4150, "valid_targets_mean": 2848.4, "valid_targets_min": 1241 }, { "epoch": 6.659182036888533, "grad_norm": 0.5978142445674056, "learning_rate": 2.917845987852652e-07, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.12275230884552002, "step": 4155, "valid_targets_mean": 5131.2, "valid_targets_min": 1631 }, { "epoch": 6.6672012830793905, "grad_norm": 0.6989850067101168, "learning_rate": 2.783404353881758e-07, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.12991738319396973, "step": 4160, "valid_targets_mean": 5254.8, "valid_targets_min": 1794 }, { "epoch": 6.6752205292702484, "grad_norm": 0.6831761000655288, "learning_rate": 2.652111748085151e-07, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.12421713769435883, "step": 4165, "valid_targets_mean": 3544.2, "valid_targets_min": 1009 }, { "epoch": 6.683239775461106, "grad_norm": 0.6637736639097456, "learning_rate": 2.523970266859044e-07, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.11612105369567871, "step": 4170, "valid_targets_mean": 4202.0, "valid_targets_min": 1397 }, { "epoch": 6.691259021651964, "grad_norm": 0.8052071141988904, "learning_rate": 2.398981956284363e-07, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.1752295047044754, "step": 4175, "valid_targets_mean": 3697.4, "valid_targets_min": 1804 }, { "epoch": 6.699278267842823, "grad_norm": 0.771846614986006, "learning_rate": 2.2771488120944207e-07, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.18034441769123077, "step": 4180, "valid_targets_mean": 3251.6, "valid_targets_min": 1364 }, { "epoch": 6.707297514033681, "grad_norm": 0.7689430459462362, "learning_rate": 2.1584727796427174e-07, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.18182602524757385, "step": 4185, "valid_targets_mean": 3384.4, "valid_targets_min": 1269 }, { "epoch": 6.715316760224539, "grad_norm": 0.6345934861559102, "learning_rate": 2.0429557538720556e-07, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.0992988795042038, "step": 4190, "valid_targets_mean": 3541.0, "valid_targets_min": 1862 }, { "epoch": 6.723336006415397, "grad_norm": 0.7310071527515055, "learning_rate": 1.930599579284298e-07, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.11810122430324554, "step": 4195, "valid_targets_mean": 3602.1, "valid_targets_min": 1845 }, { "epoch": 6.731355252606255, "grad_norm": 0.5664508946270108, "learning_rate": 1.8214060499107679e-07, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.1088356077671051, "step": 4200, "valid_targets_mean": 4533.4, "valid_targets_min": 1299 }, { "epoch": 6.739374498797113, "grad_norm": 0.6657206647984147, "learning_rate": 1.7153769092837614e-07, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.10410232841968536, "step": 4205, "valid_targets_mean": 3370.6, "valid_targets_min": 1057 }, { "epoch": 6.7473937449879715, "grad_norm": 0.7416720662788616, "learning_rate": 1.6125138504086146e-07, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.10707104951143265, "step": 4210, "valid_targets_mean": 2630.2, "valid_targets_min": 855 }, { "epoch": 6.755412991178829, "grad_norm": 0.5671208154371713, "learning_rate": 1.5128185157367247e-07, "loss": 0.278, "loss_nan_ranks": 0, "loss_rank_avg": 0.13333214819431305, "step": 4215, "valid_targets_mean": 4998.6, "valid_targets_min": 1238 }, { "epoch": 6.763432237369687, "grad_norm": 0.7000691617144927, "learning_rate": 1.4162924971393044e-07, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.16572439670562744, "step": 4220, "valid_targets_mean": 4097.9, "valid_targets_min": 1808 }, { "epoch": 6.771451483560545, "grad_norm": 1.0427903862301446, "learning_rate": 1.322937335881891e-07, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.14080201089382172, "step": 4225, "valid_targets_mean": 4474.2, "valid_targets_min": 1133 }, { "epoch": 6.779470729751403, "grad_norm": 0.604225087803022, "learning_rate": 1.2327545225999215e-07, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16035734117031097, "step": 4230, "valid_targets_mean": 5771.0, "valid_targets_min": 1022 }, { "epoch": 6.787489975942261, "grad_norm": 0.7120534688025915, "learning_rate": 1.145745497274664e-07, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.16921287775039673, "step": 4235, "valid_targets_mean": 4174.0, "valid_targets_min": 1988 }, { "epoch": 6.79550922213312, "grad_norm": 0.7648717180045367, "learning_rate": 1.061911649210523e-07, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1884380578994751, "step": 4240, "valid_targets_mean": 5023.6, "valid_targets_min": 1372 }, { "epoch": 6.803528468323978, "grad_norm": 0.6388536724286882, "learning_rate": 9.812543170126365e-08, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.11434964835643768, "step": 4245, "valid_targets_mean": 4338.6, "valid_targets_min": 2334 }, { "epoch": 6.811547714514836, "grad_norm": 0.7270357721190687, "learning_rate": 9.03774788565559e-08, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.24188214540481567, "step": 4250, "valid_targets_mean": 5134.2, "valid_targets_min": 1123 }, { "epoch": 6.819566960705694, "grad_norm": 0.8119218603253432, "learning_rate": 8.294743010127448e-08, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.15277987718582153, "step": 4255, "valid_targets_mean": 2758.6, "valid_targets_min": 858 }, { "epoch": 6.827586206896552, "grad_norm": 0.7089787347354933, "learning_rate": 7.583540407367418e-08, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.17936328053474426, "step": 4260, "valid_targets_mean": 3873.8, "valid_targets_min": 1148 }, { "epoch": 6.8356054530874095, "grad_norm": 0.733927681130997, "learning_rate": 6.904151433402728e-08, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.18088877201080322, "step": 4265, "valid_targets_mean": 5007.8, "valid_targets_min": 1377 }, { "epoch": 6.843624699278267, "grad_norm": 0.7031485625421123, "learning_rate": 6.256586936281172e-08, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.10452007502317429, "step": 4270, "valid_targets_mean": 2666.0, "valid_targets_min": 1150 }, { "epoch": 6.851643945469126, "grad_norm": 0.6652572684887978, "learning_rate": 5.6408572558972475e-08, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.13122780621051788, "step": 4275, "valid_targets_mean": 3638.0, "valid_targets_min": 1016 }, { "epoch": 6.859663191659984, "grad_norm": 0.6857482931865787, "learning_rate": 5.0569722238280605e-08, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.16107389330863953, "step": 4280, "valid_targets_mean": 4468.1, "valid_targets_min": 803 }, { "epoch": 6.867682437850842, "grad_norm": 0.72913675672226, "learning_rate": 4.504941163175236e-08, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.14377540349960327, "step": 4285, "valid_targets_mean": 3290.5, "valid_targets_min": 1286 }, { "epoch": 6.8757016840417, "grad_norm": 0.6468123069769464, "learning_rate": 3.984772888417032e-08, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.16589681804180145, "step": 4290, "valid_targets_mean": 6056.2, "valid_targets_min": 1364 }, { "epoch": 6.883720930232558, "grad_norm": 0.6669737110792908, "learning_rate": 3.4964757052671216e-08, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.14455217123031616, "step": 4295, "valid_targets_mean": 4423.9, "valid_targets_min": 2216 }, { "epoch": 6.891740176423416, "grad_norm": 0.6447822559671433, "learning_rate": 3.0400574105415856e-08, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.10480152070522308, "step": 4300, "valid_targets_mean": 3992.2, "valid_targets_min": 1304 }, { "epoch": 6.899759422614274, "grad_norm": 0.6269333630594336, "learning_rate": 2.615525292035459e-08, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.20834621787071228, "step": 4305, "valid_targets_mean": 6044.5, "valid_targets_min": 1353 }, { "epoch": 6.907778668805133, "grad_norm": 0.6801689751096721, "learning_rate": 2.222886128405266e-08, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.10578888654708862, "step": 4310, "valid_targets_mean": 2282.5, "valid_targets_min": 1331 }, { "epoch": 6.9157979149959905, "grad_norm": 0.616271937547341, "learning_rate": 1.8621461890617752e-08, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.0919659286737442, "step": 4315, "valid_targets_mean": 2920.1, "valid_targets_min": 1139 }, { "epoch": 6.923817161186848, "grad_norm": 0.6251342212375184, "learning_rate": 1.5333112340687463e-08, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263146996498108, "step": 4320, "valid_targets_mean": 4399.0, "valid_targets_min": 1203 }, { "epoch": 6.931836407377706, "grad_norm": 0.8172684670405291, "learning_rate": 1.2363865140518905e-08, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.1875896155834198, "step": 4325, "valid_targets_mean": 3179.0, "valid_targets_min": 1288 }, { "epoch": 6.939855653568564, "grad_norm": 0.6804193695635374, "learning_rate": 9.713767701151621e-09, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.14937788248062134, "step": 4330, "valid_targets_mean": 5056.6, "valid_targets_min": 1414 }, { "epoch": 6.947874899759423, "grad_norm": 0.7198516572202387, "learning_rate": 7.382862337641516e-09, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.14979767799377441, "step": 4335, "valid_targets_mean": 3678.6, "valid_targets_min": 1477 }, { "epoch": 6.955894145950281, "grad_norm": 0.8585805179317972, "learning_rate": 5.371186268390283e-09, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378738284111023, "step": 4340, "valid_targets_mean": 2880.1, "valid_targets_min": 1239 }, { "epoch": 6.963913392141139, "grad_norm": 0.7632442302373305, "learning_rate": 3.678771614550325e-09, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.21591196954250336, "step": 4345, "valid_targets_mean": 4265.0, "valid_targets_min": 2028 }, { "epoch": 6.971932638331997, "grad_norm": 0.6597310967858202, "learning_rate": 2.3056453995162763e-09, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.1997801512479782, "step": 4350, "valid_targets_mean": 5230.1, "valid_targets_min": 2152 }, { "epoch": 6.979951884522855, "grad_norm": 0.6935715453803216, "learning_rate": 1.2518295484875708e-09, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.13192936778068542, "step": 4355, "valid_targets_mean": 3180.9, "valid_targets_min": 1182 }, { "epoch": 6.987971130713713, "grad_norm": 0.6257334178571583, "learning_rate": 5.173408881198328e-10, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475430130958557, "step": 4360, "valid_targets_mean": 5180.1, "valid_targets_min": 2119 }, { "epoch": 6.995990376904571, "grad_norm": 0.6404645600840769, "learning_rate": 1.0219114625398263e-10, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.07926057279109955, "step": 4365, "valid_targets_mean": 2509.1, "valid_targets_min": 915 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.3030981719493866, "step": 4368, "total_flos": 1.299011914721919e+18, "train_loss": 0.3405153105383391, "train_runtime": 50827.1401, "train_samples_per_second": 1.373, "train_steps_per_second": 0.086, "valid_targets_mean": 4862.5, "valid_targets_min": 1479 } ], "logging_steps": 5, "max_steps": 4368, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.299011914721919e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }