{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 8475, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0029498525073746312, "grad_norm": 8.773958827225787, "learning_rate": 1.886792452830189e-07, "loss": 0.9616, "loss_nan_ranks": 0, "loss_rank_avg": 0.2874046862125397, "step": 5, "valid_targets_mean": 9206.2, "valid_targets_min": 1498 }, { "epoch": 0.0058997050147492625, "grad_norm": 8.43130406707678, "learning_rate": 4.2452830188679244e-07, "loss": 0.9704, "loss_nan_ranks": 0, "loss_rank_avg": 0.2660023272037506, "step": 10, "valid_targets_mean": 8719.1, "valid_targets_min": 1566 }, { "epoch": 0.008849557522123894, "grad_norm": 7.980973049789234, "learning_rate": 6.603773584905661e-07, "loss": 0.9721, "loss_nan_ranks": 0, "loss_rank_avg": 0.31450343132019043, "step": 15, "valid_targets_mean": 10767.6, "valid_targets_min": 1915 }, { "epoch": 0.011799410029498525, "grad_norm": 6.592074179405163, "learning_rate": 8.962264150943397e-07, "loss": 0.939, "loss_nan_ranks": 0, "loss_rank_avg": 0.2821187973022461, "step": 20, "valid_targets_mean": 9179.4, "valid_targets_min": 2072 }, { "epoch": 0.014749262536873156, "grad_norm": 5.341472842760085, "learning_rate": 1.1320754716981133e-06, "loss": 0.9091, "loss_nan_ranks": 0, "loss_rank_avg": 0.2598068118095398, "step": 25, "valid_targets_mean": 7131.3, "valid_targets_min": 1543 }, { "epoch": 0.017699115044247787, "grad_norm": 3.625836875106732, "learning_rate": 1.3679245283018869e-06, "loss": 0.8698, "loss_nan_ranks": 0, "loss_rank_avg": 0.28657275438308716, "step": 30, "valid_targets_mean": 10059.4, "valid_targets_min": 1912 }, { "epoch": 0.02064896755162242, "grad_norm": 2.4455995461055537, "learning_rate": 1.6037735849056604e-06, "loss": 0.8339, "loss_nan_ranks": 0, "loss_rank_avg": 0.25056618452072144, "step": 35, "valid_targets_mean": 8692.7, "valid_targets_min": 2885 }, { "epoch": 0.02359882005899705, "grad_norm": 1.671129853566953, "learning_rate": 1.839622641509434e-06, "loss": 0.8019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2268742173910141, "step": 40, "valid_targets_mean": 9311.7, "valid_targets_min": 1693 }, { "epoch": 0.02654867256637168, "grad_norm": 1.4983532466868172, "learning_rate": 2.075471698113208e-06, "loss": 0.7848, "loss_nan_ranks": 0, "loss_rank_avg": 0.24425435066223145, "step": 45, "valid_targets_mean": 10148.1, "valid_targets_min": 2792 }, { "epoch": 0.029498525073746312, "grad_norm": 1.1050377261180897, "learning_rate": 2.3113207547169815e-06, "loss": 0.7493, "loss_nan_ranks": 0, "loss_rank_avg": 0.2659146189689636, "step": 50, "valid_targets_mean": 10758.8, "valid_targets_min": 2016 }, { "epoch": 0.032448377581120944, "grad_norm": 0.84276225776089, "learning_rate": 2.547169811320755e-06, "loss": 0.7382, "loss_nan_ranks": 0, "loss_rank_avg": 0.2542104721069336, "step": 55, "valid_targets_mean": 9880.1, "valid_targets_min": 1422 }, { "epoch": 0.035398230088495575, "grad_norm": 0.7161442776999163, "learning_rate": 2.7830188679245286e-06, "loss": 0.7227, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537986636161804, "step": 60, "valid_targets_mean": 10118.1, "valid_targets_min": 1520 }, { "epoch": 0.038348082595870206, "grad_norm": 0.5278769329869252, "learning_rate": 3.018867924528302e-06, "loss": 0.698, "loss_nan_ranks": 0, "loss_rank_avg": 0.22161734104156494, "step": 65, "valid_targets_mean": 10715.5, "valid_targets_min": 1277 }, { "epoch": 0.04129793510324484, "grad_norm": 0.48264794318692644, "learning_rate": 3.2547169811320758e-06, "loss": 0.6842, "loss_nan_ranks": 0, "loss_rank_avg": 0.23746953904628754, "step": 70, "valid_targets_mean": 10908.8, "valid_targets_min": 689 }, { "epoch": 0.04424778761061947, "grad_norm": 0.3981010617617588, "learning_rate": 3.4905660377358493e-06, "loss": 0.6673, "loss_nan_ranks": 0, "loss_rank_avg": 0.26581302285194397, "step": 75, "valid_targets_mean": 11115.4, "valid_targets_min": 2402 }, { "epoch": 0.0471976401179941, "grad_norm": 0.39704919780613845, "learning_rate": 3.726415094339623e-06, "loss": 0.6438, "loss_nan_ranks": 0, "loss_rank_avg": 0.24585619568824768, "step": 80, "valid_targets_mean": 11587.3, "valid_targets_min": 3348 }, { "epoch": 0.05014749262536873, "grad_norm": 0.3005424445383612, "learning_rate": 3.962264150943396e-06, "loss": 0.629, "loss_nan_ranks": 0, "loss_rank_avg": 0.2160702645778656, "step": 85, "valid_targets_mean": 10653.8, "valid_targets_min": 2047 }, { "epoch": 0.05309734513274336, "grad_norm": 0.2623859001613278, "learning_rate": 4.19811320754717e-06, "loss": 0.6211, "loss_nan_ranks": 0, "loss_rank_avg": 0.22089292109012604, "step": 90, "valid_targets_mean": 11910.6, "valid_targets_min": 2312 }, { "epoch": 0.05604719764011799, "grad_norm": 0.27019333924019306, "learning_rate": 4.4339622641509435e-06, "loss": 0.6044, "loss_nan_ranks": 0, "loss_rank_avg": 0.1921449899673462, "step": 95, "valid_targets_mean": 9248.5, "valid_targets_min": 1411 }, { "epoch": 0.058997050147492625, "grad_norm": 0.24358668760990093, "learning_rate": 4.6698113207547175e-06, "loss": 0.5878, "loss_nan_ranks": 0, "loss_rank_avg": 0.19868874549865723, "step": 100, "valid_targets_mean": 8963.3, "valid_targets_min": 1519 }, { "epoch": 0.061946902654867256, "grad_norm": 0.2317817621237028, "learning_rate": 4.905660377358491e-06, "loss": 0.5809, "loss_nan_ranks": 0, "loss_rank_avg": 0.15674249827861786, "step": 105, "valid_targets_mean": 9282.0, "valid_targets_min": 1902 }, { "epoch": 0.06489675516224189, "grad_norm": 0.21518580064198847, "learning_rate": 5.1415094339622655e-06, "loss": 0.5668, "loss_nan_ranks": 0, "loss_rank_avg": 0.15662211179733276, "step": 110, "valid_targets_mean": 8392.4, "valid_targets_min": 2588 }, { "epoch": 0.06784660766961652, "grad_norm": 0.22321760855402145, "learning_rate": 5.377358490566038e-06, "loss": 0.5676, "loss_nan_ranks": 0, "loss_rank_avg": 0.20928239822387695, "step": 115, "valid_targets_mean": 11378.3, "valid_targets_min": 2407 }, { "epoch": 0.07079646017699115, "grad_norm": 0.2365011327381435, "learning_rate": 5.613207547169813e-06, "loss": 0.5627, "loss_nan_ranks": 0, "loss_rank_avg": 0.18675848841667175, "step": 120, "valid_targets_mean": 9986.8, "valid_targets_min": 2330 }, { "epoch": 0.07374631268436578, "grad_norm": 0.21095555367092353, "learning_rate": 5.849056603773585e-06, "loss": 0.5494, "loss_nan_ranks": 0, "loss_rank_avg": 0.20561310648918152, "step": 125, "valid_targets_mean": 13140.6, "valid_targets_min": 2373 }, { "epoch": 0.07669616519174041, "grad_norm": 0.2254076492475572, "learning_rate": 6.08490566037736e-06, "loss": 0.5456, "loss_nan_ranks": 0, "loss_rank_avg": 0.16216091811656952, "step": 130, "valid_targets_mean": 9226.3, "valid_targets_min": 1613 }, { "epoch": 0.07964601769911504, "grad_norm": 0.22864199872760177, "learning_rate": 6.320754716981132e-06, "loss": 0.5343, "loss_nan_ranks": 0, "loss_rank_avg": 0.15893808007240295, "step": 135, "valid_targets_mean": 8972.0, "valid_targets_min": 2220 }, { "epoch": 0.08259587020648967, "grad_norm": 0.22340821685443538, "learning_rate": 6.556603773584907e-06, "loss": 0.5382, "loss_nan_ranks": 0, "loss_rank_avg": 0.15970075130462646, "step": 140, "valid_targets_mean": 9749.8, "valid_targets_min": 1853 }, { "epoch": 0.0855457227138643, "grad_norm": 0.2105247063608589, "learning_rate": 6.792452830188679e-06, "loss": 0.5374, "loss_nan_ranks": 0, "loss_rank_avg": 0.2028973549604416, "step": 145, "valid_targets_mean": 12082.2, "valid_targets_min": 1279 }, { "epoch": 0.08849557522123894, "grad_norm": 0.22580596780293535, "learning_rate": 7.028301886792454e-06, "loss": 0.5317, "loss_nan_ranks": 0, "loss_rank_avg": 0.16002820432186127, "step": 150, "valid_targets_mean": 10171.3, "valid_targets_min": 2108 }, { "epoch": 0.09144542772861357, "grad_norm": 0.2797740687314117, "learning_rate": 7.264150943396226e-06, "loss": 0.5311, "loss_nan_ranks": 0, "loss_rank_avg": 0.16304832696914673, "step": 155, "valid_targets_mean": 8414.3, "valid_targets_min": 2331 }, { "epoch": 0.0943952802359882, "grad_norm": 0.24060452477660244, "learning_rate": 7.500000000000001e-06, "loss": 0.525, "loss_nan_ranks": 0, "loss_rank_avg": 0.168437197804451, "step": 160, "valid_targets_mean": 9946.0, "valid_targets_min": 2071 }, { "epoch": 0.09734513274336283, "grad_norm": 0.26990784653362826, "learning_rate": 7.735849056603775e-06, "loss": 0.5303, "loss_nan_ranks": 0, "loss_rank_avg": 0.23207911849021912, "step": 165, "valid_targets_mean": 11584.8, "valid_targets_min": 2526 }, { "epoch": 0.10029498525073746, "grad_norm": 0.21813379853235298, "learning_rate": 7.971698113207547e-06, "loss": 0.5219, "loss_nan_ranks": 0, "loss_rank_avg": 0.17449553310871124, "step": 170, "valid_targets_mean": 11271.9, "valid_targets_min": 2150 }, { "epoch": 0.10324483775811209, "grad_norm": 0.2177784266608873, "learning_rate": 8.207547169811321e-06, "loss": 0.5211, "loss_nan_ranks": 0, "loss_rank_avg": 0.1942562758922577, "step": 175, "valid_targets_mean": 11034.4, "valid_targets_min": 1379 }, { "epoch": 0.10619469026548672, "grad_norm": 0.2365221311955703, "learning_rate": 8.443396226415095e-06, "loss": 0.5156, "loss_nan_ranks": 0, "loss_rank_avg": 0.173548623919487, "step": 180, "valid_targets_mean": 11233.3, "valid_targets_min": 1872 }, { "epoch": 0.10914454277286136, "grad_norm": 0.22263607666515303, "learning_rate": 8.67924528301887e-06, "loss": 0.5137, "loss_nan_ranks": 0, "loss_rank_avg": 0.176674023270607, "step": 185, "valid_targets_mean": 10453.3, "valid_targets_min": 1094 }, { "epoch": 0.11209439528023599, "grad_norm": 0.22259600474883798, "learning_rate": 8.915094339622642e-06, "loss": 0.5103, "loss_nan_ranks": 0, "loss_rank_avg": 0.21244749426841736, "step": 190, "valid_targets_mean": 13592.8, "valid_targets_min": 2893 }, { "epoch": 0.11504424778761062, "grad_norm": 0.23853918792073867, "learning_rate": 9.150943396226416e-06, "loss": 0.5119, "loss_nan_ranks": 0, "loss_rank_avg": 0.15338359773159027, "step": 195, "valid_targets_mean": 9848.4, "valid_targets_min": 2305 }, { "epoch": 0.11799410029498525, "grad_norm": 0.24544705784022192, "learning_rate": 9.38679245283019e-06, "loss": 0.5113, "loss_nan_ranks": 0, "loss_rank_avg": 0.15049920976161957, "step": 200, "valid_targets_mean": 8824.9, "valid_targets_min": 1762 }, { "epoch": 0.12094395280235988, "grad_norm": 0.23996923684824645, "learning_rate": 9.622641509433963e-06, "loss": 0.5036, "loss_nan_ranks": 0, "loss_rank_avg": 0.17622515559196472, "step": 205, "valid_targets_mean": 10279.9, "valid_targets_min": 993 }, { "epoch": 0.12389380530973451, "grad_norm": 0.2356178723103165, "learning_rate": 9.858490566037736e-06, "loss": 0.5047, "loss_nan_ranks": 0, "loss_rank_avg": 0.16885659098625183, "step": 210, "valid_targets_mean": 9878.6, "valid_targets_min": 1434 }, { "epoch": 0.12684365781710916, "grad_norm": 0.2593343578467735, "learning_rate": 1.0094339622641511e-05, "loss": 0.5052, "loss_nan_ranks": 0, "loss_rank_avg": 0.15777814388275146, "step": 215, "valid_targets_mean": 9382.0, "valid_targets_min": 1289 }, { "epoch": 0.12979351032448377, "grad_norm": 0.23853635794945394, "learning_rate": 1.0330188679245284e-05, "loss": 0.5059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1759573519229889, "step": 220, "valid_targets_mean": 9724.2, "valid_targets_min": 2358 }, { "epoch": 0.13274336283185842, "grad_norm": 0.25629620309918427, "learning_rate": 1.0566037735849058e-05, "loss": 0.5033, "loss_nan_ranks": 0, "loss_rank_avg": 0.17160122096538544, "step": 225, "valid_targets_mean": 11027.6, "valid_targets_min": 1069 }, { "epoch": 0.13569321533923304, "grad_norm": 0.28852388125039813, "learning_rate": 1.0801886792452832e-05, "loss": 0.499, "loss_nan_ranks": 0, "loss_rank_avg": 0.1474302113056183, "step": 230, "valid_targets_mean": 9196.5, "valid_targets_min": 536 }, { "epoch": 0.13864306784660768, "grad_norm": 0.24690849305589715, "learning_rate": 1.1037735849056606e-05, "loss": 0.5006, "loss_nan_ranks": 0, "loss_rank_avg": 0.15746231377124786, "step": 235, "valid_targets_mean": 9754.9, "valid_targets_min": 1806 }, { "epoch": 0.1415929203539823, "grad_norm": 0.28233830897850076, "learning_rate": 1.1273584905660378e-05, "loss": 0.5022, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537265032529831, "step": 240, "valid_targets_mean": 9171.2, "valid_targets_min": 1140 }, { "epoch": 0.14454277286135694, "grad_norm": 0.25448817250054345, "learning_rate": 1.1509433962264152e-05, "loss": 0.4989, "loss_nan_ranks": 0, "loss_rank_avg": 0.16555047035217285, "step": 245, "valid_targets_mean": 9798.3, "valid_targets_min": 1344 }, { "epoch": 0.14749262536873156, "grad_norm": 0.27603293860374156, "learning_rate": 1.1745283018867926e-05, "loss": 0.5022, "loss_nan_ranks": 0, "loss_rank_avg": 0.15127146244049072, "step": 250, "valid_targets_mean": 8997.8, "valid_targets_min": 2398 }, { "epoch": 0.1504424778761062, "grad_norm": 0.28094160412298935, "learning_rate": 1.19811320754717e-05, "loss": 0.5008, "loss_nan_ranks": 0, "loss_rank_avg": 0.18154668807983398, "step": 255, "valid_targets_mean": 10034.7, "valid_targets_min": 1739 }, { "epoch": 0.15339233038348082, "grad_norm": 0.272720858377614, "learning_rate": 1.2216981132075472e-05, "loss": 0.4942, "loss_nan_ranks": 0, "loss_rank_avg": 0.14723987877368927, "step": 260, "valid_targets_mean": 9813.8, "valid_targets_min": 1050 }, { "epoch": 0.15634218289085547, "grad_norm": 0.24896110011232206, "learning_rate": 1.2452830188679246e-05, "loss": 0.4967, "loss_nan_ranks": 0, "loss_rank_avg": 0.15721940994262695, "step": 265, "valid_targets_mean": 10142.0, "valid_targets_min": 2362 }, { "epoch": 0.1592920353982301, "grad_norm": 0.2384263642596385, "learning_rate": 1.268867924528302e-05, "loss": 0.4927, "loss_nan_ranks": 0, "loss_rank_avg": 0.16213515400886536, "step": 270, "valid_targets_mean": 10334.2, "valid_targets_min": 1215 }, { "epoch": 0.16224188790560473, "grad_norm": 0.26632949187377725, "learning_rate": 1.2924528301886794e-05, "loss": 0.4914, "loss_nan_ranks": 0, "loss_rank_avg": 0.13655009865760803, "step": 275, "valid_targets_mean": 7946.3, "valid_targets_min": 1646 }, { "epoch": 0.16519174041297935, "grad_norm": 0.2848379528640083, "learning_rate": 1.3160377358490568e-05, "loss": 0.4907, "loss_nan_ranks": 0, "loss_rank_avg": 0.16915015876293182, "step": 280, "valid_targets_mean": 10197.9, "valid_targets_min": 2517 }, { "epoch": 0.168141592920354, "grad_norm": 0.2503018600734144, "learning_rate": 1.339622641509434e-05, "loss": 0.5004, "loss_nan_ranks": 0, "loss_rank_avg": 0.1548536717891693, "step": 285, "valid_targets_mean": 9506.9, "valid_targets_min": 2134 }, { "epoch": 0.1710914454277286, "grad_norm": 0.24628942797179826, "learning_rate": 1.3632075471698114e-05, "loss": 0.4874, "loss_nan_ranks": 0, "loss_rank_avg": 0.15937039256095886, "step": 290, "valid_targets_mean": 10417.7, "valid_targets_min": 1786 }, { "epoch": 0.17404129793510326, "grad_norm": 0.27090595503730375, "learning_rate": 1.3867924528301888e-05, "loss": 0.4737, "loss_nan_ranks": 0, "loss_rank_avg": 0.16793963313102722, "step": 295, "valid_targets_mean": 10820.2, "valid_targets_min": 2213 }, { "epoch": 0.17699115044247787, "grad_norm": 0.26417038077590604, "learning_rate": 1.4103773584905662e-05, "loss": 0.4866, "loss_nan_ranks": 0, "loss_rank_avg": 0.18323713541030884, "step": 300, "valid_targets_mean": 12955.4, "valid_targets_min": 1467 }, { "epoch": 0.17994100294985252, "grad_norm": 0.23601605137120854, "learning_rate": 1.4339622641509435e-05, "loss": 0.4893, "loss_nan_ranks": 0, "loss_rank_avg": 0.1528908610343933, "step": 305, "valid_targets_mean": 10078.7, "valid_targets_min": 1501 }, { "epoch": 0.18289085545722714, "grad_norm": 0.2531068673705301, "learning_rate": 1.4575471698113209e-05, "loss": 0.4851, "loss_nan_ranks": 0, "loss_rank_avg": 0.13879773020744324, "step": 310, "valid_targets_mean": 8772.9, "valid_targets_min": 1174 }, { "epoch": 0.18584070796460178, "grad_norm": 0.27397534098938575, "learning_rate": 1.4811320754716983e-05, "loss": 0.4808, "loss_nan_ranks": 0, "loss_rank_avg": 0.16207556426525116, "step": 315, "valid_targets_mean": 10604.9, "valid_targets_min": 1801 }, { "epoch": 0.1887905604719764, "grad_norm": 0.2267842788550988, "learning_rate": 1.5047169811320757e-05, "loss": 0.4775, "loss_nan_ranks": 0, "loss_rank_avg": 0.14752934873104095, "step": 320, "valid_targets_mean": 8825.4, "valid_targets_min": 2007 }, { "epoch": 0.19174041297935104, "grad_norm": 0.2499831182134859, "learning_rate": 1.5283018867924532e-05, "loss": 0.476, "loss_nan_ranks": 0, "loss_rank_avg": 0.15672816336154938, "step": 325, "valid_targets_mean": 10086.0, "valid_targets_min": 2308 }, { "epoch": 0.19469026548672566, "grad_norm": 0.2631441971415124, "learning_rate": 1.55188679245283e-05, "loss": 0.479, "loss_nan_ranks": 0, "loss_rank_avg": 0.14103585481643677, "step": 330, "valid_targets_mean": 9196.3, "valid_targets_min": 2358 }, { "epoch": 0.1976401179941003, "grad_norm": 0.2918399531224374, "learning_rate": 1.5754716981132077e-05, "loss": 0.4852, "loss_nan_ranks": 0, "loss_rank_avg": 0.13344430923461914, "step": 335, "valid_targets_mean": 8499.4, "valid_targets_min": 1309 }, { "epoch": 0.20058997050147492, "grad_norm": 0.2984964884465926, "learning_rate": 1.599056603773585e-05, "loss": 0.4832, "loss_nan_ranks": 0, "loss_rank_avg": 0.16676054894924164, "step": 340, "valid_targets_mean": 9956.7, "valid_targets_min": 1540 }, { "epoch": 0.20353982300884957, "grad_norm": 0.27016950611621293, "learning_rate": 1.6226415094339625e-05, "loss": 0.4772, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715359091758728, "step": 345, "valid_targets_mean": 10383.4, "valid_targets_min": 2501 }, { "epoch": 0.20648967551622419, "grad_norm": 0.246612135038914, "learning_rate": 1.6462264150943397e-05, "loss": 0.4828, "loss_nan_ranks": 0, "loss_rank_avg": 0.1632922887802124, "step": 350, "valid_targets_mean": 9967.4, "valid_targets_min": 1821 }, { "epoch": 0.20943952802359883, "grad_norm": 0.26017611465367824, "learning_rate": 1.669811320754717e-05, "loss": 0.4765, "loss_nan_ranks": 0, "loss_rank_avg": 0.15242213010787964, "step": 355, "valid_targets_mean": 9924.0, "valid_targets_min": 1816 }, { "epoch": 0.21238938053097345, "grad_norm": 0.251691625498555, "learning_rate": 1.6933962264150945e-05, "loss": 0.471, "loss_nan_ranks": 0, "loss_rank_avg": 0.16618210077285767, "step": 360, "valid_targets_mean": 10049.2, "valid_targets_min": 1217 }, { "epoch": 0.2153392330383481, "grad_norm": 0.2608799009369842, "learning_rate": 1.716981132075472e-05, "loss": 0.4829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1781197488307953, "step": 365, "valid_targets_mean": 12419.6, "valid_targets_min": 2271 }, { "epoch": 0.2182890855457227, "grad_norm": 0.2709855931241016, "learning_rate": 1.740566037735849e-05, "loss": 0.4677, "loss_nan_ranks": 0, "loss_rank_avg": 0.18040911853313446, "step": 370, "valid_targets_mean": 10423.2, "valid_targets_min": 1900 }, { "epoch": 0.22123893805309736, "grad_norm": 0.2922486386967908, "learning_rate": 1.7641509433962265e-05, "loss": 0.4685, "loss_nan_ranks": 0, "loss_rank_avg": 0.1437935084104538, "step": 375, "valid_targets_mean": 8453.0, "valid_targets_min": 1408 }, { "epoch": 0.22418879056047197, "grad_norm": 0.2509932527846505, "learning_rate": 1.7877358490566038e-05, "loss": 0.4788, "loss_nan_ranks": 0, "loss_rank_avg": 0.15098921954631805, "step": 380, "valid_targets_mean": 9931.7, "valid_targets_min": 2305 }, { "epoch": 0.22713864306784662, "grad_norm": 0.27496741475909753, "learning_rate": 1.8113207547169813e-05, "loss": 0.469, "loss_nan_ranks": 0, "loss_rank_avg": 0.17977483570575714, "step": 385, "valid_targets_mean": 10178.9, "valid_targets_min": 1039 }, { "epoch": 0.23008849557522124, "grad_norm": 0.33037536151215885, "learning_rate": 1.834905660377359e-05, "loss": 0.4732, "loss_nan_ranks": 0, "loss_rank_avg": 0.17215262353420258, "step": 390, "valid_targets_mean": 10581.9, "valid_targets_min": 1697 }, { "epoch": 0.23303834808259588, "grad_norm": 0.2590333044167339, "learning_rate": 1.8584905660377358e-05, "loss": 0.4833, "loss_nan_ranks": 0, "loss_rank_avg": 0.1654370129108429, "step": 395, "valid_targets_mean": 10485.4, "valid_targets_min": 2081 }, { "epoch": 0.2359882005899705, "grad_norm": 0.25165290674930346, "learning_rate": 1.8820754716981133e-05, "loss": 0.4738, "loss_nan_ranks": 0, "loss_rank_avg": 0.16054049134254456, "step": 400, "valid_targets_mean": 10634.4, "valid_targets_min": 1494 }, { "epoch": 0.23893805309734514, "grad_norm": 0.2558867155213945, "learning_rate": 1.905660377358491e-05, "loss": 0.4624, "loss_nan_ranks": 0, "loss_rank_avg": 0.14743725955486298, "step": 405, "valid_targets_mean": 9134.9, "valid_targets_min": 1983 }, { "epoch": 0.24188790560471976, "grad_norm": 0.320593320482016, "learning_rate": 1.929245283018868e-05, "loss": 0.4771, "loss_nan_ranks": 0, "loss_rank_avg": 0.13047058880329132, "step": 410, "valid_targets_mean": 7631.4, "valid_targets_min": 1308 }, { "epoch": 0.2448377581120944, "grad_norm": 0.249814248566448, "learning_rate": 1.9528301886792454e-05, "loss": 0.4706, "loss_nan_ranks": 0, "loss_rank_avg": 0.15469786524772644, "step": 415, "valid_targets_mean": 11488.8, "valid_targets_min": 3111 }, { "epoch": 0.24778761061946902, "grad_norm": 0.2657696546498897, "learning_rate": 1.9764150943396226e-05, "loss": 0.4683, "loss_nan_ranks": 0, "loss_rank_avg": 0.13970687985420227, "step": 420, "valid_targets_mean": 9848.1, "valid_targets_min": 1539 }, { "epoch": 0.25073746312684364, "grad_norm": 0.26882223733506905, "learning_rate": 2e-05, "loss": 0.4648, "loss_nan_ranks": 0, "loss_rank_avg": 0.17859773337841034, "step": 425, "valid_targets_mean": 12024.1, "valid_targets_min": 2727 }, { "epoch": 0.2536873156342183, "grad_norm": 0.246210269985762, "learning_rate": 2.0235849056603777e-05, "loss": 0.4701, "loss_nan_ranks": 0, "loss_rank_avg": 0.15420570969581604, "step": 430, "valid_targets_mean": 9545.0, "valid_targets_min": 1882 }, { "epoch": 0.25663716814159293, "grad_norm": 0.29785060543263786, "learning_rate": 2.047169811320755e-05, "loss": 0.4718, "loss_nan_ranks": 0, "loss_rank_avg": 0.1376991719007492, "step": 435, "valid_targets_mean": 8259.6, "valid_targets_min": 1045 }, { "epoch": 0.25958702064896755, "grad_norm": 0.28985379658927735, "learning_rate": 2.0707547169811325e-05, "loss": 0.4684, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606501042842865, "step": 440, "valid_targets_mean": 10127.1, "valid_targets_min": 1797 }, { "epoch": 0.26253687315634217, "grad_norm": 0.2814165129117154, "learning_rate": 2.0943396226415098e-05, "loss": 0.4692, "loss_nan_ranks": 0, "loss_rank_avg": 0.14782124757766724, "step": 445, "valid_targets_mean": 8850.4, "valid_targets_min": 1524 }, { "epoch": 0.26548672566371684, "grad_norm": 0.2797668741402931, "learning_rate": 2.1179245283018866e-05, "loss": 0.4714, "loss_nan_ranks": 0, "loss_rank_avg": 0.12928162515163422, "step": 450, "valid_targets_mean": 8547.2, "valid_targets_min": 1657 }, { "epoch": 0.26843657817109146, "grad_norm": 0.2528656289681847, "learning_rate": 2.1415094339622642e-05, "loss": 0.4636, "loss_nan_ranks": 0, "loss_rank_avg": 0.13063043355941772, "step": 455, "valid_targets_mean": 7498.9, "valid_targets_min": 2006 }, { "epoch": 0.2713864306784661, "grad_norm": 0.2581926598105123, "learning_rate": 2.1650943396226414e-05, "loss": 0.4667, "loss_nan_ranks": 0, "loss_rank_avg": 0.16427075862884521, "step": 460, "valid_targets_mean": 10987.5, "valid_targets_min": 2508 }, { "epoch": 0.2743362831858407, "grad_norm": 0.2823206577169872, "learning_rate": 2.188679245283019e-05, "loss": 0.473, "loss_nan_ranks": 0, "loss_rank_avg": 0.14611220359802246, "step": 465, "valid_targets_mean": 10292.0, "valid_targets_min": 2280 }, { "epoch": 0.27728613569321536, "grad_norm": 0.26695133201537186, "learning_rate": 2.2122641509433966e-05, "loss": 0.468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15307700634002686, "step": 470, "valid_targets_mean": 10601.8, "valid_targets_min": 1396 }, { "epoch": 0.28023598820059, "grad_norm": 0.28255841738322507, "learning_rate": 2.2358490566037738e-05, "loss": 0.4624, "loss_nan_ranks": 0, "loss_rank_avg": 0.1726362109184265, "step": 475, "valid_targets_mean": 9942.6, "valid_targets_min": 2133 }, { "epoch": 0.2831858407079646, "grad_norm": 0.2694490289689112, "learning_rate": 2.2594339622641514e-05, "loss": 0.4713, "loss_nan_ranks": 0, "loss_rank_avg": 0.1771799623966217, "step": 480, "valid_targets_mean": 9759.4, "valid_targets_min": 1581 }, { "epoch": 0.2861356932153392, "grad_norm": 0.26320630311881227, "learning_rate": 2.2830188679245286e-05, "loss": 0.4658, "loss_nan_ranks": 0, "loss_rank_avg": 0.18050238490104675, "step": 485, "valid_targets_mean": 10620.5, "valid_targets_min": 1461 }, { "epoch": 0.2890855457227139, "grad_norm": 0.2821384330941035, "learning_rate": 2.306603773584906e-05, "loss": 0.4715, "loss_nan_ranks": 0, "loss_rank_avg": 0.13854411244392395, "step": 490, "valid_targets_mean": 8787.5, "valid_targets_min": 2197 }, { "epoch": 0.2920353982300885, "grad_norm": 0.2589089232000087, "learning_rate": 2.330188679245283e-05, "loss": 0.4677, "loss_nan_ranks": 0, "loss_rank_avg": 0.13725772500038147, "step": 495, "valid_targets_mean": 9077.8, "valid_targets_min": 2800 }, { "epoch": 0.2949852507374631, "grad_norm": 0.27484048405379097, "learning_rate": 2.3537735849056603e-05, "loss": 0.4649, "loss_nan_ranks": 0, "loss_rank_avg": 0.16023467481136322, "step": 500, "valid_targets_mean": 9941.8, "valid_targets_min": 2260 }, { "epoch": 0.29793510324483774, "grad_norm": 0.27097915398189687, "learning_rate": 2.377358490566038e-05, "loss": 0.4688, "loss_nan_ranks": 0, "loss_rank_avg": 0.15327778458595276, "step": 505, "valid_targets_mean": 10138.6, "valid_targets_min": 1655 }, { "epoch": 0.3008849557522124, "grad_norm": 0.3090554478712165, "learning_rate": 2.4009433962264154e-05, "loss": 0.4575, "loss_nan_ranks": 0, "loss_rank_avg": 0.1643308848142624, "step": 510, "valid_targets_mean": 9809.2, "valid_targets_min": 1817 }, { "epoch": 0.30383480825958703, "grad_norm": 0.26976590724785876, "learning_rate": 2.4245283018867926e-05, "loss": 0.4662, "loss_nan_ranks": 0, "loss_rank_avg": 0.18249952793121338, "step": 515, "valid_targets_mean": 11053.2, "valid_targets_min": 1891 }, { "epoch": 0.30678466076696165, "grad_norm": 0.30412168245675625, "learning_rate": 2.4481132075471702e-05, "loss": 0.4558, "loss_nan_ranks": 0, "loss_rank_avg": 0.17874681949615479, "step": 520, "valid_targets_mean": 10950.2, "valid_targets_min": 2265 }, { "epoch": 0.30973451327433627, "grad_norm": 0.2436153196597148, "learning_rate": 2.4716981132075474e-05, "loss": 0.4625, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472557932138443, "step": 525, "valid_targets_mean": 9727.5, "valid_targets_min": 1294 }, { "epoch": 0.31268436578171094, "grad_norm": 0.25885412101342653, "learning_rate": 2.495283018867925e-05, "loss": 0.468, "loss_nan_ranks": 0, "loss_rank_avg": 0.16035309433937073, "step": 530, "valid_targets_mean": 10823.4, "valid_targets_min": 2542 }, { "epoch": 0.31563421828908556, "grad_norm": 0.30705913319043077, "learning_rate": 2.5188679245283022e-05, "loss": 0.4593, "loss_nan_ranks": 0, "loss_rank_avg": 0.15604931116104126, "step": 535, "valid_targets_mean": 10381.6, "valid_targets_min": 1504 }, { "epoch": 0.3185840707964602, "grad_norm": 0.28099029262967157, "learning_rate": 2.542452830188679e-05, "loss": 0.4574, "loss_nan_ranks": 0, "loss_rank_avg": 0.17848971486091614, "step": 540, "valid_targets_mean": 10812.6, "valid_targets_min": 1055 }, { "epoch": 0.3215339233038348, "grad_norm": 0.28014050592117723, "learning_rate": 2.5660377358490567e-05, "loss": 0.4637, "loss_nan_ranks": 0, "loss_rank_avg": 0.14001238346099854, "step": 545, "valid_targets_mean": 9040.8, "valid_targets_min": 1130 }, { "epoch": 0.32448377581120946, "grad_norm": 0.3027064554505464, "learning_rate": 2.5896226415094343e-05, "loss": 0.4597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1356821060180664, "step": 550, "valid_targets_mean": 9655.9, "valid_targets_min": 1410 }, { "epoch": 0.3274336283185841, "grad_norm": 0.24986437223369426, "learning_rate": 2.6132075471698115e-05, "loss": 0.4604, "loss_nan_ranks": 0, "loss_rank_avg": 0.13323450088500977, "step": 555, "valid_targets_mean": 8905.6, "valid_targets_min": 1830 }, { "epoch": 0.3303834808259587, "grad_norm": 0.27829745186311433, "learning_rate": 2.636792452830189e-05, "loss": 0.4599, "loss_nan_ranks": 0, "loss_rank_avg": 0.13928677141666412, "step": 560, "valid_targets_mean": 9882.5, "valid_targets_min": 2408 }, { "epoch": 0.3333333333333333, "grad_norm": 0.2716435864042277, "learning_rate": 2.6603773584905663e-05, "loss": 0.4602, "loss_nan_ranks": 0, "loss_rank_avg": 0.14196351170539856, "step": 565, "valid_targets_mean": 9463.4, "valid_targets_min": 1659 }, { "epoch": 0.336283185840708, "grad_norm": 0.3535835553630807, "learning_rate": 2.683962264150944e-05, "loss": 0.4614, "loss_nan_ranks": 0, "loss_rank_avg": 0.14128056168556213, "step": 570, "valid_targets_mean": 11038.2, "valid_targets_min": 1531 }, { "epoch": 0.3392330383480826, "grad_norm": 0.33471177982730127, "learning_rate": 2.707547169811321e-05, "loss": 0.4572, "loss_nan_ranks": 0, "loss_rank_avg": 0.1605977863073349, "step": 575, "valid_targets_mean": 10074.7, "valid_targets_min": 2085 }, { "epoch": 0.3421828908554572, "grad_norm": 0.27189834395930973, "learning_rate": 2.731132075471698e-05, "loss": 0.4621, "loss_nan_ranks": 0, "loss_rank_avg": 0.13230662047863007, "step": 580, "valid_targets_mean": 10108.6, "valid_targets_min": 1642 }, { "epoch": 0.34513274336283184, "grad_norm": 0.32866294091387294, "learning_rate": 2.7547169811320755e-05, "loss": 0.4626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1503252238035202, "step": 585, "valid_targets_mean": 9673.6, "valid_targets_min": 997 }, { "epoch": 0.3480825958702065, "grad_norm": 0.2960662895794109, "learning_rate": 2.7783018867924528e-05, "loss": 0.456, "loss_nan_ranks": 0, "loss_rank_avg": 0.13039669394493103, "step": 590, "valid_targets_mean": 8708.4, "valid_targets_min": 1573 }, { "epoch": 0.35103244837758113, "grad_norm": 0.26573228974936325, "learning_rate": 2.8018867924528303e-05, "loss": 0.4605, "loss_nan_ranks": 0, "loss_rank_avg": 0.17490148544311523, "step": 595, "valid_targets_mean": 12304.2, "valid_targets_min": 1814 }, { "epoch": 0.35398230088495575, "grad_norm": 0.26907409187290865, "learning_rate": 2.825471698113208e-05, "loss": 0.4649, "loss_nan_ranks": 0, "loss_rank_avg": 0.15238738059997559, "step": 600, "valid_targets_mean": 11132.8, "valid_targets_min": 1200 }, { "epoch": 0.35693215339233036, "grad_norm": 0.2774500653590238, "learning_rate": 2.849056603773585e-05, "loss": 0.468, "loss_nan_ranks": 0, "loss_rank_avg": 0.16456542909145355, "step": 605, "valid_targets_mean": 10237.6, "valid_targets_min": 950 }, { "epoch": 0.35988200589970504, "grad_norm": 0.25930731596289175, "learning_rate": 2.8726415094339627e-05, "loss": 0.46, "loss_nan_ranks": 0, "loss_rank_avg": 0.13452622294425964, "step": 610, "valid_targets_mean": 10417.7, "valid_targets_min": 2034 }, { "epoch": 0.36283185840707965, "grad_norm": 0.24490820051848358, "learning_rate": 2.89622641509434e-05, "loss": 0.4486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15420666337013245, "step": 615, "valid_targets_mean": 11726.6, "valid_targets_min": 1312 }, { "epoch": 0.36578171091445427, "grad_norm": 0.2982872806748629, "learning_rate": 2.9198113207547175e-05, "loss": 0.4552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1296735554933548, "step": 620, "valid_targets_mean": 8954.2, "valid_targets_min": 1876 }, { "epoch": 0.3687315634218289, "grad_norm": 0.3250742977113956, "learning_rate": 2.9433962264150944e-05, "loss": 0.4613, "loss_nan_ranks": 0, "loss_rank_avg": 0.17718186974525452, "step": 625, "valid_targets_mean": 10257.4, "valid_targets_min": 2939 }, { "epoch": 0.37168141592920356, "grad_norm": 0.26652767339475386, "learning_rate": 2.9669811320754716e-05, "loss": 0.4555, "loss_nan_ranks": 0, "loss_rank_avg": 0.14411255717277527, "step": 630, "valid_targets_mean": 9281.1, "valid_targets_min": 2123 }, { "epoch": 0.3746312684365782, "grad_norm": 0.26668461534256777, "learning_rate": 2.9905660377358492e-05, "loss": 0.4559, "loss_nan_ranks": 0, "loss_rank_avg": 0.16539090871810913, "step": 635, "valid_targets_mean": 9339.8, "valid_targets_min": 2558 }, { "epoch": 0.3775811209439528, "grad_norm": 0.29462928332592325, "learning_rate": 3.0141509433962268e-05, "loss": 0.4579, "loss_nan_ranks": 0, "loss_rank_avg": 0.15282703936100006, "step": 640, "valid_targets_mean": 9360.2, "valid_targets_min": 2415 }, { "epoch": 0.3805309734513274, "grad_norm": 0.2516067578464611, "learning_rate": 3.037735849056604e-05, "loss": 0.4552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402677595615387, "step": 645, "valid_targets_mean": 8395.6, "valid_targets_min": 1630 }, { "epoch": 0.3834808259587021, "grad_norm": 0.2498210260731851, "learning_rate": 3.061320754716981e-05, "loss": 0.4488, "loss_nan_ranks": 0, "loss_rank_avg": 0.17535334825515747, "step": 650, "valid_targets_mean": 12708.2, "valid_targets_min": 3373 }, { "epoch": 0.3864306784660767, "grad_norm": 0.21973934537102108, "learning_rate": 3.084905660377359e-05, "loss": 0.4468, "loss_nan_ranks": 0, "loss_rank_avg": 0.14050549268722534, "step": 655, "valid_targets_mean": 11102.9, "valid_targets_min": 2383 }, { "epoch": 0.3893805309734513, "grad_norm": 0.270755988116607, "learning_rate": 3.1084905660377363e-05, "loss": 0.4565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1484229564666748, "step": 660, "valid_targets_mean": 9429.2, "valid_targets_min": 1243 }, { "epoch": 0.39233038348082594, "grad_norm": 0.29290363039429895, "learning_rate": 3.1320754716981136e-05, "loss": 0.4508, "loss_nan_ranks": 0, "loss_rank_avg": 0.17251214385032654, "step": 665, "valid_targets_mean": 12589.8, "valid_targets_min": 1293 }, { "epoch": 0.3952802359882006, "grad_norm": 0.2937360725551836, "learning_rate": 3.155660377358491e-05, "loss": 0.4512, "loss_nan_ranks": 0, "loss_rank_avg": 0.14358994364738464, "step": 670, "valid_targets_mean": 9731.8, "valid_targets_min": 1129 }, { "epoch": 0.39823008849557523, "grad_norm": 0.3156882903522341, "learning_rate": 3.179245283018868e-05, "loss": 0.4506, "loss_nan_ranks": 0, "loss_rank_avg": 0.11705832928419113, "step": 675, "valid_targets_mean": 8218.8, "valid_targets_min": 595 }, { "epoch": 0.40117994100294985, "grad_norm": 0.2562761263862917, "learning_rate": 3.202830188679245e-05, "loss": 0.4566, "loss_nan_ranks": 0, "loss_rank_avg": 0.14067499339580536, "step": 680, "valid_targets_mean": 9081.4, "valid_targets_min": 888 }, { "epoch": 0.40412979351032446, "grad_norm": 0.27166104573986943, "learning_rate": 3.226415094339623e-05, "loss": 0.4478, "loss_nan_ranks": 0, "loss_rank_avg": 0.15120014548301697, "step": 685, "valid_targets_mean": 10127.8, "valid_targets_min": 1547 }, { "epoch": 0.40707964601769914, "grad_norm": 0.25598816634560684, "learning_rate": 3.2500000000000004e-05, "loss": 0.4501, "loss_nan_ranks": 0, "loss_rank_avg": 0.14215946197509766, "step": 690, "valid_targets_mean": 9777.3, "valid_targets_min": 1666 }, { "epoch": 0.41002949852507375, "grad_norm": 0.25719286137409414, "learning_rate": 3.2735849056603776e-05, "loss": 0.4504, "loss_nan_ranks": 0, "loss_rank_avg": 0.13619284331798553, "step": 695, "valid_targets_mean": 8813.1, "valid_targets_min": 2184 }, { "epoch": 0.41297935103244837, "grad_norm": 0.2896922208973931, "learning_rate": 3.297169811320755e-05, "loss": 0.4582, "loss_nan_ranks": 0, "loss_rank_avg": 0.1457536220550537, "step": 700, "valid_targets_mean": 9679.6, "valid_targets_min": 2445 }, { "epoch": 0.415929203539823, "grad_norm": 0.23727416292578302, "learning_rate": 3.320754716981133e-05, "loss": 0.4565, "loss_nan_ranks": 0, "loss_rank_avg": 0.14196723699569702, "step": 705, "valid_targets_mean": 10510.3, "valid_targets_min": 1998 }, { "epoch": 0.41887905604719766, "grad_norm": 0.30186788865389924, "learning_rate": 3.34433962264151e-05, "loss": 0.454, "loss_nan_ranks": 0, "loss_rank_avg": 0.2078678011894226, "step": 710, "valid_targets_mean": 12465.5, "valid_targets_min": 1710 }, { "epoch": 0.4218289085545723, "grad_norm": 0.2708370944564039, "learning_rate": 3.367924528301887e-05, "loss": 0.4493, "loss_nan_ranks": 0, "loss_rank_avg": 0.17721615731716156, "step": 715, "valid_targets_mean": 10231.8, "valid_targets_min": 2259 }, { "epoch": 0.4247787610619469, "grad_norm": 0.2350755624225508, "learning_rate": 3.3915094339622644e-05, "loss": 0.4535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1684504598379135, "step": 720, "valid_targets_mean": 13320.7, "valid_targets_min": 1376 }, { "epoch": 0.4277286135693215, "grad_norm": 0.2522551418925396, "learning_rate": 3.415094339622642e-05, "loss": 0.4443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1219257265329361, "step": 725, "valid_targets_mean": 8426.0, "valid_targets_min": 1654 }, { "epoch": 0.4306784660766962, "grad_norm": 0.2388555987026393, "learning_rate": 3.438679245283019e-05, "loss": 0.4497, "loss_nan_ranks": 0, "loss_rank_avg": 0.13714396953582764, "step": 730, "valid_targets_mean": 8610.3, "valid_targets_min": 2335 }, { "epoch": 0.4336283185840708, "grad_norm": 0.2582456062781972, "learning_rate": 3.462264150943397e-05, "loss": 0.449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14914974570274353, "step": 735, "valid_targets_mean": 9733.9, "valid_targets_min": 2604 }, { "epoch": 0.4365781710914454, "grad_norm": 0.2700913343244362, "learning_rate": 3.485849056603774e-05, "loss": 0.4458, "loss_nan_ranks": 0, "loss_rank_avg": 0.12170357257127762, "step": 740, "valid_targets_mean": 7887.3, "valid_targets_min": 961 }, { "epoch": 0.43952802359882004, "grad_norm": 0.222415816081342, "learning_rate": 3.509433962264151e-05, "loss": 0.4508, "loss_nan_ranks": 0, "loss_rank_avg": 0.17051385343074799, "step": 745, "valid_targets_mean": 12008.4, "valid_targets_min": 3631 }, { "epoch": 0.4424778761061947, "grad_norm": 0.25946960551263726, "learning_rate": 3.5330188679245285e-05, "loss": 0.4559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1592746078968048, "step": 750, "valid_targets_mean": 11155.2, "valid_targets_min": 2731 }, { "epoch": 0.44542772861356933, "grad_norm": 0.25561757233854515, "learning_rate": 3.5566037735849064e-05, "loss": 0.4428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529407799243927, "step": 755, "valid_targets_mean": 10674.4, "valid_targets_min": 1317 }, { "epoch": 0.44837758112094395, "grad_norm": 0.24513783517340867, "learning_rate": 3.580188679245283e-05, "loss": 0.4481, "loss_nan_ranks": 0, "loss_rank_avg": 0.17502880096435547, "step": 760, "valid_targets_mean": 11136.4, "valid_targets_min": 1890 }, { "epoch": 0.45132743362831856, "grad_norm": 0.28955720780331523, "learning_rate": 3.603773584905661e-05, "loss": 0.4513, "loss_nan_ranks": 0, "loss_rank_avg": 0.18724988400936127, "step": 765, "valid_targets_mean": 12538.8, "valid_targets_min": 1856 }, { "epoch": 0.45427728613569324, "grad_norm": 0.27683507884518554, "learning_rate": 3.627358490566038e-05, "loss": 0.4577, "loss_nan_ranks": 0, "loss_rank_avg": 0.17236828804016113, "step": 770, "valid_targets_mean": 11351.3, "valid_targets_min": 1738 }, { "epoch": 0.45722713864306785, "grad_norm": 0.26370920620085647, "learning_rate": 3.650943396226415e-05, "loss": 0.4472, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365929037332535, "step": 775, "valid_targets_mean": 9638.6, "valid_targets_min": 2769 }, { "epoch": 0.46017699115044247, "grad_norm": 0.2492816067379124, "learning_rate": 3.6745283018867925e-05, "loss": 0.4494, "loss_nan_ranks": 0, "loss_rank_avg": 0.15394821763038635, "step": 780, "valid_targets_mean": 10217.3, "valid_targets_min": 1867 }, { "epoch": 0.4631268436578171, "grad_norm": 0.2662678776277218, "learning_rate": 3.6981132075471704e-05, "loss": 0.4454, "loss_nan_ranks": 0, "loss_rank_avg": 0.1481439769268036, "step": 785, "valid_targets_mean": 10830.1, "valid_targets_min": 2056 }, { "epoch": 0.46607669616519176, "grad_norm": 0.27166721966840673, "learning_rate": 3.721698113207548e-05, "loss": 0.4433, "loss_nan_ranks": 0, "loss_rank_avg": 0.11750192940235138, "step": 790, "valid_targets_mean": 8065.7, "valid_targets_min": 2250 }, { "epoch": 0.4690265486725664, "grad_norm": 0.2802680400873714, "learning_rate": 3.745283018867925e-05, "loss": 0.4492, "loss_nan_ranks": 0, "loss_rank_avg": 0.14400440454483032, "step": 795, "valid_targets_mean": 10655.2, "valid_targets_min": 2555 }, { "epoch": 0.471976401179941, "grad_norm": 0.25574385214080575, "learning_rate": 3.768867924528302e-05, "loss": 0.4452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591102033853531, "step": 800, "valid_targets_mean": 11071.5, "valid_targets_min": 860 }, { "epoch": 0.4749262536873156, "grad_norm": 0.2337795901319177, "learning_rate": 3.7924528301886794e-05, "loss": 0.4413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704762876033783, "step": 805, "valid_targets_mean": 11408.9, "valid_targets_min": 2015 }, { "epoch": 0.4778761061946903, "grad_norm": 0.21354425291394666, "learning_rate": 3.8160377358490566e-05, "loss": 0.4471, "loss_nan_ranks": 0, "loss_rank_avg": 0.12261828780174255, "step": 810, "valid_targets_mean": 9568.1, "valid_targets_min": 1913 }, { "epoch": 0.4808259587020649, "grad_norm": 0.27920147232288245, "learning_rate": 3.8396226415094345e-05, "loss": 0.4514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378454566001892, "step": 815, "valid_targets_mean": 9056.0, "valid_targets_min": 1585 }, { "epoch": 0.4837758112094395, "grad_norm": 0.23954199670564313, "learning_rate": 3.863207547169812e-05, "loss": 0.4453, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725279539823532, "step": 820, "valid_targets_mean": 13044.3, "valid_targets_min": 2160 }, { "epoch": 0.48672566371681414, "grad_norm": 0.27199528594568334, "learning_rate": 3.886792452830189e-05, "loss": 0.449, "loss_nan_ranks": 0, "loss_rank_avg": 0.12170670181512833, "step": 825, "valid_targets_mean": 9486.9, "valid_targets_min": 1543 }, { "epoch": 0.4896755162241888, "grad_norm": 0.24402116494508275, "learning_rate": 3.910377358490566e-05, "loss": 0.4475, "loss_nan_ranks": 0, "loss_rank_avg": 0.12425626814365387, "step": 830, "valid_targets_mean": 9637.9, "valid_targets_min": 1453 }, { "epoch": 0.49262536873156343, "grad_norm": 0.2601853493885366, "learning_rate": 3.933962264150944e-05, "loss": 0.4498, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890874207019806, "step": 835, "valid_targets_mean": 11221.1, "valid_targets_min": 1861 }, { "epoch": 0.49557522123893805, "grad_norm": 0.26759359151306256, "learning_rate": 3.957547169811321e-05, "loss": 0.4493, "loss_nan_ranks": 0, "loss_rank_avg": 0.12343671172857285, "step": 840, "valid_targets_mean": 7896.7, "valid_targets_min": 1601 }, { "epoch": 0.49852507374631266, "grad_norm": 0.27994930659509876, "learning_rate": 3.9811320754716985e-05, "loss": 0.4498, "loss_nan_ranks": 0, "loss_rank_avg": 0.1634995937347412, "step": 845, "valid_targets_mean": 11206.3, "valid_targets_min": 2567 }, { "epoch": 0.5014749262536873, "grad_norm": 0.31281920185152984, "learning_rate": 3.999999830335006e-05, "loss": 0.4382, "loss_nan_ranks": 0, "loss_rank_avg": 0.15493710339069366, "step": 850, "valid_targets_mean": 9940.7, "valid_targets_min": 1487 }, { "epoch": 0.504424778761062, "grad_norm": 0.27455549055935935, "learning_rate": 3.999993892063233e-05, "loss": 0.4466, "loss_nan_ranks": 0, "loss_rank_avg": 0.14785268902778625, "step": 855, "valid_targets_mean": 9426.9, "valid_targets_min": 1920 }, { "epoch": 0.5073746312684366, "grad_norm": 0.2514821993311233, "learning_rate": 3.999979470570539e-05, "loss": 0.4487, "loss_nan_ranks": 0, "loss_rank_avg": 0.12655514478683472, "step": 860, "valid_targets_mean": 7889.9, "valid_targets_min": 1997 }, { "epoch": 0.5103244837758112, "grad_norm": 0.2315638399925816, "learning_rate": 3.999956565918094e-05, "loss": 0.4399, "loss_nan_ranks": 0, "loss_rank_avg": 0.12273876368999481, "step": 865, "valid_targets_mean": 8702.3, "valid_targets_min": 2150 }, { "epoch": 0.5132743362831859, "grad_norm": 0.27177307915070725, "learning_rate": 3.9999251782030515e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.17223188281059265, "step": 870, "valid_targets_mean": 11533.9, "valid_targets_min": 1871 }, { "epoch": 0.5162241887905604, "grad_norm": 0.2530159978008084, "learning_rate": 3.999885307558546e-05, "loss": 0.4309, "loss_nan_ranks": 0, "loss_rank_avg": 0.14095968008041382, "step": 875, "valid_targets_mean": 10099.0, "valid_targets_min": 2449 }, { "epoch": 0.5191740412979351, "grad_norm": 0.23419659787170694, "learning_rate": 3.999836954153693e-05, "loss": 0.4375, "loss_nan_ranks": 0, "loss_rank_avg": 0.1631159782409668, "step": 880, "valid_targets_mean": 10613.0, "valid_targets_min": 1767 }, { "epoch": 0.5221238938053098, "grad_norm": 0.2635996187407809, "learning_rate": 3.999780118193591e-05, "loss": 0.4491, "loss_nan_ranks": 0, "loss_rank_avg": 0.14979779720306396, "step": 885, "valid_targets_mean": 9735.8, "valid_targets_min": 1444 }, { "epoch": 0.5250737463126843, "grad_norm": 0.23138056829140724, "learning_rate": 3.999714799919315e-05, "loss": 0.4543, "loss_nan_ranks": 0, "loss_rank_avg": 0.16043859720230103, "step": 890, "valid_targets_mean": 12089.4, "valid_targets_min": 1483 }, { "epoch": 0.528023598820059, "grad_norm": 0.2552416570547656, "learning_rate": 3.9996409996079216e-05, "loss": 0.4479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1546708643436432, "step": 895, "valid_targets_mean": 9522.6, "valid_targets_min": 747 }, { "epoch": 0.5309734513274337, "grad_norm": 0.27707949183780095, "learning_rate": 3.999558717572444e-05, "loss": 0.4341, "loss_nan_ranks": 0, "loss_rank_avg": 0.10108429193496704, "step": 900, "valid_targets_mean": 6589.8, "valid_targets_min": 1001 }, { "epoch": 0.5339233038348082, "grad_norm": 0.30013490391556236, "learning_rate": 3.9994679541618915e-05, "loss": 0.4496, "loss_nan_ranks": 0, "loss_rank_avg": 0.141307532787323, "step": 905, "valid_targets_mean": 8307.7, "valid_targets_min": 1442 }, { "epoch": 0.5368731563421829, "grad_norm": 0.2380696069906505, "learning_rate": 3.999368709761248e-05, "loss": 0.4392, "loss_nan_ranks": 0, "loss_rank_avg": 0.13957419991493225, "step": 910, "valid_targets_mean": 9174.5, "valid_targets_min": 2099 }, { "epoch": 0.5398230088495575, "grad_norm": 0.243047986423948, "learning_rate": 3.999260984791471e-05, "loss": 0.442, "loss_nan_ranks": 0, "loss_rank_avg": 0.15068325400352478, "step": 915, "valid_targets_mean": 9977.2, "valid_targets_min": 1385 }, { "epoch": 0.5427728613569321, "grad_norm": 0.282398462410271, "learning_rate": 3.9991447797094886e-05, "loss": 0.4448, "loss_nan_ranks": 0, "loss_rank_avg": 0.12257401645183563, "step": 920, "valid_targets_mean": 8322.1, "valid_targets_min": 2131 }, { "epoch": 0.5457227138643068, "grad_norm": 0.2803063967663372, "learning_rate": 3.999020095008201e-05, "loss": 0.4486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15170587599277496, "step": 925, "valid_targets_mean": 10406.2, "valid_targets_min": 1407 }, { "epoch": 0.5486725663716814, "grad_norm": 0.21878506602558695, "learning_rate": 3.998886931216471e-05, "loss": 0.4366, "loss_nan_ranks": 0, "loss_rank_avg": 0.167210191488266, "step": 930, "valid_targets_mean": 12493.9, "valid_targets_min": 2457 }, { "epoch": 0.551622418879056, "grad_norm": 0.28765408994466546, "learning_rate": 3.998745288899132e-05, "loss": 0.4335, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283373236656189, "step": 935, "valid_targets_mean": 9960.1, "valid_targets_min": 2052 }, { "epoch": 0.5545722713864307, "grad_norm": 0.2843227805103614, "learning_rate": 3.998595168656975e-05, "loss": 0.4495, "loss_nan_ranks": 0, "loss_rank_avg": 0.12957099080085754, "step": 940, "valid_targets_mean": 8378.8, "valid_targets_min": 1560 }, { "epoch": 0.5575221238938053, "grad_norm": 0.25406467688649903, "learning_rate": 3.998436571126755e-05, "loss": 0.4391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349082589149475, "step": 945, "valid_targets_mean": 9472.5, "valid_targets_min": 2484 }, { "epoch": 0.56047197640118, "grad_norm": 0.25433445706846386, "learning_rate": 3.9982694969811826e-05, "loss": 0.444, "loss_nan_ranks": 0, "loss_rank_avg": 0.1430283486843109, "step": 950, "valid_targets_mean": 10299.2, "valid_targets_min": 878 }, { "epoch": 0.5634218289085545, "grad_norm": 0.23787392787588774, "learning_rate": 3.9980939469289235e-05, "loss": 0.4427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1557752639055252, "step": 955, "valid_targets_mean": 10887.9, "valid_targets_min": 2125 }, { "epoch": 0.5663716814159292, "grad_norm": 0.2308555142208238, "learning_rate": 3.9979099217145944e-05, "loss": 0.4394, "loss_nan_ranks": 0, "loss_rank_avg": 0.18596434593200684, "step": 960, "valid_targets_mean": 12573.0, "valid_targets_min": 2048 }, { "epoch": 0.5693215339233039, "grad_norm": 0.2658698303261006, "learning_rate": 3.997717422118762e-05, "loss": 0.445, "loss_nan_ranks": 0, "loss_rank_avg": 0.13433973491191864, "step": 965, "valid_targets_mean": 9179.3, "valid_targets_min": 1147 }, { "epoch": 0.5722713864306784, "grad_norm": 0.23518502065874103, "learning_rate": 3.997516448957936e-05, "loss": 0.4322, "loss_nan_ranks": 0, "loss_rank_avg": 0.15136614441871643, "step": 970, "valid_targets_mean": 10706.8, "valid_targets_min": 1593 }, { "epoch": 0.5752212389380531, "grad_norm": 0.26959385406200537, "learning_rate": 3.99730700308457e-05, "loss": 0.4388, "loss_nan_ranks": 0, "loss_rank_avg": 0.14212557673454285, "step": 975, "valid_targets_mean": 9218.1, "valid_targets_min": 2137 }, { "epoch": 0.5781710914454278, "grad_norm": 0.29520369839795346, "learning_rate": 3.997089085387053e-05, "loss": 0.4406, "loss_nan_ranks": 0, "loss_rank_avg": 0.1661655157804489, "step": 980, "valid_targets_mean": 11224.7, "valid_targets_min": 1822 }, { "epoch": 0.5811209439528023, "grad_norm": 0.24272878958124294, "learning_rate": 3.996862696789711e-05, "loss": 0.4386, "loss_nan_ranks": 0, "loss_rank_avg": 0.15572072565555573, "step": 985, "valid_targets_mean": 11156.6, "valid_targets_min": 1606 }, { "epoch": 0.584070796460177, "grad_norm": 0.22014999106432825, "learning_rate": 3.9966278382527984e-05, "loss": 0.4371, "loss_nan_ranks": 0, "loss_rank_avg": 0.16465000808238983, "step": 990, "valid_targets_mean": 10960.1, "valid_targets_min": 1556 }, { "epoch": 0.5870206489675516, "grad_norm": 0.22932156241002566, "learning_rate": 3.9963845107724974e-05, "loss": 0.4417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330799162387848, "step": 995, "valid_targets_mean": 9461.7, "valid_targets_min": 1929 }, { "epoch": 0.5899705014749262, "grad_norm": 0.25358406476549183, "learning_rate": 3.9961327153809115e-05, "loss": 0.4457, "loss_nan_ranks": 0, "loss_rank_avg": 0.153403177857399, "step": 1000, "valid_targets_mean": 9745.5, "valid_targets_min": 1581 }, { "epoch": 0.5929203539823009, "grad_norm": 0.23111027669299938, "learning_rate": 3.995872453146061e-05, "loss": 0.4334, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502678245306015, "step": 1005, "valid_targets_mean": 10080.6, "valid_targets_min": 2923 }, { "epoch": 0.5958702064896755, "grad_norm": 0.24859400144388313, "learning_rate": 3.9956037251718815e-05, "loss": 0.4316, "loss_nan_ranks": 0, "loss_rank_avg": 0.14000633358955383, "step": 1010, "valid_targets_mean": 8127.2, "valid_targets_min": 1571 }, { "epoch": 0.5988200589970502, "grad_norm": 0.22734263938219632, "learning_rate": 3.9953265325982154e-05, "loss": 0.4433, "loss_nan_ranks": 0, "loss_rank_avg": 0.14217329025268555, "step": 1015, "valid_targets_mean": 10449.8, "valid_targets_min": 1912 }, { "epoch": 0.6017699115044248, "grad_norm": 0.2617934457733421, "learning_rate": 3.9950408766008084e-05, "loss": 0.4408, "loss_nan_ranks": 0, "loss_rank_avg": 0.1299726665019989, "step": 1020, "valid_targets_mean": 8532.2, "valid_targets_min": 1791 }, { "epoch": 0.6047197640117994, "grad_norm": 0.25200466318788883, "learning_rate": 3.994746758391308e-05, "loss": 0.4415, "loss_nan_ranks": 0, "loss_rank_avg": 0.15745247900485992, "step": 1025, "valid_targets_mean": 11387.8, "valid_targets_min": 2003 }, { "epoch": 0.6076696165191741, "grad_norm": 0.2522310486948059, "learning_rate": 3.9944441792172496e-05, "loss": 0.4409, "loss_nan_ranks": 0, "loss_rank_avg": 0.1417302042245865, "step": 1030, "valid_targets_mean": 9229.9, "valid_targets_min": 2522 }, { "epoch": 0.6106194690265486, "grad_norm": 0.24087788923556788, "learning_rate": 3.9941331403620627e-05, "loss": 0.4382, "loss_nan_ranks": 0, "loss_rank_avg": 0.16813431680202484, "step": 1035, "valid_targets_mean": 12198.8, "valid_targets_min": 1675 }, { "epoch": 0.6135693215339233, "grad_norm": 0.26238210737003126, "learning_rate": 3.993813643145055e-05, "loss": 0.4408, "loss_nan_ranks": 0, "loss_rank_avg": 0.14091551303863525, "step": 1040, "valid_targets_mean": 10017.0, "valid_targets_min": 1776 }, { "epoch": 0.616519174041298, "grad_norm": 0.2317100253921235, "learning_rate": 3.9934856889214154e-05, "loss": 0.4373, "loss_nan_ranks": 0, "loss_rank_avg": 0.13581900298595428, "step": 1045, "valid_targets_mean": 10342.0, "valid_targets_min": 1961 }, { "epoch": 0.6194690265486725, "grad_norm": 0.21932495712560107, "learning_rate": 3.993149279082201e-05, "loss": 0.4399, "loss_nan_ranks": 0, "loss_rank_avg": 0.14504750072956085, "step": 1050, "valid_targets_mean": 9962.6, "valid_targets_min": 2405 }, { "epoch": 0.6224188790560472, "grad_norm": 0.23356570302226454, "learning_rate": 3.9928044150543364e-05, "loss": 0.4387, "loss_nan_ranks": 0, "loss_rank_avg": 0.12058188766241074, "step": 1055, "valid_targets_mean": 8304.7, "valid_targets_min": 1978 }, { "epoch": 0.6253687315634219, "grad_norm": 0.24065917712232185, "learning_rate": 3.992451098300604e-05, "loss": 0.436, "loss_nan_ranks": 0, "loss_rank_avg": 0.15964940190315247, "step": 1060, "valid_targets_mean": 12342.4, "valid_targets_min": 2187 }, { "epoch": 0.6283185840707964, "grad_norm": 0.21529728843415769, "learning_rate": 3.9920893303196406e-05, "loss": 0.4381, "loss_nan_ranks": 0, "loss_rank_avg": 0.1437956839799881, "step": 1065, "valid_targets_mean": 9165.0, "valid_targets_min": 832 }, { "epoch": 0.6312684365781711, "grad_norm": 0.22294702084259344, "learning_rate": 3.99171911264593e-05, "loss": 0.4389, "loss_nan_ranks": 0, "loss_rank_avg": 0.1432226449251175, "step": 1070, "valid_targets_mean": 10573.9, "valid_targets_min": 2386 }, { "epoch": 0.6342182890855457, "grad_norm": 0.2488004867962405, "learning_rate": 3.991340446849797e-05, "loss": 0.4451, "loss_nan_ranks": 0, "loss_rank_avg": 0.11577347666025162, "step": 1075, "valid_targets_mean": 8261.4, "valid_targets_min": 1439 }, { "epoch": 0.6371681415929203, "grad_norm": 0.31671954979395994, "learning_rate": 3.990953334537398e-05, "loss": 0.448, "loss_nan_ranks": 0, "loss_rank_avg": 0.15443119406700134, "step": 1080, "valid_targets_mean": 9847.7, "valid_targets_min": 1767 }, { "epoch": 0.640117994100295, "grad_norm": 0.25680278491945663, "learning_rate": 3.9905577773507184e-05, "loss": 0.4368, "loss_nan_ranks": 0, "loss_rank_avg": 0.16935217380523682, "step": 1085, "valid_targets_mean": 13030.2, "valid_targets_min": 2483 }, { "epoch": 0.6430678466076696, "grad_norm": 0.239359194829167, "learning_rate": 3.990153776967562e-05, "loss": 0.4355, "loss_nan_ranks": 0, "loss_rank_avg": 0.13085396587848663, "step": 1090, "valid_targets_mean": 9731.1, "valid_targets_min": 1703 }, { "epoch": 0.6460176991150443, "grad_norm": 0.22373425243288575, "learning_rate": 3.989741335101547e-05, "loss": 0.4346, "loss_nan_ranks": 0, "loss_rank_avg": 0.14850249886512756, "step": 1095, "valid_targets_mean": 10780.1, "valid_targets_min": 1649 }, { "epoch": 0.6489675516224189, "grad_norm": 0.2433722186409111, "learning_rate": 3.989320453502096e-05, "loss": 0.4436, "loss_nan_ranks": 0, "loss_rank_avg": 0.15189602971076965, "step": 1100, "valid_targets_mean": 10743.4, "valid_targets_min": 1801 }, { "epoch": 0.6519174041297935, "grad_norm": 0.3323864666353114, "learning_rate": 3.988891133954431e-05, "loss": 0.4436, "loss_nan_ranks": 0, "loss_rank_avg": 0.11629551649093628, "step": 1105, "valid_targets_mean": 9102.6, "valid_targets_min": 1830 }, { "epoch": 0.6548672566371682, "grad_norm": 0.22889042461049347, "learning_rate": 3.988453378279563e-05, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.12611937522888184, "step": 1110, "valid_targets_mean": 9400.9, "valid_targets_min": 1853 }, { "epoch": 0.6578171091445427, "grad_norm": 0.2543271499306638, "learning_rate": 3.9880071883342877e-05, "loss": 0.4267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1420837789773941, "step": 1115, "valid_targets_mean": 10114.0, "valid_targets_min": 2144 }, { "epoch": 0.6607669616519174, "grad_norm": 0.22975752551359416, "learning_rate": 3.9875525660111746e-05, "loss": 0.425, "loss_nan_ranks": 0, "loss_rank_avg": 0.14416566491127014, "step": 1120, "valid_targets_mean": 9553.2, "valid_targets_min": 2181 }, { "epoch": 0.6637168141592921, "grad_norm": 0.25343521443481465, "learning_rate": 3.987089513238559e-05, "loss": 0.4391, "loss_nan_ranks": 0, "loss_rank_avg": 0.15074048936367035, "step": 1125, "valid_targets_mean": 9748.7, "valid_targets_min": 856 }, { "epoch": 0.6666666666666666, "grad_norm": 0.22582108402324896, "learning_rate": 3.986618031980537e-05, "loss": 0.4384, "loss_nan_ranks": 0, "loss_rank_avg": 0.1590452492237091, "step": 1130, "valid_targets_mean": 12207.3, "valid_targets_min": 2941 }, { "epoch": 0.6696165191740413, "grad_norm": 0.25138835363280104, "learning_rate": 3.9861381242369566e-05, "loss": 0.4352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1295248568058014, "step": 1135, "valid_targets_mean": 9607.7, "valid_targets_min": 1480 }, { "epoch": 0.672566371681416, "grad_norm": 0.21744109580566193, "learning_rate": 3.985649792043403e-05, "loss": 0.4445, "loss_nan_ranks": 0, "loss_rank_avg": 0.13683268427848816, "step": 1140, "valid_targets_mean": 10516.6, "valid_targets_min": 1750 }, { "epoch": 0.6755162241887905, "grad_norm": 0.24750482724598766, "learning_rate": 3.9851530374711985e-05, "loss": 0.4365, "loss_nan_ranks": 0, "loss_rank_avg": 0.12796282768249512, "step": 1145, "valid_targets_mean": 9166.2, "valid_targets_min": 2342 }, { "epoch": 0.6784660766961652, "grad_norm": 0.27006974732922817, "learning_rate": 3.984647862627389e-05, "loss": 0.4368, "loss_nan_ranks": 0, "loss_rank_avg": 0.16928240656852722, "step": 1150, "valid_targets_mean": 10198.2, "valid_targets_min": 1888 }, { "epoch": 0.6814159292035398, "grad_norm": 0.22988670089720328, "learning_rate": 3.984134269654736e-05, "loss": 0.4373, "loss_nan_ranks": 0, "loss_rank_avg": 0.14798274636268616, "step": 1155, "valid_targets_mean": 9976.0, "valid_targets_min": 1591 }, { "epoch": 0.6843657817109144, "grad_norm": 0.23566250791004936, "learning_rate": 3.9836122607317083e-05, "loss": 0.4349, "loss_nan_ranks": 0, "loss_rank_avg": 0.13107168674468994, "step": 1160, "valid_targets_mean": 8667.3, "valid_targets_min": 1636 }, { "epoch": 0.6873156342182891, "grad_norm": 0.22239697943516684, "learning_rate": 3.983081838072469e-05, "loss": 0.4378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1745031625032425, "step": 1165, "valid_targets_mean": 11671.9, "valid_targets_min": 1372 }, { "epoch": 0.6902654867256637, "grad_norm": 0.22586990007122548, "learning_rate": 3.9825430039268734e-05, "loss": 0.4379, "loss_nan_ranks": 0, "loss_rank_avg": 0.12756019830703735, "step": 1170, "valid_targets_mean": 8705.5, "valid_targets_min": 788 }, { "epoch": 0.6932153392330384, "grad_norm": 0.22261089505162365, "learning_rate": 3.9819957605804514e-05, "loss": 0.4395, "loss_nan_ranks": 0, "loss_rank_avg": 0.14750631153583527, "step": 1175, "valid_targets_mean": 10789.9, "valid_targets_min": 1629 }, { "epoch": 0.696165191740413, "grad_norm": 0.22306615194696608, "learning_rate": 3.9814401103544044e-05, "loss": 0.4432, "loss_nan_ranks": 0, "loss_rank_avg": 0.13897669315338135, "step": 1180, "valid_targets_mean": 9820.9, "valid_targets_min": 2079 }, { "epoch": 0.6991150442477876, "grad_norm": 0.22317738628263822, "learning_rate": 3.980876055605591e-05, "loss": 0.4338, "loss_nan_ranks": 0, "loss_rank_avg": 0.1291494220495224, "step": 1185, "valid_targets_mean": 9519.0, "valid_targets_min": 1443 }, { "epoch": 0.7020648967551623, "grad_norm": 0.2256263144128267, "learning_rate": 3.980303598726519e-05, "loss": 0.4334, "loss_nan_ranks": 0, "loss_rank_avg": 0.14101535081863403, "step": 1190, "valid_targets_mean": 11148.6, "valid_targets_min": 2844 }, { "epoch": 0.7050147492625368, "grad_norm": 0.21397313621788763, "learning_rate": 3.9797227421453345e-05, "loss": 0.4385, "loss_nan_ranks": 0, "loss_rank_avg": 0.17973126471042633, "step": 1195, "valid_targets_mean": 11772.3, "valid_targets_min": 2041 }, { "epoch": 0.7079646017699115, "grad_norm": 0.19691259367572003, "learning_rate": 3.9791334883258133e-05, "loss": 0.4338, "loss_nan_ranks": 0, "loss_rank_avg": 0.13496637344360352, "step": 1200, "valid_targets_mean": 9464.2, "valid_targets_min": 2006 }, { "epoch": 0.7109144542772862, "grad_norm": 0.21329831639659594, "learning_rate": 3.978535839767346e-05, "loss": 0.4389, "loss_nan_ranks": 0, "loss_rank_avg": 0.12946803867816925, "step": 1205, "valid_targets_mean": 10115.8, "valid_targets_min": 2033 }, { "epoch": 0.7138643067846607, "grad_norm": 0.2154057849716186, "learning_rate": 3.977929799004937e-05, "loss": 0.4281, "loss_nan_ranks": 0, "loss_rank_avg": 0.11410190910100937, "step": 1210, "valid_targets_mean": 8914.2, "valid_targets_min": 1829 }, { "epoch": 0.7168141592920354, "grad_norm": 0.2271674738481832, "learning_rate": 3.977315368609179e-05, "loss": 0.4307, "loss_nan_ranks": 0, "loss_rank_avg": 0.16380158066749573, "step": 1215, "valid_targets_mean": 11594.1, "valid_targets_min": 1466 }, { "epoch": 0.7197640117994101, "grad_norm": 0.2386454065940037, "learning_rate": 3.9766925511862554e-05, "loss": 0.4295, "loss_nan_ranks": 0, "loss_rank_avg": 0.14458134770393372, "step": 1220, "valid_targets_mean": 10735.3, "valid_targets_min": 1786 }, { "epoch": 0.7227138643067846, "grad_norm": 0.2255030881058441, "learning_rate": 3.976061349377924e-05, "loss": 0.4309, "loss_nan_ranks": 0, "loss_rank_avg": 0.14954999089241028, "step": 1225, "valid_targets_mean": 11454.9, "valid_targets_min": 2305 }, { "epoch": 0.7256637168141593, "grad_norm": 0.2481445013421651, "learning_rate": 3.975421765861505e-05, "loss": 0.4384, "loss_nan_ranks": 0, "loss_rank_avg": 0.12814843654632568, "step": 1230, "valid_targets_mean": 9119.2, "valid_targets_min": 933 }, { "epoch": 0.7286135693215339, "grad_norm": 0.21781116099994088, "learning_rate": 3.974773803349869e-05, "loss": 0.4383, "loss_nan_ranks": 0, "loss_rank_avg": 0.1225578561425209, "step": 1235, "valid_targets_mean": 9410.8, "valid_targets_min": 1837 }, { "epoch": 0.7315634218289085, "grad_norm": 0.21342911241238924, "learning_rate": 3.974117464591432e-05, "loss": 0.4315, "loss_nan_ranks": 0, "loss_rank_avg": 0.12645339965820312, "step": 1240, "valid_targets_mean": 9461.3, "valid_targets_min": 1841 }, { "epoch": 0.7345132743362832, "grad_norm": 0.20513947169642738, "learning_rate": 3.973452752370134e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715991497039795, "step": 1245, "valid_targets_mean": 12400.2, "valid_targets_min": 2042 }, { "epoch": 0.7374631268436578, "grad_norm": 0.21563879416279083, "learning_rate": 3.972779669505434e-05, "loss": 0.4352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1682026982307434, "step": 1250, "valid_targets_mean": 12530.3, "valid_targets_min": 2926 }, { "epoch": 0.7404129793510325, "grad_norm": 0.23091666313240913, "learning_rate": 3.972098218852296e-05, "loss": 0.4352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543908715248108, "step": 1255, "valid_targets_mean": 10509.6, "valid_targets_min": 649 }, { "epoch": 0.7433628318584071, "grad_norm": 0.22856855769072065, "learning_rate": 3.971408403301178e-05, "loss": 0.4309, "loss_nan_ranks": 0, "loss_rank_avg": 0.14025411009788513, "step": 1260, "valid_targets_mean": 9454.0, "valid_targets_min": 2003 }, { "epoch": 0.7463126843657817, "grad_norm": 0.2335912261958896, "learning_rate": 3.970710225778016e-05, "loss": 0.4349, "loss_nan_ranks": 0, "loss_rank_avg": 0.1344713419675827, "step": 1265, "valid_targets_mean": 9103.6, "valid_targets_min": 1608 }, { "epoch": 0.7492625368731564, "grad_norm": 0.22079369010684347, "learning_rate": 3.9700036892442175e-05, "loss": 0.4317, "loss_nan_ranks": 0, "loss_rank_avg": 0.13677185773849487, "step": 1270, "valid_targets_mean": 9436.6, "valid_targets_min": 2137 }, { "epoch": 0.7522123893805309, "grad_norm": 0.1971068177734515, "learning_rate": 3.969288796696645e-05, "loss": 0.4289, "loss_nan_ranks": 0, "loss_rank_avg": 0.13685756921768188, "step": 1275, "valid_targets_mean": 9747.0, "valid_targets_min": 1135 }, { "epoch": 0.7551622418879056, "grad_norm": 0.2347117554337764, "learning_rate": 3.968565551167602e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.15099859237670898, "step": 1280, "valid_targets_mean": 10079.6, "valid_targets_min": 2286 }, { "epoch": 0.7581120943952803, "grad_norm": 0.2272814602284412, "learning_rate": 3.967833955724824e-05, "loss": 0.4424, "loss_nan_ranks": 0, "loss_rank_avg": 0.15157118439674377, "step": 1285, "valid_targets_mean": 10582.6, "valid_targets_min": 1657 }, { "epoch": 0.7610619469026548, "grad_norm": 0.24637729164796876, "learning_rate": 3.967094013471464e-05, "loss": 0.4391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1336841583251953, "step": 1290, "valid_targets_mean": 8869.7, "valid_targets_min": 1883 }, { "epoch": 0.7640117994100295, "grad_norm": 0.22473990553847215, "learning_rate": 3.966345727546078e-05, "loss": 0.4251, "loss_nan_ranks": 0, "loss_rank_avg": 0.1474177986383438, "step": 1295, "valid_targets_mean": 10999.8, "valid_targets_min": 1608 }, { "epoch": 0.7669616519174042, "grad_norm": 0.2266397688976117, "learning_rate": 3.965589101122613e-05, "loss": 0.4335, "loss_nan_ranks": 0, "loss_rank_avg": 0.14274467527866364, "step": 1300, "valid_targets_mean": 10845.2, "valid_targets_min": 1769 }, { "epoch": 0.7699115044247787, "grad_norm": 0.23903918230849802, "learning_rate": 3.9648241374103936e-05, "loss": 0.4318, "loss_nan_ranks": 0, "loss_rank_avg": 0.15274375677108765, "step": 1305, "valid_targets_mean": 11583.4, "valid_targets_min": 2726 }, { "epoch": 0.7728613569321534, "grad_norm": 0.22667591691034675, "learning_rate": 3.964050839654107e-05, "loss": 0.4276, "loss_nan_ranks": 0, "loss_rank_avg": 0.12878428399562836, "step": 1310, "valid_targets_mean": 9023.2, "valid_targets_min": 1719 }, { "epoch": 0.775811209439528, "grad_norm": 0.20118498187763423, "learning_rate": 3.963269211133792e-05, "loss": 0.4314, "loss_nan_ranks": 0, "loss_rank_avg": 0.16713985800743103, "step": 1315, "valid_targets_mean": 11621.1, "valid_targets_min": 1627 }, { "epoch": 0.7787610619469026, "grad_norm": 0.23317769615200384, "learning_rate": 3.962479255164823e-05, "loss": 0.4285, "loss_nan_ranks": 0, "loss_rank_avg": 0.17432451248168945, "step": 1320, "valid_targets_mean": 10227.8, "valid_targets_min": 2542 }, { "epoch": 0.7817109144542773, "grad_norm": 0.20839049675195365, "learning_rate": 3.961680975097894e-05, "loss": 0.424, "loss_nan_ranks": 0, "loss_rank_avg": 0.13311053812503815, "step": 1325, "valid_targets_mean": 8847.1, "valid_targets_min": 2962 }, { "epoch": 0.7846607669616519, "grad_norm": 0.22533441508609903, "learning_rate": 3.960874374319009e-05, "loss": 0.4339, "loss_nan_ranks": 0, "loss_rank_avg": 0.1515326201915741, "step": 1330, "valid_targets_mean": 11824.5, "valid_targets_min": 2336 }, { "epoch": 0.7876106194690266, "grad_norm": 0.21681982017955925, "learning_rate": 3.960059456249466e-05, "loss": 0.4365, "loss_nan_ranks": 0, "loss_rank_avg": 0.17768153548240662, "step": 1335, "valid_targets_mean": 13422.8, "valid_targets_min": 2469 }, { "epoch": 0.7905604719764012, "grad_norm": 0.21506616827856356, "learning_rate": 3.95923622434584e-05, "loss": 0.4332, "loss_nan_ranks": 0, "loss_rank_avg": 0.1056060940027237, "step": 1340, "valid_targets_mean": 8039.5, "valid_targets_min": 1011 }, { "epoch": 0.7935103244837758, "grad_norm": 0.2092664738221549, "learning_rate": 3.958404682099969e-05, "loss": 0.431, "loss_nan_ranks": 0, "loss_rank_avg": 0.11958029121160507, "step": 1345, "valid_targets_mean": 8162.9, "valid_targets_min": 1768 }, { "epoch": 0.7964601769911505, "grad_norm": 0.21447497725002448, "learning_rate": 3.957564833038944e-05, "loss": 0.431, "loss_nan_ranks": 0, "loss_rank_avg": 0.15218974649906158, "step": 1350, "valid_targets_mean": 9680.6, "valid_targets_min": 1517 }, { "epoch": 0.799410029498525, "grad_norm": 0.22430754653919985, "learning_rate": 3.9567166807250876e-05, "loss": 0.4311, "loss_nan_ranks": 0, "loss_rank_avg": 0.14632052183151245, "step": 1355, "valid_targets_mean": 10204.0, "valid_targets_min": 1856 }, { "epoch": 0.8023598820058997, "grad_norm": 0.20821866979698975, "learning_rate": 3.9558602287559435e-05, "loss": 0.4291, "loss_nan_ranks": 0, "loss_rank_avg": 0.16714532673358917, "step": 1360, "valid_targets_mean": 11088.9, "valid_targets_min": 3033 }, { "epoch": 0.8053097345132744, "grad_norm": 0.21842361789585152, "learning_rate": 3.954995480764257e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.12598569691181183, "step": 1365, "valid_targets_mean": 8808.9, "valid_targets_min": 1628 }, { "epoch": 0.8082595870206489, "grad_norm": 0.2452191859994776, "learning_rate": 3.9541224404179646e-05, "loss": 0.4296, "loss_nan_ranks": 0, "loss_rank_avg": 0.15447130799293518, "step": 1370, "valid_targets_mean": 10004.9, "valid_targets_min": 2090 }, { "epoch": 0.8112094395280236, "grad_norm": 0.21351961088739702, "learning_rate": 3.953241111420174e-05, "loss": 0.4325, "loss_nan_ranks": 0, "loss_rank_avg": 0.15034262835979462, "step": 1375, "valid_targets_mean": 11585.9, "valid_targets_min": 1578 }, { "epoch": 0.8141592920353983, "grad_norm": 0.2438372245243314, "learning_rate": 3.952351497509151e-05, "loss": 0.4281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1585340052843094, "step": 1380, "valid_targets_mean": 10658.7, "valid_targets_min": 1712 }, { "epoch": 0.8171091445427728, "grad_norm": 0.2286487537231045, "learning_rate": 3.9514536024583025e-05, "loss": 0.4286, "loss_nan_ranks": 0, "loss_rank_avg": 0.16236230731010437, "step": 1385, "valid_targets_mean": 11714.4, "valid_targets_min": 2874 }, { "epoch": 0.8200589970501475, "grad_norm": 0.22767053921731062, "learning_rate": 3.950547430076162e-05, "loss": 0.4258, "loss_nan_ranks": 0, "loss_rank_avg": 0.12050891667604446, "step": 1390, "valid_targets_mean": 9205.3, "valid_targets_min": 2733 }, { "epoch": 0.8230088495575221, "grad_norm": 0.21243248388698746, "learning_rate": 3.949632984206371e-05, "loss": 0.4213, "loss_nan_ranks": 0, "loss_rank_avg": 0.11950334906578064, "step": 1395, "valid_targets_mean": 8837.8, "valid_targets_min": 2032 }, { "epoch": 0.8259587020648967, "grad_norm": 0.19404822707082142, "learning_rate": 3.948710268727665e-05, "loss": 0.4254, "loss_nan_ranks": 0, "loss_rank_avg": 0.13935215771198273, "step": 1400, "valid_targets_mean": 10313.7, "valid_targets_min": 2037 }, { "epoch": 0.8289085545722714, "grad_norm": 0.20795543066174288, "learning_rate": 3.947779287553855e-05, "loss": 0.4326, "loss_nan_ranks": 0, "loss_rank_avg": 0.11591978371143341, "step": 1405, "valid_targets_mean": 8079.2, "valid_targets_min": 1799 }, { "epoch": 0.831858407079646, "grad_norm": 0.22220292602112293, "learning_rate": 3.946840044633812e-05, "loss": 0.422, "loss_nan_ranks": 0, "loss_rank_avg": 0.17623038589954376, "step": 1410, "valid_targets_mean": 11687.4, "valid_targets_min": 1660 }, { "epoch": 0.8348082595870207, "grad_norm": 0.22466394230939674, "learning_rate": 3.945892543951452e-05, "loss": 0.4348, "loss_nan_ranks": 0, "loss_rank_avg": 0.13592171669006348, "step": 1415, "valid_targets_mean": 9689.1, "valid_targets_min": 1213 }, { "epoch": 0.8377581120943953, "grad_norm": 0.2254962724331218, "learning_rate": 3.9449367895257154e-05, "loss": 0.4298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1883118897676468, "step": 1420, "valid_targets_mean": 13727.9, "valid_targets_min": 2019 }, { "epoch": 0.8407079646017699, "grad_norm": 0.21194725404217385, "learning_rate": 3.9439727854105525e-05, "loss": 0.4296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12037979066371918, "step": 1425, "valid_targets_mean": 8408.8, "valid_targets_min": 1770 }, { "epoch": 0.8436578171091446, "grad_norm": 0.2340701396614431, "learning_rate": 3.943000535694906e-05, "loss": 0.434, "loss_nan_ranks": 0, "loss_rank_avg": 0.15494517982006073, "step": 1430, "valid_targets_mean": 10496.0, "valid_targets_min": 1924 }, { "epoch": 0.8466076696165191, "grad_norm": 0.19806546741399747, "learning_rate": 3.9420200445026935e-05, "loss": 0.4274, "loss_nan_ranks": 0, "loss_rank_avg": 0.13141945004463196, "step": 1435, "valid_targets_mean": 9131.2, "valid_targets_min": 2712 }, { "epoch": 0.8495575221238938, "grad_norm": 0.21286070590728243, "learning_rate": 3.9410313159927884e-05, "loss": 0.4291, "loss_nan_ranks": 0, "loss_rank_avg": 0.14135153591632843, "step": 1440, "valid_targets_mean": 8391.5, "valid_targets_min": 1896 }, { "epoch": 0.8525073746312685, "grad_norm": 0.21373668014960542, "learning_rate": 3.9400343543590055e-05, "loss": 0.4216, "loss_nan_ranks": 0, "loss_rank_avg": 0.1340659260749817, "step": 1445, "valid_targets_mean": 9973.9, "valid_targets_min": 1874 }, { "epoch": 0.855457227138643, "grad_norm": 0.19867038831411135, "learning_rate": 3.9390291638300803e-05, "loss": 0.4268, "loss_nan_ranks": 0, "loss_rank_avg": 0.15295977890491486, "step": 1450, "valid_targets_mean": 11387.2, "valid_targets_min": 2079 }, { "epoch": 0.8584070796460177, "grad_norm": 0.2071025265272414, "learning_rate": 3.938015748669652e-05, "loss": 0.4267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1454063355922699, "step": 1455, "valid_targets_mean": 9381.8, "valid_targets_min": 1708 }, { "epoch": 0.8613569321533924, "grad_norm": 0.21597614110893262, "learning_rate": 3.936994113176247e-05, "loss": 0.4331, "loss_nan_ranks": 0, "loss_rank_avg": 0.13651731610298157, "step": 1460, "valid_targets_mean": 8509.3, "valid_targets_min": 1118 }, { "epoch": 0.8643067846607669, "grad_norm": 0.2168658534884769, "learning_rate": 3.935964261683258e-05, "loss": 0.4328, "loss_nan_ranks": 0, "loss_rank_avg": 0.14359349012374878, "step": 1465, "valid_targets_mean": 10374.7, "valid_targets_min": 2011 }, { "epoch": 0.8672566371681416, "grad_norm": 0.20858730892961191, "learning_rate": 3.934926198558926e-05, "loss": 0.4302, "loss_nan_ranks": 0, "loss_rank_avg": 0.17608967423439026, "step": 1470, "valid_targets_mean": 12519.0, "valid_targets_min": 1887 }, { "epoch": 0.8702064896755162, "grad_norm": 0.2006306585200802, "learning_rate": 3.933879928206325e-05, "loss": 0.4244, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375437080860138, "step": 1475, "valid_targets_mean": 9916.1, "valid_targets_min": 1793 }, { "epoch": 0.8731563421828908, "grad_norm": 0.2205586415746746, "learning_rate": 3.9328254550633413e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.15739303827285767, "step": 1480, "valid_targets_mean": 10340.9, "valid_targets_min": 1125 }, { "epoch": 0.8761061946902655, "grad_norm": 0.19812340046811802, "learning_rate": 3.9317627836026505e-05, "loss": 0.427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516011655330658, "step": 1485, "valid_targets_mean": 9584.5, "valid_targets_min": 2028 }, { "epoch": 0.8790560471976401, "grad_norm": 0.21139493708043888, "learning_rate": 3.930691918331706e-05, "loss": 0.4345, "loss_nan_ranks": 0, "loss_rank_avg": 0.16548380255699158, "step": 1490, "valid_targets_mean": 11590.9, "valid_targets_min": 2261 }, { "epoch": 0.8820058997050148, "grad_norm": 0.21329975804889742, "learning_rate": 3.929612863792713e-05, "loss": 0.4285, "loss_nan_ranks": 0, "loss_rank_avg": 0.15393435955047607, "step": 1495, "valid_targets_mean": 11354.4, "valid_targets_min": 1773 }, { "epoch": 0.8849557522123894, "grad_norm": 0.2541979721275341, "learning_rate": 3.928525624562617e-05, "loss": 0.4301, "loss_nan_ranks": 0, "loss_rank_avg": 0.13612164556980133, "step": 1500, "valid_targets_mean": 9635.8, "valid_targets_min": 2187 }, { "epoch": 0.887905604719764, "grad_norm": 0.22539564954558305, "learning_rate": 3.927430205253077e-05, "loss": 0.4229, "loss_nan_ranks": 0, "loss_rank_avg": 0.14678379893302917, "step": 1505, "valid_targets_mean": 10532.5, "valid_targets_min": 1940 }, { "epoch": 0.8908554572271387, "grad_norm": 0.20356625113991283, "learning_rate": 3.9263266105104484e-05, "loss": 0.4278, "loss_nan_ranks": 0, "loss_rank_avg": 0.15266424417495728, "step": 1510, "valid_targets_mean": 11384.6, "valid_targets_min": 2096 }, { "epoch": 0.8938053097345132, "grad_norm": 0.21042754257939417, "learning_rate": 3.9252148450157646e-05, "loss": 0.4244, "loss_nan_ranks": 0, "loss_rank_avg": 0.14113900065422058, "step": 1515, "valid_targets_mean": 10272.5, "valid_targets_min": 2815 }, { "epoch": 0.8967551622418879, "grad_norm": 0.19598960033237253, "learning_rate": 3.9240949134847164e-05, "loss": 0.4312, "loss_nan_ranks": 0, "loss_rank_avg": 0.16119873523712158, "step": 1520, "valid_targets_mean": 11145.4, "valid_targets_min": 818 }, { "epoch": 0.8997050147492626, "grad_norm": 0.19245802334587098, "learning_rate": 3.922966820667632e-05, "loss": 0.4242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1274881511926651, "step": 1525, "valid_targets_mean": 9275.6, "valid_targets_min": 1757 }, { "epoch": 0.9026548672566371, "grad_norm": 0.20722152151745302, "learning_rate": 3.921830571349455e-05, "loss": 0.4275, "loss_nan_ranks": 0, "loss_rank_avg": 0.15170887112617493, "step": 1530, "valid_targets_mean": 10562.0, "valid_targets_min": 1778 }, { "epoch": 0.9056047197640118, "grad_norm": 0.2211212721089106, "learning_rate": 3.920686170349728e-05, "loss": 0.425, "loss_nan_ranks": 0, "loss_rank_avg": 0.14120131731033325, "step": 1535, "valid_targets_mean": 9969.5, "valid_targets_min": 1957 }, { "epoch": 0.9085545722713865, "grad_norm": 0.22615337216600126, "learning_rate": 3.9195336225225694e-05, "loss": 0.427, "loss_nan_ranks": 0, "loss_rank_avg": 0.15712234377861023, "step": 1540, "valid_targets_mean": 10153.2, "valid_targets_min": 2191 }, { "epoch": 0.911504424778761, "grad_norm": 0.20841743928677547, "learning_rate": 3.918372932756652e-05, "loss": 0.4335, "loss_nan_ranks": 0, "loss_rank_avg": 0.11234050989151001, "step": 1545, "valid_targets_mean": 8849.2, "valid_targets_min": 324 }, { "epoch": 0.9144542772861357, "grad_norm": 0.24202127593053716, "learning_rate": 3.917204105975186e-05, "loss": 0.4258, "loss_nan_ranks": 0, "loss_rank_avg": 0.15047121047973633, "step": 1550, "valid_targets_mean": 10924.6, "valid_targets_min": 2710 }, { "epoch": 0.9174041297935103, "grad_norm": 0.19857249098394833, "learning_rate": 3.916027147135894e-05, "loss": 0.4289, "loss_nan_ranks": 0, "loss_rank_avg": 0.15521690249443054, "step": 1555, "valid_targets_mean": 11752.3, "valid_targets_min": 1969 }, { "epoch": 0.9203539823008849, "grad_norm": 0.21436174937187652, "learning_rate": 3.9148420612309907e-05, "loss": 0.429, "loss_nan_ranks": 0, "loss_rank_avg": 0.16796237230300903, "step": 1560, "valid_targets_mean": 12698.6, "valid_targets_min": 2768 }, { "epoch": 0.9233038348082596, "grad_norm": 0.21760621553388323, "learning_rate": 3.913648853287167e-05, "loss": 0.4293, "loss_nan_ranks": 0, "loss_rank_avg": 0.13657817244529724, "step": 1565, "valid_targets_mean": 10104.6, "valid_targets_min": 1652 }, { "epoch": 0.9262536873156342, "grad_norm": 0.19337765257103107, "learning_rate": 3.912447528365559e-05, "loss": 0.431, "loss_nan_ranks": 0, "loss_rank_avg": 0.14748969674110413, "step": 1570, "valid_targets_mean": 11014.7, "valid_targets_min": 1872 }, { "epoch": 0.9292035398230089, "grad_norm": 0.22146689942592468, "learning_rate": 3.911238091561736e-05, "loss": 0.4246, "loss_nan_ranks": 0, "loss_rank_avg": 0.1421777307987213, "step": 1575, "valid_targets_mean": 10039.7, "valid_targets_min": 2777 }, { "epoch": 0.9321533923303835, "grad_norm": 0.20189886878274899, "learning_rate": 3.910020548005673e-05, "loss": 0.4319, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599784791469574, "step": 1580, "valid_targets_mean": 11453.5, "valid_targets_min": 1275 }, { "epoch": 0.9351032448377581, "grad_norm": 0.2045400723388353, "learning_rate": 3.908794902861733e-05, "loss": 0.4336, "loss_nan_ranks": 0, "loss_rank_avg": 0.12890928983688354, "step": 1585, "valid_targets_mean": 8932.7, "valid_targets_min": 1791 }, { "epoch": 0.9380530973451328, "grad_norm": 0.1989335490497034, "learning_rate": 3.9075611613286385e-05, "loss": 0.4193, "loss_nan_ranks": 0, "loss_rank_avg": 0.14698082208633423, "step": 1590, "valid_targets_mean": 11101.6, "valid_targets_min": 2707 }, { "epoch": 0.9410029498525073, "grad_norm": 0.22960216786420032, "learning_rate": 3.906319328639457e-05, "loss": 0.4275, "loss_nan_ranks": 0, "loss_rank_avg": 0.17267057299613953, "step": 1595, "valid_targets_mean": 10862.0, "valid_targets_min": 1591 }, { "epoch": 0.943952802359882, "grad_norm": 0.22563473609963453, "learning_rate": 3.905069410061576e-05, "loss": 0.4264, "loss_nan_ranks": 0, "loss_rank_avg": 0.15903520584106445, "step": 1600, "valid_targets_mean": 10801.4, "valid_targets_min": 1421 }, { "epoch": 0.9469026548672567, "grad_norm": 0.21538014638851252, "learning_rate": 3.90381141089668e-05, "loss": 0.4277, "loss_nan_ranks": 0, "loss_rank_avg": 0.1417563259601593, "step": 1605, "valid_targets_mean": 8929.9, "valid_targets_min": 1203 }, { "epoch": 0.9498525073746312, "grad_norm": 0.20130244582393142, "learning_rate": 3.902545336480726e-05, "loss": 0.4329, "loss_nan_ranks": 0, "loss_rank_avg": 0.1481684297323227, "step": 1610, "valid_targets_mean": 10474.6, "valid_targets_min": 1041 }, { "epoch": 0.9528023598820059, "grad_norm": 0.2296462679204711, "learning_rate": 3.9012711921839255e-05, "loss": 0.4289, "loss_nan_ranks": 0, "loss_rank_avg": 0.12770214676856995, "step": 1615, "valid_targets_mean": 8967.3, "valid_targets_min": 2401 }, { "epoch": 0.9557522123893806, "grad_norm": 0.21190599582292202, "learning_rate": 3.899988983410719e-05, "loss": 0.4245, "loss_nan_ranks": 0, "loss_rank_avg": 0.15029430389404297, "step": 1620, "valid_targets_mean": 10507.0, "valid_targets_min": 1811 }, { "epoch": 0.9587020648967551, "grad_norm": 0.2076012555064984, "learning_rate": 3.898698715599754e-05, "loss": 0.4287, "loss_nan_ranks": 0, "loss_rank_avg": 0.12323871999979019, "step": 1625, "valid_targets_mean": 9101.4, "valid_targets_min": 1896 }, { "epoch": 0.9616519174041298, "grad_norm": 0.23218538306869804, "learning_rate": 3.8974003942238595e-05, "loss": 0.4243, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530805230140686, "step": 1630, "valid_targets_mean": 11740.2, "valid_targets_min": 1329 }, { "epoch": 0.9646017699115044, "grad_norm": 0.24503360985761793, "learning_rate": 3.896094024790026e-05, "loss": 0.4252, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282130479812622, "step": 1635, "valid_targets_mean": 8273.8, "valid_targets_min": 1581 }, { "epoch": 0.967551622418879, "grad_norm": 0.2539213856936481, "learning_rate": 3.894779612839381e-05, "loss": 0.427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1584298014640808, "step": 1640, "valid_targets_mean": 10531.7, "valid_targets_min": 2030 }, { "epoch": 0.9705014749262537, "grad_norm": 0.21788762425717897, "learning_rate": 3.893457163947165e-05, "loss": 0.4203, "loss_nan_ranks": 0, "loss_rank_avg": 0.12848243117332458, "step": 1645, "valid_targets_mean": 8572.2, "valid_targets_min": 1302 }, { "epoch": 0.9734513274336283, "grad_norm": 0.2259553001628983, "learning_rate": 3.892126683722709e-05, "loss": 0.4304, "loss_nan_ranks": 0, "loss_rank_avg": 0.15158626437187195, "step": 1650, "valid_targets_mean": 10365.0, "valid_targets_min": 1880 }, { "epoch": 0.976401179941003, "grad_norm": 0.19968783409752863, "learning_rate": 3.890788177809407e-05, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.16649773716926575, "step": 1655, "valid_targets_mean": 11930.6, "valid_targets_min": 1431 }, { "epoch": 0.9793510324483776, "grad_norm": 0.19109065781129364, "learning_rate": 3.8894416518846984e-05, "loss": 0.4244, "loss_nan_ranks": 0, "loss_rank_avg": 0.14009195566177368, "step": 1660, "valid_targets_mean": 10015.8, "valid_targets_min": 1439 }, { "epoch": 0.9823008849557522, "grad_norm": 0.20147950450173913, "learning_rate": 3.88808711166004e-05, "loss": 0.4264, "loss_nan_ranks": 0, "loss_rank_avg": 0.15372982621192932, "step": 1665, "valid_targets_mean": 10110.8, "valid_targets_min": 2130 }, { "epoch": 0.9852507374631269, "grad_norm": 0.20274757156010115, "learning_rate": 3.886724562880878e-05, "loss": 0.4287, "loss_nan_ranks": 0, "loss_rank_avg": 0.1347220540046692, "step": 1670, "valid_targets_mean": 9938.6, "valid_targets_min": 1395 }, { "epoch": 0.9882005899705014, "grad_norm": 0.20933626991726081, "learning_rate": 3.8853540113266356e-05, "loss": 0.434, "loss_nan_ranks": 0, "loss_rank_avg": 0.170450359582901, "step": 1675, "valid_targets_mean": 11508.6, "valid_targets_min": 1832 }, { "epoch": 0.9911504424778761, "grad_norm": 0.1998299607341395, "learning_rate": 3.883975462810673e-05, "loss": 0.4221, "loss_nan_ranks": 0, "loss_rank_avg": 0.12960436940193176, "step": 1680, "valid_targets_mean": 9993.5, "valid_targets_min": 2294 }, { "epoch": 0.9941002949852508, "grad_norm": 0.2747789084378386, "learning_rate": 3.882588923180276e-05, "loss": 0.427, "loss_nan_ranks": 0, "loss_rank_avg": 0.16216714680194855, "step": 1685, "valid_targets_mean": 11300.2, "valid_targets_min": 1578 }, { "epoch": 0.9970501474926253, "grad_norm": 0.2060289370907001, "learning_rate": 3.881194398316622e-05, "loss": 0.4189, "loss_nan_ranks": 0, "loss_rank_avg": 0.13950684666633606, "step": 1690, "valid_targets_mean": 10239.3, "valid_targets_min": 1636 }, { "epoch": 1.0, "grad_norm": 0.2060665846116573, "learning_rate": 3.8797918941347605e-05, "loss": 0.424, "loss_nan_ranks": 0, "loss_rank_avg": 0.1244438886642456, "step": 1695, "valid_targets_mean": 9906.2, "valid_targets_min": 1715 }, { "epoch": 1.0029498525073746, "grad_norm": 0.2214317321286988, "learning_rate": 3.878381416583587e-05, "loss": 0.4111, "loss_nan_ranks": 0, "loss_rank_avg": 0.12244114279747009, "step": 1700, "valid_targets_mean": 8369.7, "valid_targets_min": 1768 }, { "epoch": 1.0058997050147493, "grad_norm": 0.2436305117216246, "learning_rate": 3.876962971645816e-05, "loss": 0.4145, "loss_nan_ranks": 0, "loss_rank_avg": 0.12919296324253082, "step": 1705, "valid_targets_mean": 8753.0, "valid_targets_min": 2256 }, { "epoch": 1.008849557522124, "grad_norm": 0.2541456145942789, "learning_rate": 3.8755365653379554e-05, "loss": 0.4147, "loss_nan_ranks": 0, "loss_rank_avg": 0.15090519189834595, "step": 1710, "valid_targets_mean": 10982.1, "valid_targets_min": 1108 }, { "epoch": 1.0117994100294985, "grad_norm": 0.23014848454095105, "learning_rate": 3.874102203710285e-05, "loss": 0.4178, "loss_nan_ranks": 0, "loss_rank_avg": 0.13246405124664307, "step": 1715, "valid_targets_mean": 11002.4, "valid_targets_min": 2056 }, { "epoch": 1.0147492625368733, "grad_norm": 0.22453946076727968, "learning_rate": 3.8726598928468264e-05, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1798960417509079, "step": 1720, "valid_targets_mean": 12538.0, "valid_targets_min": 3339 }, { "epoch": 1.0176991150442478, "grad_norm": 0.2135015538264713, "learning_rate": 3.871209638865319e-05, "loss": 0.4176, "loss_nan_ranks": 0, "loss_rank_avg": 0.15504910051822662, "step": 1725, "valid_targets_mean": 11040.2, "valid_targets_min": 993 }, { "epoch": 1.0206489675516224, "grad_norm": 0.2035972797318352, "learning_rate": 3.8697514479171944e-05, "loss": 0.4069, "loss_nan_ranks": 0, "loss_rank_avg": 0.15845829248428345, "step": 1730, "valid_targets_mean": 11769.6, "valid_targets_min": 993 }, { "epoch": 1.023598820058997, "grad_norm": 0.21102734058214348, "learning_rate": 3.868285326187549e-05, "loss": 0.4087, "loss_nan_ranks": 0, "loss_rank_avg": 0.15515300631523132, "step": 1735, "valid_targets_mean": 12242.0, "valid_targets_min": 1933 }, { "epoch": 1.0265486725663717, "grad_norm": 0.21414046560162203, "learning_rate": 3.8668112798951186e-05, "loss": 0.4084, "loss_nan_ranks": 0, "loss_rank_avg": 0.11055143177509308, "step": 1740, "valid_targets_mean": 8613.3, "valid_targets_min": 1326 }, { "epoch": 1.0294985250737463, "grad_norm": 0.3490042762055538, "learning_rate": 3.865329315292253e-05, "loss": 0.4143, "loss_nan_ranks": 0, "loss_rank_avg": 0.15151363611221313, "step": 1745, "valid_targets_mean": 10904.8, "valid_targets_min": 2374 }, { "epoch": 1.0324483775811208, "grad_norm": 0.19879886174283662, "learning_rate": 3.863839438664888e-05, "loss": 0.4077, "loss_nan_ranks": 0, "loss_rank_avg": 0.11457093805074692, "step": 1750, "valid_targets_mean": 9075.7, "valid_targets_min": 1929 }, { "epoch": 1.0353982300884956, "grad_norm": 0.22408334317438344, "learning_rate": 3.862341656332519e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.12300422042608261, "step": 1755, "valid_targets_mean": 9564.1, "valid_targets_min": 1758 }, { "epoch": 1.0383480825958702, "grad_norm": 0.20190523650308992, "learning_rate": 3.8608359746481757e-05, "loss": 0.4062, "loss_nan_ranks": 0, "loss_rank_avg": 0.12284660339355469, "step": 1760, "valid_targets_mean": 9423.4, "valid_targets_min": 1229 }, { "epoch": 1.0412979351032448, "grad_norm": 0.1889811146160302, "learning_rate": 3.859322399998391e-05, "loss": 0.411, "loss_nan_ranks": 0, "loss_rank_avg": 0.11543569713830948, "step": 1765, "valid_targets_mean": 8829.8, "valid_targets_min": 1326 }, { "epoch": 1.0442477876106195, "grad_norm": 0.20750598590889113, "learning_rate": 3.85780093880318e-05, "loss": 0.4168, "loss_nan_ranks": 0, "loss_rank_avg": 0.12260887026786804, "step": 1770, "valid_targets_mean": 9662.1, "valid_targets_min": 1275 }, { "epoch": 1.047197640117994, "grad_norm": 0.22141314053223685, "learning_rate": 3.856271597516007e-05, "loss": 0.4148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14068543910980225, "step": 1775, "valid_targets_mean": 10959.3, "valid_targets_min": 638 }, { "epoch": 1.0501474926253687, "grad_norm": 0.21606621123216593, "learning_rate": 3.8547343826237625e-05, "loss": 0.4082, "loss_nan_ranks": 0, "loss_rank_avg": 0.1010463610291481, "step": 1780, "valid_targets_mean": 7978.1, "valid_targets_min": 766 }, { "epoch": 1.0530973451327434, "grad_norm": 0.21156952456065437, "learning_rate": 3.853189300646733e-05, "loss": 0.4096, "loss_nan_ranks": 0, "loss_rank_avg": 0.12438692152500153, "step": 1785, "valid_targets_mean": 10245.8, "valid_targets_min": 1763 }, { "epoch": 1.056047197640118, "grad_norm": 0.19194806585850302, "learning_rate": 3.8516363581385744e-05, "loss": 0.4219, "loss_nan_ranks": 0, "loss_rank_avg": 0.15674549341201782, "step": 1790, "valid_targets_mean": 11258.5, "valid_targets_min": 1816 }, { "epoch": 1.0589970501474926, "grad_norm": 0.2107193241639981, "learning_rate": 3.850075561686284e-05, "loss": 0.4077, "loss_nan_ranks": 0, "loss_rank_avg": 0.1198762059211731, "step": 1795, "valid_targets_mean": 8000.7, "valid_targets_min": 2223 }, { "epoch": 1.0619469026548674, "grad_norm": 0.2148666662551988, "learning_rate": 3.848506917910173e-05, "loss": 0.4149, "loss_nan_ranks": 0, "loss_rank_avg": 0.13810782134532928, "step": 1800, "valid_targets_mean": 10893.6, "valid_targets_min": 1409 }, { "epoch": 1.064896755162242, "grad_norm": 0.19406443957944047, "learning_rate": 3.846930433463837e-05, "loss": 0.4143, "loss_nan_ranks": 0, "loss_rank_avg": 0.13573281466960907, "step": 1805, "valid_targets_mean": 10108.5, "valid_targets_min": 1004 }, { "epoch": 1.0678466076696165, "grad_norm": 0.23058912274050483, "learning_rate": 3.84534611503413e-05, "loss": 0.4135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543012261390686, "step": 1810, "valid_targets_mean": 12145.3, "valid_targets_min": 1885 }, { "epoch": 1.0707964601769913, "grad_norm": 0.21404882128297154, "learning_rate": 3.843753969341133e-05, "loss": 0.409, "loss_nan_ranks": 0, "loss_rank_avg": 0.17230772972106934, "step": 1815, "valid_targets_mean": 11707.7, "valid_targets_min": 2484 }, { "epoch": 1.0737463126843658, "grad_norm": 0.21766349751933262, "learning_rate": 3.84215400313813e-05, "loss": 0.4123, "loss_nan_ranks": 0, "loss_rank_avg": 0.16566194593906403, "step": 1820, "valid_targets_mean": 10948.0, "valid_targets_min": 1919 }, { "epoch": 1.0766961651917404, "grad_norm": 0.21941802778104524, "learning_rate": 3.840546223211573e-05, "loss": 0.413, "loss_nan_ranks": 0, "loss_rank_avg": 0.13953745365142822, "step": 1825, "valid_targets_mean": 10782.3, "valid_targets_min": 1761 }, { "epoch": 1.079646017699115, "grad_norm": 0.21274994098907102, "learning_rate": 3.8389306363810603e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.12339918315410614, "step": 1830, "valid_targets_mean": 9099.6, "valid_targets_min": 1580 }, { "epoch": 1.0825958702064897, "grad_norm": 0.22377623817685083, "learning_rate": 3.837307249499304e-05, "loss": 0.4092, "loss_nan_ranks": 0, "loss_rank_avg": 0.11521419882774353, "step": 1835, "valid_targets_mean": 9367.8, "valid_targets_min": 1997 }, { "epoch": 1.0855457227138643, "grad_norm": 0.19797643732478384, "learning_rate": 3.835676069452098e-05, "loss": 0.4059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17100510001182556, "step": 1840, "valid_targets_mean": 12947.3, "valid_targets_min": 2121 }, { "epoch": 1.0884955752212389, "grad_norm": 0.21865904068357092, "learning_rate": 3.834037103158294e-05, "loss": 0.4127, "loss_nan_ranks": 0, "loss_rank_avg": 0.11623190343379974, "step": 1845, "valid_targets_mean": 9119.2, "valid_targets_min": 581 }, { "epoch": 1.0914454277286136, "grad_norm": 0.19819166759077297, "learning_rate": 3.832390357569771e-05, "loss": 0.4113, "loss_nan_ranks": 0, "loss_rank_avg": 0.13250255584716797, "step": 1850, "valid_targets_mean": 10413.7, "valid_targets_min": 1747 }, { "epoch": 1.0943952802359882, "grad_norm": 0.2137794724256389, "learning_rate": 3.830735839671402e-05, "loss": 0.414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471385657787323, "step": 1855, "valid_targets_mean": 10754.2, "valid_targets_min": 2854 }, { "epoch": 1.0973451327433628, "grad_norm": 0.20180269762632919, "learning_rate": 3.829073556481031e-05, "loss": 0.4046, "loss_nan_ranks": 0, "loss_rank_avg": 0.11916483938694, "step": 1860, "valid_targets_mean": 9007.5, "valid_targets_min": 1396 }, { "epoch": 1.1002949852507375, "grad_norm": 0.1967635045770067, "learning_rate": 3.827403515049435e-05, "loss": 0.4079, "loss_nan_ranks": 0, "loss_rank_avg": 0.09877189993858337, "step": 1865, "valid_targets_mean": 8820.8, "valid_targets_min": 1666 }, { "epoch": 1.103244837758112, "grad_norm": 0.21494925676253426, "learning_rate": 3.8257257224603017e-05, "loss": 0.41, "loss_nan_ranks": 0, "loss_rank_avg": 0.13791577517986298, "step": 1870, "valid_targets_mean": 10300.9, "valid_targets_min": 1870 }, { "epoch": 1.1061946902654867, "grad_norm": 0.20240256675457352, "learning_rate": 3.824040185830196e-05, "loss": 0.4183, "loss_nan_ranks": 0, "loss_rank_avg": 0.15127933025360107, "step": 1875, "valid_targets_mean": 10301.0, "valid_targets_min": 1872 }, { "epoch": 1.1091445427728615, "grad_norm": 0.19891739705938485, "learning_rate": 3.82234691230853e-05, "loss": 0.4178, "loss_nan_ranks": 0, "loss_rank_avg": 0.11647451668977737, "step": 1880, "valid_targets_mean": 8726.2, "valid_targets_min": 1376 }, { "epoch": 1.112094395280236, "grad_norm": 0.22683438639070486, "learning_rate": 3.82064590907753e-05, "loss": 0.4165, "loss_nan_ranks": 0, "loss_rank_avg": 0.13766145706176758, "step": 1885, "valid_targets_mean": 9197.0, "valid_targets_min": 1423 }, { "epoch": 1.1150442477876106, "grad_norm": 0.21204497029633457, "learning_rate": 3.818937183352214e-05, "loss": 0.4118, "loss_nan_ranks": 0, "loss_rank_avg": 0.13173851370811462, "step": 1890, "valid_targets_mean": 10090.6, "valid_targets_min": 1763 }, { "epoch": 1.1179941002949851, "grad_norm": 0.2040720064717632, "learning_rate": 3.81722074238035e-05, "loss": 0.4054, "loss_nan_ranks": 0, "loss_rank_avg": 0.14814019203186035, "step": 1895, "valid_targets_mean": 12130.7, "valid_targets_min": 2016 }, { "epoch": 1.12094395280236, "grad_norm": 0.20133866889947288, "learning_rate": 3.815496593442437e-05, "loss": 0.4061, "loss_nan_ranks": 0, "loss_rank_avg": 0.15776057541370392, "step": 1900, "valid_targets_mean": 12728.4, "valid_targets_min": 2160 }, { "epoch": 1.1238938053097345, "grad_norm": 0.20242503749135837, "learning_rate": 3.813764743851665e-05, "loss": 0.4141, "loss_nan_ranks": 0, "loss_rank_avg": 0.15720617771148682, "step": 1905, "valid_targets_mean": 10916.8, "valid_targets_min": 1351 }, { "epoch": 1.1268436578171093, "grad_norm": 0.208072373800863, "learning_rate": 3.812025200953886e-05, "loss": 0.4127, "loss_nan_ranks": 0, "loss_rank_avg": 0.1405029296875, "step": 1910, "valid_targets_mean": 9711.5, "valid_targets_min": 1453 }, { "epoch": 1.1297935103244838, "grad_norm": 0.21335388533193136, "learning_rate": 3.8102779721275876e-05, "loss": 0.4187, "loss_nan_ranks": 0, "loss_rank_avg": 0.11071514338254929, "step": 1915, "valid_targets_mean": 7793.0, "valid_targets_min": 2061 }, { "epoch": 1.1327433628318584, "grad_norm": 0.20639777456737793, "learning_rate": 3.808523064783855e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.15259069204330444, "step": 1920, "valid_targets_mean": 10522.3, "valid_targets_min": 2051 }, { "epoch": 1.135693215339233, "grad_norm": 0.20238312463667626, "learning_rate": 3.806760486366346e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.12089171260595322, "step": 1925, "valid_targets_mean": 9354.5, "valid_targets_min": 1660 }, { "epoch": 1.1386430678466077, "grad_norm": 0.20356162120879506, "learning_rate": 3.8049902443512545e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.11329087615013123, "step": 1930, "valid_targets_mean": 8649.6, "valid_targets_min": 1301 }, { "epoch": 1.1415929203539823, "grad_norm": 0.1804088599383834, "learning_rate": 3.803212346247279e-05, "loss": 0.4055, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426897943019867, "step": 1935, "valid_targets_mean": 10430.0, "valid_targets_min": 880 }, { "epoch": 1.1445427728613569, "grad_norm": 0.2271543333220535, "learning_rate": 3.801426799595594e-05, "loss": 0.4107, "loss_nan_ranks": 0, "loss_rank_avg": 0.14367930591106415, "step": 1940, "valid_targets_mean": 10661.6, "valid_targets_min": 1734 }, { "epoch": 1.1474926253687316, "grad_norm": 0.1928149869518129, "learning_rate": 3.799633611969816e-05, "loss": 0.403, "loss_nan_ranks": 0, "loss_rank_avg": 0.12169966101646423, "step": 1945, "valid_targets_mean": 10279.0, "valid_targets_min": 1395 }, { "epoch": 1.1504424778761062, "grad_norm": 0.21134894803857232, "learning_rate": 3.7978327909759724e-05, "loss": 0.4067, "loss_nan_ranks": 0, "loss_rank_avg": 0.12604662775993347, "step": 1950, "valid_targets_mean": 8528.5, "valid_targets_min": 2313 }, { "epoch": 1.1533923303834808, "grad_norm": 0.20396072826134254, "learning_rate": 3.796024344252468e-05, "loss": 0.4106, "loss_nan_ranks": 0, "loss_rank_avg": 0.1569386124610901, "step": 1955, "valid_targets_mean": 11313.9, "valid_targets_min": 1467 }, { "epoch": 1.1563421828908556, "grad_norm": 0.22194681338512706, "learning_rate": 3.7942082794700515e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357463002204895, "step": 1960, "valid_targets_mean": 10597.4, "valid_targets_min": 2147 }, { "epoch": 1.1592920353982301, "grad_norm": 0.20539906350360473, "learning_rate": 3.7923846043317865e-05, "loss": 0.4109, "loss_nan_ranks": 0, "loss_rank_avg": 0.1538807451725006, "step": 1965, "valid_targets_mean": 12742.9, "valid_targets_min": 1402 }, { "epoch": 1.1622418879056047, "grad_norm": 0.20120409032277925, "learning_rate": 3.790553326573016e-05, "loss": 0.4127, "loss_nan_ranks": 0, "loss_rank_avg": 0.13526630401611328, "step": 1970, "valid_targets_mean": 10137.4, "valid_targets_min": 1357 }, { "epoch": 1.1651917404129795, "grad_norm": 0.21338986564297552, "learning_rate": 3.788714453961331e-05, "loss": 0.4113, "loss_nan_ranks": 0, "loss_rank_avg": 0.13483178615570068, "step": 1975, "valid_targets_mean": 10012.6, "valid_targets_min": 2316 }, { "epoch": 1.168141592920354, "grad_norm": 0.21188408754979535, "learning_rate": 3.786867994296535e-05, "loss": 0.411, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392839252948761, "step": 1980, "valid_targets_mean": 9308.8, "valid_targets_min": 1282 }, { "epoch": 1.1710914454277286, "grad_norm": 0.2039564451558122, "learning_rate": 3.785013955410617e-05, "loss": 0.4065, "loss_nan_ranks": 0, "loss_rank_avg": 0.09764277935028076, "step": 1985, "valid_targets_mean": 8041.7, "valid_targets_min": 1623 }, { "epoch": 1.1740412979351031, "grad_norm": 0.19136114966992632, "learning_rate": 3.783152345167711e-05, "loss": 0.4097, "loss_nan_ranks": 0, "loss_rank_avg": 0.12284572422504425, "step": 1990, "valid_targets_mean": 9104.2, "valid_targets_min": 2701 }, { "epoch": 1.176991150442478, "grad_norm": 0.1916739509383337, "learning_rate": 3.781283171464065e-05, "loss": 0.4158, "loss_nan_ranks": 0, "loss_rank_avg": 0.13541018962860107, "step": 1995, "valid_targets_mean": 9892.2, "valid_targets_min": 1543 }, { "epoch": 1.1799410029498525, "grad_norm": 0.21980881264220392, "learning_rate": 3.779406442228012e-05, "loss": 0.4089, "loss_nan_ranks": 0, "loss_rank_avg": 0.13939528167247772, "step": 2000, "valid_targets_mean": 8413.7, "valid_targets_min": 1348 }, { "epoch": 1.182890855457227, "grad_norm": 0.25391048063546057, "learning_rate": 3.777522165419929e-05, "loss": 0.4147, "loss_nan_ranks": 0, "loss_rank_avg": 0.12453456223011017, "step": 2005, "valid_targets_mean": 9011.9, "valid_targets_min": 1258 }, { "epoch": 1.1858407079646018, "grad_norm": 0.1946857583209541, "learning_rate": 3.77563034903221e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.13194556534290314, "step": 2010, "valid_targets_mean": 10724.9, "valid_targets_min": 1737 }, { "epoch": 1.1887905604719764, "grad_norm": 0.19693826294861733, "learning_rate": 3.773731001089227e-05, "loss": 0.4166, "loss_nan_ranks": 0, "loss_rank_avg": 0.14914648234844208, "step": 2015, "valid_targets_mean": 11330.2, "valid_targets_min": 2645 }, { "epoch": 1.191740412979351, "grad_norm": 0.2073049850541922, "learning_rate": 3.771824129647299e-05, "loss": 0.4112, "loss_nan_ranks": 0, "loss_rank_avg": 0.12241712957620621, "step": 2020, "valid_targets_mean": 8752.2, "valid_targets_min": 1943 }, { "epoch": 1.1946902654867257, "grad_norm": 0.2085637489120309, "learning_rate": 3.7699097427946556e-05, "loss": 0.4122, "loss_nan_ranks": 0, "loss_rank_avg": 0.13761894404888153, "step": 2025, "valid_targets_mean": 10287.4, "valid_targets_min": 1357 }, { "epoch": 1.1976401179941003, "grad_norm": 0.222453588302852, "learning_rate": 3.7679878486514066e-05, "loss": 0.4078, "loss_nan_ranks": 0, "loss_rank_avg": 0.14405113458633423, "step": 2030, "valid_targets_mean": 11753.1, "valid_targets_min": 2172 }, { "epoch": 1.2005899705014749, "grad_norm": 0.24169539701661746, "learning_rate": 3.7660584553695015e-05, "loss": 0.4062, "loss_nan_ranks": 0, "loss_rank_avg": 0.13349585235118866, "step": 2035, "valid_targets_mean": 10826.9, "valid_targets_min": 1833 }, { "epoch": 1.2035398230088497, "grad_norm": 0.2108273326549157, "learning_rate": 3.7641215711327016e-05, "loss": 0.4074, "loss_nan_ranks": 0, "loss_rank_avg": 0.12320627272129059, "step": 2040, "valid_targets_mean": 8298.7, "valid_targets_min": 2118 }, { "epoch": 1.2064896755162242, "grad_norm": 0.20442694007571818, "learning_rate": 3.762177204156539e-05, "loss": 0.4084, "loss_nan_ranks": 0, "loss_rank_avg": 0.14502795040607452, "step": 2045, "valid_targets_mean": 10686.5, "valid_targets_min": 1710 }, { "epoch": 1.2094395280235988, "grad_norm": 0.19955409878173785, "learning_rate": 3.760225362688287e-05, "loss": 0.4121, "loss_nan_ranks": 0, "loss_rank_avg": 0.1251523792743683, "step": 2050, "valid_targets_mean": 10852.7, "valid_targets_min": 1179 }, { "epoch": 1.2123893805309733, "grad_norm": 0.2103406530212919, "learning_rate": 3.758266055006922e-05, "loss": 0.4137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1394679844379425, "step": 2055, "valid_targets_mean": 9916.9, "valid_targets_min": 2572 }, { "epoch": 1.2153392330383481, "grad_norm": 0.23099560954553897, "learning_rate": 3.756299289423089e-05, "loss": 0.4115, "loss_nan_ranks": 0, "loss_rank_avg": 0.13078881800174713, "step": 2060, "valid_targets_mean": 9324.3, "valid_targets_min": 2445 }, { "epoch": 1.2182890855457227, "grad_norm": 0.20192145184305313, "learning_rate": 3.7543250742790676e-05, "loss": 0.4105, "loss_nan_ranks": 0, "loss_rank_avg": 0.13179230690002441, "step": 2065, "valid_targets_mean": 9231.1, "valid_targets_min": 1873 }, { "epoch": 1.2212389380530975, "grad_norm": 0.2248883000903419, "learning_rate": 3.752343417948734e-05, "loss": 0.4097, "loss_nan_ranks": 0, "loss_rank_avg": 0.14653357863426208, "step": 2070, "valid_targets_mean": 10349.4, "valid_targets_min": 898 }, { "epoch": 1.224188790560472, "grad_norm": 0.19674161802721363, "learning_rate": 3.750354328837529e-05, "loss": 0.4045, "loss_nan_ranks": 0, "loss_rank_avg": 0.12419191002845764, "step": 2075, "valid_targets_mean": 9958.1, "valid_targets_min": 2833 }, { "epoch": 1.2271386430678466, "grad_norm": 0.2040519297416266, "learning_rate": 3.748357815382419e-05, "loss": 0.4061, "loss_nan_ranks": 0, "loss_rank_avg": 0.13978463411331177, "step": 2080, "valid_targets_mean": 9267.8, "valid_targets_min": 1924 }, { "epoch": 1.2300884955752212, "grad_norm": 0.1935700879911901, "learning_rate": 3.746353886051862e-05, "loss": 0.4131, "loss_nan_ranks": 0, "loss_rank_avg": 0.14617498219013214, "step": 2085, "valid_targets_mean": 11356.9, "valid_targets_min": 1715 }, { "epoch": 1.233038348082596, "grad_norm": 0.20323760274797556, "learning_rate": 3.7443425493457735e-05, "loss": 0.4028, "loss_nan_ranks": 0, "loss_rank_avg": 0.15078863501548767, "step": 2090, "valid_targets_mean": 9942.5, "valid_targets_min": 2202 }, { "epoch": 1.2359882005899705, "grad_norm": 0.19237355834888428, "learning_rate": 3.7423238137954835e-05, "loss": 0.4027, "loss_nan_ranks": 0, "loss_rank_avg": 0.12100933492183685, "step": 2095, "valid_targets_mean": 9043.8, "valid_targets_min": 2039 }, { "epoch": 1.238938053097345, "grad_norm": 0.19405452277576316, "learning_rate": 3.74029768796371e-05, "loss": 0.4126, "loss_nan_ranks": 0, "loss_rank_avg": 0.12515579164028168, "step": 2100, "valid_targets_mean": 10029.0, "valid_targets_min": 2074 }, { "epoch": 1.2418879056047198, "grad_norm": 0.1918975786310472, "learning_rate": 3.7382641804445136e-05, "loss": 0.4101, "loss_nan_ranks": 0, "loss_rank_avg": 0.13490715622901917, "step": 2105, "valid_targets_mean": 12080.2, "valid_targets_min": 1794 }, { "epoch": 1.2448377581120944, "grad_norm": 0.22948564571877864, "learning_rate": 3.73622329986327e-05, "loss": 0.4081, "loss_nan_ranks": 0, "loss_rank_avg": 0.14957517385482788, "step": 2110, "valid_targets_mean": 10673.3, "valid_targets_min": 1919 }, { "epoch": 1.247787610619469, "grad_norm": 0.1956858906108937, "learning_rate": 3.734175054876626e-05, "loss": 0.4018, "loss_nan_ranks": 0, "loss_rank_avg": 0.13325190544128418, "step": 2115, "valid_targets_mean": 10177.9, "valid_targets_min": 816 }, { "epoch": 1.2507374631268435, "grad_norm": 0.20690628762099494, "learning_rate": 3.7321194541724625e-05, "loss": 0.4055, "loss_nan_ranks": 0, "loss_rank_avg": 0.1585572063922882, "step": 2120, "valid_targets_mean": 11231.2, "valid_targets_min": 2275 }, { "epoch": 1.2536873156342183, "grad_norm": 0.1958247690154711, "learning_rate": 3.7300565064698664e-05, "loss": 0.4057, "loss_nan_ranks": 0, "loss_rank_avg": 0.11031612753868103, "step": 2125, "valid_targets_mean": 8387.8, "valid_targets_min": 1395 }, { "epoch": 1.2566371681415929, "grad_norm": 0.2249780519965779, "learning_rate": 3.727986220519085e-05, "loss": 0.4014, "loss_nan_ranks": 0, "loss_rank_avg": 0.15190738439559937, "step": 2130, "valid_targets_mean": 10092.2, "valid_targets_min": 1533 }, { "epoch": 1.2595870206489677, "grad_norm": 0.19232542968979785, "learning_rate": 3.7259086051014896e-05, "loss": 0.4125, "loss_nan_ranks": 0, "loss_rank_avg": 0.13802318274974823, "step": 2135, "valid_targets_mean": 11030.4, "valid_targets_min": 1781 }, { "epoch": 1.2625368731563422, "grad_norm": 0.21055352053943993, "learning_rate": 3.7238236690295433e-05, "loss": 0.4106, "loss_nan_ranks": 0, "loss_rank_avg": 0.12079479545354843, "step": 2140, "valid_targets_mean": 8386.0, "valid_targets_min": 1623 }, { "epoch": 1.2654867256637168, "grad_norm": 0.21340054364438876, "learning_rate": 3.7217314211467615e-05, "loss": 0.4113, "loss_nan_ranks": 0, "loss_rank_avg": 0.1280185729265213, "step": 2145, "valid_targets_mean": 9386.7, "valid_targets_min": 2248 }, { "epoch": 1.2684365781710913, "grad_norm": 0.19654827232796557, "learning_rate": 3.7196318703276695e-05, "loss": 0.412, "loss_nan_ranks": 0, "loss_rank_avg": 0.12935896217823029, "step": 2150, "valid_targets_mean": 10851.2, "valid_targets_min": 1999 }, { "epoch": 1.2713864306784661, "grad_norm": 0.18684413906547542, "learning_rate": 3.717525025477772e-05, "loss": 0.4107, "loss_nan_ranks": 0, "loss_rank_avg": 0.12971490621566772, "step": 2155, "valid_targets_mean": 10156.7, "valid_targets_min": 1575 }, { "epoch": 1.2743362831858407, "grad_norm": 0.20131635339460882, "learning_rate": 3.715410895533511e-05, "loss": 0.4128, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318942904472351, "step": 2160, "valid_targets_mean": 9176.0, "valid_targets_min": 1819 }, { "epoch": 1.2772861356932155, "grad_norm": 0.20005532418427976, "learning_rate": 3.713289489462231e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.12302594631910324, "step": 2165, "valid_targets_mean": 9579.9, "valid_targets_min": 1936 }, { "epoch": 1.28023598820059, "grad_norm": 0.1987319890122761, "learning_rate": 3.711160816262136e-05, "loss": 0.4038, "loss_nan_ranks": 0, "loss_rank_avg": 0.13187222182750702, "step": 2170, "valid_targets_mean": 10588.2, "valid_targets_min": 2210 }, { "epoch": 1.2831858407079646, "grad_norm": 0.20569943718314818, "learning_rate": 3.7090248849622575e-05, "loss": 0.4108, "loss_nan_ranks": 0, "loss_rank_avg": 0.1288871467113495, "step": 2175, "valid_targets_mean": 9435.7, "valid_targets_min": 1343 }, { "epoch": 1.2861356932153392, "grad_norm": 0.19481024413783074, "learning_rate": 3.7068817046224106e-05, "loss": 0.4121, "loss_nan_ranks": 0, "loss_rank_avg": 0.1117725670337677, "step": 2180, "valid_targets_mean": 8765.1, "valid_targets_min": 2181 }, { "epoch": 1.289085545722714, "grad_norm": 0.2075955871038273, "learning_rate": 3.7047312843331596e-05, "loss": 0.4058, "loss_nan_ranks": 0, "loss_rank_avg": 0.13937462866306305, "step": 2185, "valid_targets_mean": 11306.6, "valid_targets_min": 1251 }, { "epoch": 1.2920353982300885, "grad_norm": 0.1966624832512414, "learning_rate": 3.702573633215778e-05, "loss": 0.4082, "loss_nan_ranks": 0, "loss_rank_avg": 0.1228807345032692, "step": 2190, "valid_targets_mean": 8945.6, "valid_targets_min": 2289 }, { "epoch": 1.294985250737463, "grad_norm": 0.17735257514071073, "learning_rate": 3.700408760422209e-05, "loss": 0.4114, "loss_nan_ranks": 0, "loss_rank_avg": 0.13248281180858612, "step": 2195, "valid_targets_mean": 10275.5, "valid_targets_min": 2173 }, { "epoch": 1.2979351032448379, "grad_norm": 0.20566850050832683, "learning_rate": 3.698236675135027e-05, "loss": 0.4068, "loss_nan_ranks": 0, "loss_rank_avg": 0.12011992931365967, "step": 2200, "valid_targets_mean": 9283.0, "valid_targets_min": 1861 }, { "epoch": 1.3008849557522124, "grad_norm": 0.19471925424106384, "learning_rate": 3.696057386567401e-05, "loss": 0.4039, "loss_nan_ranks": 0, "loss_rank_avg": 0.11719102412462234, "step": 2205, "valid_targets_mean": 8844.1, "valid_targets_min": 1562 }, { "epoch": 1.303834808259587, "grad_norm": 0.20677025054702694, "learning_rate": 3.6938709039630514e-05, "loss": 0.4088, "loss_nan_ranks": 0, "loss_rank_avg": 0.11571133136749268, "step": 2210, "valid_targets_mean": 9628.9, "valid_targets_min": 2723 }, { "epoch": 1.3067846607669615, "grad_norm": 0.19386983627829316, "learning_rate": 3.6916772365962146e-05, "loss": 0.4071, "loss_nan_ranks": 0, "loss_rank_avg": 0.14339354634284973, "step": 2215, "valid_targets_mean": 9824.7, "valid_targets_min": 2124 }, { "epoch": 1.3097345132743363, "grad_norm": 0.20733483530915647, "learning_rate": 3.689476393771601e-05, "loss": 0.4087, "loss_nan_ranks": 0, "loss_rank_avg": 0.16114959120750427, "step": 2220, "valid_targets_mean": 10805.5, "valid_targets_min": 1645 }, { "epoch": 1.3126843657817109, "grad_norm": 0.2074662286669484, "learning_rate": 3.687268384824358e-05, "loss": 0.4065, "loss_nan_ranks": 0, "loss_rank_avg": 0.1201554462313652, "step": 2225, "valid_targets_mean": 8827.6, "valid_targets_min": 1488 }, { "epoch": 1.3156342182890857, "grad_norm": 0.20787590103008372, "learning_rate": 3.685053219120027e-05, "loss": 0.4076, "loss_nan_ranks": 0, "loss_rank_avg": 0.1468854397535324, "step": 2230, "valid_targets_mean": 9714.4, "valid_targets_min": 1897 }, { "epoch": 1.3185840707964602, "grad_norm": 0.2130181150365414, "learning_rate": 3.682830906054508e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.13946279883384705, "step": 2235, "valid_targets_mean": 10670.6, "valid_targets_min": 1889 }, { "epoch": 1.3215339233038348, "grad_norm": 0.19106711316771613, "learning_rate": 3.680601455054015e-05, "loss": 0.4112, "loss_nan_ranks": 0, "loss_rank_avg": 0.15019375085830688, "step": 2240, "valid_targets_mean": 10592.3, "valid_targets_min": 2458 }, { "epoch": 1.3244837758112094, "grad_norm": 0.19726641284267823, "learning_rate": 3.6783648755750384e-05, "loss": 0.4007, "loss_nan_ranks": 0, "loss_rank_avg": 0.17111629247665405, "step": 2245, "valid_targets_mean": 13763.0, "valid_targets_min": 1776 }, { "epoch": 1.3274336283185841, "grad_norm": 0.18422082465731265, "learning_rate": 3.6761211771043094e-05, "loss": 0.4085, "loss_nan_ranks": 0, "loss_rank_avg": 0.12834113836288452, "step": 2250, "valid_targets_mean": 10454.7, "valid_targets_min": 1719 }, { "epoch": 1.3303834808259587, "grad_norm": 0.18180812278892167, "learning_rate": 3.673870369158749e-05, "loss": 0.4103, "loss_nan_ranks": 0, "loss_rank_avg": 0.14465734362602234, "step": 2255, "valid_targets_mean": 9654.4, "valid_targets_min": 1351 }, { "epoch": 1.3333333333333333, "grad_norm": 0.1895037587937176, "learning_rate": 3.671612461285439e-05, "loss": 0.4026, "loss_nan_ranks": 0, "loss_rank_avg": 0.13590912520885468, "step": 2260, "valid_targets_mean": 10966.7, "valid_targets_min": 1919 }, { "epoch": 1.336283185840708, "grad_norm": 0.18289571304655325, "learning_rate": 3.6693474630615723e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.14450351893901825, "step": 2265, "valid_targets_mean": 10623.2, "valid_targets_min": 2312 }, { "epoch": 1.3392330383480826, "grad_norm": 0.19387794145565707, "learning_rate": 3.6670753840944196e-05, "loss": 0.4113, "loss_nan_ranks": 0, "loss_rank_avg": 0.14855991303920746, "step": 2270, "valid_targets_mean": 11599.1, "valid_targets_min": 1690 }, { "epoch": 1.3421828908554572, "grad_norm": 0.2129132270060968, "learning_rate": 3.6647962340212845e-05, "loss": 0.4001, "loss_nan_ranks": 0, "loss_rank_avg": 0.12970374524593353, "step": 2275, "valid_targets_mean": 10497.8, "valid_targets_min": 1494 }, { "epoch": 1.3451327433628317, "grad_norm": 0.20779965227080616, "learning_rate": 3.6625100225094624e-05, "loss": 0.4107, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262437105178833, "step": 2280, "valid_targets_mean": 9126.5, "valid_targets_min": 2499 }, { "epoch": 1.3480825958702065, "grad_norm": 0.2017390741108949, "learning_rate": 3.660216759256202e-05, "loss": 0.4135, "loss_nan_ranks": 0, "loss_rank_avg": 0.14283165335655212, "step": 2285, "valid_targets_mean": 10106.3, "valid_targets_min": 1729 }, { "epoch": 1.351032448377581, "grad_norm": 0.18994227000395517, "learning_rate": 3.657916453988663e-05, "loss": 0.4039, "loss_nan_ranks": 0, "loss_rank_avg": 0.12617641687393188, "step": 2290, "valid_targets_mean": 10339.8, "valid_targets_min": 1135 }, { "epoch": 1.3539823008849559, "grad_norm": 0.2119826690671679, "learning_rate": 3.655609116463874e-05, "loss": 0.3999, "loss_nan_ranks": 0, "loss_rank_avg": 0.15031850337982178, "step": 2295, "valid_targets_mean": 10505.3, "valid_targets_min": 1982 }, { "epoch": 1.3569321533923304, "grad_norm": 0.21767299900598155, "learning_rate": 3.65329475646869e-05, "loss": 0.4034, "loss_nan_ranks": 0, "loss_rank_avg": 0.11701009422540665, "step": 2300, "valid_targets_mean": 8692.3, "valid_targets_min": 2029 }, { "epoch": 1.359882005899705, "grad_norm": 0.2183834292919999, "learning_rate": 3.6509733838197564e-05, "loss": 0.4101, "loss_nan_ranks": 0, "loss_rank_avg": 0.16395114362239838, "step": 2305, "valid_targets_mean": 11298.5, "valid_targets_min": 2026 }, { "epoch": 1.3628318584070795, "grad_norm": 0.18901010572773513, "learning_rate": 3.648645008363462e-05, "loss": 0.4063, "loss_nan_ranks": 0, "loss_rank_avg": 0.13451609015464783, "step": 2310, "valid_targets_mean": 11260.0, "valid_targets_min": 1881 }, { "epoch": 1.3657817109144543, "grad_norm": 0.2048497137635517, "learning_rate": 3.646309639975897e-05, "loss": 0.4068, "loss_nan_ranks": 0, "loss_rank_avg": 0.13462871313095093, "step": 2315, "valid_targets_mean": 8625.0, "valid_targets_min": 1667 }, { "epoch": 1.368731563421829, "grad_norm": 0.19236734583414303, "learning_rate": 3.6439672885628166e-05, "loss": 0.4088, "loss_nan_ranks": 0, "loss_rank_avg": 0.13107746839523315, "step": 2320, "valid_targets_mean": 9656.2, "valid_targets_min": 934 }, { "epoch": 1.3716814159292037, "grad_norm": 0.19053766648018297, "learning_rate": 3.6416179640595915e-05, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.13497191667556763, "step": 2325, "valid_targets_mean": 9664.0, "valid_targets_min": 1144 }, { "epoch": 1.3746312684365782, "grad_norm": 0.19300409834685217, "learning_rate": 3.639261676431173e-05, "loss": 0.409, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307114213705063, "step": 2330, "valid_targets_mean": 9555.0, "valid_targets_min": 1431 }, { "epoch": 1.3775811209439528, "grad_norm": 0.1915293402622118, "learning_rate": 3.636898435672045e-05, "loss": 0.4086, "loss_nan_ranks": 0, "loss_rank_avg": 0.14565394818782806, "step": 2335, "valid_targets_mean": 11355.8, "valid_targets_min": 1551 }, { "epoch": 1.3805309734513274, "grad_norm": 0.18757009262408111, "learning_rate": 3.6345282518061854e-05, "loss": 0.4081, "loss_nan_ranks": 0, "loss_rank_avg": 0.13044847548007965, "step": 2340, "valid_targets_mean": 9336.7, "valid_targets_min": 1510 }, { "epoch": 1.3834808259587021, "grad_norm": 0.21574355726659275, "learning_rate": 3.6321511348870216e-05, "loss": 0.4108, "loss_nan_ranks": 0, "loss_rank_avg": 0.14156800508499146, "step": 2345, "valid_targets_mean": 10439.0, "valid_targets_min": 950 }, { "epoch": 1.3864306784660767, "grad_norm": 0.2220379252664554, "learning_rate": 3.629767094997387e-05, "loss": 0.4085, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283535361289978, "step": 2350, "valid_targets_mean": 9239.7, "valid_targets_min": 1882 }, { "epoch": 1.3893805309734513, "grad_norm": 0.20889828514195585, "learning_rate": 3.6273761422494835e-05, "loss": 0.4069, "loss_nan_ranks": 0, "loss_rank_avg": 0.11462993174791336, "step": 2355, "valid_targets_mean": 8878.3, "valid_targets_min": 1276 }, { "epoch": 1.392330383480826, "grad_norm": 0.1971508256806736, "learning_rate": 3.6249782867848305e-05, "loss": 0.414, "loss_nan_ranks": 0, "loss_rank_avg": 0.12239646911621094, "step": 2360, "valid_targets_mean": 9431.4, "valid_targets_min": 1698 }, { "epoch": 1.3952802359882006, "grad_norm": 0.20606399593524655, "learning_rate": 3.622573538774227e-05, "loss": 0.4012, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392350047826767, "step": 2365, "valid_targets_mean": 9600.9, "valid_targets_min": 2070 }, { "epoch": 1.3982300884955752, "grad_norm": 0.2006887696751807, "learning_rate": 3.620161908417711e-05, "loss": 0.413, "loss_nan_ranks": 0, "loss_rank_avg": 0.13277579843997955, "step": 2370, "valid_targets_mean": 9258.9, "valid_targets_min": 2322 }, { "epoch": 1.4011799410029497, "grad_norm": 0.2143607038766854, "learning_rate": 3.6177434059445094e-05, "loss": 0.4103, "loss_nan_ranks": 0, "loss_rank_avg": 0.14542219042778015, "step": 2375, "valid_targets_mean": 11005.1, "valid_targets_min": 1545 }, { "epoch": 1.4041297935103245, "grad_norm": 0.19051154679740112, "learning_rate": 3.615318041612998e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375996470451355, "step": 2380, "valid_targets_mean": 10616.3, "valid_targets_min": 1536 }, { "epoch": 1.407079646017699, "grad_norm": 0.18605652703530892, "learning_rate": 3.612885825710659e-05, "loss": 0.4071, "loss_nan_ranks": 0, "loss_rank_avg": 0.16152793169021606, "step": 2385, "valid_targets_mean": 11486.4, "valid_targets_min": 518 }, { "epoch": 1.4100294985250739, "grad_norm": 0.1952639376391805, "learning_rate": 3.610446768554037e-05, "loss": 0.409, "loss_nan_ranks": 0, "loss_rank_avg": 0.13920962810516357, "step": 2390, "valid_targets_mean": 9616.6, "valid_targets_min": 1230 }, { "epoch": 1.4129793510324484, "grad_norm": 0.18753466403054453, "learning_rate": 3.608000880488694e-05, "loss": 0.403, "loss_nan_ranks": 0, "loss_rank_avg": 0.12460490316152573, "step": 2395, "valid_targets_mean": 8952.7, "valid_targets_min": 1587 }, { "epoch": 1.415929203539823, "grad_norm": 0.20751763054816902, "learning_rate": 3.6055481718891664e-05, "loss": 0.406, "loss_nan_ranks": 0, "loss_rank_avg": 0.15804365277290344, "step": 2400, "valid_targets_mean": 11414.2, "valid_targets_min": 3387 }, { "epoch": 1.4188790560471976, "grad_norm": 0.22456567480775044, "learning_rate": 3.603088653158919e-05, "loss": 0.4021, "loss_nan_ranks": 0, "loss_rank_avg": 0.18407636880874634, "step": 2405, "valid_targets_mean": 12465.5, "valid_targets_min": 1710 }, { "epoch": 1.4218289085545723, "grad_norm": 0.1897115624902503, "learning_rate": 3.6006223347303055e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.15461409091949463, "step": 2410, "valid_targets_mean": 10231.8, "valid_targets_min": 2259 }, { "epoch": 1.424778761061947, "grad_norm": 0.18663608515655314, "learning_rate": 3.5981492270645186e-05, "loss": 0.3995, "loss_nan_ranks": 0, "loss_rank_avg": 0.14762979745864868, "step": 2415, "valid_targets_mean": 13320.7, "valid_targets_min": 1376 }, { "epoch": 1.4277286135693215, "grad_norm": 0.18670962136513533, "learning_rate": 3.5956693406515514e-05, "loss": 0.3911, "loss_nan_ranks": 0, "loss_rank_avg": 0.10723703354597092, "step": 2420, "valid_targets_mean": 8426.0, "valid_targets_min": 1654 }, { "epoch": 1.4306784660766962, "grad_norm": 0.21110550552454987, "learning_rate": 3.5931826860101464e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.11997527629137039, "step": 2425, "valid_targets_mean": 8610.3, "valid_targets_min": 2335 }, { "epoch": 1.4336283185840708, "grad_norm": 0.1927862790503147, "learning_rate": 3.590689273687757e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.12968887388706207, "step": 2430, "valid_targets_mean": 9733.9, "valid_targets_min": 2604 }, { "epoch": 1.4365781710914454, "grad_norm": 0.18845839982483642, "learning_rate": 3.588189114260499e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.10686099529266357, "step": 2435, "valid_targets_mean": 7887.3, "valid_targets_min": 961 }, { "epoch": 1.43952802359882, "grad_norm": 0.1913639955229515, "learning_rate": 3.585682218333108e-05, "loss": 0.3973, "loss_nan_ranks": 0, "loss_rank_avg": 0.1498546153306961, "step": 2440, "valid_targets_mean": 12008.4, "valid_targets_min": 3631 }, { "epoch": 1.4424778761061947, "grad_norm": 0.19182583587682012, "learning_rate": 3.583168596538891e-05, "loss": 0.4034, "loss_nan_ranks": 0, "loss_rank_avg": 0.14093820750713348, "step": 2445, "valid_targets_mean": 11155.2, "valid_targets_min": 2731 }, { "epoch": 1.4454277286135693, "grad_norm": 0.20882085785585852, "learning_rate": 3.580648259539686e-05, "loss": 0.3912, "loss_nan_ranks": 0, "loss_rank_avg": 0.13466665148735046, "step": 2450, "valid_targets_mean": 10674.4, "valid_targets_min": 1317 }, { "epoch": 1.448377581120944, "grad_norm": 0.1999862673806767, "learning_rate": 3.578121218025814e-05, "loss": 0.395, "loss_nan_ranks": 0, "loss_rank_avg": 0.15615367889404297, "step": 2455, "valid_targets_mean": 11136.4, "valid_targets_min": 1890 }, { "epoch": 1.4513274336283186, "grad_norm": 0.21154653827787115, "learning_rate": 3.5755874827160324e-05, "loss": 0.3973, "loss_nan_ranks": 0, "loss_rank_avg": 0.16489741206169128, "step": 2460, "valid_targets_mean": 12538.8, "valid_targets_min": 1856 }, { "epoch": 1.4542772861356932, "grad_norm": 0.20865259658756602, "learning_rate": 3.573047064357492e-05, "loss": 0.4061, "loss_nan_ranks": 0, "loss_rank_avg": 0.15276436507701874, "step": 2465, "valid_targets_mean": 11351.3, "valid_targets_min": 1738 }, { "epoch": 1.4572271386430677, "grad_norm": 0.21166081933048564, "learning_rate": 3.5704999737256923e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.10980367660522461, "step": 2470, "valid_targets_mean": 9638.6, "valid_targets_min": 2769 }, { "epoch": 1.4601769911504425, "grad_norm": 0.20547766161198802, "learning_rate": 3.567946221624431e-05, "loss": 0.3965, "loss_nan_ranks": 0, "loss_rank_avg": 0.13496387004852295, "step": 2475, "valid_targets_mean": 10217.3, "valid_targets_min": 1867 }, { "epoch": 1.463126843657817, "grad_norm": 0.20272356539276168, "learning_rate": 3.5653858188857637e-05, "loss": 0.3933, "loss_nan_ranks": 0, "loss_rank_avg": 0.13152998685836792, "step": 2480, "valid_targets_mean": 10830.1, "valid_targets_min": 2056 }, { "epoch": 1.4660766961651919, "grad_norm": 0.1928236170984883, "learning_rate": 3.5628187763699545e-05, "loss": 0.3916, "loss_nan_ranks": 0, "loss_rank_avg": 0.10376954078674316, "step": 2485, "valid_targets_mean": 8065.7, "valid_targets_min": 2250 }, { "epoch": 1.4690265486725664, "grad_norm": 0.20906690195005687, "learning_rate": 3.560245104965431e-05, "loss": 0.3981, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269378960132599, "step": 2490, "valid_targets_mean": 10655.2, "valid_targets_min": 2555 }, { "epoch": 1.471976401179941, "grad_norm": 0.2046303448144277, "learning_rate": 3.5576648155887366e-05, "loss": 0.395, "loss_nan_ranks": 0, "loss_rank_avg": 0.14142167568206787, "step": 2495, "valid_targets_mean": 11071.5, "valid_targets_min": 860 }, { "epoch": 1.4749262536873156, "grad_norm": 0.20599363038669596, "learning_rate": 3.555077919184489e-05, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.15158352255821228, "step": 2500, "valid_targets_mean": 11408.9, "valid_targets_min": 2015 }, { "epoch": 1.4778761061946903, "grad_norm": 0.1788204164478249, "learning_rate": 3.552484426725329e-05, "loss": 0.3966, "loss_nan_ranks": 0, "loss_rank_avg": 0.10846086591482162, "step": 2505, "valid_targets_mean": 9568.1, "valid_targets_min": 1913 }, { "epoch": 1.480825958702065, "grad_norm": 0.1923751273446749, "learning_rate": 3.549884349211874e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.12155988812446594, "step": 2510, "valid_targets_mean": 9056.0, "valid_targets_min": 1585 }, { "epoch": 1.4837758112094395, "grad_norm": 0.20639266762873654, "learning_rate": 3.5472776976726734e-05, "loss": 0.393, "loss_nan_ranks": 0, "loss_rank_avg": 0.15222719311714172, "step": 2515, "valid_targets_mean": 13044.3, "valid_targets_min": 2160 }, { "epoch": 1.4867256637168142, "grad_norm": 0.22266275834029062, "learning_rate": 3.5446644831641614e-05, "loss": 0.3987, "loss_nan_ranks": 0, "loss_rank_avg": 0.10895134508609772, "step": 2520, "valid_targets_mean": 9486.9, "valid_targets_min": 1543 }, { "epoch": 1.4896755162241888, "grad_norm": 0.21384271957343456, "learning_rate": 3.54204471677061e-05, "loss": 0.3968, "loss_nan_ranks": 0, "loss_rank_avg": 0.11045604944229126, "step": 2525, "valid_targets_mean": 9637.9, "valid_targets_min": 1453 }, { "epoch": 1.4926253687315634, "grad_norm": 0.21759058269956286, "learning_rate": 3.539418409604082e-05, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.1656768023967743, "step": 2530, "valid_targets_mean": 11221.1, "valid_targets_min": 1861 }, { "epoch": 1.495575221238938, "grad_norm": 0.22306265795961336, "learning_rate": 3.536785572804383e-05, "loss": 0.3984, "loss_nan_ranks": 0, "loss_rank_avg": 0.11005926877260208, "step": 2535, "valid_targets_mean": 7896.7, "valid_targets_min": 1601 }, { "epoch": 1.4985250737463127, "grad_norm": 0.18758579596156683, "learning_rate": 3.534146217539016e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.14364221692085266, "step": 2540, "valid_targets_mean": 11206.3, "valid_targets_min": 2567 }, { "epoch": 1.5014749262536873, "grad_norm": 0.2141138193508478, "learning_rate": 3.531500355003131e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.13702622056007385, "step": 2545, "valid_targets_mean": 9940.7, "valid_targets_min": 1487 }, { "epoch": 1.504424778761062, "grad_norm": 0.20617771305195218, "learning_rate": 3.528847996419481e-05, "loss": 0.3954, "loss_nan_ranks": 0, "loss_rank_avg": 0.1305457502603531, "step": 2550, "valid_targets_mean": 9426.9, "valid_targets_min": 1920 }, { "epoch": 1.5073746312684366, "grad_norm": 0.22125729323813947, "learning_rate": 3.526189153038372e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.11197060346603394, "step": 2555, "valid_targets_mean": 7889.9, "valid_targets_min": 1997 }, { "epoch": 1.5103244837758112, "grad_norm": 0.20228311822774708, "learning_rate": 3.523523836137617e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.10877414047718048, "step": 2560, "valid_targets_mean": 8702.3, "valid_targets_min": 2150 }, { "epoch": 1.5132743362831858, "grad_norm": 0.1924749677621517, "learning_rate": 3.5208520570224865e-05, "loss": 0.3871, "loss_nan_ranks": 0, "loss_rank_avg": 0.15349164605140686, "step": 2565, "valid_targets_mean": 11533.9, "valid_targets_min": 1871 }, { "epoch": 1.5162241887905603, "grad_norm": 0.22515634811956609, "learning_rate": 3.5181738270256595e-05, "loss": 0.3818, "loss_nan_ranks": 0, "loss_rank_avg": 0.12597164511680603, "step": 2570, "valid_targets_mean": 10099.0, "valid_targets_min": 2449 }, { "epoch": 1.519174041297935, "grad_norm": 0.20497870920040415, "learning_rate": 3.5154891575071816e-05, "loss": 0.3881, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445295214653015, "step": 2575, "valid_targets_mean": 10613.0, "valid_targets_min": 1767 }, { "epoch": 1.5221238938053099, "grad_norm": 0.19355635363854126, "learning_rate": 3.512798059854409e-05, "loss": 0.3984, "loss_nan_ranks": 0, "loss_rank_avg": 0.132507786154747, "step": 2580, "valid_targets_mean": 9735.8, "valid_targets_min": 1444 }, { "epoch": 1.5250737463126844, "grad_norm": 0.19422329710559866, "learning_rate": 3.510100545481964e-05, "loss": 0.4035, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423739790916443, "step": 2585, "valid_targets_mean": 12089.4, "valid_targets_min": 1483 }, { "epoch": 1.528023598820059, "grad_norm": 0.20363806304130708, "learning_rate": 3.507396625831687e-05, "loss": 0.3989, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374133825302124, "step": 2590, "valid_targets_mean": 9522.6, "valid_targets_min": 747 }, { "epoch": 1.5309734513274336, "grad_norm": 0.20209241704309913, "learning_rate": 3.504686312372587e-05, "loss": 0.3859, "loss_nan_ranks": 0, "loss_rank_avg": 0.09004460275173187, "step": 2595, "valid_targets_mean": 6589.8, "valid_targets_min": 1001 }, { "epoch": 1.5339233038348081, "grad_norm": 0.20549443606621662, "learning_rate": 3.5019696166007936e-05, "loss": 0.4004, "loss_nan_ranks": 0, "loss_rank_avg": 0.1255984753370285, "step": 2600, "valid_targets_mean": 8307.7, "valid_targets_min": 1442 }, { "epoch": 1.536873156342183, "grad_norm": 0.189294083469522, "learning_rate": 3.499246550039506e-05, "loss": 0.3899, "loss_nan_ranks": 0, "loss_rank_avg": 0.12242449820041656, "step": 2605, "valid_targets_mean": 9174.5, "valid_targets_min": 2099 }, { "epoch": 1.5398230088495575, "grad_norm": 0.223437837939735, "learning_rate": 3.4965171242389485e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.13413646817207336, "step": 2610, "valid_targets_mean": 9977.2, "valid_targets_min": 1385 }, { "epoch": 1.5427728613569323, "grad_norm": 0.1946804583428626, "learning_rate": 3.4937813507763155e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.10855253040790558, "step": 2615, "valid_targets_mean": 8322.1, "valid_targets_min": 2131 }, { "epoch": 1.5457227138643068, "grad_norm": 0.1996768663383723, "learning_rate": 3.491039241255729e-05, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.13678157329559326, "step": 2620, "valid_targets_mean": 10406.2, "valid_targets_min": 1407 }, { "epoch": 1.5486725663716814, "grad_norm": 0.19472478670325657, "learning_rate": 3.488290807308186e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.14884641766548157, "step": 2625, "valid_targets_mean": 12493.9, "valid_targets_min": 2457 }, { "epoch": 1.551622418879056, "grad_norm": 0.19161386368368877, "learning_rate": 3.485536060591507e-05, "loss": 0.3876, "loss_nan_ranks": 0, "loss_rank_avg": 0.11435461044311523, "step": 2630, "valid_targets_mean": 9960.1, "valid_targets_min": 2052 }, { "epoch": 1.5545722713864307, "grad_norm": 0.2149406169132456, "learning_rate": 3.482775012790289e-05, "loss": 0.4006, "loss_nan_ranks": 0, "loss_rank_avg": 0.11524064838886261, "step": 2635, "valid_targets_mean": 8378.8, "valid_targets_min": 1560 }, { "epoch": 1.5575221238938053, "grad_norm": 0.1976686009933042, "learning_rate": 3.48000767561586e-05, "loss": 0.3914, "loss_nan_ranks": 0, "loss_rank_avg": 0.11932376027107239, "step": 2640, "valid_targets_mean": 9472.5, "valid_targets_min": 2484 }, { "epoch": 1.56047197640118, "grad_norm": 0.1986083979866418, "learning_rate": 3.47723406080622e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.12804947793483734, "step": 2645, "valid_targets_mean": 10299.2, "valid_targets_min": 878 }, { "epoch": 1.5634218289085546, "grad_norm": 0.19875678796513913, "learning_rate": 3.474454180125998e-05, "loss": 0.3951, "loss_nan_ranks": 0, "loss_rank_avg": 0.138924703001976, "step": 2650, "valid_targets_mean": 10887.9, "valid_targets_min": 2125 }, { "epoch": 1.5663716814159292, "grad_norm": 0.208010638626533, "learning_rate": 3.4716680453664034e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.16505074501037598, "step": 2655, "valid_targets_mean": 12573.0, "valid_targets_min": 2048 }, { "epoch": 1.5693215339233038, "grad_norm": 0.2113806560061952, "learning_rate": 3.4688756683451687e-05, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.1205722764134407, "step": 2660, "valid_targets_mean": 9179.3, "valid_targets_min": 1147 }, { "epoch": 1.5722713864306783, "grad_norm": 0.19990820921293187, "learning_rate": 3.466077060906507e-05, "loss": 0.3867, "loss_nan_ranks": 0, "loss_rank_avg": 0.13424262404441833, "step": 2665, "valid_targets_mean": 10706.8, "valid_targets_min": 1593 }, { "epoch": 1.575221238938053, "grad_norm": 0.2035721175968825, "learning_rate": 3.4632722349210554e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269957721233368, "step": 2670, "valid_targets_mean": 9218.1, "valid_targets_min": 2137 }, { "epoch": 1.5781710914454279, "grad_norm": 0.19354321221920615, "learning_rate": 3.4604612022858306e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.14735949039459229, "step": 2675, "valid_targets_mean": 11224.7, "valid_targets_min": 1822 }, { "epoch": 1.5811209439528024, "grad_norm": 0.23544262059333004, "learning_rate": 3.457643974924174e-05, "loss": 0.3909, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378946602344513, "step": 2680, "valid_targets_mean": 11156.6, "valid_targets_min": 1606 }, { "epoch": 1.584070796460177, "grad_norm": 0.20303218282604443, "learning_rate": 3.4548205647857035e-05, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464405059814453, "step": 2685, "valid_targets_mean": 10960.1, "valid_targets_min": 1556 }, { "epoch": 1.5870206489675516, "grad_norm": 0.19961288753135736, "learning_rate": 3.451990983846262e-05, "loss": 0.3945, "loss_nan_ranks": 0, "loss_rank_avg": 0.11880732327699661, "step": 2690, "valid_targets_mean": 9461.7, "valid_targets_min": 1929 }, { "epoch": 1.5899705014749261, "grad_norm": 0.22630238402236566, "learning_rate": 3.4491552441078654e-05, "loss": 0.3995, "loss_nan_ranks": 0, "loss_rank_avg": 0.13695894181728363, "step": 2695, "valid_targets_mean": 9745.5, "valid_targets_min": 1581 }, { "epoch": 1.592920353982301, "grad_norm": 0.22240211592749506, "learning_rate": 3.446313357598655e-05, "loss": 0.3871, "loss_nan_ranks": 0, "loss_rank_avg": 0.13270913064479828, "step": 2700, "valid_targets_mean": 10080.6, "valid_targets_min": 2923 }, { "epoch": 1.5958702064896755, "grad_norm": 0.20453988006624954, "learning_rate": 3.443465336372842e-05, "loss": 0.3861, "loss_nan_ranks": 0, "loss_rank_avg": 0.12554414570331573, "step": 2705, "valid_targets_mean": 8127.2, "valid_targets_min": 1571 }, { "epoch": 1.5988200589970503, "grad_norm": 0.19769030059580794, "learning_rate": 3.4406111925106596e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.12743881344795227, "step": 2710, "valid_targets_mean": 10449.8, "valid_targets_min": 1912 }, { "epoch": 1.6017699115044248, "grad_norm": 0.21819544409639086, "learning_rate": 3.437750938118312e-05, "loss": 0.3941, "loss_nan_ranks": 0, "loss_rank_avg": 0.11632522940635681, "step": 2715, "valid_targets_mean": 8532.2, "valid_targets_min": 1791 }, { "epoch": 1.6047197640117994, "grad_norm": 0.19796092409366658, "learning_rate": 3.434884585327922e-05, "loss": 0.3957, "loss_nan_ranks": 0, "loss_rank_avg": 0.13927127420902252, "step": 2720, "valid_targets_mean": 11387.8, "valid_targets_min": 2003 }, { "epoch": 1.607669616519174, "grad_norm": 0.20029936745164265, "learning_rate": 3.4320121462974766e-05, "loss": 0.3955, "loss_nan_ranks": 0, "loss_rank_avg": 0.12672072649002075, "step": 2725, "valid_targets_mean": 9229.9, "valid_targets_min": 2522 }, { "epoch": 1.6106194690265485, "grad_norm": 0.1872592104723706, "learning_rate": 3.429133633210782e-05, "loss": 0.392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504121869802475, "step": 2730, "valid_targets_mean": 12198.8, "valid_targets_min": 1675 }, { "epoch": 1.6135693215339233, "grad_norm": 0.186467265613796, "learning_rate": 3.426249058277407e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.12724050879478455, "step": 2735, "valid_targets_mean": 10017.0, "valid_targets_min": 1776 }, { "epoch": 1.616519174041298, "grad_norm": 0.17773999259250345, "learning_rate": 3.423358433732631e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.1229085773229599, "step": 2740, "valid_targets_mean": 10342.0, "valid_targets_min": 1961 }, { "epoch": 1.6194690265486726, "grad_norm": 0.17658621399418326, "learning_rate": 3.420461771837396e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.12835684418678284, "step": 2745, "valid_targets_mean": 9962.6, "valid_targets_min": 2405 }, { "epoch": 1.6224188790560472, "grad_norm": 0.20031625945910475, "learning_rate": 3.4175590848782495e-05, "loss": 0.3938, "loss_nan_ranks": 0, "loss_rank_avg": 0.1081707626581192, "step": 2750, "valid_targets_mean": 8304.7, "valid_targets_min": 1978 }, { "epoch": 1.6253687315634218, "grad_norm": 0.20896474694567252, "learning_rate": 3.414650385167298e-05, "loss": 0.3912, "loss_nan_ranks": 0, "loss_rank_avg": 0.14379850029945374, "step": 2755, "valid_targets_mean": 12342.4, "valid_targets_min": 2187 }, { "epoch": 1.6283185840707963, "grad_norm": 0.20182015995158958, "learning_rate": 3.4117356850421485e-05, "loss": 0.3922, "loss_nan_ranks": 0, "loss_rank_avg": 0.12928926944732666, "step": 2760, "valid_targets_mean": 9165.0, "valid_targets_min": 832 }, { "epoch": 1.631268436578171, "grad_norm": 0.20103812781549815, "learning_rate": 3.408814996865863e-05, "loss": 0.3928, "loss_nan_ranks": 0, "loss_rank_avg": 0.1281728893518448, "step": 2765, "valid_targets_mean": 10573.9, "valid_targets_min": 2386 }, { "epoch": 1.6342182890855457, "grad_norm": 0.18029541909036872, "learning_rate": 3.4058883330268995e-05, "loss": 0.4005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1050175353884697, "step": 2770, "valid_targets_mean": 8261.4, "valid_targets_min": 1439 }, { "epoch": 1.6371681415929205, "grad_norm": 0.2012413957828967, "learning_rate": 3.402955705939065e-05, "loss": 0.4041, "loss_nan_ranks": 0, "loss_rank_avg": 0.14012792706489563, "step": 2775, "valid_targets_mean": 9847.7, "valid_targets_min": 1767 }, { "epoch": 1.640117994100295, "grad_norm": 0.19178800924013567, "learning_rate": 3.400017128041459e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.15238690376281738, "step": 2780, "valid_targets_mean": 13030.2, "valid_targets_min": 2483 }, { "epoch": 1.6430678466076696, "grad_norm": 0.19419884624460312, "learning_rate": 3.397072611798421e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.11771540343761444, "step": 2785, "valid_targets_mean": 9731.1, "valid_targets_min": 1703 }, { "epoch": 1.6460176991150441, "grad_norm": 0.19910500058317934, "learning_rate": 3.394122169699482e-05, "loss": 0.3925, "loss_nan_ranks": 0, "loss_rank_avg": 0.13526403903961182, "step": 2790, "valid_targets_mean": 10780.1, "valid_targets_min": 1649 }, { "epoch": 1.648967551622419, "grad_norm": 0.18202549756014805, "learning_rate": 3.3911658142593044e-05, "loss": 0.3993, "loss_nan_ranks": 0, "loss_rank_avg": 0.13593779504299164, "step": 2795, "valid_targets_mean": 10743.4, "valid_targets_min": 1801 }, { "epoch": 1.6519174041297935, "grad_norm": 0.19194239646892167, "learning_rate": 3.388203558017636e-05, "loss": 0.4012, "loss_nan_ranks": 0, "loss_rank_avg": 0.10597368329763412, "step": 2800, "valid_targets_mean": 9102.6, "valid_targets_min": 1830 }, { "epoch": 1.6548672566371683, "grad_norm": 0.1852839602364545, "learning_rate": 3.3852354135392534e-05, "loss": 0.3906, "loss_nan_ranks": 0, "loss_rank_avg": 0.11317931115627289, "step": 2805, "valid_targets_mean": 9400.9, "valid_targets_min": 1853 }, { "epoch": 1.6578171091445428, "grad_norm": 0.19090895235342278, "learning_rate": 3.382261393413905e-05, "loss": 0.3841, "loss_nan_ranks": 0, "loss_rank_avg": 0.1284770369529724, "step": 2810, "valid_targets_mean": 10114.0, "valid_targets_min": 2144 }, { "epoch": 1.6607669616519174, "grad_norm": 0.2029009930014119, "learning_rate": 3.3792815102562646e-05, "loss": 0.3825, "loss_nan_ranks": 0, "loss_rank_avg": 0.13038460910320282, "step": 2815, "valid_targets_mean": 9553.2, "valid_targets_min": 2181 }, { "epoch": 1.663716814159292, "grad_norm": 0.20663093892181367, "learning_rate": 3.3762957767058764e-05, "loss": 0.3948, "loss_nan_ranks": 0, "loss_rank_avg": 0.13431856036186218, "step": 2820, "valid_targets_mean": 9748.7, "valid_targets_min": 856 }, { "epoch": 1.6666666666666665, "grad_norm": 0.18749624837860834, "learning_rate": 3.373304205427096e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.14476144313812256, "step": 2825, "valid_targets_mean": 12207.3, "valid_targets_min": 2941 }, { "epoch": 1.6696165191740413, "grad_norm": 0.188979400398134, "learning_rate": 3.370306809109043e-05, "loss": 0.3919, "loss_nan_ranks": 0, "loss_rank_avg": 0.11705923080444336, "step": 2830, "valid_targets_mean": 9607.7, "valid_targets_min": 1480 }, { "epoch": 1.672566371681416, "grad_norm": 0.1822789862555373, "learning_rate": 3.367303600465543e-05, "loss": 0.4009, "loss_nan_ranks": 0, "loss_rank_avg": 0.12379142642021179, "step": 2835, "valid_targets_mean": 10516.6, "valid_targets_min": 1750 }, { "epoch": 1.6755162241887906, "grad_norm": 0.19514377116590026, "learning_rate": 3.364294592235077e-05, "loss": 0.393, "loss_nan_ranks": 0, "loss_rank_avg": 0.1143941879272461, "step": 2840, "valid_targets_mean": 9166.2, "valid_targets_min": 2342 }, { "epoch": 1.6784660766961652, "grad_norm": 0.1995337838648031, "learning_rate": 3.361279797180724e-05, "loss": 0.3945, "loss_nan_ranks": 0, "loss_rank_avg": 0.15227705240249634, "step": 2845, "valid_targets_mean": 10198.2, "valid_targets_min": 1888 }, { "epoch": 1.6814159292035398, "grad_norm": 0.19203783654469914, "learning_rate": 3.358259228090109e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.13235729932785034, "step": 2850, "valid_targets_mean": 9976.0, "valid_targets_min": 1591 }, { "epoch": 1.6843657817109143, "grad_norm": 0.1976180105398448, "learning_rate": 3.3552328977753506e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.1187744140625, "step": 2855, "valid_targets_mean": 8667.3, "valid_targets_min": 1636 }, { "epoch": 1.6873156342182891, "grad_norm": 0.19202804434606036, "learning_rate": 3.3522008190730004e-05, "loss": 0.394, "loss_nan_ranks": 0, "loss_rank_avg": 0.15723806619644165, "step": 2860, "valid_targets_mean": 11671.9, "valid_targets_min": 1372 }, { "epoch": 1.6902654867256637, "grad_norm": 0.19925777636796418, "learning_rate": 3.349163004843995e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.11505947262048721, "step": 2865, "valid_targets_mean": 8705.5, "valid_targets_min": 788 }, { "epoch": 1.6932153392330385, "grad_norm": 0.20575461925435287, "learning_rate": 3.346119467973598e-05, "loss": 0.3958, "loss_nan_ranks": 0, "loss_rank_avg": 0.13286572694778442, "step": 2870, "valid_targets_mean": 10789.9, "valid_targets_min": 1629 }, { "epoch": 1.696165191740413, "grad_norm": 0.195789852899565, "learning_rate": 3.343070221371347e-05, "loss": 0.3993, "loss_nan_ranks": 0, "loss_rank_avg": 0.12431154400110245, "step": 2875, "valid_targets_mean": 9820.9, "valid_targets_min": 2079 }, { "epoch": 1.6991150442477876, "grad_norm": 0.19085369231753674, "learning_rate": 3.340015277970998e-05, "loss": 0.3911, "loss_nan_ranks": 0, "loss_rank_avg": 0.11652038991451263, "step": 2880, "valid_targets_mean": 9519.0, "valid_targets_min": 1443 }, { "epoch": 1.7020648967551621, "grad_norm": 0.18434544444359915, "learning_rate": 3.33695465073047e-05, "loss": 0.3913, "loss_nan_ranks": 0, "loss_rank_avg": 0.12810981273651123, "step": 2885, "valid_targets_mean": 11148.6, "valid_targets_min": 2844 }, { "epoch": 1.7050147492625367, "grad_norm": 0.19182102586594751, "learning_rate": 3.3338883526317915e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.16361527144908905, "step": 2890, "valid_targets_mean": 11772.3, "valid_targets_min": 2041 }, { "epoch": 1.7079646017699115, "grad_norm": 0.18685253615301253, "learning_rate": 3.3308163966810446e-05, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.12067534029483795, "step": 2895, "valid_targets_mean": 9464.2, "valid_targets_min": 2006 }, { "epoch": 1.7109144542772863, "grad_norm": 0.18789090242459708, "learning_rate": 3.3277387959083086e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.11749487370252609, "step": 2900, "valid_targets_mean": 10115.8, "valid_targets_min": 2033 }, { "epoch": 1.7138643067846608, "grad_norm": 0.19142845485695198, "learning_rate": 3.324655563367608e-05, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.10298315435647964, "step": 2905, "valid_targets_mean": 8914.2, "valid_targets_min": 1829 }, { "epoch": 1.7168141592920354, "grad_norm": 0.19266959518709054, "learning_rate": 3.3215667121368536e-05, "loss": 0.3883, "loss_nan_ranks": 0, "loss_rank_avg": 0.14745637774467468, "step": 2910, "valid_targets_mean": 11594.1, "valid_targets_min": 1466 }, { "epoch": 1.71976401179941, "grad_norm": 0.19916980056432732, "learning_rate": 3.3184722553177886e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.13046494126319885, "step": 2915, "valid_targets_mean": 10735.3, "valid_targets_min": 1786 }, { "epoch": 1.7227138643067845, "grad_norm": 0.18897005780526288, "learning_rate": 3.3153722060359345e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.13529415428638458, "step": 2920, "valid_targets_mean": 11454.9, "valid_targets_min": 2305 }, { "epoch": 1.7256637168141593, "grad_norm": 0.19134823925494687, "learning_rate": 3.312266577440533e-05, "loss": 0.3965, "loss_nan_ranks": 0, "loss_rank_avg": 0.11531375348567963, "step": 2925, "valid_targets_mean": 9119.2, "valid_targets_min": 933 }, { "epoch": 1.7286135693215339, "grad_norm": 0.2730744331613668, "learning_rate": 3.30915538270449e-05, "loss": 0.3965, "loss_nan_ranks": 0, "loss_rank_avg": 0.11113665252923965, "step": 2930, "valid_targets_mean": 9410.8, "valid_targets_min": 1837 }, { "epoch": 1.7315634218289087, "grad_norm": 0.1840969708035178, "learning_rate": 3.306038635024323e-05, "loss": 0.3881, "loss_nan_ranks": 0, "loss_rank_avg": 0.1135941594839096, "step": 2935, "valid_targets_mean": 9461.3, "valid_targets_min": 1841 }, { "epoch": 1.7345132743362832, "grad_norm": 0.19348029772223146, "learning_rate": 3.302916347620102e-05, "loss": 0.393, "loss_nan_ranks": 0, "loss_rank_avg": 0.1548248678445816, "step": 2940, "valid_targets_mean": 12400.2, "valid_targets_min": 2042 }, { "epoch": 1.7374631268436578, "grad_norm": 0.18252156946800238, "learning_rate": 3.299788533735393e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.15255288779735565, "step": 2945, "valid_targets_mean": 12530.3, "valid_targets_min": 2926 }, { "epoch": 1.7404129793510323, "grad_norm": 0.18125067932284578, "learning_rate": 3.296655206637205e-05, "loss": 0.3924, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404009312391281, "step": 2950, "valid_targets_mean": 10509.6, "valid_targets_min": 649 }, { "epoch": 1.7433628318584071, "grad_norm": 0.17493040232422627, "learning_rate": 3.293516379615933e-05, "loss": 0.3896, "loss_nan_ranks": 0, "loss_rank_avg": 0.12707272171974182, "step": 2955, "valid_targets_mean": 9454.0, "valid_targets_min": 2003 }, { "epoch": 1.7463126843657817, "grad_norm": 0.19612154842958732, "learning_rate": 3.2903720659852973e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.12193826586008072, "step": 2960, "valid_targets_mean": 9103.6, "valid_targets_min": 1608 }, { "epoch": 1.7492625368731565, "grad_norm": 0.18257690930740766, "learning_rate": 3.287222279082294e-05, "loss": 0.3893, "loss_nan_ranks": 0, "loss_rank_avg": 0.12374929338693619, "step": 2965, "valid_targets_mean": 9436.6, "valid_targets_min": 2137 }, { "epoch": 1.752212389380531, "grad_norm": 0.18167704644036603, "learning_rate": 3.2840670322671316e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.12390658259391785, "step": 2970, "valid_targets_mean": 9747.0, "valid_targets_min": 1135 }, { "epoch": 1.7551622418879056, "grad_norm": 0.1965094558740685, "learning_rate": 3.28090633892318e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370033472776413, "step": 2975, "valid_targets_mean": 10079.6, "valid_targets_min": 2286 }, { "epoch": 1.7581120943952802, "grad_norm": 0.19269690309905338, "learning_rate": 3.277740212456909e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1356833130121231, "step": 2980, "valid_targets_mean": 10582.6, "valid_targets_min": 1657 }, { "epoch": 1.7610619469026547, "grad_norm": 0.1952694338389336, "learning_rate": 3.2745686662978355e-05, "loss": 0.3977, "loss_nan_ranks": 0, "loss_rank_avg": 0.1223859190940857, "step": 2985, "valid_targets_mean": 8869.7, "valid_targets_min": 1883 }, { "epoch": 1.7640117994100295, "grad_norm": 0.20350950152630534, "learning_rate": 3.2713917138984634e-05, "loss": 0.3838, "loss_nan_ranks": 0, "loss_rank_avg": 0.13408294320106506, "step": 2990, "valid_targets_mean": 10999.8, "valid_targets_min": 1608 }, { "epoch": 1.7669616519174043, "grad_norm": 0.19334915963802546, "learning_rate": 3.268209368734229e-05, "loss": 0.392, "loss_nan_ranks": 0, "loss_rank_avg": 0.129969522356987, "step": 2995, "valid_targets_mean": 10845.2, "valid_targets_min": 1769 }, { "epoch": 1.7699115044247788, "grad_norm": 0.18099169248601887, "learning_rate": 3.265021644303441e-05, "loss": 0.3905, "loss_nan_ranks": 0, "loss_rank_avg": 0.13780558109283447, "step": 3000, "valid_targets_mean": 11583.4, "valid_targets_min": 2726 }, { "epoch": 1.7728613569321534, "grad_norm": 0.1896969180469815, "learning_rate": 3.261828554127227e-05, "loss": 0.3881, "loss_nan_ranks": 0, "loss_rank_avg": 0.11599138379096985, "step": 3005, "valid_targets_mean": 9023.2, "valid_targets_min": 1719 }, { "epoch": 1.775811209439528, "grad_norm": 0.19063468212727738, "learning_rate": 3.258630111749474e-05, "loss": 0.3905, "loss_nan_ranks": 0, "loss_rank_avg": 0.15030834078788757, "step": 3010, "valid_targets_mean": 11621.1, "valid_targets_min": 1627 }, { "epoch": 1.7787610619469025, "grad_norm": 0.20924962814002224, "learning_rate": 3.255426330736768e-05, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.15606912970542908, "step": 3015, "valid_targets_mean": 10227.8, "valid_targets_min": 2542 }, { "epoch": 1.7817109144542773, "grad_norm": 0.18928326396508474, "learning_rate": 3.252217224678342e-05, "loss": 0.3839, "loss_nan_ranks": 0, "loss_rank_avg": 0.12054719030857086, "step": 3020, "valid_targets_mean": 8847.1, "valid_targets_min": 2962 }, { "epoch": 1.7846607669616519, "grad_norm": 0.20098696420819967, "learning_rate": 3.249002807186016e-05, "loss": 0.3922, "loss_nan_ranks": 0, "loss_rank_avg": 0.137400820851326, "step": 3025, "valid_targets_mean": 11824.5, "valid_targets_min": 2336 }, { "epoch": 1.7876106194690267, "grad_norm": 0.19025621382762697, "learning_rate": 3.2457830918941384e-05, "loss": 0.3943, "loss_nan_ranks": 0, "loss_rank_avg": 0.1631835699081421, "step": 3030, "valid_targets_mean": 13422.8, "valid_targets_min": 2469 }, { "epoch": 1.7905604719764012, "grad_norm": 0.1774868607110602, "learning_rate": 3.242558092459529e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.09473612904548645, "step": 3035, "valid_targets_mean": 8039.5, "valid_targets_min": 1011 }, { "epoch": 1.7935103244837758, "grad_norm": 0.18665228670374476, "learning_rate": 3.2393278225614205e-05, "loss": 0.3901, "loss_nan_ranks": 0, "loss_rank_avg": 0.10702696442604065, "step": 3040, "valid_targets_mean": 8162.9, "valid_targets_min": 1768 }, { "epoch": 1.7964601769911503, "grad_norm": 0.2199654108080235, "learning_rate": 3.2360922959014014e-05, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1379621922969818, "step": 3045, "valid_targets_mean": 9680.6, "valid_targets_min": 1517 }, { "epoch": 1.799410029498525, "grad_norm": 0.22475118561788887, "learning_rate": 3.232851526203359e-05, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1337410807609558, "step": 3050, "valid_targets_mean": 10204.0, "valid_targets_min": 1856 }, { "epoch": 1.8023598820058997, "grad_norm": 0.21577531073711217, "learning_rate": 3.229605527213415e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.1492527723312378, "step": 3055, "valid_targets_mean": 11088.9, "valid_targets_min": 3033 }, { "epoch": 1.8053097345132745, "grad_norm": 0.1905308663972179, "learning_rate": 3.2263543126998765e-05, "loss": 0.3956, "loss_nan_ranks": 0, "loss_rank_avg": 0.11409647762775421, "step": 3060, "valid_targets_mean": 8808.9, "valid_targets_min": 1628 }, { "epoch": 1.808259587020649, "grad_norm": 0.19650377661381702, "learning_rate": 3.223097896453171e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.13997744023799896, "step": 3065, "valid_targets_mean": 10004.9, "valid_targets_min": 2090 }, { "epoch": 1.8112094395280236, "grad_norm": 0.2027973299079048, "learning_rate": 3.2198362922857896e-05, "loss": 0.3927, "loss_nan_ranks": 0, "loss_rank_avg": 0.13658654689788818, "step": 3070, "valid_targets_mean": 11585.9, "valid_targets_min": 1578 }, { "epoch": 1.8141592920353982, "grad_norm": 0.20214465917193142, "learning_rate": 3.216569514032229e-05, "loss": 0.3878, "loss_nan_ranks": 0, "loss_rank_avg": 0.1428215205669403, "step": 3075, "valid_targets_mean": 10658.7, "valid_targets_min": 1712 }, { "epoch": 1.8171091445427727, "grad_norm": 0.20351093437896298, "learning_rate": 3.213297575548932e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.14719177782535553, "step": 3080, "valid_targets_mean": 11714.4, "valid_targets_min": 2874 }, { "epoch": 1.8200589970501475, "grad_norm": 0.2021762199445001, "learning_rate": 3.210020490714231e-05, "loss": 0.386, "loss_nan_ranks": 0, "loss_rank_avg": 0.10983000695705414, "step": 3085, "valid_targets_mean": 9205.3, "valid_targets_min": 2733 }, { "epoch": 1.823008849557522, "grad_norm": 0.2079297438681715, "learning_rate": 3.206738273428284e-05, "loss": 0.3852, "loss_nan_ranks": 0, "loss_rank_avg": 0.10927362740039825, "step": 3090, "valid_targets_mean": 8837.8, "valid_targets_min": 2032 }, { "epoch": 1.8259587020648969, "grad_norm": 0.2086646841099004, "learning_rate": 3.2034509376130216e-05, "loss": 0.3861, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262950301170349, "step": 3095, "valid_targets_mean": 10313.7, "valid_targets_min": 2037 }, { "epoch": 1.8289085545722714, "grad_norm": 0.1892482439759891, "learning_rate": 3.200158497212083e-05, "loss": 0.3928, "loss_nan_ranks": 0, "loss_rank_avg": 0.10493605583906174, "step": 3100, "valid_targets_mean": 8079.2, "valid_targets_min": 1799 }, { "epoch": 1.831858407079646, "grad_norm": 0.20237233479384295, "learning_rate": 3.1968609661907624e-05, "loss": 0.3828, "loss_nan_ranks": 0, "loss_rank_avg": 0.15934070944786072, "step": 3105, "valid_targets_mean": 11687.4, "valid_targets_min": 1660 }, { "epoch": 1.8348082595870205, "grad_norm": 0.19728440008329404, "learning_rate": 3.193558358535944e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.12290243059396744, "step": 3110, "valid_targets_mean": 9689.1, "valid_targets_min": 1213 }, { "epoch": 1.8377581120943953, "grad_norm": 0.18298811670162993, "learning_rate": 3.190250688256045e-05, "loss": 0.391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1717981994152069, "step": 3115, "valid_targets_mean": 13727.9, "valid_targets_min": 2019 }, { "epoch": 1.8407079646017699, "grad_norm": 0.18698664444995303, "learning_rate": 3.186937969380957e-05, "loss": 0.3901, "loss_nan_ranks": 0, "loss_rank_avg": 0.10982745885848999, "step": 3120, "valid_targets_mean": 8408.8, "valid_targets_min": 1770 }, { "epoch": 1.8436578171091447, "grad_norm": 0.20456556558122935, "learning_rate": 3.183620215961987e-05, "loss": 0.3943, "loss_nan_ranks": 0, "loss_rank_avg": 0.14105704426765442, "step": 3125, "valid_targets_mean": 10496.0, "valid_targets_min": 1924 }, { "epoch": 1.8466076696165192, "grad_norm": 0.19477584095116424, "learning_rate": 3.180297442071796e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.119300976395607, "step": 3130, "valid_targets_mean": 9131.2, "valid_targets_min": 2712 }, { "epoch": 1.8495575221238938, "grad_norm": 0.20615521662254552, "learning_rate": 3.176969661804338e-05, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.128769189119339, "step": 3135, "valid_targets_mean": 8391.5, "valid_targets_min": 1896 }, { "epoch": 1.8525073746312684, "grad_norm": 0.18706097563298538, "learning_rate": 3.173636889274804e-05, "loss": 0.3845, "loss_nan_ranks": 0, "loss_rank_avg": 0.12298412621021271, "step": 3140, "valid_targets_mean": 9973.9, "valid_targets_min": 1874 }, { "epoch": 1.855457227138643, "grad_norm": 0.18296786256497324, "learning_rate": 3.170299138619561e-05, "loss": 0.3883, "loss_nan_ranks": 0, "loss_rank_avg": 0.13840444386005402, "step": 3145, "valid_targets_mean": 11387.2, "valid_targets_min": 2079 }, { "epoch": 1.8584070796460177, "grad_norm": 0.18750099633802875, "learning_rate": 3.16695642399609e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.13286367058753967, "step": 3150, "valid_targets_mean": 9381.8, "valid_targets_min": 1708 }, { "epoch": 1.8613569321533925, "grad_norm": 0.18499110557748116, "learning_rate": 3.1636087595829265e-05, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365491688251495, "step": 3155, "valid_targets_mean": 8509.3, "valid_targets_min": 1118 }, { "epoch": 1.864306784660767, "grad_norm": 0.1832860638035741, "learning_rate": 3.160256159579604e-05, "loss": 0.3941, "loss_nan_ranks": 0, "loss_rank_avg": 0.12997931241989136, "step": 3160, "valid_targets_mean": 10374.7, "valid_targets_min": 2011 }, { "epoch": 1.8672566371681416, "grad_norm": 0.18516569508028138, "learning_rate": 3.156898638206588e-05, "loss": 0.3916, "loss_nan_ranks": 0, "loss_rank_avg": 0.15980814397335052, "step": 3165, "valid_targets_mean": 12519.0, "valid_targets_min": 1887 }, { "epoch": 1.8702064896755162, "grad_norm": 0.19172567895750345, "learning_rate": 3.153536209705219e-05, "loss": 0.3863, "loss_nan_ranks": 0, "loss_rank_avg": 0.1256943941116333, "step": 3170, "valid_targets_mean": 9916.1, "valid_targets_min": 1793 }, { "epoch": 1.8731563421828907, "grad_norm": 0.30905823355413986, "learning_rate": 3.150168888337654e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.14326061308383942, "step": 3175, "valid_targets_mean": 10340.9, "valid_targets_min": 1125 }, { "epoch": 1.8761061946902655, "grad_norm": 0.18744713637296262, "learning_rate": 3.1467966883868016e-05, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.13681210577487946, "step": 3180, "valid_targets_mean": 9584.5, "valid_targets_min": 2028 }, { "epoch": 1.87905604719764, "grad_norm": 0.18734267628944543, "learning_rate": 3.143419624156264e-05, "loss": 0.3951, "loss_nan_ranks": 0, "loss_rank_avg": 0.14888234436511993, "step": 3185, "valid_targets_mean": 11590.9, "valid_targets_min": 2261 }, { "epoch": 1.8820058997050149, "grad_norm": 0.19649116485647783, "learning_rate": 3.140037709970277e-05, "loss": 0.3897, "loss_nan_ranks": 0, "loss_rank_avg": 0.1408083736896515, "step": 3190, "valid_targets_mean": 11354.4, "valid_targets_min": 1773 }, { "epoch": 1.8849557522123894, "grad_norm": 0.17818662817613437, "learning_rate": 3.136650960173645e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.12512937188148499, "step": 3195, "valid_targets_mean": 9635.8, "valid_targets_min": 2187 }, { "epoch": 1.887905604719764, "grad_norm": 0.18895452708671834, "learning_rate": 3.1332593891316866e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.13278134167194366, "step": 3200, "valid_targets_mean": 10532.5, "valid_targets_min": 1940 }, { "epoch": 1.8908554572271385, "grad_norm": 0.18407399327994156, "learning_rate": 3.129863011230168e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.13952814042568207, "step": 3205, "valid_targets_mean": 11384.6, "valid_targets_min": 2096 }, { "epoch": 1.893805309734513, "grad_norm": 0.2037091941871826, "learning_rate": 3.126461840875247e-05, "loss": 0.3864, "loss_nan_ranks": 0, "loss_rank_avg": 0.12919670343399048, "step": 3210, "valid_targets_mean": 10272.5, "valid_targets_min": 2815 }, { "epoch": 1.896755162241888, "grad_norm": 0.22168382970996411, "learning_rate": 3.1230558924934056e-05, "loss": 0.3926, "loss_nan_ranks": 0, "loss_rank_avg": 0.14533631503582, "step": 3215, "valid_targets_mean": 11145.4, "valid_targets_min": 818 }, { "epoch": 1.8997050147492627, "grad_norm": 0.18055963902795616, "learning_rate": 3.119645180531395e-05, "loss": 0.3849, "loss_nan_ranks": 0, "loss_rank_avg": 0.115432009100914, "step": 3220, "valid_targets_mean": 9275.6, "valid_targets_min": 1757 }, { "epoch": 1.9026548672566372, "grad_norm": 0.20541231868387194, "learning_rate": 3.11622971945617e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.13783042132854462, "step": 3225, "valid_targets_mean": 10562.0, "valid_targets_min": 1778 }, { "epoch": 1.9056047197640118, "grad_norm": 0.19273506769296583, "learning_rate": 3.112809523754832e-05, "loss": 0.3872, "loss_nan_ranks": 0, "loss_rank_avg": 0.12814044952392578, "step": 3230, "valid_targets_mean": 9969.5, "valid_targets_min": 1957 }, { "epoch": 1.9085545722713864, "grad_norm": 0.18530212003507177, "learning_rate": 3.109384607934562e-05, "loss": 0.389, "loss_nan_ranks": 0, "loss_rank_avg": 0.14377827942371368, "step": 3235, "valid_targets_mean": 10153.2, "valid_targets_min": 2191 }, { "epoch": 1.911504424778761, "grad_norm": 0.18959418284382742, "learning_rate": 3.105954986522563e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.10337518155574799, "step": 3240, "valid_targets_mean": 8849.2, "valid_targets_min": 324 }, { "epoch": 1.9144542772861357, "grad_norm": 0.19079851081682211, "learning_rate": 3.102520674065998e-05, "loss": 0.3897, "loss_nan_ranks": 0, "loss_rank_avg": 0.13874873518943787, "step": 3245, "valid_targets_mean": 10924.6, "valid_targets_min": 2710 }, { "epoch": 1.9174041297935103, "grad_norm": 0.1961476176724746, "learning_rate": 3.099081685131927e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.14250710606575012, "step": 3250, "valid_targets_mean": 11752.3, "valid_targets_min": 1969 }, { "epoch": 1.920353982300885, "grad_norm": 0.1958977931346944, "learning_rate": 3.0956380343072466e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.15353846549987793, "step": 3255, "valid_targets_mean": 12698.6, "valid_targets_min": 2768 }, { "epoch": 1.9233038348082596, "grad_norm": 0.1997870314794016, "learning_rate": 3.092189736198625e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.12486180663108826, "step": 3260, "valid_targets_mean": 10104.6, "valid_targets_min": 1652 }, { "epoch": 1.9262536873156342, "grad_norm": 0.20616461880710768, "learning_rate": 3.0887368054324456e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.13557863235473633, "step": 3265, "valid_targets_mean": 11014.7, "valid_targets_min": 1872 }, { "epoch": 1.9292035398230087, "grad_norm": 0.2131487654674189, "learning_rate": 3.08527925665474e-05, "loss": 0.3868, "loss_nan_ranks": 0, "loss_rank_avg": 0.13005343079566956, "step": 3270, "valid_targets_mean": 10039.7, "valid_targets_min": 2777 }, { "epoch": 1.9321533923303835, "grad_norm": 0.19008851385831405, "learning_rate": 3.081817104531129e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.14494222402572632, "step": 3275, "valid_targets_mean": 11453.5, "valid_targets_min": 1275 }, { "epoch": 1.935103244837758, "grad_norm": 0.19372049268738326, "learning_rate": 3.078350363746756e-05, "loss": 0.3956, "loss_nan_ranks": 0, "loss_rank_avg": 0.11742343753576279, "step": 3280, "valid_targets_mean": 8932.7, "valid_targets_min": 1791 }, { "epoch": 1.9380530973451329, "grad_norm": 0.1779269365091446, "learning_rate": 3.074879049006232e-05, "loss": 0.3814, "loss_nan_ranks": 0, "loss_rank_avg": 0.13389301300048828, "step": 3285, "valid_targets_mean": 11101.6, "valid_targets_min": 2707 }, { "epoch": 1.9410029498525074, "grad_norm": 0.19998320668730726, "learning_rate": 3.0714031750335655e-05, "loss": 0.3896, "loss_nan_ranks": 0, "loss_rank_avg": 0.1562095731496811, "step": 3290, "valid_targets_mean": 10862.0, "valid_targets_min": 1591 }, { "epoch": 1.943952802359882, "grad_norm": 0.18309893130019378, "learning_rate": 3.067922756572106e-05, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.14485730230808258, "step": 3295, "valid_targets_mean": 10801.4, "valid_targets_min": 1421 }, { "epoch": 1.9469026548672566, "grad_norm": 0.19390454376598912, "learning_rate": 3.064437808384477e-05, "loss": 0.3907, "loss_nan_ranks": 0, "loss_rank_avg": 0.12800556421279907, "step": 3300, "valid_targets_mean": 8929.9, "valid_targets_min": 1203 }, { "epoch": 1.9498525073746311, "grad_norm": 0.179528235286811, "learning_rate": 3.0609483452525176e-05, "loss": 0.3962, "loss_nan_ranks": 0, "loss_rank_avg": 0.13554666936397552, "step": 3305, "valid_targets_mean": 10474.6, "valid_targets_min": 1041 }, { "epoch": 1.952802359882006, "grad_norm": 0.19683332955124822, "learning_rate": 3.057454381977214e-05, "loss": 0.3916, "loss_nan_ranks": 0, "loss_rank_avg": 0.11626716703176498, "step": 3310, "valid_targets_mean": 8967.3, "valid_targets_min": 2401 }, { "epoch": 1.9557522123893807, "grad_norm": 0.18365947696319398, "learning_rate": 3.053955933378645e-05, "loss": 0.3869, "loss_nan_ranks": 0, "loss_rank_avg": 0.137057363986969, "step": 3315, "valid_targets_mean": 10507.0, "valid_targets_min": 1811 }, { "epoch": 1.9587020648967552, "grad_norm": 0.1869865865059805, "learning_rate": 3.0504530142959105e-05, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.11256128549575806, "step": 3320, "valid_targets_mean": 9101.4, "valid_targets_min": 1896 }, { "epoch": 1.9616519174041298, "grad_norm": 0.19801017724283992, "learning_rate": 3.046945639587075e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.14004410803318024, "step": 3325, "valid_targets_mean": 11740.2, "valid_targets_min": 1329 }, { "epoch": 1.9646017699115044, "grad_norm": 0.18975756312038314, "learning_rate": 3.0434338241291015e-05, "loss": 0.3898, "loss_nan_ranks": 0, "loss_rank_avg": 0.11776711046695709, "step": 3330, "valid_targets_mean": 8273.8, "valid_targets_min": 1581 }, { "epoch": 1.967551622418879, "grad_norm": 0.18066282594029207, "learning_rate": 3.0399175828177872e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.14526595175266266, "step": 3335, "valid_targets_mean": 10531.7, "valid_targets_min": 2030 }, { "epoch": 1.9705014749262537, "grad_norm": 0.24555864656109105, "learning_rate": 3.036396930567705e-05, "loss": 0.3849, "loss_nan_ranks": 0, "loss_rank_avg": 0.11780230700969696, "step": 3340, "valid_targets_mean": 8572.2, "valid_targets_min": 1302 }, { "epoch": 1.9734513274336283, "grad_norm": 0.1929888138428312, "learning_rate": 3.0328718823121355e-05, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.13801506161689758, "step": 3345, "valid_targets_mean": 10365.0, "valid_targets_min": 1880 }, { "epoch": 1.976401179941003, "grad_norm": 0.19478904054138915, "learning_rate": 3.0293424530030056e-05, "loss": 0.3963, "loss_nan_ranks": 0, "loss_rank_avg": 0.15185290575027466, "step": 3350, "valid_targets_mean": 11930.6, "valid_targets_min": 1431 }, { "epoch": 1.9793510324483776, "grad_norm": 0.19519690417624672, "learning_rate": 3.0258086576108262e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.12830832600593567, "step": 3355, "valid_targets_mean": 10015.8, "valid_targets_min": 1439 }, { "epoch": 1.9823008849557522, "grad_norm": 0.1883692069344865, "learning_rate": 3.0222705111246253e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.13900379836559296, "step": 3360, "valid_targets_mean": 10110.8, "valid_targets_min": 2130 }, { "epoch": 1.9852507374631267, "grad_norm": 0.18813353910541836, "learning_rate": 3.0187280285518886e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365911900997162, "step": 3365, "valid_targets_mean": 9938.6, "valid_targets_min": 1395 }, { "epoch": 1.9882005899705013, "grad_norm": 0.5636207002863355, "learning_rate": 3.015181224918493e-05, "loss": 0.3968, "loss_nan_ranks": 0, "loss_rank_avg": 0.15566903352737427, "step": 3370, "valid_targets_mean": 11508.6, "valid_targets_min": 1832 }, { "epoch": 1.991150442477876, "grad_norm": 0.19814675061839912, "learning_rate": 3.011630115268644e-05, "loss": 0.3862, "loss_nan_ranks": 0, "loss_rank_avg": 0.11800093948841095, "step": 3375, "valid_targets_mean": 9993.5, "valid_targets_min": 2294 }, { "epoch": 1.9941002949852509, "grad_norm": 0.19741184278201546, "learning_rate": 3.008074714664812e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.1500239372253418, "step": 3380, "valid_targets_mean": 11300.2, "valid_targets_min": 1578 }, { "epoch": 1.9970501474926254, "grad_norm": 0.20703640740260867, "learning_rate": 3.0045150381876654e-05, "loss": 0.3829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278185397386551, "step": 3385, "valid_targets_mean": 10239.3, "valid_targets_min": 1636 }, { "epoch": 2.0, "grad_norm": 0.1889992510723016, "learning_rate": 3.0009511009360132e-05, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.11499617993831635, "step": 3390, "valid_targets_mean": 9906.2, "valid_targets_min": 1715 }, { "epoch": 2.0029498525073746, "grad_norm": 0.21278107260553616, "learning_rate": 2.9973829180267344e-05, "loss": 0.3862, "loss_nan_ranks": 0, "loss_rank_avg": 0.11433631181716919, "step": 3395, "valid_targets_mean": 8588.9, "valid_targets_min": 1332 }, { "epoch": 2.005899705014749, "grad_norm": 0.1803230580174313, "learning_rate": 2.993810504594717e-05, "loss": 0.3779, "loss_nan_ranks": 0, "loss_rank_avg": 0.1344345510005951, "step": 3400, "valid_targets_mean": 11002.7, "valid_targets_min": 2057 }, { "epoch": 2.0088495575221237, "grad_norm": 0.19004812139972974, "learning_rate": 2.9902338757927945e-05, "loss": 0.3787, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447649896144867, "step": 3405, "valid_targets_mean": 10779.6, "valid_targets_min": 1624 }, { "epoch": 2.0117994100294987, "grad_norm": 0.1754994480283632, "learning_rate": 2.9866530467916783e-05, "loss": 0.3837, "loss_nan_ranks": 0, "loss_rank_avg": 0.11555009335279465, "step": 3410, "valid_targets_mean": 9960.4, "valid_targets_min": 934 }, { "epoch": 2.0147492625368733, "grad_norm": 0.2008870048940001, "learning_rate": 2.983068032779897e-05, "loss": 0.3813, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313355714082718, "step": 3415, "valid_targets_mean": 10384.6, "valid_targets_min": 1938 }, { "epoch": 2.017699115044248, "grad_norm": 0.17804754922004767, "learning_rate": 2.97947884896373e-05, "loss": 0.3821, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404610574245453, "step": 3420, "valid_targets_mean": 12087.9, "valid_targets_min": 1363 }, { "epoch": 2.0206489675516224, "grad_norm": 0.2177881217184323, "learning_rate": 2.975885510567143e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.10633949935436249, "step": 3425, "valid_targets_mean": 9539.9, "valid_targets_min": 2274 }, { "epoch": 2.023598820058997, "grad_norm": 0.18809039627040855, "learning_rate": 2.9722880328317246e-05, "loss": 0.3785, "loss_nan_ranks": 0, "loss_rank_avg": 0.12327896058559418, "step": 3430, "valid_targets_mean": 9841.0, "valid_targets_min": 2940 }, { "epoch": 2.0265486725663715, "grad_norm": 0.17916281339730925, "learning_rate": 2.9686864310166206e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.12415190786123276, "step": 3435, "valid_targets_mean": 10737.5, "valid_targets_min": 2207 }, { "epoch": 2.0294985250737465, "grad_norm": 0.1843528188235671, "learning_rate": 2.965080720398469e-05, "loss": 0.379, "loss_nan_ranks": 0, "loss_rank_avg": 0.10842064023017883, "step": 3440, "valid_targets_mean": 10486.7, "valid_targets_min": 2517 }, { "epoch": 2.032448377581121, "grad_norm": 0.19308551789685657, "learning_rate": 2.9614709162713377e-05, "loss": 0.3886, "loss_nan_ranks": 0, "loss_rank_avg": 0.10595126450061798, "step": 3445, "valid_targets_mean": 8381.7, "valid_targets_min": 1327 }, { "epoch": 2.0353982300884956, "grad_norm": 0.19204697437288043, "learning_rate": 2.9578570339466553e-05, "loss": 0.3831, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404932737350464, "step": 3450, "valid_targets_mean": 10446.8, "valid_targets_min": 1143 }, { "epoch": 2.03834808259587, "grad_norm": 0.1789574739748446, "learning_rate": 2.95423908875315e-05, "loss": 0.3817, "loss_nan_ranks": 0, "loss_rank_avg": 0.10503190755844116, "step": 3455, "valid_targets_mean": 8746.9, "valid_targets_min": 1190 }, { "epoch": 2.0412979351032448, "grad_norm": 0.18398589452173997, "learning_rate": 2.9506170960367826e-05, "loss": 0.3832, "loss_nan_ranks": 0, "loss_rank_avg": 0.124261774122715, "step": 3460, "valid_targets_mean": 10087.5, "valid_targets_min": 1183 }, { "epoch": 2.0442477876106193, "grad_norm": 0.19056300671049287, "learning_rate": 2.9469910711606827e-05, "loss": 0.3837, "loss_nan_ranks": 0, "loss_rank_avg": 0.12515035271644592, "step": 3465, "valid_targets_mean": 10579.7, "valid_targets_min": 1933 }, { "epoch": 2.047197640117994, "grad_norm": 0.19450910448739192, "learning_rate": 2.9433610295050825e-05, "loss": 0.3938, "loss_nan_ranks": 0, "loss_rank_avg": 0.12465958297252655, "step": 3470, "valid_targets_mean": 8302.7, "valid_targets_min": 1372 }, { "epoch": 2.050147492625369, "grad_norm": 0.1845326161792297, "learning_rate": 2.9397269864672502e-05, "loss": 0.3901, "loss_nan_ranks": 0, "loss_rank_avg": 0.133334219455719, "step": 3475, "valid_targets_mean": 9780.0, "valid_targets_min": 2871 }, { "epoch": 2.0530973451327434, "grad_norm": 0.17669162571743713, "learning_rate": 2.93608895746143e-05, "loss": 0.3817, "loss_nan_ranks": 0, "loss_rank_avg": 0.13513781130313873, "step": 3480, "valid_targets_mean": 11931.6, "valid_targets_min": 2711 }, { "epoch": 2.056047197640118, "grad_norm": 0.17475474879616718, "learning_rate": 2.9324469579187687e-05, "loss": 0.3813, "loss_nan_ranks": 0, "loss_rank_avg": 0.14042824506759644, "step": 3485, "valid_targets_mean": 11337.6, "valid_targets_min": 2230 }, { "epoch": 2.0589970501474926, "grad_norm": 0.1770599580241005, "learning_rate": 2.928801003287259e-05, "loss": 0.3909, "loss_nan_ranks": 0, "loss_rank_avg": 0.1170044094324112, "step": 3490, "valid_targets_mean": 8988.7, "valid_targets_min": 1903 }, { "epoch": 2.061946902654867, "grad_norm": 0.18907281322057007, "learning_rate": 2.9251511090316653e-05, "loss": 0.3863, "loss_nan_ranks": 0, "loss_rank_avg": 0.13288113474845886, "step": 3495, "valid_targets_mean": 9600.8, "valid_targets_min": 1444 }, { "epoch": 2.0648967551622417, "grad_norm": 0.19113320061416877, "learning_rate": 2.9214972906334663e-05, "loss": 0.3836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1208382397890091, "step": 3500, "valid_targets_mean": 9575.3, "valid_targets_min": 1520 }, { "epoch": 2.0678466076696167, "grad_norm": 0.18227771976678786, "learning_rate": 2.917839563590783e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.11254595965147018, "step": 3505, "valid_targets_mean": 9455.3, "valid_targets_min": 1637 }, { "epoch": 2.0707964601769913, "grad_norm": 0.18929906045231637, "learning_rate": 2.914177943418316e-05, "loss": 0.3854, "loss_nan_ranks": 0, "loss_rank_avg": 0.12085720151662827, "step": 3510, "valid_targets_mean": 10024.9, "valid_targets_min": 1887 }, { "epoch": 2.073746312684366, "grad_norm": 0.17363504832025936, "learning_rate": 2.9105124456472797e-05, "loss": 0.3863, "loss_nan_ranks": 0, "loss_rank_avg": 0.11590196192264557, "step": 3515, "valid_targets_mean": 9300.0, "valid_targets_min": 1605 }, { "epoch": 2.0766961651917404, "grad_norm": 0.17322065693898156, "learning_rate": 2.9068430858253335e-05, "loss": 0.3837, "loss_nan_ranks": 0, "loss_rank_avg": 0.10647255182266235, "step": 3520, "valid_targets_mean": 9143.5, "valid_targets_min": 1876 }, { "epoch": 2.079646017699115, "grad_norm": 0.2131679266056025, "learning_rate": 2.9031698795165223e-05, "loss": 0.3847, "loss_nan_ranks": 0, "loss_rank_avg": 0.144773468375206, "step": 3525, "valid_targets_mean": 11088.1, "valid_targets_min": 2465 }, { "epoch": 2.0825958702064895, "grad_norm": 0.18575805832779857, "learning_rate": 2.8994928423012027e-05, "loss": 0.3858, "loss_nan_ranks": 0, "loss_rank_avg": 0.11051160842180252, "step": 3530, "valid_targets_mean": 9622.8, "valid_targets_min": 1275 }, { "epoch": 2.0855457227138645, "grad_norm": 0.19586130635929078, "learning_rate": 2.895811989775982e-05, "loss": 0.383, "loss_nan_ranks": 0, "loss_rank_avg": 0.15362785756587982, "step": 3535, "valid_targets_mean": 11946.5, "valid_targets_min": 1343 }, { "epoch": 2.088495575221239, "grad_norm": 0.20219771286262053, "learning_rate": 2.8921273375536506e-05, "loss": 0.3781, "loss_nan_ranks": 0, "loss_rank_avg": 0.15547239780426025, "step": 3540, "valid_targets_mean": 11678.9, "valid_targets_min": 1990 }, { "epoch": 2.0914454277286136, "grad_norm": 0.1936160339229126, "learning_rate": 2.888438901263115e-05, "loss": 0.3811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1208762675523758, "step": 3545, "valid_targets_mean": 9289.3, "valid_targets_min": 1483 }, { "epoch": 2.094395280235988, "grad_norm": 0.17413806399911613, "learning_rate": 2.884746696549334e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.1528923362493515, "step": 3550, "valid_targets_mean": 12582.7, "valid_targets_min": 2283 }, { "epoch": 2.0973451327433628, "grad_norm": 0.17194009034507063, "learning_rate": 2.8810507390732487e-05, "loss": 0.3839, "loss_nan_ranks": 0, "loss_rank_avg": 0.12632685899734497, "step": 3555, "valid_targets_mean": 10105.1, "valid_targets_min": 1272 }, { "epoch": 2.1002949852507373, "grad_norm": 0.19009776249260985, "learning_rate": 2.8773510445117195e-05, "loss": 0.3803, "loss_nan_ranks": 0, "loss_rank_avg": 0.11879489570856094, "step": 3560, "valid_targets_mean": 7560.3, "valid_targets_min": 1859 }, { "epoch": 2.103244837758112, "grad_norm": 0.17211994107816161, "learning_rate": 2.873647628557457e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.12576919794082642, "step": 3565, "valid_targets_mean": 9344.3, "valid_targets_min": 2537 }, { "epoch": 2.106194690265487, "grad_norm": 0.17305575511305302, "learning_rate": 2.8699405069189573e-05, "loss": 0.3801, "loss_nan_ranks": 0, "loss_rank_avg": 0.1216350868344307, "step": 3570, "valid_targets_mean": 10676.6, "valid_targets_min": 2376 }, { "epoch": 2.1091445427728615, "grad_norm": 0.17356172191088662, "learning_rate": 2.866229695320434e-05, "loss": 0.3827, "loss_nan_ranks": 0, "loss_rank_avg": 0.1366838812828064, "step": 3575, "valid_targets_mean": 10206.7, "valid_targets_min": 1930 }, { "epoch": 2.112094395280236, "grad_norm": 0.2080655561460447, "learning_rate": 2.862515209501753e-05, "loss": 0.3778, "loss_nan_ranks": 0, "loss_rank_avg": 0.11368487775325775, "step": 3580, "valid_targets_mean": 9517.6, "valid_targets_min": 1673 }, { "epoch": 2.1150442477876106, "grad_norm": 0.19332899914412788, "learning_rate": 2.8587970652183642e-05, "loss": 0.3803, "loss_nan_ranks": 0, "loss_rank_avg": 0.13519152998924255, "step": 3585, "valid_targets_mean": 10623.7, "valid_targets_min": 2951 }, { "epoch": 2.117994100294985, "grad_norm": 0.18213962512925527, "learning_rate": 2.8550752782412353e-05, "loss": 0.3853, "loss_nan_ranks": 0, "loss_rank_avg": 0.13883964717388153, "step": 3590, "valid_targets_mean": 11495.6, "valid_targets_min": 1657 }, { "epoch": 2.1209439528023597, "grad_norm": 0.21689471255079432, "learning_rate": 2.8513498643567853e-05, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.12648020684719086, "step": 3595, "valid_targets_mean": 8984.3, "valid_targets_min": 2901 }, { "epoch": 2.1238938053097347, "grad_norm": 0.18398713084327645, "learning_rate": 2.847620839366816e-05, "loss": 0.3867, "loss_nan_ranks": 0, "loss_rank_avg": 0.11699029058218002, "step": 3600, "valid_targets_mean": 9561.6, "valid_targets_min": 1535 }, { "epoch": 2.1268436578171093, "grad_norm": 0.19909313835659861, "learning_rate": 2.8438882190884483e-05, "loss": 0.3983, "loss_nan_ranks": 0, "loss_rank_avg": 0.12598690390586853, "step": 3605, "valid_targets_mean": 9382.0, "valid_targets_min": 1289 }, { "epoch": 2.129793510324484, "grad_norm": 0.19239468673634438, "learning_rate": 2.8401520193540514e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419348418712616, "step": 3610, "valid_targets_mean": 9724.2, "valid_targets_min": 2358 }, { "epoch": 2.1327433628318584, "grad_norm": 0.18329010429612305, "learning_rate": 2.836412256011177e-05, "loss": 0.3984, "loss_nan_ranks": 0, "loss_rank_avg": 0.13659611344337463, "step": 3615, "valid_targets_mean": 11027.6, "valid_targets_min": 1069 }, { "epoch": 2.135693215339233, "grad_norm": 0.1783365761769347, "learning_rate": 2.8326689449224938e-05, "loss": 0.3975, "loss_nan_ranks": 0, "loss_rank_avg": 0.11838910728693008, "step": 3620, "valid_targets_mean": 9196.5, "valid_targets_min": 536 }, { "epoch": 2.1386430678466075, "grad_norm": 0.18628293289232864, "learning_rate": 2.8289221019657172e-05, "loss": 0.3981, "loss_nan_ranks": 0, "loss_rank_avg": 0.12682795524597168, "step": 3625, "valid_targets_mean": 9754.9, "valid_targets_min": 1806 }, { "epoch": 2.1415929203539825, "grad_norm": 0.1819512424595782, "learning_rate": 2.8251717430335444e-05, "loss": 0.4009, "loss_nan_ranks": 0, "loss_rank_avg": 0.12250994890928268, "step": 3630, "valid_targets_mean": 9171.2, "valid_targets_min": 1140 }, { "epoch": 2.144542772861357, "grad_norm": 0.17284428231008353, "learning_rate": 2.8214178840335852e-05, "loss": 0.3997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1340324878692627, "step": 3635, "valid_targets_mean": 9798.3, "valid_targets_min": 1344 }, { "epoch": 2.1474926253687316, "grad_norm": 0.19470660392467842, "learning_rate": 2.8176605408882957e-05, "loss": 0.4013, "loss_nan_ranks": 0, "loss_rank_avg": 0.12144613265991211, "step": 3640, "valid_targets_mean": 8997.8, "valid_targets_min": 2398 }, { "epoch": 2.150442477876106, "grad_norm": 0.18160998479053364, "learning_rate": 2.813899729534911e-05, "loss": 0.402, "loss_nan_ranks": 0, "loss_rank_avg": 0.1443384438753128, "step": 3645, "valid_targets_mean": 10034.7, "valid_targets_min": 1739 }, { "epoch": 2.1533923303834808, "grad_norm": 0.17558747890590443, "learning_rate": 2.8101354659253765e-05, "loss": 0.3993, "loss_nan_ranks": 0, "loss_rank_avg": 0.11908899247646332, "step": 3650, "valid_targets_mean": 9813.8, "valid_targets_min": 1050 }, { "epoch": 2.1563421828908553, "grad_norm": 0.16794874388601116, "learning_rate": 2.806367766026281e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262470781803131, "step": 3655, "valid_targets_mean": 10142.0, "valid_targets_min": 2362 }, { "epoch": 2.15929203539823, "grad_norm": 0.18623675332508144, "learning_rate": 2.8025966458187886e-05, "loss": 0.3971, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318787783384323, "step": 3660, "valid_targets_mean": 10334.2, "valid_targets_min": 1215 }, { "epoch": 2.162241887905605, "grad_norm": 0.17693481520897764, "learning_rate": 2.7988221212985708e-05, "loss": 0.3986, "loss_nan_ranks": 0, "loss_rank_avg": 0.11097447574138641, "step": 3665, "valid_targets_mean": 7946.3, "valid_targets_min": 1646 }, { "epoch": 2.1651917404129795, "grad_norm": 0.18784856297361613, "learning_rate": 2.7950442084757394e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.13702723383903503, "step": 3670, "valid_targets_mean": 10197.9, "valid_targets_min": 2517 }, { "epoch": 2.168141592920354, "grad_norm": 0.1827780965965856, "learning_rate": 2.791262923374778e-05, "loss": 0.4084, "loss_nan_ranks": 0, "loss_rank_avg": 0.1261982023715973, "step": 3675, "valid_targets_mean": 9506.9, "valid_targets_min": 2134 }, { "epoch": 2.1710914454277286, "grad_norm": 0.1859839322818085, "learning_rate": 2.787478282034473e-05, "loss": 0.3978, "loss_nan_ranks": 0, "loss_rank_avg": 0.1325964778661728, "step": 3680, "valid_targets_mean": 10417.7, "valid_targets_min": 1786 }, { "epoch": 2.174041297935103, "grad_norm": 0.1639518540971534, "learning_rate": 2.783690300507849e-05, "loss": 0.3852, "loss_nan_ranks": 0, "loss_rank_avg": 0.1373385339975357, "step": 3685, "valid_targets_mean": 10820.2, "valid_targets_min": 2213 }, { "epoch": 2.1769911504424777, "grad_norm": 0.17159152749861892, "learning_rate": 2.7798989948620962e-05, "loss": 0.3962, "loss_nan_ranks": 0, "loss_rank_avg": 0.14926663041114807, "step": 3690, "valid_targets_mean": 12955.4, "valid_targets_min": 1467 }, { "epoch": 2.1799410029498527, "grad_norm": 0.18047206481601527, "learning_rate": 2.7761043811785065e-05, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.12459855526685715, "step": 3695, "valid_targets_mean": 10078.7, "valid_targets_min": 1501 }, { "epoch": 2.1828908554572273, "grad_norm": 0.19306413780026327, "learning_rate": 2.7723064755524018e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.11301134526729584, "step": 3700, "valid_targets_mean": 8772.9, "valid_targets_min": 1174 }, { "epoch": 2.185840707964602, "grad_norm": 0.18676754801787854, "learning_rate": 2.768505294093067e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.13223782181739807, "step": 3705, "valid_targets_mean": 10604.9, "valid_targets_min": 1801 }, { "epoch": 2.1887905604719764, "grad_norm": 0.1762536216691242, "learning_rate": 2.764700852923682e-05, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.12154674530029297, "step": 3710, "valid_targets_mean": 8825.4, "valid_targets_min": 2007 }, { "epoch": 2.191740412979351, "grad_norm": 0.17120906094368002, "learning_rate": 2.7608931681812548e-05, "loss": 0.3907, "loss_nan_ranks": 0, "loss_rank_avg": 0.1289297640323639, "step": 3715, "valid_targets_mean": 10086.0, "valid_targets_min": 2308 }, { "epoch": 2.1946902654867255, "grad_norm": 0.17585644290659275, "learning_rate": 2.7570822560165494e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.11464974284172058, "step": 3720, "valid_targets_mean": 9196.3, "valid_targets_min": 2358 }, { "epoch": 2.1976401179941005, "grad_norm": 0.17193676556874152, "learning_rate": 2.75326813259402e-05, "loss": 0.4006, "loss_nan_ranks": 0, "loss_rank_avg": 0.10923153162002563, "step": 3725, "valid_targets_mean": 8499.4, "valid_targets_min": 1309 }, { "epoch": 2.200589970501475, "grad_norm": 0.17740306662737546, "learning_rate": 2.7494508140917423e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.13836762309074402, "step": 3730, "valid_targets_mean": 9956.7, "valid_targets_min": 1540 }, { "epoch": 2.2035398230088497, "grad_norm": 0.18082605228455478, "learning_rate": 2.7456303167013435e-05, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.14022909104824066, "step": 3735, "valid_targets_mean": 10383.4, "valid_targets_min": 2501 }, { "epoch": 2.206489675516224, "grad_norm": 0.1783469044956506, "learning_rate": 2.7418066566279348e-05, "loss": 0.398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1336425542831421, "step": 3740, "valid_targets_mean": 9967.4, "valid_targets_min": 1821 }, { "epoch": 2.2094395280235988, "grad_norm": 0.1691487313763563, "learning_rate": 2.7379798500900424e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.1256037950515747, "step": 3745, "valid_targets_mean": 9924.0, "valid_targets_min": 1816 }, { "epoch": 2.2123893805309733, "grad_norm": 0.18101957895595286, "learning_rate": 2.7341499133195385e-05, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.13777321577072144, "step": 3750, "valid_targets_mean": 10049.2, "valid_targets_min": 1217 }, { "epoch": 2.215339233038348, "grad_norm": 0.17450735843383483, "learning_rate": 2.7303168625615718e-05, "loss": 0.401, "loss_nan_ranks": 0, "loss_rank_avg": 0.14749610424041748, "step": 3755, "valid_targets_mean": 12419.6, "valid_targets_min": 2271 }, { "epoch": 2.218289085545723, "grad_norm": 0.1845441504660646, "learning_rate": 2.7264807140745017e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.14936435222625732, "step": 3760, "valid_targets_mean": 10423.2, "valid_targets_min": 1900 }, { "epoch": 2.2212389380530975, "grad_norm": 0.18470787390804666, "learning_rate": 2.722641484129825e-05, "loss": 0.3896, "loss_nan_ranks": 0, "loss_rank_avg": 0.12111598998308182, "step": 3765, "valid_targets_mean": 8453.0, "valid_targets_min": 1408 }, { "epoch": 2.224188790560472, "grad_norm": 0.17056997100554727, "learning_rate": 2.7187991890121076e-05, "loss": 0.4008, "loss_nan_ranks": 0, "loss_rank_avg": 0.12580421566963196, "step": 3770, "valid_targets_mean": 9931.7, "valid_targets_min": 2305 }, { "epoch": 2.2271386430678466, "grad_norm": 0.18783881320534634, "learning_rate": 2.7149538450189204e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.1510670930147171, "step": 3775, "valid_targets_mean": 10178.9, "valid_targets_min": 1039 }, { "epoch": 2.230088495575221, "grad_norm": 0.1739931085046215, "learning_rate": 2.7111054684607644e-05, "loss": 0.3951, "loss_nan_ranks": 0, "loss_rank_avg": 0.14426995813846588, "step": 3780, "valid_targets_mean": 10581.9, "valid_targets_min": 1697 }, { "epoch": 2.2330383480825957, "grad_norm": 0.17254501855584767, "learning_rate": 2.7072540756610027e-05, "loss": 0.4058, "loss_nan_ranks": 0, "loss_rank_avg": 0.14102444052696228, "step": 3785, "valid_targets_mean": 10485.4, "valid_targets_min": 2081 }, { "epoch": 2.2359882005899703, "grad_norm": 0.16449191575448785, "learning_rate": 2.703399682955794e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.13488492369651794, "step": 3790, "valid_targets_mean": 10634.4, "valid_targets_min": 1494 }, { "epoch": 2.2389380530973453, "grad_norm": 0.1764118124541508, "learning_rate": 2.6995423066940206e-05, "loss": 0.3864, "loss_nan_ranks": 0, "loss_rank_avg": 0.12274979054927826, "step": 3795, "valid_targets_mean": 9134.9, "valid_targets_min": 1983 }, { "epoch": 2.24188790560472, "grad_norm": 0.18680929847990685, "learning_rate": 2.6956819632372194e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.10951778292655945, "step": 3800, "valid_targets_mean": 7631.4, "valid_targets_min": 1308 }, { "epoch": 2.2448377581120944, "grad_norm": 0.20523570522718323, "learning_rate": 2.6918186689595134e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293448507785797, "step": 3805, "valid_targets_mean": 11488.8, "valid_targets_min": 3111 }, { "epoch": 2.247787610619469, "grad_norm": 0.17597635789172644, "learning_rate": 2.687952440247543e-05, "loss": 0.3926, "loss_nan_ranks": 0, "loss_rank_avg": 0.1164768636226654, "step": 3810, "valid_targets_mean": 9848.1, "valid_targets_min": 1539 }, { "epoch": 2.2507374631268435, "grad_norm": 0.18144303661230346, "learning_rate": 2.6840832935003942e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.15120357275009155, "step": 3815, "valid_targets_mean": 12024.1, "valid_targets_min": 2727 }, { "epoch": 2.2536873156342185, "grad_norm": 0.1847443407254508, "learning_rate": 2.68021124512953e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.12879443168640137, "step": 3820, "valid_targets_mean": 9545.0, "valid_targets_min": 1882 }, { "epoch": 2.256637168141593, "grad_norm": 0.18701048508634804, "learning_rate": 2.6763363115587218e-05, "loss": 0.3954, "loss_nan_ranks": 0, "loss_rank_avg": 0.11498545110225677, "step": 3825, "valid_targets_mean": 8259.6, "valid_targets_min": 1045 }, { "epoch": 2.2595870206489677, "grad_norm": 0.18824323332335477, "learning_rate": 2.6724585092239784e-05, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.13292992115020752, "step": 3830, "valid_targets_mean": 10127.1, "valid_targets_min": 1797 }, { "epoch": 2.262536873156342, "grad_norm": 0.20140870554938575, "learning_rate": 2.668577854573477e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.12686914205551147, "step": 3835, "valid_targets_mean": 8850.4, "valid_targets_min": 1524 }, { "epoch": 2.265486725663717, "grad_norm": 0.17288624780173162, "learning_rate": 2.6646943640674937e-05, "loss": 0.3963, "loss_nan_ranks": 0, "loss_rank_avg": 0.1073978841304779, "step": 3840, "valid_targets_mean": 8547.2, "valid_targets_min": 1657 }, { "epoch": 2.2684365781710913, "grad_norm": 0.18135599145281248, "learning_rate": 2.6608080541783316e-05, "loss": 0.3905, "loss_nan_ranks": 0, "loss_rank_avg": 0.11137989163398743, "step": 3845, "valid_targets_mean": 7498.9, "valid_targets_min": 2006 }, { "epoch": 2.271386430678466, "grad_norm": 0.1858489858186105, "learning_rate": 2.6569189413902544e-05, "loss": 0.3944, "loss_nan_ranks": 0, "loss_rank_avg": 0.13760294020175934, "step": 3850, "valid_targets_mean": 10987.5, "valid_targets_min": 2508 }, { "epoch": 2.274336283185841, "grad_norm": 0.17666569108019423, "learning_rate": 2.6530270421994146e-05, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.1223081648349762, "step": 3855, "valid_targets_mean": 10292.0, "valid_targets_min": 2280 }, { "epoch": 2.2772861356932155, "grad_norm": 0.18248461786488382, "learning_rate": 2.6491323731137818e-05, "loss": 0.3945, "loss_nan_ranks": 0, "loss_rank_avg": 0.13024061918258667, "step": 3860, "valid_targets_mean": 10601.8, "valid_targets_min": 1396 }, { "epoch": 2.28023598820059, "grad_norm": 0.18453098272423848, "learning_rate": 2.6452349506530762e-05, "loss": 0.3897, "loss_nan_ranks": 0, "loss_rank_avg": 0.1465938836336136, "step": 3865, "valid_targets_mean": 9942.6, "valid_targets_min": 2133 }, { "epoch": 2.2831858407079646, "grad_norm": 0.1800510324678868, "learning_rate": 2.6413347913486967e-05, "loss": 0.3993, "loss_nan_ranks": 0, "loss_rank_avg": 0.15016867220401764, "step": 3870, "valid_targets_mean": 9759.4, "valid_targets_min": 1581 }, { "epoch": 2.286135693215339, "grad_norm": 0.1840760855307141, "learning_rate": 2.637431911743649e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1509101539850235, "step": 3875, "valid_targets_mean": 10620.5, "valid_targets_min": 1461 }, { "epoch": 2.2890855457227137, "grad_norm": 0.20046019039716598, "learning_rate": 2.63352632839248e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.11841368675231934, "step": 3880, "valid_targets_mean": 8787.5, "valid_targets_min": 2197 }, { "epoch": 2.2920353982300883, "grad_norm": 0.17185687883942527, "learning_rate": 2.629618057861202e-05, "loss": 0.3971, "loss_nan_ranks": 0, "loss_rank_avg": 0.11624648422002792, "step": 3885, "valid_targets_mean": 9077.8, "valid_targets_min": 2800 }, { "epoch": 2.2949852507374633, "grad_norm": 0.1740597178196862, "learning_rate": 2.625707116727228e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.13334083557128906, "step": 3890, "valid_targets_mean": 9941.8, "valid_targets_min": 2260 }, { "epoch": 2.297935103244838, "grad_norm": 0.17155366850277412, "learning_rate": 2.6217935215792967e-05, "loss": 0.3987, "loss_nan_ranks": 0, "loss_rank_avg": 0.13235624134540558, "step": 3895, "valid_targets_mean": 10138.6, "valid_targets_min": 1655 }, { "epoch": 2.3008849557522124, "grad_norm": 0.18246331548218217, "learning_rate": 2.6178772890174057e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.14090922474861145, "step": 3900, "valid_targets_mean": 9809.2, "valid_targets_min": 1817 }, { "epoch": 2.303834808259587, "grad_norm": 0.18779345629629093, "learning_rate": 2.6139584356527385e-05, "loss": 0.3968, "loss_nan_ranks": 0, "loss_rank_avg": 0.15629766881465912, "step": 3905, "valid_targets_mean": 11053.2, "valid_targets_min": 1891 }, { "epoch": 2.3067846607669615, "grad_norm": 0.17739964048057022, "learning_rate": 2.610036978107595e-05, "loss": 0.3874, "loss_nan_ranks": 0, "loss_rank_avg": 0.15338581800460815, "step": 3910, "valid_targets_mean": 10950.2, "valid_targets_min": 2265 }, { "epoch": 2.309734513274336, "grad_norm": 0.19609733988432582, "learning_rate": 2.6061129330153212e-05, "loss": 0.3941, "loss_nan_ranks": 0, "loss_rank_avg": 0.12699197232723236, "step": 3915, "valid_targets_mean": 9727.5, "valid_targets_min": 1294 }, { "epoch": 2.312684365781711, "grad_norm": 0.18288278960145077, "learning_rate": 2.602186317020239e-05, "loss": 0.3978, "loss_nan_ranks": 0, "loss_rank_avg": 0.13509252667427063, "step": 3920, "valid_targets_mean": 10823.4, "valid_targets_min": 2542 }, { "epoch": 2.3156342182890857, "grad_norm": 0.19152225870964204, "learning_rate": 2.598257146777575e-05, "loss": 0.3921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314992904663086, "step": 3925, "valid_targets_mean": 10381.6, "valid_targets_min": 1504 }, { "epoch": 2.3185840707964602, "grad_norm": 0.17075307828765438, "learning_rate": 2.5943254389533888e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531062126159668, "step": 3930, "valid_targets_mean": 10812.6, "valid_targets_min": 1055 }, { "epoch": 2.321533923303835, "grad_norm": 0.17132496778995138, "learning_rate": 2.5903912102245053e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.11895540356636047, "step": 3935, "valid_targets_mean": 9040.8, "valid_targets_min": 1130 }, { "epoch": 2.3244837758112094, "grad_norm": 0.18685408915114127, "learning_rate": 2.5864544772784407e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.11604495346546173, "step": 3940, "valid_targets_mean": 9655.9, "valid_targets_min": 1410 }, { "epoch": 2.327433628318584, "grad_norm": 0.16879584787533836, "learning_rate": 2.5825152568133343e-05, "loss": 0.3924, "loss_nan_ranks": 0, "loss_rank_avg": 0.11255620419979095, "step": 3945, "valid_targets_mean": 8905.6, "valid_targets_min": 1830 }, { "epoch": 2.330383480825959, "grad_norm": 0.1864666442297191, "learning_rate": 2.5785735655378745e-05, "loss": 0.3919, "loss_nan_ranks": 0, "loss_rank_avg": 0.11839946359395981, "step": 3950, "valid_targets_mean": 9882.5, "valid_targets_min": 2408 }, { "epoch": 2.3333333333333335, "grad_norm": 0.23730696535755824, "learning_rate": 2.5746294201712326e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.12219962477684021, "step": 3955, "valid_targets_mean": 9463.4, "valid_targets_min": 1659 }, { "epoch": 2.336283185840708, "grad_norm": 0.16420168897254991, "learning_rate": 2.5706828374429873e-05, "loss": 0.3949, "loss_nan_ranks": 0, "loss_rank_avg": 0.11978039145469666, "step": 3960, "valid_targets_mean": 11038.2, "valid_targets_min": 1531 }, { "epoch": 2.3392330383480826, "grad_norm": 0.18849127213452108, "learning_rate": 2.5667338340930563e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.1379072070121765, "step": 3965, "valid_targets_mean": 10074.7, "valid_targets_min": 2085 }, { "epoch": 2.342182890855457, "grad_norm": 0.171765781113225, "learning_rate": 2.5627824268716247e-05, "loss": 0.3955, "loss_nan_ranks": 0, "loss_rank_avg": 0.11300992965698242, "step": 3970, "valid_targets_mean": 10108.6, "valid_targets_min": 1642 }, { "epoch": 2.3451327433628317, "grad_norm": 0.17177249459813396, "learning_rate": 2.5588286325390744e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.12897521257400513, "step": 3975, "valid_targets_mean": 9673.6, "valid_targets_min": 997 }, { "epoch": 2.3480825958702063, "grad_norm": 0.17701611497782288, "learning_rate": 2.5548724678659115e-05, "loss": 0.3926, "loss_nan_ranks": 0, "loss_rank_avg": 0.11329556256532669, "step": 3980, "valid_targets_mean": 8708.4, "valid_targets_min": 1573 }, { "epoch": 2.3510324483775813, "grad_norm": 0.25579883316916374, "learning_rate": 2.550913949632697e-05, "loss": 0.3938, "loss_nan_ranks": 0, "loss_rank_avg": 0.14847159385681152, "step": 3985, "valid_targets_mean": 12304.2, "valid_targets_min": 1814 }, { "epoch": 2.353982300884956, "grad_norm": 0.16613061378431035, "learning_rate": 2.5469530946299746e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.13126221299171448, "step": 3990, "valid_targets_mean": 11132.8, "valid_targets_min": 1200 }, { "epoch": 2.3569321533923304, "grad_norm": 0.17686783624732347, "learning_rate": 2.542989919658199e-05, "loss": 0.4007, "loss_nan_ranks": 0, "loss_rank_avg": 0.14059323072433472, "step": 3995, "valid_targets_mean": 10237.6, "valid_targets_min": 950 }, { "epoch": 2.359882005899705, "grad_norm": 0.20215416996696808, "learning_rate": 2.5390244415276666e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.1143152043223381, "step": 4000, "valid_targets_mean": 10417.7, "valid_targets_min": 2034 }, { "epoch": 2.3628318584070795, "grad_norm": 0.17655569706363347, "learning_rate": 2.5350566770584423e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.13264046609401703, "step": 4005, "valid_targets_mean": 11726.6, "valid_targets_min": 1312 }, { "epoch": 2.365781710914454, "grad_norm": 0.17920640711803199, "learning_rate": 2.5310866430802877e-05, "loss": 0.391, "loss_nan_ranks": 0, "loss_rank_avg": 0.11140947043895721, "step": 4010, "valid_targets_mean": 8954.2, "valid_targets_min": 1876 }, { "epoch": 2.3687315634218287, "grad_norm": 0.2076440770678389, "learning_rate": 2.527114356432593e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.15259167551994324, "step": 4015, "valid_targets_mean": 10257.4, "valid_targets_min": 2939 }, { "epoch": 2.3716814159292037, "grad_norm": 0.1884915676583662, "learning_rate": 2.5231398339643022e-05, "loss": 0.3907, "loss_nan_ranks": 0, "loss_rank_avg": 0.12428969889879227, "step": 4020, "valid_targets_mean": 9281.1, "valid_targets_min": 2123 }, { "epoch": 2.3746312684365782, "grad_norm": 0.18874802459911955, "learning_rate": 2.519163092533843e-05, "loss": 0.3912, "loss_nan_ranks": 0, "loss_rank_avg": 0.14149920642375946, "step": 4025, "valid_targets_mean": 9339.8, "valid_targets_min": 2558 }, { "epoch": 2.377581120943953, "grad_norm": 0.17723065208387231, "learning_rate": 2.5151841490090537e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307816505432129, "step": 4030, "valid_targets_mean": 9360.2, "valid_targets_min": 2415 }, { "epoch": 2.3805309734513274, "grad_norm": 0.17421579470262544, "learning_rate": 2.5112030202671154e-05, "loss": 0.3906, "loss_nan_ranks": 0, "loss_rank_avg": 0.11921098828315735, "step": 4035, "valid_targets_mean": 8395.6, "valid_targets_min": 1630 }, { "epoch": 2.383480825958702, "grad_norm": 0.17031332521729364, "learning_rate": 2.507219723194477e-05, "loss": 0.3844, "loss_nan_ranks": 0, "loss_rank_avg": 0.14918190240859985, "step": 4040, "valid_targets_mean": 12708.2, "valid_targets_min": 3373 }, { "epoch": 2.386430678466077, "grad_norm": 0.17823669644393042, "learning_rate": 2.5032342746867844e-05, "loss": 0.3827, "loss_nan_ranks": 0, "loss_rank_avg": 0.1188630759716034, "step": 4045, "valid_targets_mean": 11102.9, "valid_targets_min": 2383 }, { "epoch": 2.3893805309734515, "grad_norm": 0.17538450361576227, "learning_rate": 2.49924669164881e-05, "loss": 0.3935, "loss_nan_ranks": 0, "loss_rank_avg": 0.12793388962745667, "step": 4050, "valid_targets_mean": 9429.2, "valid_targets_min": 1243 }, { "epoch": 2.392330383480826, "grad_norm": 0.17032901916386253, "learning_rate": 2.495256990994378e-05, "loss": 0.389, "loss_nan_ranks": 0, "loss_rank_avg": 0.15003778040409088, "step": 4055, "valid_targets_mean": 12589.8, "valid_targets_min": 1293 }, { "epoch": 2.3952802359882006, "grad_norm": 0.17182426265268705, "learning_rate": 2.4912651896462967e-05, "loss": 0.3893, "loss_nan_ranks": 0, "loss_rank_avg": 0.12547190487384796, "step": 4060, "valid_targets_mean": 9731.8, "valid_targets_min": 1129 }, { "epoch": 2.398230088495575, "grad_norm": 0.17298035699811434, "learning_rate": 2.487271304536284e-05, "loss": 0.3879, "loss_nan_ranks": 0, "loss_rank_avg": 0.101053886115551, "step": 4065, "valid_targets_mean": 8218.8, "valid_targets_min": 595 }, { "epoch": 2.4011799410029497, "grad_norm": 0.16731123092758138, "learning_rate": 2.4832753526048977e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.12202181667089462, "step": 4070, "valid_targets_mean": 9081.4, "valid_targets_min": 888 }, { "epoch": 2.4041297935103243, "grad_norm": 0.17594985833188911, "learning_rate": 2.4792773508014597e-05, "loss": 0.3858, "loss_nan_ranks": 0, "loss_rank_avg": 0.13053381443023682, "step": 4075, "valid_targets_mean": 10127.8, "valid_targets_min": 1547 }, { "epoch": 2.4070796460176993, "grad_norm": 0.1725954639777345, "learning_rate": 2.4752773160839885e-05, "loss": 0.388, "loss_nan_ranks": 0, "loss_rank_avg": 0.12309059500694275, "step": 4080, "valid_targets_mean": 9777.3, "valid_targets_min": 1666 }, { "epoch": 2.410029498525074, "grad_norm": 0.17639722633497423, "learning_rate": 2.4712752654191254e-05, "loss": 0.3893, "loss_nan_ranks": 0, "loss_rank_avg": 0.11810016632080078, "step": 4085, "valid_targets_mean": 8813.1, "valid_targets_min": 2184 }, { "epoch": 2.4129793510324484, "grad_norm": 0.1845806404741444, "learning_rate": 2.467271215782061e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.12740883231163025, "step": 4090, "valid_targets_mean": 9679.6, "valid_targets_min": 2445 }, { "epoch": 2.415929203539823, "grad_norm": 0.18118441307550773, "learning_rate": 2.4632651841564673e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.12179508060216904, "step": 4095, "valid_targets_mean": 10510.3, "valid_targets_min": 1998 }, { "epoch": 2.4188790560471976, "grad_norm": 0.18764285880053957, "learning_rate": 2.4592571875344217e-05, "loss": 0.3786, "loss_nan_ranks": 0, "loss_rank_avg": 0.1726941615343094, "step": 4100, "valid_targets_mean": 12465.5, "valid_targets_min": 1710 }, { "epoch": 2.421828908554572, "grad_norm": 0.18199183358032803, "learning_rate": 2.4552472429163357e-05, "loss": 0.3711, "loss_nan_ranks": 0, "loss_rank_avg": 0.14343643188476562, "step": 4105, "valid_targets_mean": 10231.8, "valid_targets_min": 2259 }, { "epoch": 2.4247787610619467, "grad_norm": 0.1725750391349139, "learning_rate": 2.4512353673108847e-05, "loss": 0.3753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398804783821106, "step": 4110, "valid_targets_mean": 13320.7, "valid_targets_min": 1376 }, { "epoch": 2.4277286135693217, "grad_norm": 0.18305122770334165, "learning_rate": 2.4472215777349346e-05, "loss": 0.3667, "loss_nan_ranks": 0, "loss_rank_avg": 0.10101216286420822, "step": 4115, "valid_targets_mean": 8426.0, "valid_targets_min": 1654 }, { "epoch": 2.4306784660766962, "grad_norm": 0.1926083380216005, "learning_rate": 2.4432058912134695e-05, "loss": 0.3714, "loss_nan_ranks": 0, "loss_rank_avg": 0.11317503452301025, "step": 4120, "valid_targets_mean": 8610.3, "valid_targets_min": 2335 }, { "epoch": 2.433628318584071, "grad_norm": 0.2196195456089233, "learning_rate": 2.439188324779518e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.12208309769630432, "step": 4125, "valid_targets_mean": 9733.9, "valid_targets_min": 2604 }, { "epoch": 2.4365781710914454, "grad_norm": 0.2002734068453938, "learning_rate": 2.435168895474085e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.09944422543048859, "step": 4130, "valid_targets_mean": 7887.3, "valid_targets_min": 961 }, { "epoch": 2.43952802359882, "grad_norm": 0.1974919985284759, "learning_rate": 2.4311476203460753e-05, "loss": 0.3722, "loss_nan_ranks": 0, "loss_rank_avg": 0.14025208353996277, "step": 4135, "valid_targets_mean": 12008.4, "valid_targets_min": 3631 }, { "epoch": 2.442477876106195, "grad_norm": 0.1992481010119958, "learning_rate": 2.4271245164522244e-05, "loss": 0.3792, "loss_nan_ranks": 0, "loss_rank_avg": 0.13258278369903564, "step": 4140, "valid_targets_mean": 11155.2, "valid_targets_min": 2731 }, { "epoch": 2.4454277286135695, "grad_norm": 0.18912241428488177, "learning_rate": 2.4230996008570237e-05, "loss": 0.367, "loss_nan_ranks": 0, "loss_rank_avg": 0.1264360398054123, "step": 4145, "valid_targets_mean": 10674.4, "valid_targets_min": 1317 }, { "epoch": 2.448377581120944, "grad_norm": 0.18223546620888548, "learning_rate": 2.4190728906326496e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.14574602246284485, "step": 4150, "valid_targets_mean": 11136.4, "valid_targets_min": 1890 }, { "epoch": 2.4513274336283186, "grad_norm": 0.20209171805214524, "learning_rate": 2.4150444028588896e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.15436725318431854, "step": 4155, "valid_targets_mean": 12538.8, "valid_targets_min": 1856 }, { "epoch": 2.454277286135693, "grad_norm": 0.1981802269778582, "learning_rate": 2.411014154623073e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.14357636868953705, "step": 4160, "valid_targets_mean": 11351.3, "valid_targets_min": 1738 }, { "epoch": 2.4572271386430677, "grad_norm": 0.18767130154313147, "learning_rate": 2.4069821630199938e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.10319440811872482, "step": 4165, "valid_targets_mean": 9638.6, "valid_targets_min": 2769 }, { "epoch": 2.4601769911504423, "grad_norm": 0.20106308424588426, "learning_rate": 2.402948445151843e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.12477102875709534, "step": 4170, "valid_targets_mean": 10217.3, "valid_targets_min": 1867 }, { "epoch": 2.4631268436578173, "grad_norm": 0.1878349564170574, "learning_rate": 2.3989130181281323e-05, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.12376038730144501, "step": 4175, "valid_targets_mean": 10830.1, "valid_targets_min": 2056 }, { "epoch": 2.466076696165192, "grad_norm": 0.182326417226956, "learning_rate": 2.3948758990656232e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.09735498577356339, "step": 4180, "valid_targets_mean": 8065.7, "valid_targets_min": 2250 }, { "epoch": 2.4690265486725664, "grad_norm": 0.17881624649061542, "learning_rate": 2.3908371050882554e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.11818811297416687, "step": 4185, "valid_targets_mean": 10655.2, "valid_targets_min": 2555 }, { "epoch": 2.471976401179941, "grad_norm": 0.2015720023458747, "learning_rate": 2.3867966533270716e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320725679397583, "step": 4190, "valid_targets_mean": 11071.5, "valid_targets_min": 860 }, { "epoch": 2.4749262536873156, "grad_norm": 0.19971733040726514, "learning_rate": 2.3827545609201462e-05, "loss": 0.3641, "loss_nan_ranks": 0, "loss_rank_avg": 0.14172565937042236, "step": 4195, "valid_targets_mean": 11408.9, "valid_targets_min": 2015 }, { "epoch": 2.47787610619469, "grad_norm": 0.1895322692289199, "learning_rate": 2.3787108450125133e-05, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.10191375017166138, "step": 4200, "valid_targets_mean": 9568.1, "valid_targets_min": 1913 }, { "epoch": 2.4808259587020647, "grad_norm": 0.189797790905414, "learning_rate": 2.3746655227560932e-05, "loss": 0.3743, "loss_nan_ranks": 0, "loss_rank_avg": 0.11338387429714203, "step": 4205, "valid_targets_mean": 9056.0, "valid_targets_min": 1585 }, { "epoch": 2.4837758112094397, "grad_norm": 0.19042071073474165, "learning_rate": 2.3706186113096187e-05, "loss": 0.3688, "loss_nan_ranks": 0, "loss_rank_avg": 0.1429302990436554, "step": 4210, "valid_targets_mean": 13044.3, "valid_targets_min": 2160 }, { "epoch": 2.4867256637168142, "grad_norm": 0.194122243175992, "learning_rate": 2.366570127838564e-05, "loss": 0.3738, "loss_nan_ranks": 0, "loss_rank_avg": 0.10320837795734406, "step": 4215, "valid_targets_mean": 9486.9, "valid_targets_min": 1543 }, { "epoch": 2.489675516224189, "grad_norm": 0.17235334362756774, "learning_rate": 2.362520089515073e-05, "loss": 0.374, "loss_nan_ranks": 0, "loss_rank_avg": 0.10433302819728851, "step": 4220, "valid_targets_mean": 9637.9, "valid_targets_min": 1453 }, { "epoch": 2.4926253687315634, "grad_norm": 0.17737199801949888, "learning_rate": 2.358468513517882e-05, "loss": 0.3744, "loss_nan_ranks": 0, "loss_rank_avg": 0.1555056869983673, "step": 4225, "valid_targets_mean": 11221.1, "valid_targets_min": 1861 }, { "epoch": 2.495575221238938, "grad_norm": 0.1776538389094094, "learning_rate": 2.35441541703225e-05, "loss": 0.3734, "loss_nan_ranks": 0, "loss_rank_avg": 0.10380370914936066, "step": 4230, "valid_targets_mean": 7896.7, "valid_targets_min": 1601 }, { "epoch": 2.4985250737463125, "grad_norm": 0.16806275136850427, "learning_rate": 2.3503608172498878e-05, "loss": 0.3737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1344701498746872, "step": 4235, "valid_targets_mean": 11206.3, "valid_targets_min": 2567 }, { "epoch": 2.501474926253687, "grad_norm": 0.1838042863563555, "learning_rate": 2.346304731368879e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.12868273258209229, "step": 4240, "valid_targets_mean": 9940.7, "valid_targets_min": 1487 }, { "epoch": 2.504424778761062, "grad_norm": 0.1882399630093764, "learning_rate": 2.3422471765936124e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.12242631614208221, "step": 4245, "valid_targets_mean": 9426.9, "valid_targets_min": 1920 }, { "epoch": 2.5073746312684366, "grad_norm": 0.1927731789030749, "learning_rate": 2.338188170134709e-05, "loss": 0.3738, "loss_nan_ranks": 0, "loss_rank_avg": 0.1051219254732132, "step": 4250, "valid_targets_mean": 7889.9, "valid_targets_min": 1997 }, { "epoch": 2.510324483775811, "grad_norm": 0.19010092340967272, "learning_rate": 2.3341277292089446e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.10231277346611023, "step": 4255, "valid_targets_mean": 8702.3, "valid_targets_min": 2150 }, { "epoch": 2.5132743362831858, "grad_norm": 0.18926011510358104, "learning_rate": 2.33006587103918e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.14327773451805115, "step": 4260, "valid_targets_mean": 11533.9, "valid_targets_min": 1871 }, { "epoch": 2.5162241887905603, "grad_norm": 0.19331180232935863, "learning_rate": 2.3260026128542886e-05, "loss": 0.3586, "loss_nan_ranks": 0, "loss_rank_avg": 0.11851916462182999, "step": 4265, "valid_targets_mean": 10099.0, "valid_targets_min": 2449 }, { "epoch": 2.5191740412979353, "grad_norm": 0.19110202290037573, "learning_rate": 2.3219379718890814e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.13638907670974731, "step": 4270, "valid_targets_mean": 10613.0, "valid_targets_min": 1767 }, { "epoch": 2.52212389380531, "grad_norm": 0.18240060005875852, "learning_rate": 2.317871965384235e-05, "loss": 0.3725, "loss_nan_ranks": 0, "loss_rank_avg": 0.12266083061695099, "step": 4275, "valid_targets_mean": 9735.8, "valid_targets_min": 1444 }, { "epoch": 2.5250737463126844, "grad_norm": 0.19650112914503412, "learning_rate": 2.3138046105862175e-05, "loss": 0.3779, "loss_nan_ranks": 0, "loss_rank_avg": 0.13388144969940186, "step": 4280, "valid_targets_mean": 12089.4, "valid_targets_min": 1483 }, { "epoch": 2.528023598820059, "grad_norm": 0.18887624139751505, "learning_rate": 2.3097359247472156e-05, "loss": 0.3742, "loss_nan_ranks": 0, "loss_rank_avg": 0.12826773524284363, "step": 4285, "valid_targets_mean": 9522.6, "valid_targets_min": 747 }, { "epoch": 2.5309734513274336, "grad_norm": 0.1966567564253813, "learning_rate": 2.3056659251250637e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.08406929671764374, "step": 4290, "valid_targets_mean": 6589.8, "valid_targets_min": 1001 }, { "epoch": 2.533923303834808, "grad_norm": 0.18282408339040876, "learning_rate": 2.301594628983166e-05, "loss": 0.3742, "loss_nan_ranks": 0, "loss_rank_avg": 0.11688566207885742, "step": 4295, "valid_targets_mean": 8307.7, "valid_targets_min": 1442 }, { "epoch": 2.5368731563421827, "grad_norm": 0.1875617083131164, "learning_rate": 2.2975220535904286e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.11464380472898483, "step": 4300, "valid_targets_mean": 9174.5, "valid_targets_min": 2099 }, { "epoch": 2.5398230088495577, "grad_norm": 0.1882850853875356, "learning_rate": 2.2934482162211827e-05, "loss": 0.3674, "loss_nan_ranks": 0, "loss_rank_avg": 0.127057284116745, "step": 4305, "valid_targets_mean": 9977.2, "valid_targets_min": 1385 }, { "epoch": 2.5427728613569323, "grad_norm": 0.1889501349131273, "learning_rate": 2.2893731341551117e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.10239008069038391, "step": 4310, "valid_targets_mean": 8322.1, "valid_targets_min": 2131 }, { "epoch": 2.545722713864307, "grad_norm": 0.17697629988020622, "learning_rate": 2.285296824677179e-05, "loss": 0.3745, "loss_nan_ranks": 0, "loss_rank_avg": 0.12793973088264465, "step": 4315, "valid_targets_mean": 10406.2, "valid_targets_min": 1407 }, { "epoch": 2.5486725663716814, "grad_norm": 0.19561789633386095, "learning_rate": 2.2812193050775552e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.140027716755867, "step": 4320, "valid_targets_mean": 12493.9, "valid_targets_min": 2457 }, { "epoch": 2.551622418879056, "grad_norm": 0.1802313241831928, "learning_rate": 2.2771405926515423e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.10761629045009613, "step": 4325, "valid_targets_mean": 9960.1, "valid_targets_min": 2052 }, { "epoch": 2.554572271386431, "grad_norm": 0.1751657945259594, "learning_rate": 2.2730607046995026e-05, "loss": 0.3738, "loss_nan_ranks": 0, "loss_rank_avg": 0.10588338226079941, "step": 4330, "valid_targets_mean": 8378.8, "valid_targets_min": 1560 }, { "epoch": 2.557522123893805, "grad_norm": 0.19248830700949682, "learning_rate": 2.2689796585267843e-05, "loss": 0.3674, "loss_nan_ranks": 0, "loss_rank_avg": 0.11182724684476852, "step": 4335, "valid_targets_mean": 9472.5, "valid_targets_min": 2484 }, { "epoch": 2.56047197640118, "grad_norm": 0.18435708690786634, "learning_rate": 2.2648974714436473e-05, "loss": 0.3712, "loss_nan_ranks": 0, "loss_rank_avg": 0.11992965638637543, "step": 4340, "valid_targets_mean": 10299.2, "valid_targets_min": 878 }, { "epoch": 2.5634218289085546, "grad_norm": 0.17894693429898967, "learning_rate": 2.260814160765194e-05, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.13005350530147552, "step": 4345, "valid_targets_mean": 10887.9, "valid_targets_min": 2125 }, { "epoch": 2.566371681415929, "grad_norm": 0.17833561968446868, "learning_rate": 2.2567297438112896e-05, "loss": 0.3667, "loss_nan_ranks": 0, "loss_rank_avg": 0.15313655138015747, "step": 4350, "valid_targets_mean": 12573.0, "valid_targets_min": 2048 }, { "epoch": 2.5693215339233038, "grad_norm": 0.18379146848722314, "learning_rate": 2.2526442379064926e-05, "loss": 0.371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11305586993694305, "step": 4355, "valid_targets_mean": 9179.3, "valid_targets_min": 1147 }, { "epoch": 2.5722713864306783, "grad_norm": 0.1753040455053401, "learning_rate": 2.2485576603799804e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262725293636322, "step": 4360, "valid_targets_mean": 10706.8, "valid_targets_min": 1593 }, { "epoch": 2.5752212389380533, "grad_norm": 0.18485595887788345, "learning_rate": 2.2444700285654765e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.11888639628887177, "step": 4365, "valid_targets_mean": 9218.1, "valid_targets_min": 2137 }, { "epoch": 2.578171091445428, "grad_norm": 0.19103757174545843, "learning_rate": 2.240381359801175e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.13815957307815552, "step": 4370, "valid_targets_mean": 11224.7, "valid_targets_min": 1822 }, { "epoch": 2.5811209439528024, "grad_norm": 0.18190256491713522, "learning_rate": 2.236291671429669e-05, "loss": 0.367, "loss_nan_ranks": 0, "loss_rank_avg": 0.1305564045906067, "step": 4375, "valid_targets_mean": 11156.6, "valid_targets_min": 1606 }, { "epoch": 2.584070796460177, "grad_norm": 0.1912488927143699, "learning_rate": 2.232200980797877e-05, "loss": 0.3663, "loss_nan_ranks": 0, "loss_rank_avg": 0.13565358519554138, "step": 4380, "valid_targets_mean": 10960.1, "valid_targets_min": 1556 }, { "epoch": 2.5870206489675516, "grad_norm": 0.19092041778251356, "learning_rate": 2.2281093052569677e-05, "loss": 0.3701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1110101193189621, "step": 4385, "valid_targets_mean": 9461.7, "valid_targets_min": 1929 }, { "epoch": 2.589970501474926, "grad_norm": 0.1909995367933586, "learning_rate": 2.224016662162289e-05, "loss": 0.3754, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283772736787796, "step": 4390, "valid_targets_mean": 9745.5, "valid_targets_min": 1581 }, { "epoch": 2.5929203539823007, "grad_norm": 0.1875279301690173, "learning_rate": 2.2199230688732906e-05, "loss": 0.3641, "loss_nan_ranks": 0, "loss_rank_avg": 0.12525217235088348, "step": 4395, "valid_targets_mean": 10080.6, "valid_targets_min": 2923 }, { "epoch": 2.5958702064896757, "grad_norm": 0.20272720547415712, "learning_rate": 2.2158285427534537e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.11715195327997208, "step": 4400, "valid_targets_mean": 8127.2, "valid_targets_min": 1571 }, { "epoch": 2.5988200589970503, "grad_norm": 0.17990153107875204, "learning_rate": 2.2117331011702164e-05, "loss": 0.3716, "loss_nan_ranks": 0, "loss_rank_avg": 0.11927230656147003, "step": 4405, "valid_targets_mean": 10449.8, "valid_targets_min": 1912 }, { "epoch": 2.601769911504425, "grad_norm": 0.18373357287582748, "learning_rate": 2.2076367614948997e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.10929173231124878, "step": 4410, "valid_targets_mean": 8532.2, "valid_targets_min": 1791 }, { "epoch": 2.6047197640117994, "grad_norm": 0.18399152008258768, "learning_rate": 2.2035395411026338e-05, "loss": 0.3719, "loss_nan_ranks": 0, "loss_rank_avg": 0.1311100572347641, "step": 4415, "valid_targets_mean": 11387.8, "valid_targets_min": 2003 }, { "epoch": 2.607669616519174, "grad_norm": 0.18439145618369485, "learning_rate": 2.1994414573722834e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.11850002408027649, "step": 4420, "valid_targets_mean": 9229.9, "valid_targets_min": 2522 }, { "epoch": 2.6106194690265485, "grad_norm": 0.18488957845098064, "learning_rate": 2.195342527686379e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.14204034209251404, "step": 4425, "valid_targets_mean": 12198.8, "valid_targets_min": 1675 }, { "epoch": 2.613569321533923, "grad_norm": 0.19286103565402618, "learning_rate": 2.191242769431035e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.1183563768863678, "step": 4430, "valid_targets_mean": 10017.0, "valid_targets_min": 1776 }, { "epoch": 2.616519174041298, "grad_norm": 0.17380589005055547, "learning_rate": 2.1871421999958823e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.11534374952316284, "step": 4435, "valid_targets_mean": 10342.0, "valid_targets_min": 1961 }, { "epoch": 2.6194690265486726, "grad_norm": 0.18262589410060973, "learning_rate": 2.1830408367739922e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.11956163495779037, "step": 4440, "valid_targets_mean": 9962.6, "valid_targets_min": 2405 }, { "epoch": 2.622418879056047, "grad_norm": 0.18353878588806358, "learning_rate": 2.1789386971618033e-05, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.10075725615024567, "step": 4445, "valid_targets_mean": 8304.7, "valid_targets_min": 1978 }, { "epoch": 2.6253687315634218, "grad_norm": 0.18338574101129995, "learning_rate": 2.1748357985590464e-05, "loss": 0.3663, "loss_nan_ranks": 0, "loss_rank_avg": 0.13569006323814392, "step": 4450, "valid_targets_mean": 12342.4, "valid_targets_min": 2187 }, { "epoch": 2.6283185840707963, "grad_norm": 0.18731950611432518, "learning_rate": 2.1707321583686723e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.11985199898481369, "step": 4455, "valid_targets_mean": 9165.0, "valid_targets_min": 832 }, { "epoch": 2.6312684365781713, "grad_norm": 0.18179109075455493, "learning_rate": 2.166627793996778e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.11996208131313324, "step": 4460, "valid_targets_mean": 10573.9, "valid_targets_min": 2386 }, { "epoch": 2.6342182890855455, "grad_norm": 0.17639732749552067, "learning_rate": 2.162522722852531e-05, "loss": 0.3753, "loss_nan_ranks": 0, "loss_rank_avg": 0.09830086678266525, "step": 4465, "valid_targets_mean": 8261.4, "valid_targets_min": 1439 }, { "epoch": 2.6371681415929205, "grad_norm": 0.18624863734756492, "learning_rate": 2.1584169623480977e-05, "loss": 0.3793, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318359673023224, "step": 4470, "valid_targets_mean": 9847.7, "valid_targets_min": 1767 }, { "epoch": 2.640117994100295, "grad_norm": 0.18671149749630092, "learning_rate": 2.1543105298985677e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.142843559384346, "step": 4475, "valid_targets_mean": 13030.2, "valid_targets_min": 2483 }, { "epoch": 2.6430678466076696, "grad_norm": 0.17576915778049942, "learning_rate": 2.150203442921881e-05, "loss": 0.3656, "loss_nan_ranks": 0, "loss_rank_avg": 0.11096139997243881, "step": 4480, "valid_targets_mean": 9731.1, "valid_targets_min": 1703 }, { "epoch": 2.646017699115044, "grad_norm": 0.19021455051682687, "learning_rate": 2.146095718838754e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263219118118286, "step": 4485, "valid_targets_mean": 10780.1, "valid_targets_min": 1649 }, { "epoch": 2.6489675516224187, "grad_norm": 0.25149441730176714, "learning_rate": 2.1419873750726047e-05, "loss": 0.3745, "loss_nan_ranks": 0, "loss_rank_avg": 0.12710106372833252, "step": 4490, "valid_targets_mean": 10743.4, "valid_targets_min": 1801 }, { "epoch": 2.6519174041297937, "grad_norm": 0.19309226911864125, "learning_rate": 2.137878429049481e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.09978538751602173, "step": 4495, "valid_targets_mean": 9102.6, "valid_targets_min": 1830 }, { "epoch": 2.6548672566371683, "grad_norm": 0.187598366499337, "learning_rate": 2.133768898197984e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.10561759769916534, "step": 4500, "valid_targets_mean": 9400.9, "valid_targets_min": 1853 }, { "epoch": 2.657817109144543, "grad_norm": 0.18176956089972085, "learning_rate": 2.129658799949197e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.11985710263252258, "step": 4505, "valid_targets_mean": 10114.0, "valid_targets_min": 2144 }, { "epoch": 2.6607669616519174, "grad_norm": 0.19152705920323992, "learning_rate": 2.1255481517366076e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.12177897989749908, "step": 4510, "valid_targets_mean": 9553.2, "valid_targets_min": 2181 }, { "epoch": 2.663716814159292, "grad_norm": 0.20006455174532503, "learning_rate": 2.1214369709960384e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.12645691633224487, "step": 4515, "valid_targets_mean": 9748.7, "valid_targets_min": 856 }, { "epoch": 2.6666666666666665, "grad_norm": 0.1951469538446342, "learning_rate": 2.1173252751655697e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358049213886261, "step": 4520, "valid_targets_mean": 12207.3, "valid_targets_min": 2941 }, { "epoch": 2.669616519174041, "grad_norm": 0.17741183567028762, "learning_rate": 2.113213081685466e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1099037230014801, "step": 4525, "valid_targets_mean": 9607.7, "valid_targets_min": 1480 }, { "epoch": 2.672566371681416, "grad_norm": 0.17114246748827758, "learning_rate": 2.109100407998105e-05, "loss": 0.3756, "loss_nan_ranks": 0, "loss_rank_avg": 0.1161927580833435, "step": 4530, "valid_targets_mean": 10516.6, "valid_targets_min": 1750 }, { "epoch": 2.6755162241887906, "grad_norm": 0.1736298535501412, "learning_rate": 2.104987271547899e-05, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.10709735751152039, "step": 4535, "valid_targets_mean": 9166.2, "valid_targets_min": 2342 }, { "epoch": 2.678466076696165, "grad_norm": 0.18858861763150891, "learning_rate": 2.1008736897812233e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.14287090301513672, "step": 4540, "valid_targets_mean": 10198.2, "valid_targets_min": 1888 }, { "epoch": 2.6814159292035398, "grad_norm": 0.20388340088823198, "learning_rate": 2.0967596801463433e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.12462417036294937, "step": 4545, "valid_targets_mean": 9976.0, "valid_targets_min": 1591 }, { "epoch": 2.6843657817109143, "grad_norm": 0.18788704479085547, "learning_rate": 2.0926452600933388e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.11166876554489136, "step": 4550, "valid_targets_mean": 8667.3, "valid_targets_min": 1636 }, { "epoch": 2.6873156342182893, "grad_norm": 0.18354787267923775, "learning_rate": 2.0885304470740294e-05, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.14732298254966736, "step": 4555, "valid_targets_mean": 11671.9, "valid_targets_min": 1372 }, { "epoch": 2.6902654867256635, "grad_norm": 0.1982192113522515, "learning_rate": 2.084415258541903e-05, "loss": 0.3702, "loss_nan_ranks": 0, "loss_rank_avg": 0.10863981395959854, "step": 4560, "valid_targets_mean": 8705.5, "valid_targets_min": 788 }, { "epoch": 2.6932153392330385, "grad_norm": 0.18149704019737828, "learning_rate": 2.0802997119520393e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.12404702603816986, "step": 4565, "valid_targets_mean": 10789.9, "valid_targets_min": 1629 }, { "epoch": 2.696165191740413, "grad_norm": 0.1792480079906465, "learning_rate": 2.0761838247610372e-05, "loss": 0.3748, "loss_nan_ranks": 0, "loss_rank_avg": 0.11676395684480667, "step": 4570, "valid_targets_mean": 9820.9, "valid_targets_min": 2079 }, { "epoch": 2.6991150442477876, "grad_norm": 0.16606762751806176, "learning_rate": 2.0720676144269407e-05, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.11027930676937103, "step": 4575, "valid_targets_mean": 9519.0, "valid_targets_min": 1443 }, { "epoch": 2.702064896755162, "grad_norm": 0.16722925771852787, "learning_rate": 2.067951098409162e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.1202898919582367, "step": 4580, "valid_targets_mean": 11148.6, "valid_targets_min": 2844 }, { "epoch": 2.7050147492625367, "grad_norm": 0.18963004352089147, "learning_rate": 2.0638342941684146e-05, "loss": 0.3704, "loss_nan_ranks": 0, "loss_rank_avg": 0.15341144800186157, "step": 4585, "valid_targets_mean": 11772.3, "valid_targets_min": 2041 }, { "epoch": 2.7079646017699117, "grad_norm": 0.1807969224641405, "learning_rate": 2.0597172191666304e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.1127198189496994, "step": 4590, "valid_targets_mean": 9464.2, "valid_targets_min": 2006 }, { "epoch": 2.7109144542772863, "grad_norm": 0.1765733977482184, "learning_rate": 2.05559989086689e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.11121810972690582, "step": 4595, "valid_targets_mean": 10115.8, "valid_targets_min": 2033 }, { "epoch": 2.713864306784661, "grad_norm": 0.18313305838435828, "learning_rate": 2.0514823267333517e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.09712762385606766, "step": 4600, "valid_targets_mean": 8914.2, "valid_targets_min": 1829 }, { "epoch": 2.7168141592920354, "grad_norm": 0.19119710102039167, "learning_rate": 2.0473645442311704e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.1367199420928955, "step": 4605, "valid_targets_mean": 11594.1, "valid_targets_min": 1466 }, { "epoch": 2.71976401179941, "grad_norm": 0.17179732392777203, "learning_rate": 2.04324656082643e-05, "loss": 0.3664, "loss_nan_ranks": 0, "loss_rank_avg": 0.12338307499885559, "step": 4610, "valid_targets_mean": 10735.3, "valid_targets_min": 1786 }, { "epoch": 2.7227138643067845, "grad_norm": 0.19797993394417737, "learning_rate": 2.0391283939860642e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.12678474187850952, "step": 4615, "valid_targets_mean": 11454.9, "valid_targets_min": 2305 }, { "epoch": 2.725663716814159, "grad_norm": 0.18470224773039076, "learning_rate": 2.0350100611777857e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.10877864062786102, "step": 4620, "valid_targets_mean": 9119.2, "valid_targets_min": 933 }, { "epoch": 2.728613569321534, "grad_norm": 0.18900877777413866, "learning_rate": 2.0308915798700125e-05, "loss": 0.3718, "loss_nan_ranks": 0, "loss_rank_avg": 0.10504063218832016, "step": 4625, "valid_targets_mean": 9410.8, "valid_targets_min": 1837 }, { "epoch": 2.7315634218289087, "grad_norm": 0.17971348147208774, "learning_rate": 2.0267729675317907e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.10653070360422134, "step": 4630, "valid_targets_mean": 9461.3, "valid_targets_min": 1841 }, { "epoch": 2.734513274336283, "grad_norm": 0.17252415962273776, "learning_rate": 2.022654241632723e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.14466625452041626, "step": 4635, "valid_targets_mean": 12400.2, "valid_targets_min": 2042 }, { "epoch": 2.737463126843658, "grad_norm": 0.17425963981703763, "learning_rate": 2.018535419642894e-05, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.14283370971679688, "step": 4640, "valid_targets_mean": 12530.3, "valid_targets_min": 2926 }, { "epoch": 2.7404129793510323, "grad_norm": 0.23167496325337464, "learning_rate": 2.0144165190327944e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.131038635969162, "step": 4645, "valid_targets_mean": 10509.6, "valid_targets_min": 649 }, { "epoch": 2.7433628318584073, "grad_norm": 0.17833373920160922, "learning_rate": 2.0102975572732503e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.11860808730125427, "step": 4650, "valid_targets_mean": 9454.0, "valid_targets_min": 2003 }, { "epoch": 2.7463126843657815, "grad_norm": 0.17324651993806348, "learning_rate": 2.0061785518353468e-05, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.11439033597707748, "step": 4655, "valid_targets_mean": 9103.6, "valid_targets_min": 1608 }, { "epoch": 2.7492625368731565, "grad_norm": 0.19583402036382658, "learning_rate": 2.002059520190352e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.11621478199958801, "step": 4660, "valid_targets_mean": 9436.6, "valid_targets_min": 2137 }, { "epoch": 2.752212389380531, "grad_norm": 0.19255695069921716, "learning_rate": 1.9979404798096488e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11613614857196808, "step": 4665, "valid_targets_mean": 9747.0, "valid_targets_min": 1135 }, { "epoch": 2.7551622418879056, "grad_norm": 0.18838882767985898, "learning_rate": 1.9938214481646542e-05, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.12855328619480133, "step": 4670, "valid_targets_mean": 10079.6, "valid_targets_min": 2286 }, { "epoch": 2.75811209439528, "grad_norm": 0.18275839926832513, "learning_rate": 1.9897024427267503e-05, "loss": 0.3736, "loss_nan_ranks": 0, "loss_rank_avg": 0.12765586376190186, "step": 4675, "valid_targets_mean": 10582.6, "valid_targets_min": 1657 }, { "epoch": 2.7610619469026547, "grad_norm": 0.1834833774953928, "learning_rate": 1.9855834809672062e-05, "loss": 0.3721, "loss_nan_ranks": 0, "loss_rank_avg": 0.11331748217344284, "step": 4680, "valid_targets_mean": 8869.7, "valid_targets_min": 1883 }, { "epoch": 2.7640117994100297, "grad_norm": 0.19381022380541693, "learning_rate": 1.981464580357107e-05, "loss": 0.3595, "loss_nan_ranks": 0, "loss_rank_avg": 0.12564757466316223, "step": 4685, "valid_targets_mean": 10999.8, "valid_targets_min": 1608 }, { "epoch": 2.7669616519174043, "grad_norm": 0.18231953861993394, "learning_rate": 1.9773457583672774e-05, "loss": 0.3688, "loss_nan_ranks": 0, "loss_rank_avg": 0.12267229706048965, "step": 4690, "valid_targets_mean": 10845.2, "valid_targets_min": 1769 }, { "epoch": 2.769911504424779, "grad_norm": 0.1755478274789862, "learning_rate": 1.9732270324682096e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.12882521748542786, "step": 4695, "valid_targets_mean": 11583.4, "valid_targets_min": 2726 }, { "epoch": 2.7728613569321534, "grad_norm": 0.17971417614952098, "learning_rate": 1.9691084201299882e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.10892309248447418, "step": 4700, "valid_targets_mean": 9023.2, "valid_targets_min": 1719 }, { "epoch": 2.775811209439528, "grad_norm": 0.19549557753074975, "learning_rate": 1.9649899388222146e-05, "loss": 0.367, "loss_nan_ranks": 0, "loss_rank_avg": 0.14118340611457825, "step": 4705, "valid_targets_mean": 11621.1, "valid_targets_min": 1627 }, { "epoch": 2.7787610619469025, "grad_norm": 0.19667987961284608, "learning_rate": 1.9608716060139364e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.14556458592414856, "step": 4710, "valid_targets_mean": 10227.8, "valid_targets_min": 2542 }, { "epoch": 2.781710914454277, "grad_norm": 0.19029304074955575, "learning_rate": 1.9567534391735704e-05, "loss": 0.3596, "loss_nan_ranks": 0, "loss_rank_avg": 0.11205069720745087, "step": 4715, "valid_targets_mean": 8847.1, "valid_targets_min": 2962 }, { "epoch": 2.784660766961652, "grad_norm": 0.19017228149174456, "learning_rate": 1.95263545576883e-05, "loss": 0.3688, "loss_nan_ranks": 0, "loss_rank_avg": 0.12900149822235107, "step": 4720, "valid_targets_mean": 11824.5, "valid_targets_min": 2336 }, { "epoch": 2.7876106194690267, "grad_norm": 0.17552727463563755, "learning_rate": 1.9485176732666483e-05, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.15375812351703644, "step": 4725, "valid_targets_mean": 13422.8, "valid_targets_min": 2469 }, { "epoch": 2.7905604719764012, "grad_norm": 0.17668174384809351, "learning_rate": 1.9444001091331106e-05, "loss": 0.3663, "loss_nan_ranks": 0, "loss_rank_avg": 0.0886571928858757, "step": 4730, "valid_targets_mean": 8039.5, "valid_targets_min": 1011 }, { "epoch": 2.793510324483776, "grad_norm": 0.18169782556029626, "learning_rate": 1.9402827808333703e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.09978793561458588, "step": 4735, "valid_targets_mean": 8162.9, "valid_targets_min": 1768 }, { "epoch": 2.7964601769911503, "grad_norm": 0.19792473116928858, "learning_rate": 1.936165705831586e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.1303151547908783, "step": 4740, "valid_targets_mean": 9680.6, "valid_targets_min": 1517 }, { "epoch": 2.799410029498525, "grad_norm": 0.19539839901298892, "learning_rate": 1.9320489015908382e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.12567034363746643, "step": 4745, "valid_targets_mean": 10204.0, "valid_targets_min": 1856 }, { "epoch": 2.8023598820058995, "grad_norm": 0.18421451976344766, "learning_rate": 1.9279323855730607e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.1409921497106552, "step": 4750, "valid_targets_mean": 11088.9, "valid_targets_min": 3033 }, { "epoch": 2.8053097345132745, "grad_norm": 0.1832810400326197, "learning_rate": 1.923816175238963e-05, "loss": 0.3712, "loss_nan_ranks": 0, "loss_rank_avg": 0.10676514357328415, "step": 4755, "valid_targets_mean": 8808.9, "valid_targets_min": 1628 }, { "epoch": 2.808259587020649, "grad_norm": 0.1810538852883411, "learning_rate": 1.9197002880479617e-05, "loss": 0.3641, "loss_nan_ranks": 0, "loss_rank_avg": 0.12992864847183228, "step": 4760, "valid_targets_mean": 10004.9, "valid_targets_min": 2090 }, { "epoch": 2.8112094395280236, "grad_norm": 0.1738368857577118, "learning_rate": 1.9155847414580976e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.12918700277805328, "step": 4765, "valid_targets_mean": 11585.9, "valid_targets_min": 1578 }, { "epoch": 2.814159292035398, "grad_norm": 0.18899097255754913, "learning_rate": 1.911469552925971e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.13440260291099548, "step": 4770, "valid_targets_mean": 10658.7, "valid_targets_min": 1712 }, { "epoch": 2.8171091445427727, "grad_norm": 0.1795972722764541, "learning_rate": 1.9073547399066622e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.1385485976934433, "step": 4775, "valid_targets_mean": 11714.4, "valid_targets_min": 2874 }, { "epoch": 2.8200589970501477, "grad_norm": 0.18542696771062736, "learning_rate": 1.903240319853657e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.10369464010000229, "step": 4780, "valid_targets_mean": 9205.3, "valid_targets_min": 2733 }, { "epoch": 2.823008849557522, "grad_norm": 0.1781187344729139, "learning_rate": 1.899126310218777e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.10259953886270523, "step": 4785, "valid_targets_mean": 8837.8, "valid_targets_min": 2032 }, { "epoch": 2.825958702064897, "grad_norm": 0.17727229452137436, "learning_rate": 1.8950127284521017e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.11819326877593994, "step": 4790, "valid_targets_mean": 10313.7, "valid_targets_min": 2037 }, { "epoch": 2.8289085545722714, "grad_norm": 0.18090764145907315, "learning_rate": 1.890899592001895e-05, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.09841946512460709, "step": 4795, "valid_targets_mean": 8079.2, "valid_targets_min": 1799 }, { "epoch": 2.831858407079646, "grad_norm": 0.17355190974088425, "learning_rate": 1.886786918314534e-05, "loss": 0.3596, "loss_nan_ranks": 0, "loss_rank_avg": 0.14969128370285034, "step": 4800, "valid_targets_mean": 11687.4, "valid_targets_min": 1660 }, { "epoch": 2.8348082595870205, "grad_norm": 0.17647187850701593, "learning_rate": 1.8826747248344313e-05, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.11566095054149628, "step": 4805, "valid_targets_mean": 9689.1, "valid_targets_min": 1213 }, { "epoch": 2.837758112094395, "grad_norm": 0.17722114617807447, "learning_rate": 1.8785630290039623e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614227592945099, "step": 4810, "valid_targets_mean": 13727.9, "valid_targets_min": 2019 }, { "epoch": 2.84070796460177, "grad_norm": 0.1773785236767756, "learning_rate": 1.8744518482633934e-05, "loss": 0.3651, "loss_nan_ranks": 0, "loss_rank_avg": 0.10308026522397995, "step": 4815, "valid_targets_mean": 8408.8, "valid_targets_min": 1770 }, { "epoch": 2.8436578171091447, "grad_norm": 0.17990207506219663, "learning_rate": 1.8703412000508038e-05, "loss": 0.37, "loss_nan_ranks": 0, "loss_rank_avg": 0.13289114832878113, "step": 4820, "valid_targets_mean": 10496.0, "valid_targets_min": 1924 }, { "epoch": 2.8466076696165192, "grad_norm": 0.1775576622667924, "learning_rate": 1.8662311018020164e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.1118200272321701, "step": 4825, "valid_targets_mean": 9131.2, "valid_targets_min": 2712 }, { "epoch": 2.849557522123894, "grad_norm": 0.19810895558544087, "learning_rate": 1.8621215709505193e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.12048914283514023, "step": 4830, "valid_targets_mean": 8391.5, "valid_targets_min": 1896 }, { "epoch": 2.8525073746312684, "grad_norm": 0.17216688915829712, "learning_rate": 1.8580126249273963e-05, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.11605193465948105, "step": 4835, "valid_targets_mean": 9973.9, "valid_targets_min": 1874 }, { "epoch": 2.855457227138643, "grad_norm": 0.16684034444297652, "learning_rate": 1.853904281161247e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.12890911102294922, "step": 4840, "valid_targets_mean": 11387.2, "valid_targets_min": 2079 }, { "epoch": 2.8584070796460175, "grad_norm": 0.1778916844191916, "learning_rate": 1.8497965570781194e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.12453418970108032, "step": 4845, "valid_targets_mean": 9381.8, "valid_targets_min": 1708 }, { "epoch": 2.8613569321533925, "grad_norm": 0.180746525736262, "learning_rate": 1.845689470101433e-05, "loss": 0.3692, "loss_nan_ranks": 0, "loss_rank_avg": 0.11520042270421982, "step": 4850, "valid_targets_mean": 8509.3, "valid_targets_min": 1118 }, { "epoch": 2.864306784660767, "grad_norm": 0.17748264133156372, "learning_rate": 1.8415830376519023e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.12190565466880798, "step": 4855, "valid_targets_mean": 10374.7, "valid_targets_min": 2011 }, { "epoch": 2.8672566371681416, "grad_norm": 0.17404569841144527, "learning_rate": 1.8374772771474697e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.1507178097963333, "step": 4860, "valid_targets_mean": 12519.0, "valid_targets_min": 1887 }, { "epoch": 2.870206489675516, "grad_norm": 0.17223673440063744, "learning_rate": 1.8333722060032224e-05, "loss": 0.3614, "loss_nan_ranks": 0, "loss_rank_avg": 0.11666902899742126, "step": 4865, "valid_targets_mean": 9916.1, "valid_targets_min": 1793 }, { "epoch": 2.8731563421828907, "grad_norm": 0.18930517136336042, "learning_rate": 1.8292678416313283e-05, "loss": 0.3735, "loss_nan_ranks": 0, "loss_rank_avg": 0.1369718611240387, "step": 4870, "valid_targets_mean": 10340.9, "valid_targets_min": 1125 }, { "epoch": 2.8761061946902657, "grad_norm": 0.18700065727926024, "learning_rate": 1.8251642014409543e-05, "loss": 0.3634, "loss_nan_ranks": 0, "loss_rank_avg": 0.12782393395900726, "step": 4875, "valid_targets_mean": 9584.5, "valid_targets_min": 2028 }, { "epoch": 2.87905604719764, "grad_norm": 0.18553220648070542, "learning_rate": 1.821061302838198e-05, "loss": 0.371, "loss_nan_ranks": 0, "loss_rank_avg": 0.13950929045677185, "step": 4880, "valid_targets_mean": 11590.9, "valid_targets_min": 2261 }, { "epoch": 2.882005899705015, "grad_norm": 0.17299523715979212, "learning_rate": 1.8169591632260085e-05, "loss": 0.3667, "loss_nan_ranks": 0, "loss_rank_avg": 0.13274073600769043, "step": 4885, "valid_targets_mean": 11354.4, "valid_targets_min": 1773 }, { "epoch": 2.8849557522123894, "grad_norm": 0.17027993458233717, "learning_rate": 1.8128578000041187e-05, "loss": 0.3674, "loss_nan_ranks": 0, "loss_rank_avg": 0.11688661575317383, "step": 4890, "valid_targets_mean": 9635.8, "valid_targets_min": 2187 }, { "epoch": 2.887905604719764, "grad_norm": 0.3110297576805822, "learning_rate": 1.8087572305689657e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.12430237233638763, "step": 4895, "valid_targets_mean": 10532.5, "valid_targets_min": 1940 }, { "epoch": 2.8908554572271385, "grad_norm": 0.17883439437077342, "learning_rate": 1.8046574723136218e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.13129037618637085, "step": 4900, "valid_targets_mean": 11384.6, "valid_targets_min": 2096 }, { "epoch": 2.893805309734513, "grad_norm": 0.18072943139923472, "learning_rate": 1.800558542627717e-05, "loss": 0.3623, "loss_nan_ranks": 0, "loss_rank_avg": 0.12233418971300125, "step": 4905, "valid_targets_mean": 10272.5, "valid_targets_min": 2815 }, { "epoch": 2.896755162241888, "grad_norm": 0.17850264298888707, "learning_rate": 1.7964604588973672e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.13789036870002747, "step": 4910, "valid_targets_mean": 11145.4, "valid_targets_min": 818 }, { "epoch": 2.8997050147492627, "grad_norm": 0.17401095636087435, "learning_rate": 1.792363238505101e-05, "loss": 0.3614, "loss_nan_ranks": 0, "loss_rank_avg": 0.10849230736494064, "step": 4915, "valid_targets_mean": 9275.6, "valid_targets_min": 1757 }, { "epoch": 2.9026548672566372, "grad_norm": 0.16868747509879806, "learning_rate": 1.788266898829784e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.12984463572502136, "step": 4920, "valid_targets_mean": 10562.0, "valid_targets_min": 1778 }, { "epoch": 2.905604719764012, "grad_norm": 0.1713118209228475, "learning_rate": 1.784171457246547e-05, "loss": 0.364, "loss_nan_ranks": 0, "loss_rank_avg": 0.11977224051952362, "step": 4925, "valid_targets_mean": 9969.5, "valid_targets_min": 1957 }, { "epoch": 2.9085545722713864, "grad_norm": 0.2051711163286173, "learning_rate": 1.7800769311267097e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.13498347997665405, "step": 4930, "valid_targets_mean": 10153.2, "valid_targets_min": 2191 }, { "epoch": 2.911504424778761, "grad_norm": 0.182851398303451, "learning_rate": 1.7759833378377115e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.0971779078245163, "step": 4935, "valid_targets_mean": 8849.2, "valid_targets_min": 324 }, { "epoch": 2.9144542772861355, "grad_norm": 0.16859808466952741, "learning_rate": 1.771890694743032e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.13063043355941772, "step": 4940, "valid_targets_mean": 10924.6, "valid_targets_min": 2710 }, { "epoch": 2.9174041297935105, "grad_norm": 0.17589862305516682, "learning_rate": 1.7677990192021233e-05, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.13488222658634186, "step": 4945, "valid_targets_mean": 11752.3, "valid_targets_min": 1969 }, { "epoch": 2.920353982300885, "grad_norm": 0.19190635425255817, "learning_rate": 1.7637083285703316e-05, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.14491617679595947, "step": 4950, "valid_targets_mean": 12698.6, "valid_targets_min": 2768 }, { "epoch": 2.9233038348082596, "grad_norm": 0.17127630744296202, "learning_rate": 1.759618640198826e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.1178339272737503, "step": 4955, "valid_targets_mean": 10104.6, "valid_targets_min": 1652 }, { "epoch": 2.926253687315634, "grad_norm": 0.17277595293584214, "learning_rate": 1.755529971434524e-05, "loss": 0.3713, "loss_nan_ranks": 0, "loss_rank_avg": 0.12804704904556274, "step": 4960, "valid_targets_mean": 11014.7, "valid_targets_min": 1872 }, { "epoch": 2.9292035398230087, "grad_norm": 0.186889514672382, "learning_rate": 1.7514423396200206e-05, "loss": 0.3642, "loss_nan_ranks": 0, "loss_rank_avg": 0.12300354987382889, "step": 4965, "valid_targets_mean": 10039.7, "valid_targets_min": 2777 }, { "epoch": 2.9321533923303837, "grad_norm": 0.1736172015814307, "learning_rate": 1.7473557620935077e-05, "loss": 0.3705, "loss_nan_ranks": 0, "loss_rank_avg": 0.13639748096466064, "step": 4970, "valid_targets_mean": 11453.5, "valid_targets_min": 1275 }, { "epoch": 2.935103244837758, "grad_norm": 0.1787502910261031, "learning_rate": 1.7432702561887114e-05, "loss": 0.3719, "loss_nan_ranks": 0, "loss_rank_avg": 0.11030873656272888, "step": 4975, "valid_targets_mean": 8932.7, "valid_targets_min": 1791 }, { "epoch": 2.938053097345133, "grad_norm": 0.18325247424037175, "learning_rate": 1.7391858392348064e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.12594400346279144, "step": 4980, "valid_targets_mean": 11101.6, "valid_targets_min": 2707 }, { "epoch": 2.9410029498525074, "grad_norm": 0.1737878744545687, "learning_rate": 1.7351025285563526e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.1459430754184723, "step": 4985, "valid_targets_mean": 10862.0, "valid_targets_min": 1591 }, { "epoch": 2.943952802359882, "grad_norm": 0.17763844955193459, "learning_rate": 1.7310203414732167e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.1361452341079712, "step": 4990, "valid_targets_mean": 10801.4, "valid_targets_min": 1421 }, { "epoch": 2.9469026548672566, "grad_norm": 0.19567527222659836, "learning_rate": 1.726939295300498e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.11888530105352402, "step": 4995, "valid_targets_mean": 8929.9, "valid_targets_min": 1203 }, { "epoch": 2.949852507374631, "grad_norm": 0.1729651318808521, "learning_rate": 1.7228594073484584e-05, "loss": 0.3722, "loss_nan_ranks": 0, "loss_rank_avg": 0.12663039565086365, "step": 5000, "valid_targets_mean": 10474.6, "valid_targets_min": 1041 }, { "epoch": 2.952802359882006, "grad_norm": 0.177560869754914, "learning_rate": 1.718780694922445e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.10894748568534851, "step": 5005, "valid_targets_mean": 8967.3, "valid_targets_min": 2401 }, { "epoch": 2.9557522123893807, "grad_norm": 0.1874803467578325, "learning_rate": 1.7147031753228218e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277991235256195, "step": 5010, "valid_targets_mean": 10507.0, "valid_targets_min": 1811 }, { "epoch": 2.9587020648967552, "grad_norm": 0.2360296953225136, "learning_rate": 1.7106268658448886e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.10516766458749771, "step": 5015, "valid_targets_mean": 9101.4, "valid_targets_min": 1896 }, { "epoch": 2.96165191740413, "grad_norm": 0.1951433840169243, "learning_rate": 1.7065517837788183e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.13209852576255798, "step": 5020, "valid_targets_mean": 11740.2, "valid_targets_min": 1329 }, { "epoch": 2.9646017699115044, "grad_norm": 0.17905616793607196, "learning_rate": 1.7024779464095717e-05, "loss": 0.3664, "loss_nan_ranks": 0, "loss_rank_avg": 0.11057194322347641, "step": 5025, "valid_targets_mean": 8273.8, "valid_targets_min": 1581 }, { "epoch": 2.967551622418879, "grad_norm": 0.18826370887418117, "learning_rate": 1.6984053710168348e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13581299781799316, "step": 5030, "valid_targets_mean": 10531.7, "valid_targets_min": 2030 }, { "epoch": 2.9705014749262535, "grad_norm": 0.20867348643719316, "learning_rate": 1.6943340748749367e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.11186973750591278, "step": 5035, "valid_targets_mean": 8572.2, "valid_targets_min": 1302 }, { "epoch": 2.9734513274336285, "grad_norm": 0.17361471549307683, "learning_rate": 1.690264075252785e-05, "loss": 0.3712, "loss_nan_ranks": 0, "loss_rank_avg": 0.12840047478675842, "step": 5040, "valid_targets_mean": 10365.0, "valid_targets_min": 1880 }, { "epoch": 2.976401179941003, "grad_norm": 0.1737568252146911, "learning_rate": 1.6861953894137832e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.14282283186912537, "step": 5045, "valid_targets_mean": 11930.6, "valid_targets_min": 1431 }, { "epoch": 2.9793510324483776, "grad_norm": 0.1905453510522682, "learning_rate": 1.682128034615765e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.12144088000059128, "step": 5050, "valid_targets_mean": 10015.8, "valid_targets_min": 1439 }, { "epoch": 2.982300884955752, "grad_norm": 0.18806211439617518, "learning_rate": 1.678062028110919e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.13041338324546814, "step": 5055, "valid_targets_mean": 10110.8, "valid_targets_min": 2130 }, { "epoch": 2.9852507374631267, "grad_norm": 0.17057233696793214, "learning_rate": 1.6739973871457117e-05, "loss": 0.3694, "loss_nan_ranks": 0, "loss_rank_avg": 0.11651427298784256, "step": 5060, "valid_targets_mean": 9938.6, "valid_targets_min": 1395 }, { "epoch": 2.9882005899705013, "grad_norm": 0.19975824600519373, "learning_rate": 1.6699341289608208e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.15038277208805084, "step": 5065, "valid_targets_mean": 11508.6, "valid_targets_min": 1832 }, { "epoch": 2.991150442477876, "grad_norm": 0.197023590973958, "learning_rate": 1.665872270791056e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.11097166687250137, "step": 5070, "valid_targets_mean": 9993.5, "valid_targets_min": 2294 }, { "epoch": 2.994100294985251, "grad_norm": 0.18671541620967982, "learning_rate": 1.6618118298652916e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.14129869639873505, "step": 5075, "valid_targets_mean": 11300.2, "valid_targets_min": 1578 }, { "epoch": 2.9970501474926254, "grad_norm": 0.18303216917284046, "learning_rate": 1.6577528234063875e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.12070619314908981, "step": 5080, "valid_targets_mean": 10239.3, "valid_targets_min": 1636 }, { "epoch": 3.0, "grad_norm": 0.16870803400701356, "learning_rate": 1.6536952686311224e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.1085338443517685, "step": 5085, "valid_targets_mean": 9906.2, "valid_targets_min": 1715 }, { "epoch": 3.0029498525073746, "grad_norm": 0.18072419280153204, "learning_rate": 1.649639182750113e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1007838100194931, "step": 5090, "valid_targets_mean": 8127.4, "valid_targets_min": 1551 }, { "epoch": 3.005899705014749, "grad_norm": 0.15411803854002304, "learning_rate": 1.6455845829677505e-05, "loss": 0.3554, "loss_nan_ranks": 0, "loss_rank_avg": 0.10417066514492035, "step": 5095, "valid_targets_mean": 11154.4, "valid_targets_min": 1853 }, { "epoch": 3.0088495575221237, "grad_norm": 0.16448402874286094, "learning_rate": 1.6415314864821188e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.11009702831506729, "step": 5100, "valid_targets_mean": 10077.0, "valid_targets_min": 2839 }, { "epoch": 3.0117994100294987, "grad_norm": 0.1629342663277792, "learning_rate": 1.6374799104849277e-05, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320076584815979, "step": 5105, "valid_targets_mean": 11536.6, "valid_targets_min": 1416 }, { "epoch": 3.0147492625368733, "grad_norm": 0.17706779013507282, "learning_rate": 1.6334298721614366e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.11719324439764023, "step": 5110, "valid_targets_mean": 9054.6, "valid_targets_min": 2757 }, { "epoch": 3.017699115044248, "grad_norm": 0.16250629050829413, "learning_rate": 1.6293813886903823e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.08248552680015564, "step": 5115, "valid_targets_mean": 7162.3, "valid_targets_min": 1845 }, { "epoch": 3.0206489675516224, "grad_norm": 0.1673905828249734, "learning_rate": 1.6253344772439078e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.12373922765254974, "step": 5120, "valid_targets_mean": 9473.3, "valid_targets_min": 1920 }, { "epoch": 3.023598820058997, "grad_norm": 0.17125857977161707, "learning_rate": 1.6212891549874867e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.12039509415626526, "step": 5125, "valid_targets_mean": 9270.4, "valid_targets_min": 1592 }, { "epoch": 3.0265486725663715, "grad_norm": 0.172291439074316, "learning_rate": 1.617245439079854e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.13650575280189514, "step": 5130, "valid_targets_mean": 11259.1, "valid_targets_min": 1297 }, { "epoch": 3.0294985250737465, "grad_norm": 0.16609076305046538, "learning_rate": 1.6132033466729283e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.13094520568847656, "step": 5135, "valid_targets_mean": 10381.7, "valid_targets_min": 2567 }, { "epoch": 3.032448377581121, "grad_norm": 0.18662285949967705, "learning_rate": 1.609162894911745e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.11098338663578033, "step": 5140, "valid_targets_mean": 8885.5, "valid_targets_min": 2312 }, { "epoch": 3.0353982300884956, "grad_norm": 0.1648803495007328, "learning_rate": 1.6051241009343765e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.13519926369190216, "step": 5145, "valid_targets_mean": 11761.5, "valid_targets_min": 2617 }, { "epoch": 3.03834808259587, "grad_norm": 0.1687028365758394, "learning_rate": 1.601086981871868e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.12321673333644867, "step": 5150, "valid_targets_mean": 10408.8, "valid_targets_min": 1710 }, { "epoch": 3.0412979351032448, "grad_norm": 0.17926476212590314, "learning_rate": 1.597051554848158e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.12310653924942017, "step": 5155, "valid_targets_mean": 9813.8, "valid_targets_min": 2186 }, { "epoch": 3.0442477876106193, "grad_norm": 0.16155502872177424, "learning_rate": 1.593017836980007e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.10764841735363007, "step": 5160, "valid_targets_mean": 9058.5, "valid_targets_min": 2561 }, { "epoch": 3.047197640117994, "grad_norm": 0.16579859522052634, "learning_rate": 1.588985845376928e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.14767128229141235, "step": 5165, "valid_targets_mean": 12223.3, "valid_targets_min": 2051 }, { "epoch": 3.050147492625369, "grad_norm": 0.1855108695222736, "learning_rate": 1.584955597141111e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.13401386141777039, "step": 5170, "valid_targets_mean": 11200.6, "valid_targets_min": 1879 }, { "epoch": 3.0530973451327434, "grad_norm": 0.17007622797255426, "learning_rate": 1.580927109367351e-05, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.11102022230625153, "step": 5175, "valid_targets_mean": 10038.4, "valid_targets_min": 2566 }, { "epoch": 3.056047197640118, "grad_norm": 0.19256034755210089, "learning_rate": 1.5769003991429773e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.1243845671415329, "step": 5180, "valid_targets_mean": 9665.2, "valid_targets_min": 1763 }, { "epoch": 3.0589970501474926, "grad_norm": 0.18192539127795151, "learning_rate": 1.5728754835477763e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.12346881628036499, "step": 5185, "valid_targets_mean": 9427.3, "valid_targets_min": 1939 }, { "epoch": 3.061946902654867, "grad_norm": 0.18276321434981857, "learning_rate": 1.568852379653925e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.13931599259376526, "step": 5190, "valid_targets_mean": 10823.2, "valid_targets_min": 1001 }, { "epoch": 3.0648967551622417, "grad_norm": 0.18096595886413822, "learning_rate": 1.5648311045259156e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.11066380143165588, "step": 5195, "valid_targets_mean": 8042.4, "valid_targets_min": 1638 }, { "epoch": 3.0678466076696167, "grad_norm": 0.18094107164281462, "learning_rate": 1.5608116752204828e-05, "loss": 0.3594, "loss_nan_ranks": 0, "loss_rank_avg": 0.11712948232889175, "step": 5200, "valid_targets_mean": 9074.4, "valid_targets_min": 1475 }, { "epoch": 3.0707964601769913, "grad_norm": 0.17043468207653303, "learning_rate": 1.5567941087865315e-05, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.14815612137317657, "step": 5205, "valid_targets_mean": 11863.6, "valid_targets_min": 2660 }, { "epoch": 3.073746312684366, "grad_norm": 0.16707843868690472, "learning_rate": 1.5527784222650654e-05, "loss": 0.3714, "loss_nan_ranks": 0, "loss_rank_avg": 0.10225613415241241, "step": 5210, "valid_targets_mean": 8764.0, "valid_targets_min": 1401 }, { "epoch": 3.0766961651917404, "grad_norm": 0.17086362845957914, "learning_rate": 1.5487646326891156e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.11746655404567719, "step": 5215, "valid_targets_mean": 8993.1, "valid_targets_min": 1661 }, { "epoch": 3.079646017699115, "grad_norm": 0.17306648583138773, "learning_rate": 1.5447527570836646e-05, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.16646556556224823, "step": 5220, "valid_targets_mean": 12450.0, "valid_targets_min": 2341 }, { "epoch": 3.0825958702064895, "grad_norm": 0.2517036739097649, "learning_rate": 1.5407428124655793e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.11005858331918716, "step": 5225, "valid_targets_mean": 9356.4, "valid_targets_min": 2251 }, { "epoch": 3.0855457227138645, "grad_norm": 0.17036008905978894, "learning_rate": 1.536734815843533e-05, "loss": 0.3562, "loss_nan_ranks": 0, "loss_rank_avg": 0.13720500469207764, "step": 5230, "valid_targets_mean": 10593.5, "valid_targets_min": 2311 }, { "epoch": 3.088495575221239, "grad_norm": 0.1741623626944122, "learning_rate": 1.5327287842179393e-05, "loss": 0.3631, "loss_nan_ranks": 0, "loss_rank_avg": 0.12113802134990692, "step": 5235, "valid_targets_mean": 11272.2, "valid_targets_min": 2072 }, { "epoch": 3.0914454277286136, "grad_norm": 0.16679691239324818, "learning_rate": 1.5287247345808753e-05, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.11631931364536285, "step": 5240, "valid_targets_mean": 10755.2, "valid_targets_min": 2573 }, { "epoch": 3.094395280235988, "grad_norm": 0.17445815348061394, "learning_rate": 1.5247226839160123e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.13419607281684875, "step": 5245, "valid_targets_mean": 11588.6, "valid_targets_min": 1224 }, { "epoch": 3.0973451327433628, "grad_norm": 0.19235039716576158, "learning_rate": 1.5207226491985408e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.12204791605472565, "step": 5250, "valid_targets_mean": 10232.4, "valid_targets_min": 1085 }, { "epoch": 3.1002949852507373, "grad_norm": 0.16580047720364316, "learning_rate": 1.5167246473951033e-05, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.12935838103294373, "step": 5255, "valid_targets_mean": 11208.1, "valid_targets_min": 1385 }, { "epoch": 3.103244837758112, "grad_norm": 0.16982903541829203, "learning_rate": 1.5127286954637162e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330590546131134, "step": 5260, "valid_targets_mean": 11080.8, "valid_targets_min": 1637 }, { "epoch": 3.106194690265487, "grad_norm": 0.17281557035552203, "learning_rate": 1.5087348103537037e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.10759001970291138, "step": 5265, "valid_targets_mean": 9888.8, "valid_targets_min": 2043 }, { "epoch": 3.1091445427728615, "grad_norm": 0.1761369685053977, "learning_rate": 1.504743009005623e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.14634013175964355, "step": 5270, "valid_targets_mean": 11535.3, "valid_targets_min": 2343 }, { "epoch": 3.112094395280236, "grad_norm": 0.16417048428949194, "learning_rate": 1.5007533083511907e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.1197446882724762, "step": 5275, "valid_targets_mean": 9942.7, "valid_targets_min": 1725 }, { "epoch": 3.1150442477876106, "grad_norm": 0.15378812401178915, "learning_rate": 1.4967657253132157e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.10902900993824005, "step": 5280, "valid_targets_mean": 9485.1, "valid_targets_min": 2381 }, { "epoch": 3.117994100294985, "grad_norm": 0.16069117781194026, "learning_rate": 1.4927802768055228e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13259164988994598, "step": 5285, "valid_targets_mean": 11853.2, "valid_targets_min": 2085 }, { "epoch": 3.1209439528023597, "grad_norm": 0.1694320573562657, "learning_rate": 1.488796979732885e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.12871789932250977, "step": 5290, "valid_targets_mean": 11962.8, "valid_targets_min": 2572 }, { "epoch": 3.1238938053097347, "grad_norm": 0.16505966881946538, "learning_rate": 1.4848158509909465e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.15198102593421936, "step": 5295, "valid_targets_mean": 13259.6, "valid_targets_min": 1574 }, { "epoch": 3.1268436578171093, "grad_norm": 0.17879388520449493, "learning_rate": 1.480836907466158e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.10954461991786957, "step": 5300, "valid_targets_mean": 8538.3, "valid_targets_min": 3063 }, { "epoch": 3.129793510324484, "grad_norm": 0.19905872823764165, "learning_rate": 1.4768601660356981e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.11861936748027802, "step": 5305, "valid_targets_mean": 9845.7, "valid_targets_min": 1576 }, { "epoch": 3.1327433628318584, "grad_norm": 0.17338452190584372, "learning_rate": 1.4728856435674073e-05, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.1204066053032875, "step": 5310, "valid_targets_mean": 10769.1, "valid_targets_min": 1379 }, { "epoch": 3.135693215339233, "grad_norm": 0.1665094296724231, "learning_rate": 1.468913356919713e-05, "loss": 0.3681, "loss_nan_ranks": 0, "loss_rank_avg": 0.12827160954475403, "step": 5315, "valid_targets_mean": 11192.5, "valid_targets_min": 2772 }, { "epoch": 3.1386430678466075, "grad_norm": 0.17163264744974516, "learning_rate": 1.4649433229415588e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.12414673715829849, "step": 5320, "valid_targets_mean": 10055.3, "valid_targets_min": 2891 }, { "epoch": 3.1415929203539825, "grad_norm": 0.16476755230856108, "learning_rate": 1.4609755584723337e-05, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.12396431714296341, "step": 5325, "valid_targets_mean": 10126.3, "valid_targets_min": 2399 }, { "epoch": 3.144542772861357, "grad_norm": 0.16898117291359036, "learning_rate": 1.4570100803418007e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.11845681071281433, "step": 5330, "valid_targets_mean": 10440.6, "valid_targets_min": 2024 }, { "epoch": 3.1474926253687316, "grad_norm": 0.19387693997806396, "learning_rate": 1.453046905370026e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.125502347946167, "step": 5335, "valid_targets_mean": 9680.2, "valid_targets_min": 2135 }, { "epoch": 3.150442477876106, "grad_norm": 0.16587740191579503, "learning_rate": 1.449086050367303e-05, "loss": 0.3668, "loss_nan_ranks": 0, "loss_rank_avg": 0.11140230298042297, "step": 5340, "valid_targets_mean": 10028.0, "valid_targets_min": 2571 }, { "epoch": 3.1533923303834808, "grad_norm": 0.17288688854657777, "learning_rate": 1.445127532134089e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.12293601781129837, "step": 5345, "valid_targets_mean": 9146.0, "valid_targets_min": 1782 }, { "epoch": 3.1563421828908553, "grad_norm": 0.16196207264850515, "learning_rate": 1.4411713674609257e-05, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.10983482003211975, "step": 5350, "valid_targets_mean": 10024.1, "valid_targets_min": 1820 }, { "epoch": 3.15929203539823, "grad_norm": 0.17745654941894476, "learning_rate": 1.4372175731283755e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.10657268762588501, "step": 5355, "valid_targets_mean": 9066.4, "valid_targets_min": 1758 }, { "epoch": 3.162241887905605, "grad_norm": 0.17093813404945338, "learning_rate": 1.4332661659069444e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.11457949876785278, "step": 5360, "valid_targets_mean": 11200.9, "valid_targets_min": 1825 }, { "epoch": 3.1651917404129795, "grad_norm": 0.16284984460105134, "learning_rate": 1.4293171625570135e-05, "loss": 0.3633, "loss_nan_ranks": 0, "loss_rank_avg": 0.10767051577568054, "step": 5365, "valid_targets_mean": 9578.0, "valid_targets_min": 969 }, { "epoch": 3.168141592920354, "grad_norm": 0.1672772887572211, "learning_rate": 1.4253705798287677e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.10364119708538055, "step": 5370, "valid_targets_mean": 8988.4, "valid_targets_min": 1622 }, { "epoch": 3.1710914454277286, "grad_norm": 0.1716741515555153, "learning_rate": 1.4214264344621262e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.11365842074155807, "step": 5375, "valid_targets_mean": 8939.7, "valid_targets_min": 2704 }, { "epoch": 3.174041297935103, "grad_norm": 0.1756823532541479, "learning_rate": 1.4174847431866665e-05, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.11407135426998138, "step": 5380, "valid_targets_mean": 11132.0, "valid_targets_min": 1617 }, { "epoch": 3.1769911504424777, "grad_norm": 0.16762380566161988, "learning_rate": 1.4135455227215603e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.11980577558279037, "step": 5385, "valid_targets_mean": 10267.6, "valid_targets_min": 2290 }, { "epoch": 3.1799410029498527, "grad_norm": 0.16270258722311065, "learning_rate": 1.4096087897754954e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.10883092880249023, "step": 5390, "valid_targets_mean": 11235.0, "valid_targets_min": 1714 }, { "epoch": 3.1828908554572273, "grad_norm": 0.19664867619345416, "learning_rate": 1.4056745610466119e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.1180739551782608, "step": 5395, "valid_targets_mean": 9939.6, "valid_targets_min": 1119 }, { "epoch": 3.185840707964602, "grad_norm": 0.16986561951035176, "learning_rate": 1.4017428532224256e-05, "loss": 0.3702, "loss_nan_ranks": 0, "loss_rank_avg": 0.12023471295833588, "step": 5400, "valid_targets_mean": 9699.6, "valid_targets_min": 1382 }, { "epoch": 3.1887905604719764, "grad_norm": 0.16401247342669617, "learning_rate": 1.3978136829797615e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11187541484832764, "step": 5405, "valid_targets_mean": 9500.3, "valid_targets_min": 2101 }, { "epoch": 3.191740412979351, "grad_norm": 0.17203129490880129, "learning_rate": 1.3938870669846793e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.11447340250015259, "step": 5410, "valid_targets_mean": 10089.6, "valid_targets_min": 2019 }, { "epoch": 3.1946902654867255, "grad_norm": 0.16112318127681288, "learning_rate": 1.3899630218924055e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.12341278791427612, "step": 5415, "valid_targets_mean": 11681.5, "valid_targets_min": 2765 }, { "epoch": 3.1976401179941005, "grad_norm": 0.1652986251915982, "learning_rate": 1.3860415643472625e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.09924346208572388, "step": 5420, "valid_targets_mean": 9450.3, "valid_targets_min": 1236 }, { "epoch": 3.200589970501475, "grad_norm": 0.17009722063486218, "learning_rate": 1.3821227109825946e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.12092237919569016, "step": 5425, "valid_targets_mean": 10375.5, "valid_targets_min": 1709 }, { "epoch": 3.2035398230088497, "grad_norm": 0.18484989650554937, "learning_rate": 1.3782064784207041e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.10624641180038452, "step": 5430, "valid_targets_mean": 7647.3, "valid_targets_min": 1474 }, { "epoch": 3.206489675516224, "grad_norm": 0.15974643344864622, "learning_rate": 1.3742928832727726e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.09058540314435959, "step": 5435, "valid_targets_mean": 7829.2, "valid_targets_min": 1407 }, { "epoch": 3.2094395280235988, "grad_norm": 0.18499061576038137, "learning_rate": 1.3703819421387988e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.10127178579568863, "step": 5440, "valid_targets_mean": 8146.3, "valid_targets_min": 2212 }, { "epoch": 3.2123893805309733, "grad_norm": 0.17670280789378795, "learning_rate": 1.366473671607521e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.14998787641525269, "step": 5445, "valid_targets_mean": 12941.1, "valid_targets_min": 1757 }, { "epoch": 3.215339233038348, "grad_norm": 0.17641480449937122, "learning_rate": 1.3625680882563517e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.11825121939182281, "step": 5450, "valid_targets_mean": 10206.6, "valid_targets_min": 2056 }, { "epoch": 3.218289085545723, "grad_norm": 0.17433353100016663, "learning_rate": 1.3586652086513038e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.12670403718948364, "step": 5455, "valid_targets_mean": 9321.0, "valid_targets_min": 2443 }, { "epoch": 3.2212389380530975, "grad_norm": 0.17405182564049818, "learning_rate": 1.3547650493469244e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.14105822145938873, "step": 5460, "valid_targets_mean": 11845.5, "valid_targets_min": 1503 }, { "epoch": 3.224188790560472, "grad_norm": 0.17630323471438666, "learning_rate": 1.3508676268862187e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.12641315162181854, "step": 5465, "valid_targets_mean": 10094.4, "valid_targets_min": 1091 }, { "epoch": 3.2271386430678466, "grad_norm": 0.17724466941372247, "learning_rate": 1.3469729578005858e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.12962406873703003, "step": 5470, "valid_targets_mean": 9290.2, "valid_targets_min": 2482 }, { "epoch": 3.230088495575221, "grad_norm": 0.17295330887453264, "learning_rate": 1.3430810586097462e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.12997081875801086, "step": 5475, "valid_targets_mean": 10670.7, "valid_targets_min": 1532 }, { "epoch": 3.2330383480825957, "grad_norm": 0.1868078668062745, "learning_rate": 1.339191945821669e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.13852176070213318, "step": 5480, "valid_targets_mean": 11688.2, "valid_targets_min": 1261 }, { "epoch": 3.2359882005899703, "grad_norm": 0.15959566606879444, "learning_rate": 1.3353056359325072e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.12794829905033112, "step": 5485, "valid_targets_mean": 10035.3, "valid_targets_min": 1364 }, { "epoch": 3.2389380530973453, "grad_norm": 0.1671205820811924, "learning_rate": 1.3314221454265233e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.10383822023868561, "step": 5490, "valid_targets_mean": 8238.5, "valid_targets_min": 1363 }, { "epoch": 3.24188790560472, "grad_norm": 0.1768265159476027, "learning_rate": 1.3275414907760222e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.13004903495311737, "step": 5495, "valid_targets_mean": 10542.8, "valid_targets_min": 1877 }, { "epoch": 3.2448377581120944, "grad_norm": 0.1695460964551601, "learning_rate": 1.3236636884412785e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.10654259473085403, "step": 5500, "valid_targets_mean": 10243.8, "valid_targets_min": 2529 }, { "epoch": 3.247787610619469, "grad_norm": 0.15806011542943854, "learning_rate": 1.3197887548704706e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.10573803633451462, "step": 5505, "valid_targets_mean": 9045.6, "valid_targets_min": 2196 }, { "epoch": 3.2507374631268435, "grad_norm": 0.16394676727838023, "learning_rate": 1.3159167064996064e-05, "loss": 0.3623, "loss_nan_ranks": 0, "loss_rank_avg": 0.14225220680236816, "step": 5510, "valid_targets_mean": 10520.3, "valid_targets_min": 2974 }, { "epoch": 3.2536873156342185, "grad_norm": 0.17557994335059957, "learning_rate": 1.3120475597524575e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1023373156785965, "step": 5515, "valid_targets_mean": 8490.1, "valid_targets_min": 1698 }, { "epoch": 3.256637168141593, "grad_norm": 0.1772121802620938, "learning_rate": 1.3081813310404872e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.12516672909259796, "step": 5520, "valid_targets_mean": 10266.6, "valid_targets_min": 2086 }, { "epoch": 3.2595870206489677, "grad_norm": 0.16860638201476127, "learning_rate": 1.3043180367627816e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.10529131442308426, "step": 5525, "valid_targets_mean": 8899.9, "valid_targets_min": 1091 }, { "epoch": 3.262536873156342, "grad_norm": 0.16809946742678483, "learning_rate": 1.30045769330598e-05, "loss": 0.3631, "loss_nan_ranks": 0, "loss_rank_avg": 0.13498874008655548, "step": 5530, "valid_targets_mean": 12777.8, "valid_targets_min": 2085 }, { "epoch": 3.265486725663717, "grad_norm": 0.1664783405579296, "learning_rate": 1.2966003170442068e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.10611608624458313, "step": 5535, "valid_targets_mean": 8542.1, "valid_targets_min": 1275 }, { "epoch": 3.2684365781710913, "grad_norm": 0.17522851488020888, "learning_rate": 1.2927459243389976e-05, "loss": 0.3725, "loss_nan_ranks": 0, "loss_rank_avg": 0.11877696961164474, "step": 5540, "valid_targets_mean": 9471.2, "valid_targets_min": 1875 }, { "epoch": 3.271386430678466, "grad_norm": 0.1740811217541218, "learning_rate": 1.2888945315392358e-05, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.12354566901922226, "step": 5545, "valid_targets_mean": 9979.3, "valid_targets_min": 2317 }, { "epoch": 3.274336283185841, "grad_norm": 0.1855988907885218, "learning_rate": 1.28504615498108e-05, "loss": 0.3668, "loss_nan_ranks": 0, "loss_rank_avg": 0.10054697096347809, "step": 5550, "valid_targets_mean": 7764.0, "valid_targets_min": 1398 }, { "epoch": 3.2772861356932155, "grad_norm": 0.17877226686806805, "learning_rate": 1.2812008109878925e-05, "loss": 0.3634, "loss_nan_ranks": 0, "loss_rank_avg": 0.11428143084049225, "step": 5555, "valid_targets_mean": 8935.4, "valid_targets_min": 1626 }, { "epoch": 3.28023598820059, "grad_norm": 0.16683919827362095, "learning_rate": 1.277358515870176e-05, "loss": 0.3571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1391943246126175, "step": 5560, "valid_targets_mean": 11983.7, "valid_targets_min": 2161 }, { "epoch": 3.2831858407079646, "grad_norm": 0.18749132103457708, "learning_rate": 1.2735192859254988e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.12208181619644165, "step": 5565, "valid_targets_mean": 9960.0, "valid_targets_min": 1896 }, { "epoch": 3.286135693215339, "grad_norm": 0.17707993776381883, "learning_rate": 1.2696831374384287e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.11540719121694565, "step": 5570, "valid_targets_mean": 9256.6, "valid_targets_min": 1791 }, { "epoch": 3.2890855457227137, "grad_norm": 0.16692477088106328, "learning_rate": 1.2658500866804622e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.12894247472286224, "step": 5575, "valid_targets_mean": 10841.3, "valid_targets_min": 1796 }, { "epoch": 3.2920353982300883, "grad_norm": 0.15885310521115004, "learning_rate": 1.2620201499099588e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357426792383194, "step": 5580, "valid_targets_mean": 11841.5, "valid_targets_min": 2575 }, { "epoch": 3.2949852507374633, "grad_norm": 0.18151023028453872, "learning_rate": 1.2581933433720658e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.1206400990486145, "step": 5585, "valid_targets_mean": 9533.8, "valid_targets_min": 1760 }, { "epoch": 3.297935103244838, "grad_norm": 0.1576662184734288, "learning_rate": 1.2543696832986577e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.12325617671012878, "step": 5590, "valid_targets_mean": 11093.8, "valid_targets_min": 2478 }, { "epoch": 3.3008849557522124, "grad_norm": 0.16248650260323072, "learning_rate": 1.2505491859082585e-05, "loss": 0.364, "loss_nan_ranks": 0, "loss_rank_avg": 0.14523741602897644, "step": 5595, "valid_targets_mean": 12308.4, "valid_targets_min": 2441 }, { "epoch": 3.303834808259587, "grad_norm": 0.1697568324931673, "learning_rate": 1.2467318674059808e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.13691668212413788, "step": 5600, "valid_targets_mean": 10976.5, "valid_targets_min": 2610 }, { "epoch": 3.3067846607669615, "grad_norm": 0.1561936447555479, "learning_rate": 1.2429177439834512e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1259647160768509, "step": 5605, "valid_targets_mean": 10802.3, "valid_targets_min": 1914 }, { "epoch": 3.309734513274336, "grad_norm": 0.15423817220564448, "learning_rate": 1.2391068318187459e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.12037042528390884, "step": 5610, "valid_targets_mean": 11692.9, "valid_targets_min": 2256 }, { "epoch": 3.312684365781711, "grad_norm": 0.16888848959955774, "learning_rate": 1.2352991470763184e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.09414775669574738, "step": 5615, "valid_targets_mean": 7951.5, "valid_targets_min": 2257 }, { "epoch": 3.3156342182890857, "grad_norm": 0.16908333147958188, "learning_rate": 1.2314947059069335e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.11395449936389923, "step": 5620, "valid_targets_mean": 8913.4, "valid_targets_min": 2553 }, { "epoch": 3.3185840707964602, "grad_norm": 0.1651710524663912, "learning_rate": 1.227693524447599e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.11249791085720062, "step": 5625, "valid_targets_mean": 10005.8, "valid_targets_min": 1375 }, { "epoch": 3.321533923303835, "grad_norm": 0.17144720901775296, "learning_rate": 1.2238956188214936e-05, "loss": 0.3596, "loss_nan_ranks": 0, "loss_rank_avg": 0.14235293865203857, "step": 5630, "valid_targets_mean": 11095.1, "valid_targets_min": 3126 }, { "epoch": 3.3244837758112094, "grad_norm": 0.16362249587364253, "learning_rate": 1.2201010051379043e-05, "loss": 0.3694, "loss_nan_ranks": 0, "loss_rank_avg": 0.12004884332418442, "step": 5635, "valid_targets_mean": 9365.7, "valid_targets_min": 1396 }, { "epoch": 3.327433628318584, "grad_norm": 0.16857686837608443, "learning_rate": 1.2163096994921518e-05, "loss": 0.3696, "loss_nan_ranks": 0, "loss_rank_avg": 0.1059444323182106, "step": 5640, "valid_targets_mean": 9492.3, "valid_targets_min": 1480 }, { "epoch": 3.330383480825959, "grad_norm": 0.1597626038930533, "learning_rate": 1.2125217179655278e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.11164246499538422, "step": 5645, "valid_targets_mean": 9468.8, "valid_targets_min": 1678 }, { "epoch": 3.3333333333333335, "grad_norm": 0.1792298222255779, "learning_rate": 1.2087370766252228e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.13133028149604797, "step": 5650, "valid_targets_mean": 10842.1, "valid_targets_min": 1206 }, { "epoch": 3.336283185840708, "grad_norm": 0.18065578316617883, "learning_rate": 1.2049557915242616e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.13570484519004822, "step": 5655, "valid_targets_mean": 10905.9, "valid_targets_min": 1230 }, { "epoch": 3.3392330383480826, "grad_norm": 0.16218754902076543, "learning_rate": 1.2011778787014297e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.10976435244083405, "step": 5660, "valid_targets_mean": 9180.0, "valid_targets_min": 1869 }, { "epoch": 3.342182890855457, "grad_norm": 0.16358824521292456, "learning_rate": 1.1974033541812124e-05, "loss": 0.3594, "loss_nan_ranks": 0, "loss_rank_avg": 0.13786596059799194, "step": 5665, "valid_targets_mean": 11668.7, "valid_targets_min": 2090 }, { "epoch": 3.3451327433628317, "grad_norm": 0.17494440281924994, "learning_rate": 1.1936322339737193e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.13460367918014526, "step": 5670, "valid_targets_mean": 10886.5, "valid_targets_min": 2834 }, { "epoch": 3.3480825958702063, "grad_norm": 0.18096806292604525, "learning_rate": 1.1898645340746242e-05, "loss": 0.3557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1231859102845192, "step": 5675, "valid_targets_mean": 9843.6, "valid_targets_min": 1609 }, { "epoch": 3.3510324483775813, "grad_norm": 0.1659915993499302, "learning_rate": 1.1861002704650897e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.11928001046180725, "step": 5680, "valid_targets_mean": 10241.2, "valid_targets_min": 2562 }, { "epoch": 3.353982300884956, "grad_norm": 0.1735036326764437, "learning_rate": 1.1823394591117048e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.12572640180587769, "step": 5685, "valid_targets_mean": 10534.2, "valid_targets_min": 1480 }, { "epoch": 3.3569321533923304, "grad_norm": 0.16324620999370973, "learning_rate": 1.1785821159664158e-05, "loss": 0.3595, "loss_nan_ranks": 0, "loss_rank_avg": 0.12011720985174179, "step": 5690, "valid_targets_mean": 11762.8, "valid_targets_min": 2092 }, { "epoch": 3.359882005899705, "grad_norm": 0.1612218314865116, "learning_rate": 1.174828256966456e-05, "loss": 0.3553, "loss_nan_ranks": 0, "loss_rank_avg": 0.11624462157487869, "step": 5695, "valid_targets_mean": 11185.9, "valid_targets_min": 1579 }, { "epoch": 3.3628318584070795, "grad_norm": 0.16525818633723133, "learning_rate": 1.1710778980342834e-05, "loss": 0.3725, "loss_nan_ranks": 0, "loss_rank_avg": 0.12180322408676147, "step": 5700, "valid_targets_mean": 9581.1, "valid_targets_min": 2162 }, { "epoch": 3.365781710914454, "grad_norm": 0.17000114316124038, "learning_rate": 1.1673310550775066e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.11625468730926514, "step": 5705, "valid_targets_mean": 10227.8, "valid_targets_min": 832 }, { "epoch": 3.3687315634218287, "grad_norm": 0.16674908078453304, "learning_rate": 1.1635877439888232e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.15849077701568604, "step": 5710, "valid_targets_mean": 11126.4, "valid_targets_min": 1768 }, { "epoch": 3.3716814159292037, "grad_norm": 0.16244915053131123, "learning_rate": 1.1598479806459493e-05, "loss": 0.3708, "loss_nan_ranks": 0, "loss_rank_avg": 0.11129726469516754, "step": 5715, "valid_targets_mean": 10253.1, "valid_targets_min": 2074 }, { "epoch": 3.3746312684365782, "grad_norm": 0.1720907804169401, "learning_rate": 1.1561117809115522e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.12222810089588165, "step": 5720, "valid_targets_mean": 10034.1, "valid_targets_min": 2135 }, { "epoch": 3.377581120943953, "grad_norm": 0.16006227650596366, "learning_rate": 1.1523791606331844e-05, "loss": 0.3722, "loss_nan_ranks": 0, "loss_rank_avg": 0.12712764739990234, "step": 5725, "valid_targets_mean": 11439.1, "valid_targets_min": 1921 }, { "epoch": 3.3805309734513274, "grad_norm": 0.1844916337446282, "learning_rate": 1.1486501356432157e-05, "loss": 0.3576, "loss_nan_ranks": 0, "loss_rank_avg": 0.12447535246610641, "step": 5730, "valid_targets_mean": 9926.1, "valid_targets_min": 2217 }, { "epoch": 3.383480825958702, "grad_norm": 0.17250265514425828, "learning_rate": 1.1449247217587654e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.12348814308643341, "step": 5735, "valid_targets_mean": 10439.4, "valid_targets_min": 2181 }, { "epoch": 3.386430678466077, "grad_norm": 0.17414640085174973, "learning_rate": 1.1412029347816364e-05, "loss": 0.3656, "loss_nan_ranks": 0, "loss_rank_avg": 0.12620124220848083, "step": 5740, "valid_targets_mean": 10171.7, "valid_targets_min": 1676 }, { "epoch": 3.3893805309734515, "grad_norm": 0.17188785739593934, "learning_rate": 1.1374847904982476e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.11639649420976639, "step": 5745, "valid_targets_mean": 9770.0, "valid_targets_min": 1417 }, { "epoch": 3.392330383480826, "grad_norm": 0.16379536749749107, "learning_rate": 1.1337703046795658e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.13657310605049133, "step": 5750, "valid_targets_mean": 11708.1, "valid_targets_min": 1751 }, { "epoch": 3.3952802359882006, "grad_norm": 0.1835047259245895, "learning_rate": 1.1300594930810428e-05, "loss": 0.3668, "loss_nan_ranks": 0, "loss_rank_avg": 0.1326453983783722, "step": 5755, "valid_targets_mean": 10102.0, "valid_targets_min": 1956 }, { "epoch": 3.398230088495575, "grad_norm": 0.1606630887122043, "learning_rate": 1.1263523714425433e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.11090432107448578, "step": 5760, "valid_targets_mean": 10676.0, "valid_targets_min": 805 }, { "epoch": 3.4011799410029497, "grad_norm": 0.17060284412602886, "learning_rate": 1.1226489554882808e-05, "loss": 0.3663, "loss_nan_ranks": 0, "loss_rank_avg": 0.12317381799221039, "step": 5765, "valid_targets_mean": 11039.3, "valid_targets_min": 2536 }, { "epoch": 3.4041297935103243, "grad_norm": 0.18149054238359424, "learning_rate": 1.1189492609267518e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.12160060554742813, "step": 5770, "valid_targets_mean": 9479.5, "valid_targets_min": 1980 }, { "epoch": 3.4070796460176993, "grad_norm": 0.15777568100406267, "learning_rate": 1.1152533034506668e-05, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.12296357750892639, "step": 5775, "valid_targets_mean": 10496.0, "valid_targets_min": 2590 }, { "epoch": 3.410029498525074, "grad_norm": 0.17773974058522804, "learning_rate": 1.1115610987368858e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567886620759964, "step": 5780, "valid_targets_mean": 11851.6, "valid_targets_min": 1998 }, { "epoch": 3.4129793510324484, "grad_norm": 0.15238485468696308, "learning_rate": 1.1078726624463504e-05, "loss": 0.3595, "loss_nan_ranks": 0, "loss_rank_avg": 0.10325300693511963, "step": 5785, "valid_targets_mean": 9576.4, "valid_targets_min": 1763 }, { "epoch": 3.415929203539823, "grad_norm": 0.15714087387831013, "learning_rate": 1.1041880102240184e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.10524867475032806, "step": 5790, "valid_targets_mean": 8958.1, "valid_targets_min": 1310 }, { "epoch": 3.4188790560471976, "grad_norm": 0.16033185917374054, "learning_rate": 1.1005071576987984e-05, "loss": 0.3631, "loss_nan_ranks": 0, "loss_rank_avg": 0.12304713577032089, "step": 5795, "valid_targets_mean": 10463.5, "valid_targets_min": 2114 }, { "epoch": 3.421828908554572, "grad_norm": 0.1873816855988947, "learning_rate": 1.096830120483478e-05, "loss": 0.3641, "loss_nan_ranks": 0, "loss_rank_avg": 0.11564882099628448, "step": 5800, "valid_targets_mean": 9729.3, "valid_targets_min": 1082 }, { "epoch": 3.4247787610619467, "grad_norm": 0.1607099901079245, "learning_rate": 1.0931569141746672e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13356913626194, "step": 5805, "valid_targets_mean": 12371.8, "valid_targets_min": 2109 }, { "epoch": 3.4277286135693217, "grad_norm": 0.1665172667935528, "learning_rate": 1.089487554352721e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.11274045705795288, "step": 5810, "valid_targets_mean": 9811.8, "valid_targets_min": 2354 }, { "epoch": 3.4306784660766962, "grad_norm": 0.1516818925090918, "learning_rate": 1.085822056581685e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11470094323158264, "step": 5815, "valid_targets_mean": 10083.3, "valid_targets_min": 1855 }, { "epoch": 3.433628318584071, "grad_norm": 0.16050534256161125, "learning_rate": 1.0821604364092173e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.10790784657001495, "step": 5820, "valid_targets_mean": 8987.7, "valid_targets_min": 1528 }, { "epoch": 3.4365781710914454, "grad_norm": 0.15780365845904865, "learning_rate": 1.0785027093665338e-05, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.11171510070562363, "step": 5825, "valid_targets_mean": 9973.6, "valid_targets_min": 2086 }, { "epoch": 3.43952802359882, "grad_norm": 0.15230714390743114, "learning_rate": 1.074848890968335e-05, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.13318592309951782, "step": 5830, "valid_targets_mean": 11855.9, "valid_targets_min": 1948 }, { "epoch": 3.442477876106195, "grad_norm": 0.16470290904412074, "learning_rate": 1.0711989967127411e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.11730567365884781, "step": 5835, "valid_targets_mean": 10060.4, "valid_targets_min": 1194 }, { "epoch": 3.4454277286135695, "grad_norm": 0.18454157641952232, "learning_rate": 1.067553042081232e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1288733184337616, "step": 5840, "valid_targets_mean": 10188.3, "valid_targets_min": 1425 }, { "epoch": 3.448377581120944, "grad_norm": 0.16574266792943357, "learning_rate": 1.0639110425385706e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.14179229736328125, "step": 5845, "valid_targets_mean": 10892.8, "valid_targets_min": 2394 }, { "epoch": 3.4513274336283186, "grad_norm": 0.16678421583777908, "learning_rate": 1.0602730135327506e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.1217309832572937, "step": 5850, "valid_targets_mean": 11444.2, "valid_targets_min": 1168 }, { "epoch": 3.454277286135693, "grad_norm": 0.16968315847539236, "learning_rate": 1.0566389704949182e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.1125468909740448, "step": 5855, "valid_targets_mean": 8869.1, "valid_targets_min": 1835 }, { "epoch": 3.4572271386430677, "grad_norm": 0.1627605634002582, "learning_rate": 1.0530089288393186e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.12059512734413147, "step": 5860, "valid_targets_mean": 10218.8, "valid_targets_min": 1490 }, { "epoch": 3.4601769911504423, "grad_norm": 0.16403510964024512, "learning_rate": 1.0493829039632177e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.1418202966451645, "step": 5865, "valid_targets_mean": 12011.1, "valid_targets_min": 1228 }, { "epoch": 3.4631268436578173, "grad_norm": 0.17134085314800312, "learning_rate": 1.0457609112468505e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.13072720170021057, "step": 5870, "valid_targets_mean": 9414.9, "valid_targets_min": 2166 }, { "epoch": 3.466076696165192, "grad_norm": 0.17700321377311182, "learning_rate": 1.0421429660533456e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.10390730202198029, "step": 5875, "valid_targets_mean": 8437.3, "valid_targets_min": 2591 }, { "epoch": 3.4690265486725664, "grad_norm": 0.16339951264714045, "learning_rate": 1.038529083728663e-05, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.1167861744761467, "step": 5880, "valid_targets_mean": 10423.9, "valid_targets_min": 1563 }, { "epoch": 3.471976401179941, "grad_norm": 0.15604649534709167, "learning_rate": 1.0349192796015315e-05, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.11106991767883301, "step": 5885, "valid_targets_mean": 10573.0, "valid_targets_min": 1979 }, { "epoch": 3.4749262536873156, "grad_norm": 0.16586097181275214, "learning_rate": 1.0313135689833795e-05, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.11501479148864746, "step": 5890, "valid_targets_mean": 9576.9, "valid_targets_min": 1775 }, { "epoch": 3.47787610619469, "grad_norm": 0.1676293724345518, "learning_rate": 1.0277119671682762e-05, "loss": 0.3714, "loss_nan_ranks": 0, "loss_rank_avg": 0.14278097450733185, "step": 5895, "valid_targets_mean": 12086.6, "valid_targets_min": 2387 }, { "epoch": 3.4808259587020647, "grad_norm": 0.18486186420421635, "learning_rate": 1.0241144894328571e-05, "loss": 0.3604, "loss_nan_ranks": 0, "loss_rank_avg": 0.10634157061576843, "step": 5900, "valid_targets_mean": 9452.8, "valid_targets_min": 1872 }, { "epoch": 3.4837758112094397, "grad_norm": 0.1606984225160234, "learning_rate": 1.0205211510362711e-05, "loss": 0.3651, "loss_nan_ranks": 0, "loss_rank_avg": 0.13014531135559082, "step": 5905, "valid_targets_mean": 10363.9, "valid_targets_min": 2676 }, { "epoch": 3.4867256637168142, "grad_norm": 0.16521860033718624, "learning_rate": 1.0169319672201032e-05, "loss": 0.3594, "loss_nan_ranks": 0, "loss_rank_avg": 0.10334562510251999, "step": 5910, "valid_targets_mean": 8599.8, "valid_targets_min": 1704 }, { "epoch": 3.489675516224189, "grad_norm": 0.17246533091080463, "learning_rate": 1.013346953208322e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.12668567895889282, "step": 5915, "valid_targets_mean": 9828.8, "valid_targets_min": 1672 }, { "epoch": 3.4926253687315634, "grad_norm": 0.17718900262395443, "learning_rate": 1.0097661242072058e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.10251834243535995, "step": 5920, "valid_targets_mean": 9252.2, "valid_targets_min": 1382 }, { "epoch": 3.495575221238938, "grad_norm": 0.1706768671141397, "learning_rate": 1.006189495405283e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.13219738006591797, "step": 5925, "valid_targets_mean": 9495.1, "valid_targets_min": 872 }, { "epoch": 3.4985250737463125, "grad_norm": 0.16744200861029962, "learning_rate": 1.0026170819732664e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.12546458840370178, "step": 5930, "valid_targets_mean": 10810.9, "valid_targets_min": 1698 }, { "epoch": 3.501474926253687, "grad_norm": 0.19280117217492482, "learning_rate": 9.990488990639878e-06, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.10583603382110596, "step": 5935, "valid_targets_mean": 9692.6, "valid_targets_min": 2361 }, { "epoch": 3.504424778761062, "grad_norm": 0.17427047444951693, "learning_rate": 9.954849618123354e-06, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.12246609479188919, "step": 5940, "valid_targets_mean": 10629.6, "valid_targets_min": 861 }, { "epoch": 3.5073746312684366, "grad_norm": 0.16144722770141756, "learning_rate": 9.919252853351895e-06, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.12689387798309326, "step": 5945, "valid_targets_mean": 11336.1, "valid_targets_min": 1485 }, { "epoch": 3.510324483775811, "grad_norm": 0.17751770876828085, "learning_rate": 9.883698847313567e-06, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402921825647354, "step": 5950, "valid_targets_mean": 10965.7, "valid_targets_min": 1453 }, { "epoch": 3.5132743362831858, "grad_norm": 0.16111628346749318, "learning_rate": 9.848187750815078e-06, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.10104361176490784, "step": 5955, "valid_targets_mean": 9067.2, "valid_targets_min": 1415 }, { "epoch": 3.5162241887905603, "grad_norm": 0.17491887195807487, "learning_rate": 9.812719714481116e-06, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.10616336017847061, "step": 5960, "valid_targets_mean": 8690.3, "valid_targets_min": 1929 }, { "epoch": 3.5191740412979353, "grad_norm": 0.16660955612607778, "learning_rate": 9.77729488875375e-06, "loss": 0.3664, "loss_nan_ranks": 0, "loss_rank_avg": 0.11444689333438873, "step": 5965, "valid_targets_mean": 9147.6, "valid_targets_min": 2141 }, { "epoch": 3.52212389380531, "grad_norm": 0.16246815509165646, "learning_rate": 9.741913423891743e-06, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.1039552316069603, "step": 5970, "valid_targets_mean": 8341.9, "valid_targets_min": 1249 }, { "epoch": 3.5250737463126844, "grad_norm": 0.161823649040674, "learning_rate": 9.706575469969945e-06, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.11723171174526215, "step": 5975, "valid_targets_mean": 10117.9, "valid_targets_min": 2552 }, { "epoch": 3.528023598820059, "grad_norm": 0.14801245024385287, "learning_rate": 9.671281176878648e-06, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.10321583598852158, "step": 5980, "valid_targets_mean": 9323.1, "valid_targets_min": 2004 }, { "epoch": 3.5309734513274336, "grad_norm": 0.16517006713119983, "learning_rate": 9.636030694322954e-06, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.1235896423459053, "step": 5985, "valid_targets_mean": 9358.4, "valid_targets_min": 2727 }, { "epoch": 3.533923303834808, "grad_norm": 0.15787575860756062, "learning_rate": 9.600824171822131e-06, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.14009323716163635, "step": 5990, "valid_targets_mean": 10875.3, "valid_targets_min": 1560 }, { "epoch": 3.5368731563421827, "grad_norm": 0.16337294055437676, "learning_rate": 9.565661758708989e-06, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.13032642006874084, "step": 5995, "valid_targets_mean": 10745.1, "valid_targets_min": 2356 }, { "epoch": 3.5398230088495577, "grad_norm": 0.1644220317684143, "learning_rate": 9.530543604129257e-06, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.10932029783725739, "step": 6000, "valid_targets_mean": 9117.4, "valid_targets_min": 2033 }, { "epoch": 3.5427728613569323, "grad_norm": 0.19450356644800085, "learning_rate": 9.495469857040895e-06, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.09607994556427002, "step": 6005, "valid_targets_mean": 8322.1, "valid_targets_min": 2131 }, { "epoch": 3.545722713864307, "grad_norm": 0.17538929126825079, "learning_rate": 9.460440666213564e-06, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.11947473138570786, "step": 6010, "valid_targets_mean": 10406.2, "valid_targets_min": 1407 }, { "epoch": 3.5486725663716814, "grad_norm": 0.1664245322565486, "learning_rate": 9.425456180227863e-06, "loss": 0.3398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309795081615448, "step": 6015, "valid_targets_mean": 12493.9, "valid_targets_min": 2457 }, { "epoch": 3.551622418879056, "grad_norm": 0.15993576182334512, "learning_rate": 9.390516547474841e-06, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10049040615558624, "step": 6020, "valid_targets_mean": 9960.1, "valid_targets_min": 2052 }, { "epoch": 3.554572271386431, "grad_norm": 0.1703810082388185, "learning_rate": 9.355621916155233e-06, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.09826871007680893, "step": 6025, "valid_targets_mean": 8378.8, "valid_targets_min": 1560 }, { "epoch": 3.557522123893805, "grad_norm": 0.17052371007062495, "learning_rate": 9.320772434278944e-06, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.10447744280099869, "step": 6030, "valid_targets_mean": 9472.5, "valid_targets_min": 2484 }, { "epoch": 3.56047197640118, "grad_norm": 0.1740402728099229, "learning_rate": 9.285968249664348e-06, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.11183241754770279, "step": 6035, "valid_targets_mean": 10299.2, "valid_targets_min": 878 }, { "epoch": 3.5634218289085546, "grad_norm": 0.1727260880217204, "learning_rate": 9.251209509937678e-06, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.12178777903318405, "step": 6040, "valid_targets_mean": 10887.9, "valid_targets_min": 2125 }, { "epoch": 3.566371681415929, "grad_norm": 0.1664269769495361, "learning_rate": 9.216496362532444e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.14320679008960724, "step": 6045, "valid_targets_mean": 12573.0, "valid_targets_min": 2048 }, { "epoch": 3.5693215339233038, "grad_norm": 0.20720455649601438, "learning_rate": 9.181828954688711e-06, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.10612769424915314, "step": 6050, "valid_targets_mean": 9179.3, "valid_targets_min": 1147 }, { "epoch": 3.5722713864306783, "grad_norm": 0.17616659494798745, "learning_rate": 9.147207433452606e-06, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.1183801218867302, "step": 6055, "valid_targets_mean": 10706.8, "valid_targets_min": 1593 }, { "epoch": 3.5752212389380533, "grad_norm": 0.19353117371557066, "learning_rate": 9.112631945675543e-06, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.11053000390529633, "step": 6060, "valid_targets_mean": 9218.1, "valid_targets_min": 2137 }, { "epoch": 3.578171091445428, "grad_norm": 0.1824706599342028, "learning_rate": 9.07810263801376e-06, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.12948954105377197, "step": 6065, "valid_targets_mean": 11224.7, "valid_targets_min": 1822 }, { "epoch": 3.5811209439528024, "grad_norm": 0.17690069727924032, "learning_rate": 9.04361965692754e-06, "loss": 0.3438, "loss_nan_ranks": 0, "loss_rank_avg": 0.12248221039772034, "step": 6070, "valid_targets_mean": 11156.6, "valid_targets_min": 1606 }, { "epoch": 3.584070796460177, "grad_norm": 0.1808717891925985, "learning_rate": 9.009183148680732e-06, "loss": 0.3436, "loss_nan_ranks": 0, "loss_rank_avg": 0.12746146321296692, "step": 6075, "valid_targets_mean": 10960.1, "valid_targets_min": 1556 }, { "epoch": 3.5870206489675516, "grad_norm": 0.17184531748341997, "learning_rate": 8.97479325934002e-06, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.10450553894042969, "step": 6080, "valid_targets_mean": 9461.7, "valid_targets_min": 1929 }, { "epoch": 3.589970501474926, "grad_norm": 0.173522586995958, "learning_rate": 8.940450134774372e-06, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.11991443485021591, "step": 6085, "valid_targets_mean": 9745.5, "valid_targets_min": 1581 }, { "epoch": 3.5929203539823007, "grad_norm": 0.17891278385912598, "learning_rate": 8.906153920654386e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.1171131432056427, "step": 6090, "valid_targets_mean": 10080.6, "valid_targets_min": 2923 }, { "epoch": 3.5958702064896757, "grad_norm": 0.1727148337513361, "learning_rate": 8.871904762451684e-06, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.10876183956861496, "step": 6095, "valid_targets_mean": 8127.2, "valid_targets_min": 1571 }, { "epoch": 3.5988200589970503, "grad_norm": 0.16448376053014324, "learning_rate": 8.837702805438302e-06, "loss": 0.3489, "loss_nan_ranks": 0, "loss_rank_avg": 0.11159020662307739, "step": 6100, "valid_targets_mean": 10449.8, "valid_targets_min": 1912 }, { "epoch": 3.601769911504425, "grad_norm": 0.17316648159091635, "learning_rate": 8.803548194686052e-06, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.10270095616579056, "step": 6105, "valid_targets_mean": 8532.2, "valid_targets_min": 1791 }, { "epoch": 3.6047197640117994, "grad_norm": 0.1648039518875971, "learning_rate": 8.769441075065952e-06, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.12315913289785385, "step": 6110, "valid_targets_mean": 11387.8, "valid_targets_min": 2003 }, { "epoch": 3.607669616519174, "grad_norm": 0.1700750326347402, "learning_rate": 8.735381591247531e-06, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.11073935031890869, "step": 6115, "valid_targets_mean": 9229.9, "valid_targets_min": 2522 }, { "epoch": 3.6106194690265485, "grad_norm": 0.1650958529279955, "learning_rate": 8.701369887698316e-06, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.132333442568779, "step": 6120, "valid_targets_mean": 12198.8, "valid_targets_min": 1675 }, { "epoch": 3.613569321533923, "grad_norm": 0.17293858668863504, "learning_rate": 8.667406108683139e-06, "loss": 0.3462, "loss_nan_ranks": 0, "loss_rank_avg": 0.1118520200252533, "step": 6125, "valid_targets_mean": 10017.0, "valid_targets_min": 1776 }, { "epoch": 3.616519174041298, "grad_norm": 0.16660377768247725, "learning_rate": 8.633490398263554e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.10835165530443192, "step": 6130, "valid_targets_mean": 10342.0, "valid_targets_min": 1961 }, { "epoch": 3.6194690265486726, "grad_norm": 0.16884560005763607, "learning_rate": 8.599622900297237e-06, "loss": 0.3436, "loss_nan_ranks": 0, "loss_rank_avg": 0.11159470677375793, "step": 6135, "valid_targets_mean": 9962.6, "valid_targets_min": 2405 }, { "epoch": 3.622418879056047, "grad_norm": 0.1759270006257247, "learning_rate": 8.565803758437362e-06, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.09441868960857391, "step": 6140, "valid_targets_mean": 8304.7, "valid_targets_min": 1978 }, { "epoch": 3.6253687315634218, "grad_norm": 0.18070673900085818, "learning_rate": 8.53203311613199e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.12781083583831787, "step": 6145, "valid_targets_mean": 12342.4, "valid_targets_min": 2187 }, { "epoch": 3.6283185840707963, "grad_norm": 0.17753626529384683, "learning_rate": 8.498311116623468e-06, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.11087179183959961, "step": 6150, "valid_targets_mean": 9165.0, "valid_targets_min": 832 }, { "epoch": 3.6312684365781713, "grad_norm": 0.1646166036937146, "learning_rate": 8.46463790294782e-06, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.11283563077449799, "step": 6155, "valid_targets_mean": 10573.9, "valid_targets_min": 2386 }, { "epoch": 3.6342182890855455, "grad_norm": 0.16202203309587745, "learning_rate": 8.431013617934137e-06, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.0927003026008606, "step": 6160, "valid_targets_mean": 8261.4, "valid_targets_min": 1439 }, { "epoch": 3.6371681415929205, "grad_norm": 0.17678122262561619, "learning_rate": 8.397438404203967e-06, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.12316885590553284, "step": 6165, "valid_targets_mean": 9847.7, "valid_targets_min": 1767 }, { "epoch": 3.640117994100295, "grad_norm": 0.1680766739382681, "learning_rate": 8.363912404170738e-06, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1343480795621872, "step": 6170, "valid_targets_mean": 13030.2, "valid_targets_min": 2483 }, { "epoch": 3.6430678466076696, "grad_norm": 0.18380350198660017, "learning_rate": 8.330435760039106e-06, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.104166179895401, "step": 6175, "valid_targets_mean": 9731.1, "valid_targets_min": 1703 }, { "epoch": 3.646017699115044, "grad_norm": 0.16599997979774428, "learning_rate": 8.297008613804391e-06, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.11891473829746246, "step": 6180, "valid_targets_mean": 10780.1, "valid_targets_min": 1649 }, { "epoch": 3.6489675516224187, "grad_norm": 0.167945203058584, "learning_rate": 8.263631107251959e-06, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.12040609866380692, "step": 6185, "valid_targets_mean": 10743.4, "valid_targets_min": 1801 }, { "epoch": 3.6519174041297937, "grad_norm": 0.16579591867118337, "learning_rate": 8.230303381956626e-06, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.09442141652107239, "step": 6190, "valid_targets_mean": 9102.6, "valid_targets_min": 1830 }, { "epoch": 3.6548672566371683, "grad_norm": 0.16262630444579598, "learning_rate": 8.197025579282048e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.0995297059416771, "step": 6195, "valid_targets_mean": 9400.9, "valid_targets_min": 1853 }, { "epoch": 3.657817109144543, "grad_norm": 0.16235716247631857, "learning_rate": 8.163797840380123e-06, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11255133152008057, "step": 6200, "valid_targets_mean": 10114.0, "valid_targets_min": 2144 }, { "epoch": 3.6607669616519174, "grad_norm": 0.1754927540173778, "learning_rate": 8.130620306190433e-06, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.11358267068862915, "step": 6205, "valid_targets_mean": 9553.2, "valid_targets_min": 2181 }, { "epoch": 3.663716814159292, "grad_norm": 0.17062171541474505, "learning_rate": 8.097493117439554e-06, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.11900287866592407, "step": 6210, "valid_targets_mean": 9748.7, "valid_targets_min": 856 }, { "epoch": 3.6666666666666665, "grad_norm": 0.16773458814080258, "learning_rate": 8.064416414640572e-06, "loss": 0.3501, "loss_nan_ranks": 0, "loss_rank_avg": 0.12731051445007324, "step": 6215, "valid_targets_mean": 12207.3, "valid_targets_min": 2941 }, { "epoch": 3.669616519174041, "grad_norm": 0.168416961836028, "learning_rate": 8.031390338092378e-06, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.10286203026771545, "step": 6220, "valid_targets_mean": 9607.7, "valid_targets_min": 1480 }, { "epoch": 3.672566371681416, "grad_norm": 0.16945037472215474, "learning_rate": 7.998415027879179e-06, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.10942085087299347, "step": 6225, "valid_targets_mean": 10516.6, "valid_targets_min": 1750 }, { "epoch": 3.6755162241887906, "grad_norm": 0.17600897641430144, "learning_rate": 7.965490623869794e-06, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.1005764976143837, "step": 6230, "valid_targets_mean": 9166.2, "valid_targets_min": 2342 }, { "epoch": 3.678466076696165, "grad_norm": 0.17173774425396918, "learning_rate": 7.932617265717167e-06, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.13368156552314758, "step": 6235, "valid_targets_mean": 10198.2, "valid_targets_min": 1888 }, { "epoch": 3.6814159292035398, "grad_norm": 0.1745358047065503, "learning_rate": 7.899795092857696e-06, "loss": 0.3476, "loss_nan_ranks": 0, "loss_rank_avg": 0.11775140464305878, "step": 6240, "valid_targets_mean": 9976.0, "valid_targets_min": 1591 }, { "epoch": 3.6843657817109143, "grad_norm": 0.17554957959750347, "learning_rate": 7.867024244510673e-06, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.10555160790681839, "step": 6245, "valid_targets_mean": 8667.3, "valid_targets_min": 1636 }, { "epoch": 3.6873156342182893, "grad_norm": 0.17524218274714723, "learning_rate": 7.834304859677716e-06, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.13906937837600708, "step": 6250, "valid_targets_mean": 11671.9, "valid_targets_min": 1372 }, { "epoch": 3.6902654867256635, "grad_norm": 0.17554401621953275, "learning_rate": 7.801637077142104e-06, "loss": 0.3483, "loss_nan_ranks": 0, "loss_rank_avg": 0.1021658331155777, "step": 6255, "valid_targets_mean": 8705.5, "valid_targets_min": 788 }, { "epoch": 3.6932153392330385, "grad_norm": 0.16643085352425324, "learning_rate": 7.769021035468299e-06, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.11641626060009003, "step": 6260, "valid_targets_mean": 10789.9, "valid_targets_min": 1629 }, { "epoch": 3.696165191740413, "grad_norm": 0.16909368644232686, "learning_rate": 7.736456873001237e-06, "loss": 0.3524, "loss_nan_ranks": 0, "loss_rank_avg": 0.10872875154018402, "step": 6265, "valid_targets_mean": 9820.9, "valid_targets_min": 2079 }, { "epoch": 3.6991150442477876, "grad_norm": 0.15963667721381897, "learning_rate": 7.703944727865862e-06, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.10363304615020752, "step": 6270, "valid_targets_mean": 9519.0, "valid_targets_min": 1443 }, { "epoch": 3.702064896755162, "grad_norm": 0.16511138622677904, "learning_rate": 7.671484737966419e-06, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.11367395520210266, "step": 6275, "valid_targets_mean": 11148.6, "valid_targets_min": 2844 }, { "epoch": 3.7050147492625367, "grad_norm": 0.18024864216215955, "learning_rate": 7.639077040985988e-06, "loss": 0.3476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14413657784461975, "step": 6280, "valid_targets_mean": 11772.3, "valid_targets_min": 2041 }, { "epoch": 3.7079646017699117, "grad_norm": 0.1715775268186753, "learning_rate": 7.606721774385799e-06, "loss": 0.3434, "loss_nan_ranks": 0, "loss_rank_avg": 0.10575740039348602, "step": 6285, "valid_targets_mean": 9464.2, "valid_targets_min": 2006 }, { "epoch": 3.7109144542772863, "grad_norm": 0.178496726739179, "learning_rate": 7.574419075404718e-06, "loss": 0.3503, "loss_nan_ranks": 0, "loss_rank_avg": 0.10551615059375763, "step": 6290, "valid_targets_mean": 10115.8, "valid_targets_min": 2033 }, { "epoch": 3.713864306784661, "grad_norm": 0.16922995334986288, "learning_rate": 7.5421690810586235e-06, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.09147170186042786, "step": 6295, "valid_targets_mean": 8914.2, "valid_targets_min": 1829 }, { "epoch": 3.7168141592920354, "grad_norm": 0.1698282291677968, "learning_rate": 7.509971928139848e-06, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.12778304517269135, "step": 6300, "valid_targets_mean": 11594.1, "valid_targets_min": 1466 }, { "epoch": 3.71976401179941, "grad_norm": 0.16512789906024777, "learning_rate": 7.477827753216589e-06, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.11623457819223404, "step": 6305, "valid_targets_mean": 10735.3, "valid_targets_min": 1786 }, { "epoch": 3.7227138643067845, "grad_norm": 0.17231015736096786, "learning_rate": 7.445736692632326e-06, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.11947697401046753, "step": 6310, "valid_targets_mean": 11454.9, "valid_targets_min": 2305 }, { "epoch": 3.725663716814159, "grad_norm": 0.1641230791590994, "learning_rate": 7.413698882505271e-06, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.10247132927179337, "step": 6315, "valid_targets_mean": 9119.2, "valid_targets_min": 933 }, { "epoch": 3.728613569321534, "grad_norm": 0.16978357719585283, "learning_rate": 7.381714458727726e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.09884299337863922, "step": 6320, "valid_targets_mean": 9410.8, "valid_targets_min": 1837 }, { "epoch": 3.7315634218289087, "grad_norm": 0.15757721589249796, "learning_rate": 7.349783556965588e-06, "loss": 0.34, "loss_nan_ranks": 0, "loss_rank_avg": 0.0996585488319397, "step": 6325, "valid_targets_mean": 9461.3, "valid_targets_min": 1841 }, { "epoch": 3.734513274336283, "grad_norm": 0.16646465943939942, "learning_rate": 7.317906312657714e-06, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353026032447815, "step": 6330, "valid_targets_mean": 12400.2, "valid_targets_min": 2042 }, { "epoch": 3.737463126843658, "grad_norm": 0.1554771877383893, "learning_rate": 7.286082861015371e-06, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.13425269722938538, "step": 6335, "valid_targets_mean": 12530.3, "valid_targets_min": 2926 }, { "epoch": 3.7404129793510323, "grad_norm": 0.181300037618926, "learning_rate": 7.25431333702165e-06, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.12450385838747025, "step": 6340, "valid_targets_mean": 10509.6, "valid_targets_min": 649 }, { "epoch": 3.7433628318584073, "grad_norm": 0.1640895467509584, "learning_rate": 7.222597875430915e-06, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.11129672080278397, "step": 6345, "valid_targets_mean": 9454.0, "valid_targets_min": 2003 }, { "epoch": 3.7463126843657815, "grad_norm": 0.16861575775932142, "learning_rate": 7.190936610768207e-06, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.10709446668624878, "step": 6350, "valid_targets_mean": 9103.6, "valid_targets_min": 1608 }, { "epoch": 3.7492625368731565, "grad_norm": 0.17534385015787332, "learning_rate": 7.159329677328688e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.10979295521974564, "step": 6355, "valid_targets_mean": 9436.6, "valid_targets_min": 2137 }, { "epoch": 3.752212389380531, "grad_norm": 0.1709407442953378, "learning_rate": 7.127777209177067e-06, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.10932078212499619, "step": 6360, "valid_targets_mean": 9747.0, "valid_targets_min": 1135 }, { "epoch": 3.7551622418879056, "grad_norm": 0.1692586176282364, "learning_rate": 7.096279340147032e-06, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.11985991895198822, "step": 6365, "valid_targets_mean": 10079.6, "valid_targets_min": 2286 }, { "epoch": 3.75811209439528, "grad_norm": 0.16424785026958424, "learning_rate": 7.064836203840675e-06, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.11962170153856277, "step": 6370, "valid_targets_mean": 10582.6, "valid_targets_min": 1657 }, { "epoch": 3.7610619469026547, "grad_norm": 0.17826076992497336, "learning_rate": 7.033447933627959e-06, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.10628711432218552, "step": 6375, "valid_targets_mean": 8869.7, "valid_targets_min": 1883 }, { "epoch": 3.7640117994100297, "grad_norm": 0.18140433917301785, "learning_rate": 7.002114662646078e-06, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.1187339499592781, "step": 6380, "valid_targets_mean": 10999.8, "valid_targets_min": 1608 }, { "epoch": 3.7669616519174043, "grad_norm": 0.16342405697264487, "learning_rate": 6.970836523798992e-06, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.11724892258644104, "step": 6385, "valid_targets_mean": 10845.2, "valid_targets_min": 1769 }, { "epoch": 3.769911504424779, "grad_norm": 0.1769109723907381, "learning_rate": 6.939613649756773e-06, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.12063444405794144, "step": 6390, "valid_targets_mean": 11583.4, "valid_targets_min": 2726 }, { "epoch": 3.7728613569321534, "grad_norm": 0.16774493767056747, "learning_rate": 6.908446172955103e-06, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1022709459066391, "step": 6395, "valid_targets_mean": 9023.2, "valid_targets_min": 1719 }, { "epoch": 3.775811209439528, "grad_norm": 0.16532399248445567, "learning_rate": 6.877334225594677e-06, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327495276927948, "step": 6400, "valid_targets_mean": 11621.1, "valid_targets_min": 1627 }, { "epoch": 3.7787610619469025, "grad_norm": 0.17263632707334922, "learning_rate": 6.846277939640653e-06, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.13509851694107056, "step": 6405, "valid_targets_mean": 10227.8, "valid_targets_min": 2542 }, { "epoch": 3.781710914454277, "grad_norm": 0.1668878067844066, "learning_rate": 6.8152774468221195e-06, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.10570927709341049, "step": 6410, "valid_targets_mean": 8847.1, "valid_targets_min": 2962 }, { "epoch": 3.784660766961652, "grad_norm": 0.17606729721917502, "learning_rate": 6.78433287863147e-06, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.12169715762138367, "step": 6415, "valid_targets_mean": 11824.5, "valid_targets_min": 2336 }, { "epoch": 3.7876106194690267, "grad_norm": 0.174587558240972, "learning_rate": 6.7534443663239314e-06, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.14479205012321472, "step": 6420, "valid_targets_mean": 13422.8, "valid_targets_min": 2469 }, { "epoch": 3.7905604719764012, "grad_norm": 0.16719235317425998, "learning_rate": 6.7226120409169185e-06, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.08362986892461777, "step": 6425, "valid_targets_mean": 8039.5, "valid_targets_min": 1011 }, { "epoch": 3.793510324483776, "grad_norm": 0.16546216405386466, "learning_rate": 6.6918360331895674e-06, "loss": 0.3438, "loss_nan_ranks": 0, "loss_rank_avg": 0.09400837868452072, "step": 6430, "valid_targets_mean": 8162.9, "valid_targets_min": 1768 }, { "epoch": 3.7964601769911503, "grad_norm": 0.17191373561059659, "learning_rate": 6.661116473682088e-06, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.122324638068676, "step": 6435, "valid_targets_mean": 9680.6, "valid_targets_min": 1517 }, { "epoch": 3.799410029498525, "grad_norm": 0.16322793961765103, "learning_rate": 6.630453492695304e-06, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.11813613772392273, "step": 6440, "valid_targets_mean": 10204.0, "valid_targets_min": 1856 }, { "epoch": 3.8023598820058995, "grad_norm": 0.1652451657616475, "learning_rate": 6.5998472202900254e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.13308531045913696, "step": 6445, "valid_targets_mean": 11088.9, "valid_targets_min": 3033 }, { "epoch": 3.8053097345132745, "grad_norm": 0.16790780251020782, "learning_rate": 6.5692977862865285e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.10099241137504578, "step": 6450, "valid_targets_mean": 8808.9, "valid_targets_min": 1628 }, { "epoch": 3.808259587020649, "grad_norm": 0.17544823543649818, "learning_rate": 6.538805320264028e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.1215641126036644, "step": 6455, "valid_targets_mean": 10004.9, "valid_targets_min": 2090 }, { "epoch": 3.8112094395280236, "grad_norm": 0.15764389972156023, "learning_rate": 6.508369951560054e-06, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.12080827355384827, "step": 6460, "valid_targets_mean": 11585.9, "valid_targets_min": 1578 }, { "epoch": 3.814159292035398, "grad_norm": 0.18037623858830892, "learning_rate": 6.477991809270005e-06, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.12614494562149048, "step": 6465, "valid_targets_mean": 10658.7, "valid_targets_min": 1712 }, { "epoch": 3.8171091445427727, "grad_norm": 0.16246465667800158, "learning_rate": 6.447671022246495e-06, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1316598355770111, "step": 6470, "valid_targets_mean": 11714.4, "valid_targets_min": 2874 }, { "epoch": 3.8200589970501477, "grad_norm": 0.1671932168668726, "learning_rate": 6.4174077190989134e-06, "loss": 0.3416, "loss_nan_ranks": 0, "loss_rank_avg": 0.09807242453098297, "step": 6475, "valid_targets_mean": 9205.3, "valid_targets_min": 2733 }, { "epoch": 3.823008849557522, "grad_norm": 0.1558550238873647, "learning_rate": 6.387202028192765e-06, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.09681665897369385, "step": 6480, "valid_targets_mean": 8837.8, "valid_targets_min": 2032 }, { "epoch": 3.825958702064897, "grad_norm": 0.1599149693693091, "learning_rate": 6.357054077649236e-06, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.1108127236366272, "step": 6485, "valid_targets_mean": 10313.7, "valid_targets_min": 2037 }, { "epoch": 3.8289085545722714, "grad_norm": 0.2814540103412294, "learning_rate": 6.326963995344575e-06, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.09222610294818878, "step": 6490, "valid_targets_mean": 8079.2, "valid_targets_min": 1799 }, { "epoch": 3.831858407079646, "grad_norm": 0.16787270480252503, "learning_rate": 6.296931908909578e-06, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.14041510224342346, "step": 6495, "valid_targets_mean": 11687.4, "valid_targets_min": 1660 }, { "epoch": 3.8348082595870205, "grad_norm": 0.16222885250068517, "learning_rate": 6.266957945729044e-06, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.10812919586896896, "step": 6500, "valid_targets_mean": 9689.1, "valid_targets_min": 1213 }, { "epoch": 3.837758112094395, "grad_norm": 0.1619680212917784, "learning_rate": 6.237042232941241e-06, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.15254142880439758, "step": 6505, "valid_targets_mean": 13727.9, "valid_targets_min": 2019 }, { "epoch": 3.84070796460177, "grad_norm": 0.16666940188615342, "learning_rate": 6.207184897437355e-06, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.09690691530704498, "step": 6510, "valid_targets_mean": 8408.8, "valid_targets_min": 1770 }, { "epoch": 3.8436578171091447, "grad_norm": 0.1653920328156485, "learning_rate": 6.17738606586096e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.12510699033737183, "step": 6515, "valid_targets_mean": 10496.0, "valid_targets_min": 1924 }, { "epoch": 3.8466076696165192, "grad_norm": 0.17052174641185705, "learning_rate": 6.1476458646074765e-06, "loss": 0.3445, "loss_nan_ranks": 0, "loss_rank_avg": 0.10477550327777863, "step": 6520, "valid_targets_mean": 9131.2, "valid_targets_min": 2712 }, { "epoch": 3.849557522123894, "grad_norm": 0.17419686871265677, "learning_rate": 6.117964419823632e-06, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.11350217461585999, "step": 6525, "valid_targets_mean": 8391.5, "valid_targets_min": 1896 }, { "epoch": 3.8525073746312684, "grad_norm": 0.16258801176668275, "learning_rate": 6.088341857406952e-06, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.10940175503492355, "step": 6530, "valid_targets_mean": 9973.9, "valid_targets_min": 1874 }, { "epoch": 3.855457227138643, "grad_norm": 0.15465794427933052, "learning_rate": 6.058778303005184e-06, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.11987055838108063, "step": 6535, "valid_targets_mean": 11387.2, "valid_targets_min": 2079 }, { "epoch": 3.8584070796460175, "grad_norm": 0.16673934443470403, "learning_rate": 6.029273882015794e-06, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.11683391779661179, "step": 6540, "valid_targets_mean": 9381.8, "valid_targets_min": 1708 }, { "epoch": 3.8613569321533925, "grad_norm": 0.17985237846474775, "learning_rate": 5.999828719585419e-06, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.1079455316066742, "step": 6545, "valid_targets_mean": 8509.3, "valid_targets_min": 1118 }, { "epoch": 3.864306784660767, "grad_norm": 0.16617501395918077, "learning_rate": 5.9704429406093555e-06, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.11439075320959091, "step": 6550, "valid_targets_mean": 10374.7, "valid_targets_min": 2011 }, { "epoch": 3.8672566371681416, "grad_norm": 0.1659912761912214, "learning_rate": 5.941116669731011e-06, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.14208897948265076, "step": 6555, "valid_targets_mean": 12519.0, "valid_targets_min": 1887 }, { "epoch": 3.870206489675516, "grad_norm": 0.17092514673071188, "learning_rate": 5.9118500313413795e-06, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.10985920578241348, "step": 6560, "valid_targets_mean": 9916.1, "valid_targets_min": 1793 }, { "epoch": 3.8731563421828907, "grad_norm": 0.1747700268580997, "learning_rate": 5.882643149578522e-06, "loss": 0.3527, "loss_nan_ranks": 0, "loss_rank_avg": 0.12933915853500366, "step": 6565, "valid_targets_mean": 10340.9, "valid_targets_min": 1125 }, { "epoch": 3.8761061946902657, "grad_norm": 0.1701245952171269, "learning_rate": 5.853496148327032e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.12071774899959564, "step": 6570, "valid_targets_mean": 9584.5, "valid_targets_min": 2028 }, { "epoch": 3.87905604719764, "grad_norm": 0.17367176274171137, "learning_rate": 5.824409151217507e-06, "loss": 0.3505, "loss_nan_ranks": 0, "loss_rank_avg": 0.13250917196273804, "step": 6575, "valid_targets_mean": 11590.9, "valid_targets_min": 2261 }, { "epoch": 3.882005899705015, "grad_norm": 0.16070228970994752, "learning_rate": 5.79538228162605e-06, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.12515580654144287, "step": 6580, "valid_targets_mean": 11354.4, "valid_targets_min": 1773 }, { "epoch": 3.8849557522123894, "grad_norm": 0.16170822860983441, "learning_rate": 5.76641566267369e-06, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.11002568900585175, "step": 6585, "valid_targets_mean": 9635.8, "valid_targets_min": 2187 }, { "epoch": 3.887905604719764, "grad_norm": 0.1722451727249354, "learning_rate": 5.737509417225933e-06, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.11824969947338104, "step": 6590, "valid_targets_mean": 10532.5, "valid_targets_min": 1940 }, { "epoch": 3.8908554572271385, "grad_norm": 0.1556413370229152, "learning_rate": 5.70866366789218e-06, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.12434402853250504, "step": 6595, "valid_targets_mean": 11384.6, "valid_targets_min": 2096 }, { "epoch": 3.893805309734513, "grad_norm": 0.1656739848194637, "learning_rate": 5.679878537025238e-06, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.11528940498828888, "step": 6600, "valid_targets_mean": 10272.5, "valid_targets_min": 2815 }, { "epoch": 3.896755162241888, "grad_norm": 0.1618610591918246, "learning_rate": 5.65115414672079e-06, "loss": 0.3487, "loss_nan_ranks": 0, "loss_rank_avg": 0.13066346943378448, "step": 6605, "valid_targets_mean": 11145.4, "valid_targets_min": 818 }, { "epoch": 3.8997050147492627, "grad_norm": 0.16099503298446652, "learning_rate": 5.622490618816881e-06, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.10254774987697601, "step": 6610, "valid_targets_mean": 9275.6, "valid_targets_min": 1757 }, { "epoch": 3.9026548672566372, "grad_norm": 0.16139572620781348, "learning_rate": 5.5938880748934144e-06, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.12209212779998779, "step": 6615, "valid_targets_mean": 10562.0, "valid_targets_min": 1778 }, { "epoch": 3.905604719764012, "grad_norm": 0.16912364039387326, "learning_rate": 5.565346636271587e-06, "loss": 0.3434, "loss_nan_ranks": 0, "loss_rank_avg": 0.11217247694730759, "step": 6620, "valid_targets_mean": 9969.5, "valid_targets_min": 1957 }, { "epoch": 3.9085545722713864, "grad_norm": 0.16403825414110845, "learning_rate": 5.536866424013463e-06, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278546005487442, "step": 6625, "valid_targets_mean": 10153.2, "valid_targets_min": 2191 }, { "epoch": 3.911504424778761, "grad_norm": 0.16830399382047592, "learning_rate": 5.508447558921346e-06, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.09282360225915909, "step": 6630, "valid_targets_mean": 8849.2, "valid_targets_min": 324 }, { "epoch": 3.9144542772861355, "grad_norm": 0.15924541084825097, "learning_rate": 5.480090161537388e-06, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.12358694523572922, "step": 6635, "valid_targets_mean": 10924.6, "valid_targets_min": 2710 }, { "epoch": 3.9174041297935105, "grad_norm": 0.15560194458761062, "learning_rate": 5.451794352142965e-06, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277778148651123, "step": 6640, "valid_targets_mean": 11752.3, "valid_targets_min": 1969 }, { "epoch": 3.920353982300885, "grad_norm": 0.16863501499682176, "learning_rate": 5.423560250758264e-06, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.13744091987609863, "step": 6645, "valid_targets_mean": 12698.6, "valid_targets_min": 2768 }, { "epoch": 3.9233038348082596, "grad_norm": 0.16556811433623927, "learning_rate": 5.395387977141702e-06, "loss": 0.3506, "loss_nan_ranks": 0, "loss_rank_avg": 0.11003266274929047, "step": 6650, "valid_targets_mean": 10104.6, "valid_targets_min": 1652 }, { "epoch": 3.926253687315634, "grad_norm": 0.1566548731455713, "learning_rate": 5.367277650789455e-06, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.12147540599107742, "step": 6655, "valid_targets_mean": 11014.7, "valid_targets_min": 1872 }, { "epoch": 3.9292035398230087, "grad_norm": 0.16800747281497158, "learning_rate": 5.339229390934941e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.11620292067527771, "step": 6660, "valid_targets_mean": 10039.7, "valid_targets_min": 2777 }, { "epoch": 3.9321533923303837, "grad_norm": 0.16958647093311707, "learning_rate": 5.311243316548312e-06, "loss": 0.3503, "loss_nan_ranks": 0, "loss_rank_avg": 0.12884800136089325, "step": 6665, "valid_targets_mean": 11453.5, "valid_targets_min": 1275 }, { "epoch": 3.935103244837758, "grad_norm": 0.16445607485119396, "learning_rate": 5.2833195463359725e-06, "loss": 0.351, "loss_nan_ranks": 0, "loss_rank_avg": 0.10376372933387756, "step": 6670, "valid_targets_mean": 8932.7, "valid_targets_min": 1791 }, { "epoch": 3.938053097345133, "grad_norm": 0.17134724997512896, "learning_rate": 5.2554581987400155e-06, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.11989767104387283, "step": 6675, "valid_targets_mean": 11101.6, "valid_targets_min": 2707 }, { "epoch": 3.9410029498525074, "grad_norm": 0.1715643102378431, "learning_rate": 5.227659391937812e-06, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.13737812638282776, "step": 6680, "valid_targets_mean": 10862.0, "valid_targets_min": 1591 }, { "epoch": 3.943952802359882, "grad_norm": 0.16952566207322528, "learning_rate": 5.199923243841402e-06, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.12849953770637512, "step": 6685, "valid_targets_mean": 10801.4, "valid_targets_min": 1421 }, { "epoch": 3.9469026548672566, "grad_norm": 0.1717652002538149, "learning_rate": 5.172249872097108e-06, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.11228206753730774, "step": 6690, "valid_targets_mean": 8929.9, "valid_targets_min": 1203 }, { "epoch": 3.949852507374631, "grad_norm": 0.16253902540810058, "learning_rate": 5.144639394084938e-06, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.11897753924131393, "step": 6695, "valid_targets_mean": 10474.6, "valid_targets_min": 1041 }, { "epoch": 3.952802359882006, "grad_norm": 0.16657433949683387, "learning_rate": 5.117091926918145e-06, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.10188919305801392, "step": 6700, "valid_targets_mean": 8967.3, "valid_targets_min": 2401 }, { "epoch": 3.9557522123893807, "grad_norm": 0.1673520592720761, "learning_rate": 5.089607587442709e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.12093910574913025, "step": 6705, "valid_targets_mean": 10507.0, "valid_targets_min": 1811 }, { "epoch": 3.9587020648967552, "grad_norm": 0.16051963913152287, "learning_rate": 5.062186492236849e-06, "loss": 0.35, "loss_nan_ranks": 0, "loss_rank_avg": 0.1005478948354721, "step": 6710, "valid_targets_mean": 9101.4, "valid_targets_min": 1896 }, { "epoch": 3.96165191740413, "grad_norm": 0.1567988848736846, "learning_rate": 5.034828757610526e-06, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.12492018938064575, "step": 6715, "valid_targets_mean": 11740.2, "valid_targets_min": 1329 }, { "epoch": 3.9646017699115044, "grad_norm": 0.16986019942555441, "learning_rate": 5.007534499604945e-06, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.1041763573884964, "step": 6720, "valid_targets_mean": 8273.8, "valid_targets_min": 1581 }, { "epoch": 3.967551622418879, "grad_norm": 0.16521714927339842, "learning_rate": 4.980303833992073e-06, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.1275613158941269, "step": 6725, "valid_targets_mean": 10531.7, "valid_targets_min": 2030 }, { "epoch": 3.9705014749262535, "grad_norm": 0.16816919039174055, "learning_rate": 4.953136876274129e-06, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.10549589991569519, "step": 6730, "valid_targets_mean": 8572.2, "valid_targets_min": 1302 }, { "epoch": 3.9734513274336285, "grad_norm": 0.16156063084133174, "learning_rate": 4.9260337416831315e-06, "loss": 0.3505, "loss_nan_ranks": 0, "loss_rank_avg": 0.12027633190155029, "step": 6735, "valid_targets_mean": 10365.0, "valid_targets_min": 1880 }, { "epoch": 3.976401179941003, "grad_norm": 0.16418086724764425, "learning_rate": 4.898994545180362e-06, "loss": 0.3524, "loss_nan_ranks": 0, "loss_rank_avg": 0.135321706533432, "step": 6740, "valid_targets_mean": 11930.6, "valid_targets_min": 1431 }, { "epoch": 3.9793510324483776, "grad_norm": 0.16120879940989763, "learning_rate": 4.872019401455914e-06, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.11530904471874237, "step": 6745, "valid_targets_mean": 10015.8, "valid_targets_min": 1439 }, { "epoch": 3.982300884955752, "grad_norm": 0.16461230557595902, "learning_rate": 4.845108424928187e-06, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.12305441498756409, "step": 6750, "valid_targets_mean": 10110.8, "valid_targets_min": 2130 }, { "epoch": 3.9852507374631267, "grad_norm": 0.16618178125583494, "learning_rate": 4.8182617297434074e-06, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.11000995337963104, "step": 6755, "valid_targets_mean": 9938.6, "valid_targets_min": 1395 }, { "epoch": 3.9882005899705013, "grad_norm": 0.17046042797200478, "learning_rate": 4.791479429775147e-06, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.14216330647468567, "step": 6760, "valid_targets_mean": 11508.6, "valid_targets_min": 1832 }, { "epoch": 3.991150442477876, "grad_norm": 0.1518400194788491, "learning_rate": 4.764761638623836e-06, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.10530564188957214, "step": 6765, "valid_targets_mean": 9993.5, "valid_targets_min": 2294 }, { "epoch": 3.994100294985251, "grad_norm": 0.1665719804740287, "learning_rate": 4.738108469616285e-06, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330103576183319, "step": 6770, "valid_targets_mean": 11300.2, "valid_targets_min": 1578 }, { "epoch": 3.9970501474926254, "grad_norm": 0.163422115739297, "learning_rate": 4.711520035805197e-06, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.11337786912918091, "step": 6775, "valid_targets_mean": 10239.3, "valid_targets_min": 1636 }, { "epoch": 4.0, "grad_norm": 0.17143272673619384, "learning_rate": 4.6849964499686925e-06, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.10329215228557587, "step": 6780, "valid_targets_mean": 9906.2, "valid_targets_min": 1715 }, { "epoch": 4.002949852507375, "grad_norm": 0.16365821049173732, "learning_rate": 4.65853782460985e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.09373873472213745, "step": 6785, "valid_targets_mean": 7547.9, "valid_targets_min": 1398 }, { "epoch": 4.005899705014749, "grad_norm": 0.164443088571593, "learning_rate": 4.632144271956169e-06, "loss": 0.3509, "loss_nan_ranks": 0, "loss_rank_avg": 0.1149953305721283, "step": 6790, "valid_targets_mean": 9679.5, "valid_targets_min": 2137 }, { "epoch": 4.008849557522124, "grad_norm": 0.16651425905881423, "learning_rate": 4.6058159039591875e-06, "loss": 0.3539, "loss_nan_ranks": 0, "loss_rank_avg": 0.10481321811676025, "step": 6795, "valid_targets_mean": 8938.5, "valid_targets_min": 2170 }, { "epoch": 4.011799410029498, "grad_norm": 0.15841736021868594, "learning_rate": 4.579552832293903e-06, "loss": 0.3539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1180085763335228, "step": 6800, "valid_targets_mean": 10395.2, "valid_targets_min": 2412 }, { "epoch": 4.014749262536873, "grad_norm": 0.16169146415784627, "learning_rate": 4.5533551683583935e-06, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.12989673018455505, "step": 6805, "valid_targets_mean": 10598.5, "valid_targets_min": 1780 }, { "epoch": 4.017699115044247, "grad_norm": 0.1611965264717543, "learning_rate": 4.527223023273275e-06, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.12244442850351334, "step": 6810, "valid_targets_mean": 10495.7, "valid_targets_min": 1490 }, { "epoch": 4.020648967551622, "grad_norm": 0.15473504780481703, "learning_rate": 4.501156507881262e-06, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.1352512538433075, "step": 6815, "valid_targets_mean": 12575.5, "valid_targets_min": 1549 }, { "epoch": 4.023598820058997, "grad_norm": 0.15054625331409213, "learning_rate": 4.4751557327467145e-06, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.13213303685188293, "step": 6820, "valid_targets_mean": 11952.8, "valid_targets_min": 1639 }, { "epoch": 4.0265486725663715, "grad_norm": 0.16572229917038309, "learning_rate": 4.449220808155103e-06, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.11531409621238708, "step": 6825, "valid_targets_mean": 10646.2, "valid_targets_min": 1310 }, { "epoch": 4.0294985250737465, "grad_norm": 0.15671781348401131, "learning_rate": 4.42335184411264e-06, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.11736129224300385, "step": 6830, "valid_targets_mean": 10609.1, "valid_targets_min": 1471 }, { "epoch": 4.032448377581121, "grad_norm": 0.14812414015958358, "learning_rate": 4.3975489503457e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351662576198578, "step": 6835, "valid_targets_mean": 12694.0, "valid_targets_min": 1997 }, { "epoch": 4.035398230088496, "grad_norm": 0.1612795719679882, "learning_rate": 4.371812236300468e-06, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.12117096781730652, "step": 6840, "valid_targets_mean": 10021.1, "valid_targets_min": 1342 }, { "epoch": 4.038348082595871, "grad_norm": 0.16538082905966264, "learning_rate": 4.346141811142368e-06, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12282433360815048, "step": 6845, "valid_targets_mean": 10509.8, "valid_targets_min": 2085 }, { "epoch": 4.041297935103245, "grad_norm": 0.16131890977155694, "learning_rate": 4.320537783755694e-06, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.11613143980503082, "step": 6850, "valid_targets_mean": 9730.3, "valid_targets_min": 2631 }, { "epoch": 4.04424778761062, "grad_norm": 0.17654596470525524, "learning_rate": 4.295000262743083e-06, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.10903732478618622, "step": 6855, "valid_targets_mean": 9231.4, "valid_targets_min": 2422 }, { "epoch": 4.047197640117994, "grad_norm": 0.17150669044213787, "learning_rate": 4.2695293564250815e-06, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.12391988188028336, "step": 6860, "valid_targets_mean": 9515.6, "valid_targets_min": 1609 }, { "epoch": 4.050147492625369, "grad_norm": 0.15235581223553574, "learning_rate": 4.244125172839684e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.09287584573030472, "step": 6865, "valid_targets_mean": 9326.3, "valid_targets_min": 1804 }, { "epoch": 4.053097345132743, "grad_norm": 0.14906974124510863, "learning_rate": 4.21878781974186e-06, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.09931151568889618, "step": 6870, "valid_targets_mean": 8140.9, "valid_targets_min": 1842 }, { "epoch": 4.056047197640118, "grad_norm": 0.16023146247364678, "learning_rate": 4.193517404603142e-06, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10166919231414795, "step": 6875, "valid_targets_mean": 8372.6, "valid_targets_min": 2308 }, { "epoch": 4.058997050147493, "grad_norm": 0.15800640221773357, "learning_rate": 4.168314034611091e-06, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.12523864209651947, "step": 6880, "valid_targets_mean": 10681.7, "valid_targets_min": 1131 }, { "epoch": 4.061946902654867, "grad_norm": 0.1654824330981487, "learning_rate": 4.143177816668931e-06, "loss": 0.3506, "loss_nan_ranks": 0, "loss_rank_avg": 0.12416894733905792, "step": 6885, "valid_targets_mean": 9500.6, "valid_targets_min": 2254 }, { "epoch": 4.064896755162242, "grad_norm": 0.1656973469362214, "learning_rate": 4.118108857395011e-06, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.12975981831550598, "step": 6890, "valid_targets_mean": 11167.9, "valid_targets_min": 2228 }, { "epoch": 4.067846607669616, "grad_norm": 0.16228434232902877, "learning_rate": 4.093107263122433e-06, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.12434341013431549, "step": 6895, "valid_targets_mean": 10814.7, "valid_targets_min": 2296 }, { "epoch": 4.070796460176991, "grad_norm": 0.14909841844413213, "learning_rate": 4.068173139898541e-06, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.109537772834301, "step": 6900, "valid_targets_mean": 10893.3, "valid_targets_min": 1884 }, { "epoch": 4.073746312684365, "grad_norm": 0.15803593887854933, "learning_rate": 4.043306593484493e-06, "loss": 0.3544, "loss_nan_ranks": 0, "loss_rank_avg": 0.11893521994352341, "step": 6905, "valid_targets_mean": 11079.8, "valid_targets_min": 3070 }, { "epoch": 4.07669616519174, "grad_norm": 0.1614974693410678, "learning_rate": 4.018507729354815e-06, "loss": 0.3537, "loss_nan_ranks": 0, "loss_rank_avg": 0.09593460708856583, "step": 6910, "valid_targets_mean": 8570.8, "valid_targets_min": 1983 }, { "epoch": 4.079646017699115, "grad_norm": 0.1606360032844375, "learning_rate": 3.99377665269695e-06, "loss": 0.3571, "loss_nan_ranks": 0, "loss_rank_avg": 0.14845268428325653, "step": 6915, "valid_targets_mean": 12068.4, "valid_targets_min": 3185 }, { "epoch": 4.0825958702064895, "grad_norm": 0.14277977783783713, "learning_rate": 3.969113468410813e-06, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.10441142320632935, "step": 6920, "valid_targets_mean": 11027.8, "valid_targets_min": 2368 }, { "epoch": 4.0855457227138645, "grad_norm": 0.16483615071706414, "learning_rate": 3.944518281108343e-06, "loss": 0.351, "loss_nan_ranks": 0, "loss_rank_avg": 0.10914063453674316, "step": 6925, "valid_targets_mean": 9420.6, "valid_targets_min": 1195 }, { "epoch": 4.088495575221239, "grad_norm": 0.16405075701609317, "learning_rate": 3.919991195113062e-06, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.13144291937351227, "step": 6930, "valid_targets_mean": 10658.9, "valid_targets_min": 1980 }, { "epoch": 4.091445427728614, "grad_norm": 0.15517719230540983, "learning_rate": 3.895532314459631e-06, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.13165420293807983, "step": 6935, "valid_targets_mean": 11138.8, "valid_targets_min": 2227 }, { "epoch": 4.094395280235988, "grad_norm": 0.15695515651139186, "learning_rate": 3.87114174289341e-06, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.11405207216739655, "step": 6940, "valid_targets_mean": 9765.3, "valid_targets_min": 1932 }, { "epoch": 4.097345132743363, "grad_norm": 0.17367930962714068, "learning_rate": 3.846819583870025e-06, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.11271396279335022, "step": 6945, "valid_targets_mean": 9676.6, "valid_targets_min": 1745 }, { "epoch": 4.100294985250738, "grad_norm": 0.17161773141660588, "learning_rate": 3.822565940554912e-06, "loss": 0.3593, "loss_nan_ranks": 0, "loss_rank_avg": 0.11096750199794769, "step": 6950, "valid_targets_mean": 10371.6, "valid_targets_min": 1888 }, { "epoch": 4.103244837758112, "grad_norm": 0.16258274272264253, "learning_rate": 3.7983809158228902e-06, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.11564739048480988, "step": 6955, "valid_targets_mean": 8439.3, "valid_targets_min": 1277 }, { "epoch": 4.106194690265487, "grad_norm": 0.1693204121188279, "learning_rate": 3.7742646122577297e-06, "loss": 0.35, "loss_nan_ranks": 0, "loss_rank_avg": 0.1281132996082306, "step": 6960, "valid_targets_mean": 11040.0, "valid_targets_min": 2677 }, { "epoch": 4.109144542772861, "grad_norm": 0.151024673086712, "learning_rate": 3.7502171321517057e-06, "loss": 0.3518, "loss_nan_ranks": 0, "loss_rank_avg": 0.09777649492025375, "step": 6965, "valid_targets_mean": 8500.1, "valid_targets_min": 2033 }, { "epoch": 4.112094395280236, "grad_norm": 0.18444964223806018, "learning_rate": 3.7262385775051722e-06, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.11289547383785248, "step": 6970, "valid_targets_mean": 9576.9, "valid_targets_min": 969 }, { "epoch": 4.115044247787611, "grad_norm": 0.1614686465505653, "learning_rate": 3.702329050026132e-06, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.11157312244176865, "step": 6975, "valid_targets_mean": 8877.5, "valid_targets_min": 1814 }, { "epoch": 4.117994100294985, "grad_norm": 0.17523462686891175, "learning_rate": 3.6784886511297947e-06, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.12200837582349777, "step": 6980, "valid_targets_mean": 9325.3, "valid_targets_min": 1594 }, { "epoch": 4.12094395280236, "grad_norm": 0.1631631704226555, "learning_rate": 3.654717481938148e-06, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.10229149460792542, "step": 6985, "valid_targets_mean": 9552.2, "valid_targets_min": 1684 }, { "epoch": 4.123893805309734, "grad_norm": 0.15629991294424075, "learning_rate": 3.631015643279556e-06, "loss": 0.3518, "loss_nan_ranks": 0, "loss_rank_avg": 0.10814925283193588, "step": 6990, "valid_targets_mean": 8981.8, "valid_targets_min": 1527 }, { "epoch": 4.126843657817109, "grad_norm": 0.17070790018436796, "learning_rate": 3.6073832356882734e-06, "loss": 0.3518, "loss_nan_ranks": 0, "loss_rank_avg": 0.1253635287284851, "step": 6995, "valid_targets_mean": 10686.9, "valid_targets_min": 2034 }, { "epoch": 4.129793510324483, "grad_norm": 0.16450992652358207, "learning_rate": 3.5838203594040933e-06, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320553421974182, "step": 7000, "valid_targets_mean": 10600.8, "valid_targets_min": 489 }, { "epoch": 4.132743362831858, "grad_norm": 0.15081212631556418, "learning_rate": 3.560327114371842e-06, "loss": 0.3504, "loss_nan_ranks": 0, "loss_rank_avg": 0.11111602932214737, "step": 7005, "valid_targets_mean": 9837.0, "valid_targets_min": 2066 }, { "epoch": 4.135693215339233, "grad_norm": 0.14274429369209427, "learning_rate": 3.536903600241033e-06, "loss": 0.3528, "loss_nan_ranks": 0, "loss_rank_avg": 0.11591881513595581, "step": 7010, "valid_targets_mean": 11523.9, "valid_targets_min": 2625 }, { "epoch": 4.1386430678466075, "grad_norm": 0.15333519477139126, "learning_rate": 3.5135499163653885e-06, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.12132668495178223, "step": 7015, "valid_targets_mean": 11195.9, "valid_targets_min": 3507 }, { "epoch": 4.1415929203539825, "grad_norm": 0.16346855146116562, "learning_rate": 3.4902661618024356e-06, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.12647776305675507, "step": 7020, "valid_targets_mean": 9740.0, "valid_targets_min": 1768 }, { "epoch": 4.144542772861357, "grad_norm": 0.15472435020929068, "learning_rate": 3.467052435313105e-06, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.0965496152639389, "step": 7025, "valid_targets_mean": 8208.5, "valid_targets_min": 1597 }, { "epoch": 4.147492625368732, "grad_norm": 0.1565591225922802, "learning_rate": 3.443908835361267e-06, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.12220700830221176, "step": 7030, "valid_targets_mean": 10105.2, "valid_targets_min": 1622 }, { "epoch": 4.150442477876107, "grad_norm": 0.16216119191777653, "learning_rate": 3.4208354601133764e-06, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.10918645560741425, "step": 7035, "valid_targets_mean": 8631.7, "valid_targets_min": 1531 }, { "epoch": 4.153392330383481, "grad_norm": 0.15150502470187602, "learning_rate": 3.3978324074379777e-06, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.1369277685880661, "step": 7040, "valid_targets_mean": 12891.5, "valid_targets_min": 2405 }, { "epoch": 4.156342182890856, "grad_norm": 0.15950154019979157, "learning_rate": 3.3748997749053824e-06, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.11721132695674896, "step": 7045, "valid_targets_mean": 9850.0, "valid_targets_min": 1924 }, { "epoch": 4.15929203539823, "grad_norm": 0.15273820356160808, "learning_rate": 3.3520376597871572e-06, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12347143888473511, "step": 7050, "valid_targets_mean": 11106.8, "valid_targets_min": 1673 }, { "epoch": 4.162241887905605, "grad_norm": 0.15376128423998026, "learning_rate": 3.3292461590558056e-06, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.1032019555568695, "step": 7055, "valid_targets_mean": 8959.6, "valid_targets_min": 457 }, { "epoch": 4.165191740412979, "grad_norm": 0.15639978630694426, "learning_rate": 3.3065253693842815e-06, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.10558753460645676, "step": 7060, "valid_targets_mean": 8709.6, "valid_targets_min": 2292 }, { "epoch": 4.168141592920354, "grad_norm": 0.1608503151554277, "learning_rate": 3.2838753871456187e-06, "loss": 0.3544, "loss_nan_ranks": 0, "loss_rank_avg": 0.11058098077774048, "step": 7065, "valid_targets_mean": 9885.4, "valid_targets_min": 1487 }, { "epoch": 4.171091445427729, "grad_norm": 0.16021384382226492, "learning_rate": 3.2612963084125116e-06, "loss": 0.3576, "loss_nan_ranks": 0, "loss_rank_avg": 0.12647023797035217, "step": 7070, "valid_targets_mean": 10233.0, "valid_targets_min": 1671 }, { "epoch": 4.174041297935103, "grad_norm": 0.1591375323482639, "learning_rate": 3.238788228956913e-06, "loss": 0.3604, "loss_nan_ranks": 0, "loss_rank_avg": 0.09633976966142654, "step": 7075, "valid_targets_mean": 8591.2, "valid_targets_min": 1590 }, { "epoch": 4.176991150442478, "grad_norm": 0.16074130498635006, "learning_rate": 3.216351244249616e-06, "loss": 0.3519, "loss_nan_ranks": 0, "loss_rank_avg": 0.11467361450195312, "step": 7080, "valid_targets_mean": 10684.5, "valid_targets_min": 1611 }, { "epoch": 4.179941002949852, "grad_norm": 0.153650155824368, "learning_rate": 3.193985449459858e-06, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.11654568463563919, "step": 7085, "valid_targets_mean": 10672.2, "valid_targets_min": 1664 }, { "epoch": 4.182890855457227, "grad_norm": 0.15872416144427312, "learning_rate": 3.17169093945493e-06, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.09964530169963837, "step": 7090, "valid_targets_mean": 9493.7, "valid_targets_min": 1927 }, { "epoch": 4.185840707964601, "grad_norm": 0.16000582646104505, "learning_rate": 3.149467808799729e-06, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.12831947207450867, "step": 7095, "valid_targets_mean": 10516.8, "valid_targets_min": 1508 }, { "epoch": 4.188790560471976, "grad_norm": 0.14935677128155156, "learning_rate": 3.127316151756421e-06, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.14910808205604553, "step": 7100, "valid_targets_mean": 13157.5, "valid_targets_min": 2815 }, { "epoch": 4.191740412979351, "grad_norm": 0.15483681811534517, "learning_rate": 3.1052360622839895e-06, "loss": 0.3554, "loss_nan_ranks": 0, "loss_rank_avg": 0.12956783175468445, "step": 7105, "valid_targets_mean": 11703.2, "valid_targets_min": 1570 }, { "epoch": 4.1946902654867255, "grad_norm": 0.14466320946338967, "learning_rate": 3.0832276340378573e-06, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13992691040039062, "step": 7110, "valid_targets_mean": 12907.7, "valid_targets_min": 1243 }, { "epoch": 4.1976401179941005, "grad_norm": 0.157117658276334, "learning_rate": 3.061290960369492e-06, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.13075107336044312, "step": 7115, "valid_targets_mean": 10809.4, "valid_targets_min": 1625 }, { "epoch": 4.200589970501475, "grad_norm": 0.16367009287077325, "learning_rate": 3.0394261343259978e-06, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.11082293093204498, "step": 7120, "valid_targets_mean": 9769.5, "valid_targets_min": 2194 }, { "epoch": 4.20353982300885, "grad_norm": 0.161926795541957, "learning_rate": 3.017633248649736e-06, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.13230161368846893, "step": 7125, "valid_targets_mean": 10109.1, "valid_targets_min": 1969 }, { "epoch": 4.206489675516224, "grad_norm": 0.1477163900435012, "learning_rate": 2.9959123957779203e-06, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.12325777858495712, "step": 7130, "valid_targets_mean": 11069.5, "valid_targets_min": 2258 }, { "epoch": 4.209439528023599, "grad_norm": 0.15506843168361162, "learning_rate": 2.9742636678422253e-06, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.11096407473087311, "step": 7135, "valid_targets_mean": 9698.0, "valid_targets_min": 2368 }, { "epoch": 4.212389380530974, "grad_norm": 0.16109254954313149, "learning_rate": 2.952687156668408e-06, "loss": 0.3529, "loss_nan_ranks": 0, "loss_rank_avg": 0.11004975438117981, "step": 7140, "valid_targets_mean": 9400.0, "valid_targets_min": 1805 }, { "epoch": 4.215339233038348, "grad_norm": 0.14890135216272918, "learning_rate": 2.931182953775895e-06, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.10987749695777893, "step": 7145, "valid_targets_mean": 11538.3, "valid_targets_min": 2481 }, { "epoch": 4.218289085545723, "grad_norm": 0.15280391232069168, "learning_rate": 2.909751150377429e-06, "loss": 0.3518, "loss_nan_ranks": 0, "loss_rank_avg": 0.11714964359998703, "step": 7150, "valid_targets_mean": 10323.9, "valid_targets_min": 1960 }, { "epoch": 4.221238938053097, "grad_norm": 0.1603710398345934, "learning_rate": 2.888391837378641e-06, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.13210344314575195, "step": 7155, "valid_targets_mean": 10748.8, "valid_targets_min": 1490 }, { "epoch": 4.224188790560472, "grad_norm": 0.14641270144989635, "learning_rate": 2.8671051053776944e-06, "loss": 0.3561, "loss_nan_ranks": 0, "loss_rank_avg": 0.11850255727767944, "step": 7160, "valid_targets_mean": 11708.2, "valid_targets_min": 2442 }, { "epoch": 4.227138643067847, "grad_norm": 0.16286550427689112, "learning_rate": 2.8458910446648923e-06, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.11870785057544708, "step": 7165, "valid_targets_mean": 8852.9, "valid_targets_min": 216 }, { "epoch": 4.230088495575221, "grad_norm": 0.1556260555961893, "learning_rate": 2.8247497452222883e-06, "loss": 0.3578, "loss_nan_ranks": 0, "loss_rank_avg": 0.11046218127012253, "step": 7170, "valid_targets_mean": 9240.8, "valid_targets_min": 1875 }, { "epoch": 4.233038348082596, "grad_norm": 0.1586469227537557, "learning_rate": 2.803681296723313e-06, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.10672442615032196, "step": 7175, "valid_targets_mean": 8434.4, "valid_targets_min": 1529 }, { "epoch": 4.23598820058997, "grad_norm": 0.15901563453616538, "learning_rate": 2.7826857885323934e-06, "loss": 0.3611, "loss_nan_ranks": 0, "loss_rank_avg": 0.10011562705039978, "step": 7180, "valid_targets_mean": 8519.2, "valid_targets_min": 1630 }, { "epoch": 4.238938053097345, "grad_norm": 0.15867627879458304, "learning_rate": 2.761763309704568e-06, "loss": 0.3537, "loss_nan_ranks": 0, "loss_rank_avg": 0.11282973736524582, "step": 7185, "valid_targets_mean": 9477.0, "valid_targets_min": 1957 }, { "epoch": 4.241887905604719, "grad_norm": 0.15255571081123262, "learning_rate": 2.7409139489851066e-06, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.12214551120996475, "step": 7190, "valid_targets_mean": 10635.3, "valid_targets_min": 2955 }, { "epoch": 4.244837758112094, "grad_norm": 0.15171028129243372, "learning_rate": 2.7201377948091614e-06, "loss": 0.3504, "loss_nan_ranks": 0, "loss_rank_avg": 0.11917664855718613, "step": 7195, "valid_targets_mean": 11111.0, "valid_targets_min": 2898 }, { "epoch": 4.247787610619469, "grad_norm": 0.15175919291626522, "learning_rate": 2.699434935301335e-06, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1180785596370697, "step": 7200, "valid_targets_mean": 10576.7, "valid_targets_min": 2780 }, { "epoch": 4.2507374631268435, "grad_norm": 0.16419494179861108, "learning_rate": 2.67880545827538e-06, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.14159059524536133, "step": 7205, "valid_targets_mean": 12024.1, "valid_targets_min": 2727 }, { "epoch": 4.2536873156342185, "grad_norm": 0.15479354424867625, "learning_rate": 2.65824945123375e-06, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.11950947344303131, "step": 7210, "valid_targets_mean": 9545.0, "valid_targets_min": 1882 }, { "epoch": 4.256637168141593, "grad_norm": 0.16371358786704585, "learning_rate": 2.6377670013672998e-06, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.10644177347421646, "step": 7215, "valid_targets_mean": 8259.6, "valid_targets_min": 1045 }, { "epoch": 4.259587020648968, "grad_norm": 0.15805330816406019, "learning_rate": 2.6173581955548644e-06, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.12316429615020752, "step": 7220, "valid_targets_mean": 10127.1, "valid_targets_min": 1797 }, { "epoch": 4.262536873156342, "grad_norm": 0.1595140145705862, "learning_rate": 2.597023120362907e-06, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.11776896566152573, "step": 7225, "valid_targets_mean": 8850.4, "valid_targets_min": 1524 }, { "epoch": 4.265486725663717, "grad_norm": 0.15507688803698258, "learning_rate": 2.576761862045174e-06, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.09920550137758255, "step": 7230, "valid_targets_mean": 8547.2, "valid_targets_min": 1657 }, { "epoch": 4.268436578171092, "grad_norm": 0.1613867067717064, "learning_rate": 2.5565745065422733e-06, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.10289187729358673, "step": 7235, "valid_targets_mean": 7498.9, "valid_targets_min": 2006 }, { "epoch": 4.271386430678466, "grad_norm": 0.15493360164306041, "learning_rate": 2.536461139481383e-06, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283939778804779, "step": 7240, "valid_targets_mean": 10987.5, "valid_targets_min": 2508 }, { "epoch": 4.274336283185841, "grad_norm": 0.14748392784313846, "learning_rate": 2.516421846175814e-06, "loss": 0.3698, "loss_nan_ranks": 0, "loss_rank_avg": 0.11385820806026459, "step": 7245, "valid_targets_mean": 10292.0, "valid_targets_min": 2280 }, { "epoch": 4.277286135693215, "grad_norm": 0.1479679407796802, "learning_rate": 2.4964567116247172e-06, "loss": 0.3674, "loss_nan_ranks": 0, "loss_rank_avg": 0.12190468609333038, "step": 7250, "valid_targets_mean": 10601.8, "valid_targets_min": 1396 }, { "epoch": 4.28023598820059, "grad_norm": 0.15897034975450886, "learning_rate": 2.476565820512664e-06, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.13549286127090454, "step": 7255, "valid_targets_mean": 9942.6, "valid_targets_min": 2133 }, { "epoch": 4.283185840707965, "grad_norm": 0.1540025059352752, "learning_rate": 2.4567492572093298e-06, "loss": 0.3704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1373451054096222, "step": 7260, "valid_targets_mean": 9759.4, "valid_targets_min": 1581 }, { "epoch": 4.286135693215339, "grad_norm": 0.14967079433299837, "learning_rate": 2.4370071057691135e-06, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.13896623253822327, "step": 7265, "valid_targets_mean": 10620.5, "valid_targets_min": 1461 }, { "epoch": 4.289085545722714, "grad_norm": 0.1635262716112185, "learning_rate": 2.4173394499307846e-06, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.11073658615350723, "step": 7270, "valid_targets_mean": 8787.5, "valid_targets_min": 2197 }, { "epoch": 4.292035398230088, "grad_norm": 0.15662348738576132, "learning_rate": 2.3977463731171336e-06, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.10898212343454361, "step": 7275, "valid_targets_mean": 9077.8, "valid_targets_min": 2800 }, { "epoch": 4.294985250737463, "grad_norm": 0.15856289750370217, "learning_rate": 2.378227958434616e-06, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.12312222272157669, "step": 7280, "valid_targets_mean": 9941.8, "valid_targets_min": 2260 }, { "epoch": 4.297935103244837, "grad_norm": 0.14811468463044616, "learning_rate": 2.3587842886729905e-06, "loss": 0.37, "loss_nan_ranks": 0, "loss_rank_avg": 0.12280742079019547, "step": 7285, "valid_targets_mean": 10138.6, "valid_targets_min": 1655 }, { "epoch": 4.300884955752212, "grad_norm": 0.15642409319377618, "learning_rate": 2.3394154463049847e-06, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.13053852319717407, "step": 7290, "valid_targets_mean": 9809.2, "valid_targets_min": 1817 }, { "epoch": 4.303834808259587, "grad_norm": 0.15905712907842334, "learning_rate": 2.3201215134859424e-06, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.14553436636924744, "step": 7295, "valid_targets_mean": 11053.2, "valid_targets_min": 1891 }, { "epoch": 4.3067846607669615, "grad_norm": 0.15633498376543936, "learning_rate": 2.300902572053445e-06, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423797309398651, "step": 7300, "valid_targets_mean": 10950.2, "valid_targets_min": 2265 }, { "epoch": 4.3097345132743365, "grad_norm": 0.15432556400228098, "learning_rate": 2.281758703527015e-06, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.11870302259922028, "step": 7305, "valid_targets_mean": 9727.5, "valid_targets_min": 1294 }, { "epoch": 4.312684365781711, "grad_norm": 0.14855891542283822, "learning_rate": 2.2626899891077337e-06, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.1254224181175232, "step": 7310, "valid_targets_mean": 10823.4, "valid_targets_min": 2542 }, { "epoch": 4.315634218289086, "grad_norm": 0.1481578289958286, "learning_rate": 2.243696509677904e-06, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.12209489196538925, "step": 7315, "valid_targets_mean": 10381.6, "valid_targets_min": 1504 }, { "epoch": 4.31858407079646, "grad_norm": 0.154762941329994, "learning_rate": 2.2247783458007133e-06, "loss": 0.3634, "loss_nan_ranks": 0, "loss_rank_avg": 0.14160534739494324, "step": 7320, "valid_targets_mean": 10812.6, "valid_targets_min": 1055 }, { "epoch": 4.321533923303835, "grad_norm": 0.15270881348781443, "learning_rate": 2.2059355777198888e-06, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.11081090569496155, "step": 7325, "valid_targets_mean": 9040.8, "valid_targets_min": 1130 }, { "epoch": 4.32448377581121, "grad_norm": 0.1548144163105394, "learning_rate": 2.1871682853593555e-06, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.10774673521518707, "step": 7330, "valid_targets_mean": 9655.9, "valid_targets_min": 1410 }, { "epoch": 4.327433628318584, "grad_norm": 0.1504121646183315, "learning_rate": 2.1684765483228997e-06, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.10418853163719177, "step": 7335, "valid_targets_mean": 8905.6, "valid_targets_min": 1830 }, { "epoch": 4.330383480825959, "grad_norm": 0.14775000972766456, "learning_rate": 2.1498604458938344e-06, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.11074630171060562, "step": 7340, "valid_targets_mean": 9882.5, "valid_targets_min": 2408 }, { "epoch": 4.333333333333333, "grad_norm": 0.15125604827288272, "learning_rate": 2.1313200570346513e-06, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.1144319623708725, "step": 7345, "valid_targets_mean": 9463.4, "valid_targets_min": 1659 }, { "epoch": 4.336283185840708, "grad_norm": 0.15304017102252931, "learning_rate": 2.112855460386698e-06, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.111595019698143, "step": 7350, "valid_targets_mean": 11038.2, "valid_targets_min": 1531 }, { "epoch": 4.339233038348082, "grad_norm": 0.15292973670461382, "learning_rate": 2.094466734269849e-06, "loss": 0.3639, "loss_nan_ranks": 0, "loss_rank_avg": 0.12869225442409515, "step": 7355, "valid_targets_mean": 10074.7, "valid_targets_min": 2085 }, { "epoch": 4.342182890855457, "grad_norm": 0.14270513753434333, "learning_rate": 2.076153956682139e-06, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.10554344952106476, "step": 7360, "valid_targets_mean": 10108.6, "valid_targets_min": 1642 }, { "epoch": 4.345132743362832, "grad_norm": 0.15014445897583023, "learning_rate": 2.057917205299489e-06, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.12004509568214417, "step": 7365, "valid_targets_mean": 9673.6, "valid_targets_min": 997 }, { "epoch": 4.348082595870206, "grad_norm": 0.1576340334574788, "learning_rate": 2.0397565574753255e-06, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.10483772307634354, "step": 7370, "valid_targets_mean": 8708.4, "valid_targets_min": 1573 }, { "epoch": 4.351032448377581, "grad_norm": 0.148042243945791, "learning_rate": 2.0216720902402764e-06, "loss": 0.3681, "loss_nan_ranks": 0, "loss_rank_avg": 0.13991913199424744, "step": 7375, "valid_targets_mean": 12304.2, "valid_targets_min": 1814 }, { "epoch": 4.353982300884955, "grad_norm": 0.16331630126439883, "learning_rate": 2.0036638803018425e-06, "loss": 0.3716, "loss_nan_ranks": 0, "loss_rank_avg": 0.12212497740983963, "step": 7380, "valid_targets_mean": 11132.8, "valid_targets_min": 1200 }, { "epoch": 4.35693215339233, "grad_norm": 0.15437374905079762, "learning_rate": 1.98573200404407e-06, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.13012322783470154, "step": 7385, "valid_targets_mean": 10237.6, "valid_targets_min": 950 }, { "epoch": 4.359882005899705, "grad_norm": 0.15337072869070487, "learning_rate": 1.9678765375272223e-06, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.10758992284536362, "step": 7390, "valid_targets_mean": 10417.7, "valid_targets_min": 2034 }, { "epoch": 4.3628318584070795, "grad_norm": 0.14886015288265325, "learning_rate": 1.9500975564874626e-06, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.12389254570007324, "step": 7395, "valid_targets_mean": 11726.6, "valid_targets_min": 1312 }, { "epoch": 4.3657817109144545, "grad_norm": 0.1529975346049962, "learning_rate": 1.9323951363365423e-06, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1035454124212265, "step": 7400, "valid_targets_mean": 8954.2, "valid_targets_min": 1876 }, { "epoch": 4.368731563421829, "grad_norm": 0.16267312185022692, "learning_rate": 1.9147693521614475e-06, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419374942779541, "step": 7405, "valid_targets_mean": 10257.4, "valid_targets_min": 2939 }, { "epoch": 4.371681415929204, "grad_norm": 0.15661576832988683, "learning_rate": 1.8972202787241345e-06, "loss": 0.3634, "loss_nan_ranks": 0, "loss_rank_avg": 0.11530675739049911, "step": 7410, "valid_targets_mean": 9281.1, "valid_targets_min": 2123 }, { "epoch": 4.374631268436578, "grad_norm": 0.16089922557143402, "learning_rate": 1.8797479904611448e-06, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313277781009674, "step": 7415, "valid_targets_mean": 9339.8, "valid_targets_min": 2558 }, { "epoch": 4.377581120943953, "grad_norm": 0.1719192971303852, "learning_rate": 1.8623525614833582e-06, "loss": 0.3668, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218654215335846, "step": 7420, "valid_targets_mean": 9360.2, "valid_targets_min": 2415 }, { "epoch": 4.380530973451328, "grad_norm": 0.1661511961649541, "learning_rate": 1.8450340655756304e-06, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.11054585874080658, "step": 7425, "valid_targets_mean": 8395.6, "valid_targets_min": 1630 }, { "epoch": 4.383480825958702, "grad_norm": 0.15705768164396808, "learning_rate": 1.8277925761964965e-06, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.14034216105937958, "step": 7430, "valid_targets_mean": 12708.2, "valid_targets_min": 3373 }, { "epoch": 4.386430678466077, "grad_norm": 0.14410972407670963, "learning_rate": 1.8106281664778701e-06, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1108931228518486, "step": 7435, "valid_targets_mean": 11102.9, "valid_targets_min": 2383 }, { "epoch": 4.389380530973451, "grad_norm": 0.1585707239081277, "learning_rate": 1.7935409092247002e-06, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.11846847832202911, "step": 7440, "valid_targets_mean": 9429.2, "valid_targets_min": 1243 }, { "epoch": 4.392330383480826, "grad_norm": 0.15606287790344534, "learning_rate": 1.7765308769147105e-06, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.13980810344219208, "step": 7445, "valid_targets_mean": 12589.8, "valid_targets_min": 1293 }, { "epoch": 4.395280235988201, "grad_norm": 0.14761791334704993, "learning_rate": 1.75959814169804e-06, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.11588216572999954, "step": 7450, "valid_targets_mean": 9731.8, "valid_targets_min": 1129 }, { "epoch": 4.398230088495575, "grad_norm": 0.1523426665062693, "learning_rate": 1.7427427753969884e-06, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.09459323436021805, "step": 7455, "valid_targets_mean": 8218.8, "valid_targets_min": 595 }, { "epoch": 4.40117994100295, "grad_norm": 0.15717516506454268, "learning_rate": 1.7259648495056568e-06, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.1137595921754837, "step": 7460, "valid_targets_mean": 9081.4, "valid_targets_min": 888 }, { "epoch": 4.404129793510324, "grad_norm": 0.14821901334735668, "learning_rate": 1.709264435189699e-06, "loss": 0.3596, "loss_nan_ranks": 0, "loss_rank_avg": 0.12101010233163834, "step": 7465, "valid_targets_mean": 10127.8, "valid_targets_min": 1547 }, { "epoch": 4.407079646017699, "grad_norm": 0.14856901343181347, "learning_rate": 1.6926416032859826e-06, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.11522223055362701, "step": 7470, "valid_targets_mean": 9777.3, "valid_targets_min": 1666 }, { "epoch": 4.410029498525073, "grad_norm": 0.14887002814263378, "learning_rate": 1.676096424302298e-06, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.10992522537708282, "step": 7475, "valid_targets_mean": 8813.1, "valid_targets_min": 2184 }, { "epoch": 4.412979351032448, "grad_norm": 0.15536381393469378, "learning_rate": 1.6596289684170642e-06, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.11852423846721649, "step": 7480, "valid_targets_mean": 9679.6, "valid_targets_min": 2445 }, { "epoch": 4.415929203539823, "grad_norm": 0.14499491945938592, "learning_rate": 1.6432393054790274e-06, "loss": 0.3668, "loss_nan_ranks": 0, "loss_rank_avg": 0.11371295899152756, "step": 7485, "valid_targets_mean": 10510.3, "valid_targets_min": 1998 }, { "epoch": 4.4188790560471976, "grad_norm": 0.1610486095581393, "learning_rate": 1.6269275050069677e-06, "loss": 0.3527, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595916897058487, "step": 7490, "valid_targets_mean": 12465.5, "valid_targets_min": 1710 }, { "epoch": 4.421828908554573, "grad_norm": 0.16414754925895014, "learning_rate": 1.6106936361893977e-06, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.13262584805488586, "step": 7495, "valid_targets_mean": 10231.8, "valid_targets_min": 2259 }, { "epoch": 4.424778761061947, "grad_norm": 0.15688636504001732, "learning_rate": 1.5945377678842766e-06, "loss": 0.3494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13062500953674316, "step": 7500, "valid_targets_mean": 13320.7, "valid_targets_min": 1376 }, { "epoch": 4.427728613569322, "grad_norm": 0.150362961681588, "learning_rate": 1.5784599686187085e-06, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.09411562979221344, "step": 7505, "valid_targets_mean": 8426.0, "valid_targets_min": 1654 }, { "epoch": 4.430678466076696, "grad_norm": 0.16055863518167604, "learning_rate": 1.5624603065886734e-06, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.10464043915271759, "step": 7510, "valid_targets_mean": 8610.3, "valid_targets_min": 2335 }, { "epoch": 4.433628318584071, "grad_norm": 0.15928012971833783, "learning_rate": 1.5465388496587053e-06, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.11390765011310577, "step": 7515, "valid_targets_mean": 9733.9, "valid_targets_min": 2604 }, { "epoch": 4.436578171091446, "grad_norm": 0.15983062111463275, "learning_rate": 1.53069566536163e-06, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.09258467704057693, "step": 7520, "valid_targets_mean": 7887.3, "valid_targets_min": 961 }, { "epoch": 4.43952802359882, "grad_norm": 0.1480222383713337, "learning_rate": 1.5149308208982726e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.1298375427722931, "step": 7525, "valid_targets_mean": 12008.4, "valid_targets_min": 3631 }, { "epoch": 4.442477876106195, "grad_norm": 0.1528172900821816, "learning_rate": 1.4992443831371596e-06, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.12460409104824066, "step": 7530, "valid_targets_mean": 11155.2, "valid_targets_min": 2731 }, { "epoch": 4.445427728613569, "grad_norm": 0.15414750220527093, "learning_rate": 1.4836364186142582e-06, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.11743897199630737, "step": 7535, "valid_targets_mean": 10674.4, "valid_targets_min": 1317 }, { "epoch": 4.448377581120944, "grad_norm": 0.15382813152212646, "learning_rate": 1.468106993532674e-06, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.13689687848091125, "step": 7540, "valid_targets_mean": 11136.4, "valid_targets_min": 1890 }, { "epoch": 4.451327433628318, "grad_norm": 0.15966041725784386, "learning_rate": 1.4526561737623811e-06, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.14471429586410522, "step": 7545, "valid_targets_mean": 12538.8, "valid_targets_min": 1856 }, { "epoch": 4.454277286135693, "grad_norm": 0.15405263130677785, "learning_rate": 1.4372840248399378e-06, "loss": 0.3552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332360804080963, "step": 7550, "valid_targets_mean": 11351.3, "valid_targets_min": 1738 }, { "epoch": 4.457227138643068, "grad_norm": 0.1454681616170232, "learning_rate": 1.421990611968207e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.09641964733600616, "step": 7555, "valid_targets_mean": 9638.6, "valid_targets_min": 2769 }, { "epoch": 4.460176991150442, "grad_norm": 0.15619107717952554, "learning_rate": 1.4067760000160968e-06, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.11662718653678894, "step": 7560, "valid_targets_mean": 10217.3, "valid_targets_min": 1867 }, { "epoch": 4.463126843657817, "grad_norm": 0.1643135977247633, "learning_rate": 1.3916402535182494e-06, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.1154789924621582, "step": 7565, "valid_targets_mean": 10830.1, "valid_targets_min": 2056 }, { "epoch": 4.466076696165191, "grad_norm": 0.15658719880104097, "learning_rate": 1.37658343667481e-06, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.09098144620656967, "step": 7570, "valid_targets_mean": 8065.7, "valid_targets_min": 2250 }, { "epoch": 4.469026548672566, "grad_norm": 0.15305545076889765, "learning_rate": 1.3616056133511245e-06, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.10880333185195923, "step": 7575, "valid_targets_mean": 10655.2, "valid_targets_min": 2555 }, { "epoch": 4.4719764011799406, "grad_norm": 0.15316371686221492, "learning_rate": 1.346706847077477e-06, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.12371876835823059, "step": 7580, "valid_targets_mean": 11071.5, "valid_targets_min": 860 }, { "epoch": 4.474926253687316, "grad_norm": 0.17027456090998858, "learning_rate": 1.3318872010488227e-06, "loss": 0.3398, "loss_nan_ranks": 0, "loss_rank_avg": 0.13155479729175568, "step": 7585, "valid_targets_mean": 11408.9, "valid_targets_min": 2015 }, { "epoch": 4.477876106194691, "grad_norm": 0.15247149515898822, "learning_rate": 1.3171467381245217e-06, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.09567923843860626, "step": 7590, "valid_targets_mean": 9568.1, "valid_targets_min": 1913 }, { "epoch": 4.480825958702065, "grad_norm": 0.1606651379781345, "learning_rate": 1.3024855208280628e-06, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.10479949414730072, "step": 7595, "valid_targets_mean": 9056.0, "valid_targets_min": 1585 }, { "epoch": 4.48377581120944, "grad_norm": 0.1511496049987001, "learning_rate": 1.2879036113468103e-06, "loss": 0.3445, "loss_nan_ranks": 0, "loss_rank_avg": 0.1336202174425125, "step": 7600, "valid_targets_mean": 13044.3, "valid_targets_min": 2160 }, { "epoch": 4.486725663716814, "grad_norm": 0.1547336928002793, "learning_rate": 1.273401071531739e-06, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.09686368703842163, "step": 7605, "valid_targets_mean": 9486.9, "valid_targets_min": 1543 }, { "epoch": 4.489675516224189, "grad_norm": 0.1499179724291536, "learning_rate": 1.2589779628971498e-06, "loss": 0.3476, "loss_nan_ranks": 0, "loss_rank_avg": 0.09721426665782928, "step": 7610, "valid_targets_mean": 9637.9, "valid_targets_min": 1453 }, { "epoch": 4.492625368731564, "grad_norm": 0.16171085592994147, "learning_rate": 1.2446343466204525e-06, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1449803113937378, "step": 7615, "valid_targets_mean": 11221.1, "valid_targets_min": 1861 }, { "epoch": 4.495575221238938, "grad_norm": 0.1615174407179875, "learning_rate": 1.2303702835418485e-06, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.09636390209197998, "step": 7620, "valid_targets_mean": 7896.7, "valid_targets_min": 1601 }, { "epoch": 4.498525073746313, "grad_norm": 0.1515588014050659, "learning_rate": 1.2161858341641342e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.12471356987953186, "step": 7625, "valid_targets_mean": 11206.3, "valid_targets_min": 2567 }, { "epoch": 4.501474926253687, "grad_norm": 0.15162574672995982, "learning_rate": 1.2020810586524e-06, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.12063919007778168, "step": 7630, "valid_targets_mean": 9940.7, "valid_targets_min": 1487 }, { "epoch": 4.504424778761062, "grad_norm": 0.15943299985208736, "learning_rate": 1.1880560168337896e-06, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.11519865691661835, "step": 7635, "valid_targets_mean": 9426.9, "valid_targets_min": 1920 }, { "epoch": 4.507374631268437, "grad_norm": 0.1662033503787035, "learning_rate": 1.1741107681972496e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.09789461642503738, "step": 7640, "valid_targets_mean": 7889.9, "valid_targets_min": 1997 }, { "epoch": 4.510324483775811, "grad_norm": 0.16145641216897003, "learning_rate": 1.1602453718932715e-06, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.09589747339487076, "step": 7645, "valid_targets_mean": 8702.3, "valid_targets_min": 2150 }, { "epoch": 4.513274336283186, "grad_norm": 0.15162396305291637, "learning_rate": 1.1464598867336528e-06, "loss": 0.3379, "loss_nan_ranks": 0, "loss_rank_avg": 0.134039506316185, "step": 7650, "valid_targets_mean": 11533.9, "valid_targets_min": 1871 }, { "epoch": 4.51622418879056, "grad_norm": 0.15346636062924254, "learning_rate": 1.132754371191218e-06, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.10973073542118073, "step": 7655, "valid_targets_mean": 10099.0, "valid_targets_min": 2449 }, { "epoch": 4.519174041297935, "grad_norm": 0.1559081775420403, "learning_rate": 1.119128883399614e-06, "loss": 0.3403, "loss_nan_ranks": 0, "loss_rank_avg": 0.12783056497573853, "step": 7660, "valid_targets_mean": 10613.0, "valid_targets_min": 1767 }, { "epoch": 4.522123893805309, "grad_norm": 0.20211025090903367, "learning_rate": 1.1055834811530165e-06, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.11391949653625488, "step": 7665, "valid_targets_mean": 9735.8, "valid_targets_min": 1444 }, { "epoch": 4.525073746312684, "grad_norm": 0.14976916014788086, "learning_rate": 1.0921182219059335e-06, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497693300247192, "step": 7670, "valid_targets_mean": 12089.4, "valid_targets_min": 1483 }, { "epoch": 4.5280235988200594, "grad_norm": 0.15886160420092751, "learning_rate": 1.0787331627729182e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.11860600858926773, "step": 7675, "valid_targets_mean": 9522.6, "valid_targets_min": 747 }, { "epoch": 4.530973451327434, "grad_norm": 0.16522051263967721, "learning_rate": 1.0654283605283488e-06, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.07913932204246521, "step": 7680, "valid_targets_mean": 6589.8, "valid_targets_min": 1001 }, { "epoch": 4.533923303834809, "grad_norm": 0.1709157193165234, "learning_rate": 1.05220387160619e-06, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.10800658166408539, "step": 7685, "valid_targets_mean": 8307.7, "valid_targets_min": 1442 }, { "epoch": 4.536873156342183, "grad_norm": 0.15626400784626918, "learning_rate": 1.0390597520997426e-06, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.1069958508014679, "step": 7690, "valid_targets_mean": 9174.5, "valid_targets_min": 2099 }, { "epoch": 4.539823008849558, "grad_norm": 0.1512271056093135, "learning_rate": 1.0259960577614091e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.11784885823726654, "step": 7695, "valid_targets_mean": 9977.2, "valid_targets_min": 1385 }, { "epoch": 4.542772861356932, "grad_norm": 0.1507369858580233, "learning_rate": 1.0130128440024633e-06, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.093796007335186, "step": 7700, "valid_targets_mean": 8322.1, "valid_targets_min": 2131 }, { "epoch": 4.545722713864307, "grad_norm": 0.15852677988252023, "learning_rate": 1.0001101658928092e-06, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.1161518543958664, "step": 7705, "valid_targets_mean": 10406.2, "valid_targets_min": 1407 }, { "epoch": 4.548672566371682, "grad_norm": 0.1531404932874041, "learning_rate": 9.872880781607463e-07, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.12724629044532776, "step": 7710, "valid_targets_mean": 12493.9, "valid_targets_min": 2457 }, { "epoch": 4.551622418879056, "grad_norm": 0.15451521393434178, "learning_rate": 9.745466351927458e-07, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.09752607345581055, "step": 7715, "valid_targets_mean": 9960.1, "valid_targets_min": 2052 }, { "epoch": 4.554572271386431, "grad_norm": 0.16431695986849715, "learning_rate": 9.618858910332073e-07, "loss": 0.339, "loss_nan_ranks": 0, "loss_rank_avg": 0.09468859434127808, "step": 7720, "valid_targets_mean": 8378.8, "valid_targets_min": 1560 }, { "epoch": 4.557522123893805, "grad_norm": 0.15548881510456924, "learning_rate": 9.493058993842408e-07, "loss": 0.3348, "loss_nan_ranks": 0, "loss_rank_avg": 0.10117464512586594, "step": 7725, "valid_targets_mean": 9472.5, "valid_targets_min": 2484 }, { "epoch": 4.56047197640118, "grad_norm": 0.15239276402032617, "learning_rate": 9.368067136054337e-07, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1087859570980072, "step": 7730, "valid_targets_mean": 10299.2, "valid_targets_min": 878 }, { "epoch": 4.563421828908554, "grad_norm": 0.15751354324521347, "learning_rate": 9.243883867136239e-07, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.11837193369865417, "step": 7735, "valid_targets_mean": 10887.9, "valid_targets_min": 2125 }, { "epoch": 4.566371681415929, "grad_norm": 0.1636132491545048, "learning_rate": 9.120509713826786e-07, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383325159549713, "step": 7740, "valid_targets_mean": 12573.0, "valid_targets_min": 2048 }, { "epoch": 4.569321533923304, "grad_norm": 0.1582734920218057, "learning_rate": 8.997945199432668e-07, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.10354599356651306, "step": 7745, "valid_targets_mean": 9179.3, "valid_targets_min": 1147 }, { "epoch": 4.572271386430678, "grad_norm": 0.14978615383191066, "learning_rate": 8.876190843826426e-07, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.11529295146465302, "step": 7750, "valid_targets_mean": 10706.8, "valid_targets_min": 1593 }, { "epoch": 4.575221238938053, "grad_norm": 0.163412064717712, "learning_rate": 8.755247163444137e-07, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.10770249366760254, "step": 7755, "valid_targets_mean": 9218.1, "valid_targets_min": 2137 }, { "epoch": 4.578171091445427, "grad_norm": 0.15646391023643355, "learning_rate": 8.635114671283351e-07, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.1251239776611328, "step": 7760, "valid_targets_mean": 11224.7, "valid_targets_min": 1822 }, { "epoch": 4.5811209439528024, "grad_norm": 0.1583802965925948, "learning_rate": 8.515793876900957e-07, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.11912311613559723, "step": 7765, "valid_targets_mean": 11156.6, "valid_targets_min": 1606 }, { "epoch": 4.584070796460177, "grad_norm": 0.15774668340457346, "learning_rate": 8.397285286410683e-07, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.12353400886058807, "step": 7770, "valid_targets_mean": 10960.1, "valid_targets_min": 1556 }, { "epoch": 4.587020648967552, "grad_norm": 0.15917041823937758, "learning_rate": 8.279589402481458e-07, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.10141907632350922, "step": 7775, "valid_targets_mean": 9461.7, "valid_targets_min": 1929 }, { "epoch": 4.589970501474927, "grad_norm": 0.15450283281262311, "learning_rate": 8.162706724334812e-07, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.1162460520863533, "step": 7780, "valid_targets_mean": 9745.5, "valid_targets_min": 1581 }, { "epoch": 4.592920353982301, "grad_norm": 0.1618381177008798, "learning_rate": 8.046637747743125e-07, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.11386996507644653, "step": 7785, "valid_targets_mean": 10080.6, "valid_targets_min": 2923 }, { "epoch": 4.595870206489676, "grad_norm": 0.18422670497164972, "learning_rate": 7.931382965027245e-07, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.10538017004728317, "step": 7790, "valid_targets_mean": 8127.2, "valid_targets_min": 1571 }, { "epoch": 4.59882005899705, "grad_norm": 0.16123401086696665, "learning_rate": 7.816942865054566e-07, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.1084161102771759, "step": 7795, "valid_targets_mean": 10449.8, "valid_targets_min": 1912 }, { "epoch": 4.601769911504425, "grad_norm": 0.16819343140393953, "learning_rate": 7.703317933236886e-07, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.09945972263813019, "step": 7800, "valid_targets_mean": 8532.2, "valid_targets_min": 1791 }, { "epoch": 4.604719764011799, "grad_norm": 0.15125655287965598, "learning_rate": 7.590508651528372e-07, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.11926385760307312, "step": 7805, "valid_targets_mean": 11387.8, "valid_targets_min": 2003 }, { "epoch": 4.607669616519174, "grad_norm": 0.16124756947368554, "learning_rate": 7.478515498423577e-07, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.10725908726453781, "step": 7810, "valid_targets_mean": 9229.9, "valid_targets_min": 2522 }, { "epoch": 4.610619469026549, "grad_norm": 0.1519505295088245, "learning_rate": 7.367338948955183e-07, "loss": 0.3346, "loss_nan_ranks": 0, "loss_rank_avg": 0.12884555757045746, "step": 7815, "valid_targets_mean": 12198.8, "valid_targets_min": 1675 }, { "epoch": 4.613569321533923, "grad_norm": 0.15228717890035376, "learning_rate": 7.256979474692327e-07, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.10891731083393097, "step": 7820, "valid_targets_mean": 10017.0, "valid_targets_min": 1776 }, { "epoch": 4.616519174041298, "grad_norm": 0.15429967262842637, "learning_rate": 7.147437543738278e-07, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.10560815781354904, "step": 7825, "valid_targets_mean": 10342.0, "valid_targets_min": 1961 }, { "epoch": 4.619469026548672, "grad_norm": 0.16656461258723682, "learning_rate": 7.038713620728699e-07, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.10848058760166168, "step": 7830, "valid_targets_mean": 9962.6, "valid_targets_min": 2405 }, { "epoch": 4.622418879056047, "grad_norm": 0.16021833897800697, "learning_rate": 6.930808166829517e-07, "loss": 0.3359, "loss_nan_ranks": 0, "loss_rank_avg": 0.0915953516960144, "step": 7835, "valid_targets_mean": 8304.7, "valid_targets_min": 1978 }, { "epoch": 4.625368731563422, "grad_norm": 0.23996441726172854, "learning_rate": 6.823721639735015e-07, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.12475943565368652, "step": 7840, "valid_targets_mean": 12342.4, "valid_targets_min": 2187 }, { "epoch": 4.628318584070796, "grad_norm": 0.16033087598275933, "learning_rate": 6.71745449366592e-07, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.10748793929815292, "step": 7845, "valid_targets_mean": 9165.0, "valid_targets_min": 832 }, { "epoch": 4.631268436578171, "grad_norm": 0.15047647806461162, "learning_rate": 6.612007179367452e-07, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.10964348912239075, "step": 7850, "valid_targets_mean": 10573.9, "valid_targets_min": 2386 }, { "epoch": 4.6342182890855455, "grad_norm": 0.15419414615308352, "learning_rate": 6.507380144107433e-07, "loss": 0.3424, "loss_nan_ranks": 0, "loss_rank_avg": 0.09014791250228882, "step": 7855, "valid_targets_mean": 8261.4, "valid_targets_min": 1439 }, { "epoch": 4.6371681415929205, "grad_norm": 0.16020362869640542, "learning_rate": 6.403573831674292e-07, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.11980140209197998, "step": 7860, "valid_targets_mean": 9847.7, "valid_targets_min": 1767 }, { "epoch": 4.6401179941002955, "grad_norm": 0.148405962516986, "learning_rate": 6.300588682375375e-07, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.13102710247039795, "step": 7865, "valid_targets_mean": 13030.2, "valid_targets_min": 2483 }, { "epoch": 4.64306784660767, "grad_norm": 0.1548714133654885, "learning_rate": 6.198425133034836e-07, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.1018887311220169, "step": 7870, "valid_targets_mean": 9731.1, "valid_targets_min": 1703 }, { "epoch": 4.646017699115045, "grad_norm": 0.1658282019537656, "learning_rate": 6.097083616992039e-07, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1153990775346756, "step": 7875, "valid_targets_mean": 10780.1, "valid_targets_min": 1649 }, { "epoch": 4.648967551622419, "grad_norm": 0.16452590143085927, "learning_rate": 5.996564564099494e-07, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.11689519882202148, "step": 7880, "valid_targets_mean": 10743.4, "valid_targets_min": 1801 }, { "epoch": 4.651917404129794, "grad_norm": 0.15959360618773735, "learning_rate": 5.89686840072119e-07, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.09219282865524292, "step": 7885, "valid_targets_mean": 9102.6, "valid_targets_min": 1830 }, { "epoch": 4.654867256637168, "grad_norm": 0.15017011191767232, "learning_rate": 5.797995549730684e-07, "loss": 0.3326, "loss_nan_ranks": 0, "loss_rank_avg": 0.09676504135131836, "step": 7890, "valid_targets_mean": 9400.9, "valid_targets_min": 1853 }, { "epoch": 4.657817109144543, "grad_norm": 0.14712118858804588, "learning_rate": 5.699946430509417e-07, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.10959380120038986, "step": 7895, "valid_targets_mean": 10114.0, "valid_targets_min": 2144 }, { "epoch": 4.660766961651918, "grad_norm": 0.1667434562433671, "learning_rate": 5.602721458944783e-07, "loss": 0.3277, "loss_nan_ranks": 0, "loss_rank_avg": 0.11018405854701996, "step": 7900, "valid_targets_mean": 9553.2, "valid_targets_min": 2181 }, { "epoch": 4.663716814159292, "grad_norm": 0.15459681678025006, "learning_rate": 5.50632104742852e-07, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.11551558971405029, "step": 7905, "valid_targets_mean": 9748.7, "valid_targets_min": 856 }, { "epoch": 4.666666666666667, "grad_norm": 0.16022184516651483, "learning_rate": 5.410745604854861e-07, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.12363321334123611, "step": 7910, "valid_targets_mean": 12207.3, "valid_targets_min": 2941 }, { "epoch": 4.669616519174041, "grad_norm": 0.16639336868212634, "learning_rate": 5.315995536618856e-07, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1000465601682663, "step": 7915, "valid_targets_mean": 9607.7, "valid_targets_min": 1480 }, { "epoch": 4.672566371681416, "grad_norm": 0.15139280931936996, "learning_rate": 5.222071244614579e-07, "loss": 0.3436, "loss_nan_ranks": 0, "loss_rank_avg": 0.10658089816570282, "step": 7920, "valid_targets_mean": 10516.6, "valid_targets_min": 1750 }, { "epoch": 4.67551622418879, "grad_norm": 0.15377735360447695, "learning_rate": 5.128973127233572e-07, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.09791351854801178, "step": 7925, "valid_targets_mean": 9166.2, "valid_targets_min": 2342 }, { "epoch": 4.678466076696165, "grad_norm": 0.16515324786442742, "learning_rate": 5.036701579362935e-07, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.12997247278690338, "step": 7930, "valid_targets_mean": 10198.2, "valid_targets_min": 1888 }, { "epoch": 4.68141592920354, "grad_norm": 0.15525919346374295, "learning_rate": 4.94525699238384e-07, "loss": 0.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.11433418095111847, "step": 7935, "valid_targets_mean": 9976.0, "valid_targets_min": 1591 }, { "epoch": 4.684365781710914, "grad_norm": 0.1597583329611498, "learning_rate": 4.854639754169776e-07, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.10255442559719086, "step": 7940, "valid_targets_mean": 8667.3, "valid_targets_min": 1636 }, { "epoch": 4.687315634218289, "grad_norm": 0.1574500233002011, "learning_rate": 4.7648502490849737e-07, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.13483873009681702, "step": 7945, "valid_targets_mean": 11671.9, "valid_targets_min": 1372 }, { "epoch": 4.6902654867256635, "grad_norm": 0.16094356927855527, "learning_rate": 4.675888857982669e-07, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.09947562962770462, "step": 7950, "valid_targets_mean": 8705.5, "valid_targets_min": 788 }, { "epoch": 4.6932153392330385, "grad_norm": 0.15295367535591084, "learning_rate": 4.587755958203599e-07, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.11330919712781906, "step": 7955, "valid_targets_mean": 10789.9, "valid_targets_min": 1629 }, { "epoch": 4.696165191740413, "grad_norm": 0.15713245388762861, "learning_rate": 4.5004519235743336e-07, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.1057049110531807, "step": 7960, "valid_targets_mean": 9820.9, "valid_targets_min": 2079 }, { "epoch": 4.699115044247788, "grad_norm": 0.1474422612887287, "learning_rate": 4.4139771244056993e-07, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10105115175247192, "step": 7965, "valid_targets_mean": 9519.0, "valid_targets_min": 1443 }, { "epoch": 4.702064896755163, "grad_norm": 0.15196052029218166, "learning_rate": 4.328331927491247e-07, "loss": 0.336, "loss_nan_ranks": 0, "loss_rank_avg": 0.11080189794301987, "step": 7970, "valid_targets_mean": 11148.6, "valid_targets_min": 2844 }, { "epoch": 4.705014749262537, "grad_norm": 0.1568521251058333, "learning_rate": 4.243516696105632e-07, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.14061200618743896, "step": 7975, "valid_targets_mean": 11772.3, "valid_targets_min": 2041 }, { "epoch": 4.707964601769912, "grad_norm": 0.1545804308119341, "learning_rate": 4.159531790003146e-07, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.103056401014328, "step": 7980, "valid_targets_mean": 9464.2, "valid_targets_min": 2006 }, { "epoch": 4.710914454277286, "grad_norm": 0.1503169086247212, "learning_rate": 4.076377565416079e-07, "loss": 0.3416, "loss_nan_ranks": 0, "loss_rank_avg": 0.10284608602523804, "step": 7985, "valid_targets_mean": 10115.8, "valid_targets_min": 2033 }, { "epoch": 4.713864306784661, "grad_norm": 0.1465495169158907, "learning_rate": 3.9940543750534025e-07, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.08931340277194977, "step": 7990, "valid_targets_mean": 8914.2, "valid_targets_min": 1829 }, { "epoch": 4.716814159292035, "grad_norm": 0.15023344789396648, "learning_rate": 3.9125625680990876e-07, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.12425112724304199, "step": 7995, "valid_targets_mean": 11594.1, "valid_targets_min": 1466 }, { "epoch": 4.71976401179941, "grad_norm": 0.1625604279941507, "learning_rate": 3.8319024902106373e-07, "loss": 0.3349, "loss_nan_ranks": 0, "loss_rank_avg": 0.11338561773300171, "step": 8000, "valid_targets_mean": 10735.3, "valid_targets_min": 1786 }, { "epoch": 4.722713864306785, "grad_norm": 0.1518588563470732, "learning_rate": 3.7520744835177537e-07, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.11632370948791504, "step": 8005, "valid_targets_mean": 11454.9, "valid_targets_min": 2305 }, { "epoch": 4.725663716814159, "grad_norm": 0.15237511826928452, "learning_rate": 3.6730788866207847e-07, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.09955699741840363, "step": 8010, "valid_targets_mean": 9119.2, "valid_targets_min": 933 }, { "epoch": 4.728613569321534, "grad_norm": 0.14939438036133001, "learning_rate": 3.594916034589324e-07, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.09637914597988129, "step": 8015, "valid_targets_mean": 9410.8, "valid_targets_min": 1837 }, { "epoch": 4.731563421828908, "grad_norm": 0.16739548238864774, "learning_rate": 3.5175862589607034e-07, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.09700131416320801, "step": 8020, "valid_targets_mean": 9461.3, "valid_targets_min": 1841 }, { "epoch": 4.734513274336283, "grad_norm": 0.15421867043528203, "learning_rate": 3.441089887738769e-07, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.13177192211151123, "step": 8025, "valid_targets_mean": 12400.2, "valid_targets_min": 2042 }, { "epoch": 4.737463126843657, "grad_norm": 0.15354486453580096, "learning_rate": 3.365427245392239e-07, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302848756313324, "step": 8030, "valid_targets_mean": 12530.3, "valid_targets_min": 2926 }, { "epoch": 4.740412979351032, "grad_norm": 0.15922122301009237, "learning_rate": 3.290598652853638e-07, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.12136721611022949, "step": 8035, "valid_targets_mean": 10509.6, "valid_targets_min": 649 }, { "epoch": 4.743362831858407, "grad_norm": 0.15200559708461336, "learning_rate": 3.216604427517611e-07, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.10849249362945557, "step": 8040, "valid_targets_mean": 9454.0, "valid_targets_min": 2003 }, { "epoch": 4.7463126843657815, "grad_norm": 0.15844438088801377, "learning_rate": 3.1434448832398547e-07, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.10437265783548355, "step": 8045, "valid_targets_mean": 9103.6, "valid_targets_min": 1608 }, { "epoch": 4.7492625368731565, "grad_norm": 0.15440075823729557, "learning_rate": 3.0711203303355417e-07, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.10706086456775665, "step": 8050, "valid_targets_mean": 9436.6, "valid_targets_min": 2137 }, { "epoch": 4.752212389380531, "grad_norm": 0.15650013232286086, "learning_rate": 2.9996310755782354e-07, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.10674930363893509, "step": 8055, "valid_targets_mean": 9747.0, "valid_targets_min": 1135 }, { "epoch": 4.755162241887906, "grad_norm": 0.16010100514936637, "learning_rate": 2.92897742219842e-07, "loss": 0.3379, "loss_nan_ranks": 0, "loss_rank_avg": 0.11662594974040985, "step": 8060, "valid_targets_mean": 10079.6, "valid_targets_min": 2286 }, { "epoch": 4.758112094395281, "grad_norm": 0.18313454619062772, "learning_rate": 2.859159669882261e-07, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.11656038463115692, "step": 8065, "valid_targets_mean": 10582.6, "valid_targets_min": 1657 }, { "epoch": 4.761061946902655, "grad_norm": 0.16022588278414174, "learning_rate": 2.7901781147704257e-07, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.10365186631679535, "step": 8070, "valid_targets_mean": 8869.7, "valid_targets_min": 1883 }, { "epoch": 4.76401179941003, "grad_norm": 0.1541843916278012, "learning_rate": 2.7220330494566404e-07, "loss": 0.33, "loss_nan_ranks": 0, "loss_rank_avg": 0.11602887511253357, "step": 8075, "valid_targets_mean": 10999.8, "valid_targets_min": 1608 }, { "epoch": 4.766961651917404, "grad_norm": 0.1593256933790957, "learning_rate": 2.654724762986649e-07, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1141844168305397, "step": 8080, "valid_targets_mean": 10845.2, "valid_targets_min": 1769 }, { "epoch": 4.769911504424779, "grad_norm": 0.14692227157712975, "learning_rate": 2.588253540856811e-07, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1177644431591034, "step": 8085, "valid_targets_mean": 11583.4, "valid_targets_min": 2726 }, { "epoch": 4.772861356932154, "grad_norm": 0.15635500681838485, "learning_rate": 2.5226196650130596e-07, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.09946940094232559, "step": 8090, "valid_targets_mean": 9023.2, "valid_targets_min": 1719 }, { "epoch": 4.775811209439528, "grad_norm": 0.15542240912952268, "learning_rate": 2.4578234138495693e-07, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.12937146425247192, "step": 8095, "valid_targets_mean": 11621.1, "valid_targets_min": 1627 }, { "epoch": 4.778761061946903, "grad_norm": 0.1989805763466194, "learning_rate": 2.3938650622076453e-07, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308184713125229, "step": 8100, "valid_targets_mean": 10227.8, "valid_targets_min": 2542 }, { "epoch": 4.781710914454277, "grad_norm": 0.15854722710821223, "learning_rate": 2.3307448813744805e-07, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.1028071716427803, "step": 8105, "valid_targets_mean": 8847.1, "valid_targets_min": 2962 }, { "epoch": 4.784660766961652, "grad_norm": 0.15384075094610822, "learning_rate": 2.2684631390821775e-07, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.11849691718816757, "step": 8110, "valid_targets_mean": 11824.5, "valid_targets_min": 2336 }, { "epoch": 4.787610619469026, "grad_norm": 0.15427674682254122, "learning_rate": 2.207020099506374e-07, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.14145824313163757, "step": 8115, "valid_targets_mean": 13422.8, "valid_targets_min": 2469 }, { "epoch": 4.790560471976401, "grad_norm": 0.15160113657943072, "learning_rate": 2.1464160232653518e-07, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.08148768544197083, "step": 8120, "valid_targets_mean": 8039.5, "valid_targets_min": 1011 }, { "epoch": 4.793510324483776, "grad_norm": 0.15059629364878185, "learning_rate": 2.0866511674187518e-07, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.09149783104658127, "step": 8125, "valid_targets_mean": 8162.9, "valid_targets_min": 1768 }, { "epoch": 4.79646017699115, "grad_norm": 0.16384131384526676, "learning_rate": 2.0277257854665944e-07, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.11894331872463226, "step": 8130, "valid_targets_mean": 9680.6, "valid_targets_min": 1517 }, { "epoch": 4.799410029498525, "grad_norm": 0.1602386352213527, "learning_rate": 1.9696401273481713e-07, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11503320187330246, "step": 8135, "valid_targets_mean": 10204.0, "valid_targets_min": 1856 }, { "epoch": 4.8023598820058995, "grad_norm": 0.1545511562562192, "learning_rate": 1.9123944394409567e-07, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.12917274236679077, "step": 8140, "valid_targets_mean": 11088.9, "valid_targets_min": 3033 }, { "epoch": 4.8053097345132745, "grad_norm": 0.16017065168337155, "learning_rate": 1.8559889645596073e-07, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.09840681403875351, "step": 8145, "valid_targets_mean": 8808.9, "valid_targets_min": 1628 }, { "epoch": 4.808259587020649, "grad_norm": 0.16153661164958696, "learning_rate": 1.8004239419548985e-07, "loss": 0.3331, "loss_nan_ranks": 0, "loss_rank_avg": 0.11837130039930344, "step": 8150, "valid_targets_mean": 10004.9, "valid_targets_min": 2090 }, { "epoch": 4.811209439528024, "grad_norm": 0.15843824142798069, "learning_rate": 1.745699607312723e-07, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.11763490736484528, "step": 8155, "valid_targets_mean": 11585.9, "valid_targets_min": 1578 }, { "epoch": 4.814159292035399, "grad_norm": 0.15594867162929354, "learning_rate": 1.6918161927531375e-07, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.12264040857553482, "step": 8160, "valid_targets_mean": 10658.7, "valid_targets_min": 1712 }, { "epoch": 4.817109144542773, "grad_norm": 0.15355379471150807, "learning_rate": 1.6387739268292513e-07, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.12840881943702698, "step": 8165, "valid_targets_mean": 11714.4, "valid_targets_min": 2874 }, { "epoch": 4.820058997050148, "grad_norm": 0.15764893679634057, "learning_rate": 1.5865730345263842e-07, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.09563873708248138, "step": 8170, "valid_targets_mean": 9205.3, "valid_targets_min": 2733 }, { "epoch": 4.823008849557522, "grad_norm": 0.15015239794660265, "learning_rate": 1.5352137372611097e-07, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.09439783543348312, "step": 8175, "valid_targets_mean": 8837.8, "valid_targets_min": 2032 }, { "epoch": 4.825958702064897, "grad_norm": 0.15549841438969475, "learning_rate": 1.484696252880169e-07, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.10786696523427963, "step": 8180, "valid_targets_mean": 10313.7, "valid_targets_min": 2037 }, { "epoch": 4.828908554572271, "grad_norm": 0.15517700272853036, "learning_rate": 1.4350207956597583e-07, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.09071081876754761, "step": 8185, "valid_targets_mean": 8079.2, "valid_targets_min": 1799 }, { "epoch": 4.831858407079646, "grad_norm": 0.1551730940635976, "learning_rate": 1.3861875763043987e-07, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.1367199718952179, "step": 8190, "valid_targets_mean": 11687.4, "valid_targets_min": 1660 }, { "epoch": 4.834808259587021, "grad_norm": 0.1513284388442919, "learning_rate": 1.3381968019462678e-07, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.10539837181568146, "step": 8195, "valid_targets_mean": 9689.1, "valid_targets_min": 1213 }, { "epoch": 4.837758112094395, "grad_norm": 0.1579977975628611, "learning_rate": 1.2910486761441577e-07, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488528698682785, "step": 8200, "valid_targets_mean": 13727.9, "valid_targets_min": 2019 }, { "epoch": 4.84070796460177, "grad_norm": 0.1645343788926088, "learning_rate": 1.2447433988826306e-07, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.09441319108009338, "step": 8205, "valid_targets_mean": 8408.8, "valid_targets_min": 1770 }, { "epoch": 4.843657817109144, "grad_norm": 0.17102694080450573, "learning_rate": 1.1992811665712423e-07, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.1222073882818222, "step": 8210, "valid_targets_mean": 10496.0, "valid_targets_min": 1924 }, { "epoch": 4.846607669616519, "grad_norm": 0.15282193505100267, "learning_rate": 1.1546621720436745e-07, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.10215400159358978, "step": 8215, "valid_targets_mean": 9131.2, "valid_targets_min": 2712 }, { "epoch": 4.849557522123893, "grad_norm": 0.16566507473867742, "learning_rate": 1.1108866045569156e-07, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.11062388122081757, "step": 8220, "valid_targets_mean": 8391.5, "valid_targets_min": 1896 }, { "epoch": 4.852507374631268, "grad_norm": 0.1511859347180266, "learning_rate": 1.0679546497903926e-07, "loss": 0.3323, "loss_nan_ranks": 0, "loss_rank_avg": 0.10670909285545349, "step": 8225, "valid_targets_mean": 9973.9, "valid_targets_min": 1874 }, { "epoch": 4.855457227138643, "grad_norm": 0.14973828526729327, "learning_rate": 1.0258664898453507e-07, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.11628145724534988, "step": 8230, "valid_targets_mean": 11387.2, "valid_targets_min": 2079 }, { "epoch": 4.8584070796460175, "grad_norm": 0.15653880756528876, "learning_rate": 9.846223032438318e-08, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.11390264332294464, "step": 8235, "valid_targets_mean": 9381.8, "valid_targets_min": 1708 }, { "epoch": 4.8613569321533925, "grad_norm": 0.16974042052187077, "learning_rate": 9.442222649282296e-08, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.10504934191703796, "step": 8240, "valid_targets_mean": 8509.3, "valid_targets_min": 1118 }, { "epoch": 4.864306784660767, "grad_norm": 0.15268761111173068, "learning_rate": 9.046665462602244e-08, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.11172182857990265, "step": 8245, "valid_targets_mean": 10374.7, "valid_targets_min": 2011 }, { "epoch": 4.867256637168142, "grad_norm": 0.16194877779100575, "learning_rate": 8.659553150203392e-08, "loss": 0.3397, "loss_nan_ranks": 0, "loss_rank_avg": 0.13858763873577118, "step": 8250, "valid_targets_mean": 12519.0, "valid_targets_min": 1887 }, { "epoch": 4.870206489675516, "grad_norm": 0.1553367162188952, "learning_rate": 8.280887354069844e-08, "loss": 0.3313, "loss_nan_ranks": 0, "loss_rank_avg": 0.10727658867835999, "step": 8255, "valid_targets_mean": 9916.1, "valid_targets_min": 1793 }, { "epoch": 4.873156342182891, "grad_norm": 0.17928672354183484, "learning_rate": 7.910669680359473e-08, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.12614883482456207, "step": 8260, "valid_targets_mean": 10340.9, "valid_targets_min": 1125 }, { "epoch": 4.876106194690266, "grad_norm": 0.16037472573730496, "learning_rate": 7.548901699396372e-08, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.11756325513124466, "step": 8265, "valid_targets_mean": 9584.5, "valid_targets_min": 2028 }, { "epoch": 4.87905604719764, "grad_norm": 0.15676084316110542, "learning_rate": 7.195584945663969e-08, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.12959174811840057, "step": 8270, "valid_targets_mean": 11590.9, "valid_targets_min": 2261 }, { "epoch": 4.882005899705015, "grad_norm": 0.14981931967427253, "learning_rate": 6.850720917799036e-08, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.12228604406118393, "step": 8275, "valid_targets_mean": 11354.4, "valid_targets_min": 1773 }, { "epoch": 4.88495575221239, "grad_norm": 0.1492517770434556, "learning_rate": 6.5143110785848e-08, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.1076161116361618, "step": 8280, "valid_targets_mean": 9635.8, "valid_targets_min": 2187 }, { "epoch": 4.887905604719764, "grad_norm": 0.15883459016225324, "learning_rate": 6.186356854944953e-08, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.11498965322971344, "step": 8285, "valid_targets_mean": 10532.5, "valid_targets_min": 1940 }, { "epoch": 4.890855457227139, "grad_norm": 0.1512683940726875, "learning_rate": 5.866859637938094e-08, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.12131491303443909, "step": 8290, "valid_targets_mean": 11384.6, "valid_targets_min": 2096 }, { "epoch": 4.893805309734513, "grad_norm": 0.16374210576442358, "learning_rate": 5.555820782750854e-08, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.11251075565814972, "step": 8295, "valid_targets_mean": 10272.5, "valid_targets_min": 2815 }, { "epoch": 4.896755162241888, "grad_norm": 0.15550531670351886, "learning_rate": 5.253241608693005e-08, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.12761548161506653, "step": 8300, "valid_targets_mean": 11145.4, "valid_targets_min": 818 }, { "epoch": 4.899705014749262, "grad_norm": 0.16691708037129438, "learning_rate": 4.959123399191468e-08, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.10028710216283798, "step": 8305, "valid_targets_mean": 9275.6, "valid_targets_min": 1757 }, { "epoch": 4.902654867256637, "grad_norm": 0.15042742074564838, "learning_rate": 4.673467401784981e-08, "loss": 0.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.11940623074769974, "step": 8310, "valid_targets_mean": 10562.0, "valid_targets_min": 1778 }, { "epoch": 4.905604719764012, "grad_norm": 0.15515324897077903, "learning_rate": 4.396274828118774e-08, "loss": 0.3357, "loss_nan_ranks": 0, "loss_rank_avg": 0.10962172597646713, "step": 8315, "valid_targets_mean": 9969.5, "valid_targets_min": 1957 }, { "epoch": 4.908554572271386, "grad_norm": 0.15830692983786696, "learning_rate": 4.127546853939013e-08, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.12479501217603683, "step": 8320, "valid_targets_mean": 10153.2, "valid_targets_min": 2191 }, { "epoch": 4.911504424778761, "grad_norm": 0.15919506975556477, "learning_rate": 3.867284619089029e-08, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.0909244641661644, "step": 8325, "valid_targets_mean": 8849.2, "valid_targets_min": 324 }, { "epoch": 4.9144542772861355, "grad_norm": 0.1531424595801704, "learning_rate": 3.615489227502877e-08, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.12087876349687576, "step": 8330, "valid_targets_mean": 10924.6, "valid_targets_min": 2710 }, { "epoch": 4.9174041297935105, "grad_norm": 0.17922580684050662, "learning_rate": 3.372161747202007e-08, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497780472040176, "step": 8335, "valid_targets_mean": 11752.3, "valid_targets_min": 1969 }, { "epoch": 4.920353982300885, "grad_norm": 0.15961290538181538, "learning_rate": 3.137303210289711e-08, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.13402295112609863, "step": 8340, "valid_targets_mean": 12698.6, "valid_targets_min": 2768 }, { "epoch": 4.92330383480826, "grad_norm": 0.15686414808002838, "learning_rate": 2.9109146129475686e-08, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.10782062262296677, "step": 8345, "valid_targets_mean": 10104.6, "valid_targets_min": 1652 }, { "epoch": 4.926253687315635, "grad_norm": 0.1539726659200968, "learning_rate": 2.69299691543079e-08, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.11887013912200928, "step": 8350, "valid_targets_mean": 11014.7, "valid_targets_min": 1872 }, { "epoch": 4.929203539823009, "grad_norm": 0.15614057446465482, "learning_rate": 2.483551042064214e-08, "loss": 0.3368, "loss_nan_ranks": 0, "loss_rank_avg": 0.11364469677209854, "step": 8355, "valid_targets_mean": 10039.7, "valid_targets_min": 2777 }, { "epoch": 4.932153392330384, "grad_norm": 0.15395208293261126, "learning_rate": 2.2825778812385347e-08, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.12622305750846863, "step": 8360, "valid_targets_mean": 11453.5, "valid_targets_min": 1275 }, { "epoch": 4.935103244837758, "grad_norm": 0.15579370316332758, "learning_rate": 2.090078285405639e-08, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.10148319602012634, "step": 8365, "valid_targets_mean": 8932.7, "valid_targets_min": 1791 }, { "epoch": 4.938053097345133, "grad_norm": 0.14897559185560402, "learning_rate": 1.90605307107683e-08, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.11737137287855148, "step": 8370, "valid_targets_mean": 11101.6, "valid_targets_min": 2707 }, { "epoch": 4.941002949852507, "grad_norm": 0.1593622012689512, "learning_rate": 1.7305030188177195e-08, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.13405683636665344, "step": 8375, "valid_targets_mean": 10862.0, "valid_targets_min": 1591 }, { "epoch": 4.943952802359882, "grad_norm": 0.15857040855180185, "learning_rate": 1.563428873245343e-08, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1257179081439972, "step": 8380, "valid_targets_mean": 10801.4, "valid_targets_min": 1421 }, { "epoch": 4.946902654867257, "grad_norm": 0.16797684271769017, "learning_rate": 1.4048313430252702e-08, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.10947559773921967, "step": 8385, "valid_targets_mean": 8929.9, "valid_targets_min": 1203 }, { "epoch": 4.949852507374631, "grad_norm": 0.15234476430572783, "learning_rate": 1.2547111008689438e-08, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.11667993664741516, "step": 8390, "valid_targets_mean": 10474.6, "valid_targets_min": 1041 }, { "epoch": 4.952802359882006, "grad_norm": 0.16171341308080303, "learning_rate": 1.1130687835292364e-08, "loss": 0.34, "loss_nan_ranks": 0, "loss_rank_avg": 0.0994919091463089, "step": 8395, "valid_targets_mean": 8967.3, "valid_targets_min": 2401 }, { "epoch": 4.95575221238938, "grad_norm": 0.15653748086188524, "learning_rate": 9.79904991800007e-09, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11829991638660431, "step": 8400, "valid_targets_mean": 10507.0, "valid_targets_min": 1811 }, { "epoch": 4.958702064896755, "grad_norm": 0.15627283558458796, "learning_rate": 8.552202905116603e-09, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.0984392911195755, "step": 8405, "valid_targets_mean": 9101.4, "valid_targets_min": 1896 }, { "epoch": 4.961651917404129, "grad_norm": 0.15721821511741407, "learning_rate": 7.390152085298141e-09, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.12197485566139221, "step": 8410, "valid_targets_mean": 11740.2, "valid_targets_min": 1329 }, { "epoch": 4.964601769911504, "grad_norm": 0.16234745408852572, "learning_rate": 6.312902387526354e-09, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.10215374082326889, "step": 8415, "valid_targets_mean": 8273.8, "valid_targets_min": 1581 }, { "epoch": 4.967551622418879, "grad_norm": 0.15791372499868073, "learning_rate": 5.320458381090632e-09, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.12479733675718307, "step": 8420, "valid_targets_mean": 10531.7, "valid_targets_min": 2030 }, { "epoch": 4.9705014749262535, "grad_norm": 0.1578360190843846, "learning_rate": 4.412824275563665e-09, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.10316172242164612, "step": 8425, "valid_targets_mean": 8572.2, "valid_targets_min": 1302 }, { "epoch": 4.9734513274336285, "grad_norm": 0.15983241448664054, "learning_rate": 3.5900039207859005e-09, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.11723663657903671, "step": 8430, "valid_targets_mean": 10365.0, "valid_targets_min": 1880 }, { "epoch": 4.976401179941003, "grad_norm": 0.1625826476293185, "learning_rate": 2.852000806854438e-09, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.13278573751449585, "step": 8435, "valid_targets_mean": 11930.6, "valid_targets_min": 1431 }, { "epoch": 4.979351032448378, "grad_norm": 0.14992069896746002, "learning_rate": 2.198818064098607e-09, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.11306165158748627, "step": 8440, "valid_targets_mean": 10015.8, "valid_targets_min": 1439 }, { "epoch": 4.982300884955752, "grad_norm": 0.16714353240958918, "learning_rate": 1.6304584630733033e-09, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.12046494334936142, "step": 8445, "valid_targets_mean": 10110.8, "valid_targets_min": 2130 }, { "epoch": 4.985250737463127, "grad_norm": 0.15472606493144128, "learning_rate": 1.1469244145456693e-09, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.10794627666473389, "step": 8450, "valid_targets_mean": 9938.6, "valid_targets_min": 1395 }, { "epoch": 4.988200589970502, "grad_norm": 0.17796065764885294, "learning_rate": 7.482179694884295e-10, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.13961243629455566, "step": 8455, "valid_targets_mean": 11508.6, "valid_targets_min": 1832 }, { "epoch": 4.991150442477876, "grad_norm": 0.1512951487988943, "learning_rate": 4.3434081905990857e-10, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1032632440328598, "step": 8460, "valid_targets_mean": 9993.5, "valid_targets_min": 2294 }, { "epoch": 4.994100294985251, "grad_norm": 0.16434925179454232, "learning_rate": 2.0529429461069174e-10, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.13042443990707397, "step": 8465, "valid_targets_mean": 11300.2, "valid_targets_min": 1578 }, { "epoch": 4.997050147492625, "grad_norm": 0.1540038581679221, "learning_rate": 6.107936766808209e-11, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.11116141080856323, "step": 8470, "valid_targets_mean": 10239.3, "valid_targets_min": 1636 }, { "epoch": 5.0, "grad_norm": 0.1529484565508345, "learning_rate": 1.6966499405413062e-12, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.10146471858024597, "step": 8475, "valid_targets_mean": 9906.2, "valid_targets_min": 1715 }, { "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.10146471858024597, "step": 8475, "total_flos": 2.892950530069994e+19, "train_loss": 0.05187808655707885, "train_runtime": 37600.0558, "train_samples_per_second": 21.635, "train_steps_per_second": 0.225, "valid_targets_mean": 9906.2, "valid_targets_min": 1715 } ], "logging_steps": 5, "max_steps": 8475, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 300, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.892950530069994e+19, "train_batch_size": 1, "trial_name": null, "trial_params": null }