{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 5210, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0048, "grad_norm": 10.636854244202556, "learning_rate": 3.071017274472169e-07, "loss": 0.9544, "loss_nan_ranks": 0, "loss_rank_avg": 0.3281858265399933, "step": 5, "valid_targets_mean": 10263.1, "valid_targets_min": 1622 }, { "epoch": 0.0096, "grad_norm": 8.705611775216052, "learning_rate": 6.909788867562381e-07, "loss": 0.9596, "loss_nan_ranks": 0, "loss_rank_avg": 0.33007457852363586, "step": 10, "valid_targets_mean": 12424.5, "valid_targets_min": 2066 }, { "epoch": 0.0144, "grad_norm": 7.625331316286804, "learning_rate": 1.074856046065259e-06, "loss": 0.9453, "loss_nan_ranks": 0, "loss_rank_avg": 0.30262356996536255, "step": 15, "valid_targets_mean": 10207.7, "valid_targets_min": 1992 }, { "epoch": 0.0192, "grad_norm": 5.53278243942875, "learning_rate": 1.4587332053742803e-06, "loss": 0.9187, "loss_nan_ranks": 0, "loss_rank_avg": 0.32896602153778076, "step": 20, "valid_targets_mean": 12274.8, "valid_targets_min": 1016 }, { "epoch": 0.024, "grad_norm": 2.925539335155935, "learning_rate": 1.8426103646833015e-06, "loss": 0.8497, "loss_nan_ranks": 0, "loss_rank_avg": 0.3109387755393982, "step": 25, "valid_targets_mean": 12681.8, "valid_targets_min": 1505 }, { "epoch": 0.0288, "grad_norm": 1.8422083015449056, "learning_rate": 2.2264875239923228e-06, "loss": 0.8137, "loss_nan_ranks": 0, "loss_rank_avg": 0.27611488103866577, "step": 30, "valid_targets_mean": 12296.9, "valid_targets_min": 1668 }, { "epoch": 0.0336, "grad_norm": 1.5441559016293185, "learning_rate": 2.6103646833013433e-06, "loss": 0.7877, "loss_nan_ranks": 0, "loss_rank_avg": 0.30650392174720764, "step": 35, "valid_targets_mean": 12300.1, "valid_targets_min": 1479 }, { "epoch": 0.0384, "grad_norm": 1.1621222136438034, "learning_rate": 2.9942418426103648e-06, "loss": 0.7642, "loss_nan_ranks": 0, "loss_rank_avg": 0.2344341278076172, "step": 40, "valid_targets_mean": 10216.6, "valid_targets_min": 3242 }, { "epoch": 0.0432, "grad_norm": 0.7785445251214029, "learning_rate": 3.378119001919386e-06, "loss": 0.7259, "loss_nan_ranks": 0, "loss_rank_avg": 0.22525399923324585, "step": 45, "valid_targets_mean": 9436.8, "valid_targets_min": 1761 }, { "epoch": 0.048, "grad_norm": 0.6851609239554484, "learning_rate": 3.761996161228407e-06, "loss": 0.7095, "loss_nan_ranks": 0, "loss_rank_avg": 0.22096958756446838, "step": 50, "valid_targets_mean": 8893.3, "valid_targets_min": 1935 }, { "epoch": 0.0528, "grad_norm": 0.47600710001942337, "learning_rate": 4.145873320537428e-06, "loss": 0.6931, "loss_nan_ranks": 0, "loss_rank_avg": 0.22855256497859955, "step": 55, "valid_targets_mean": 10395.9, "valid_targets_min": 1283 }, { "epoch": 0.0576, "grad_norm": 0.4444504600275988, "learning_rate": 4.52975047984645e-06, "loss": 0.6716, "loss_nan_ranks": 0, "loss_rank_avg": 0.20247305929660797, "step": 60, "valid_targets_mean": 9470.6, "valid_targets_min": 2067 }, { "epoch": 0.0624, "grad_norm": 0.3880399717802379, "learning_rate": 4.91362763915547e-06, "loss": 0.6494, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117888331413269, "step": 65, "valid_targets_mean": 10791.5, "valid_targets_min": 4875 }, { "epoch": 0.0672, "grad_norm": 0.3032827664070752, "learning_rate": 5.297504798464492e-06, "loss": 0.6435, "loss_nan_ranks": 0, "loss_rank_avg": 0.20708134770393372, "step": 70, "valid_targets_mean": 10440.2, "valid_targets_min": 2638 }, { "epoch": 0.072, "grad_norm": 0.28159068782522545, "learning_rate": 5.681381957773513e-06, "loss": 0.6349, "loss_nan_ranks": 0, "loss_rank_avg": 0.23973067104816437, "step": 75, "valid_targets_mean": 12223.6, "valid_targets_min": 1619 }, { "epoch": 0.0768, "grad_norm": 0.2719001663622767, "learning_rate": 6.065259117082534e-06, "loss": 0.613, "loss_nan_ranks": 0, "loss_rank_avg": 0.19408732652664185, "step": 80, "valid_targets_mean": 10384.3, "valid_targets_min": 1608 }, { "epoch": 0.0816, "grad_norm": 0.23703867977781148, "learning_rate": 6.449136276391556e-06, "loss": 0.6057, "loss_nan_ranks": 0, "loss_rank_avg": 0.19000616669654846, "step": 85, "valid_targets_mean": 11075.1, "valid_targets_min": 2097 }, { "epoch": 0.0864, "grad_norm": 0.22992604502698233, "learning_rate": 6.833013435700576e-06, "loss": 0.5832, "loss_nan_ranks": 0, "loss_rank_avg": 0.20729880034923553, "step": 90, "valid_targets_mean": 10286.8, "valid_targets_min": 253 }, { "epoch": 0.0912, "grad_norm": 0.22062818252236446, "learning_rate": 7.216890595009598e-06, "loss": 0.5787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2066301703453064, "step": 95, "valid_targets_mean": 11090.3, "valid_targets_min": 2975 }, { "epoch": 0.096, "grad_norm": 0.24007612411052925, "learning_rate": 7.600767754318619e-06, "loss": 0.5724, "loss_nan_ranks": 0, "loss_rank_avg": 0.1960715353488922, "step": 100, "valid_targets_mean": 10440.2, "valid_targets_min": 1703 }, { "epoch": 0.1008, "grad_norm": 0.2364846800541795, "learning_rate": 7.98464491362764e-06, "loss": 0.5643, "loss_nan_ranks": 0, "loss_rank_avg": 0.183235764503479, "step": 105, "valid_targets_mean": 10720.9, "valid_targets_min": 1279 }, { "epoch": 0.1056, "grad_norm": 0.22116407241128727, "learning_rate": 8.368522072936662e-06, "loss": 0.5524, "loss_nan_ranks": 0, "loss_rank_avg": 0.15857258439064026, "step": 110, "valid_targets_mean": 8602.8, "valid_targets_min": 1405 }, { "epoch": 0.1104, "grad_norm": 0.24251627783577479, "learning_rate": 8.752399232245682e-06, "loss": 0.5528, "loss_nan_ranks": 0, "loss_rank_avg": 0.20528832077980042, "step": 115, "valid_targets_mean": 11334.2, "valid_targets_min": 2159 }, { "epoch": 0.1152, "grad_norm": 0.22397511123215, "learning_rate": 9.136276391554704e-06, "loss": 0.5436, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935373693704605, "step": 120, "valid_targets_mean": 11852.4, "valid_targets_min": 2174 }, { "epoch": 0.12, "grad_norm": 0.24271342022992784, "learning_rate": 9.520153550863724e-06, "loss": 0.5472, "loss_nan_ranks": 0, "loss_rank_avg": 0.19181078672409058, "step": 125, "valid_targets_mean": 10768.0, "valid_targets_min": 1942 }, { "epoch": 0.1248, "grad_norm": 0.2172967997455667, "learning_rate": 9.904030710172746e-06, "loss": 0.5468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1923825442790985, "step": 130, "valid_targets_mean": 11106.3, "valid_targets_min": 1863 }, { "epoch": 0.1296, "grad_norm": 0.2357587155660315, "learning_rate": 1.0287907869481766e-05, "loss": 0.5344, "loss_nan_ranks": 0, "loss_rank_avg": 0.16063986718654633, "step": 135, "valid_targets_mean": 9855.5, "valid_targets_min": 2389 }, { "epoch": 0.1344, "grad_norm": 0.22906584573702501, "learning_rate": 1.067178502879079e-05, "loss": 0.5344, "loss_nan_ranks": 0, "loss_rank_avg": 0.19566833972930908, "step": 140, "valid_targets_mean": 11456.1, "valid_targets_min": 2336 }, { "epoch": 0.1392, "grad_norm": 0.25114235107383526, "learning_rate": 1.105566218809981e-05, "loss": 0.5285, "loss_nan_ranks": 0, "loss_rank_avg": 0.19265873730182648, "step": 145, "valid_targets_mean": 9929.8, "valid_targets_min": 2020 }, { "epoch": 0.144, "grad_norm": 0.23750880102943095, "learning_rate": 1.143953934740883e-05, "loss": 0.5231, "loss_nan_ranks": 0, "loss_rank_avg": 0.20383387804031372, "step": 150, "valid_targets_mean": 11054.2, "valid_targets_min": 1049 }, { "epoch": 0.1488, "grad_norm": 0.23692985297514224, "learning_rate": 1.182341650671785e-05, "loss": 0.5245, "loss_nan_ranks": 0, "loss_rank_avg": 0.17097380757331848, "step": 155, "valid_targets_mean": 11116.3, "valid_targets_min": 641 }, { "epoch": 0.1536, "grad_norm": 0.24339076517066405, "learning_rate": 1.2207293666026872e-05, "loss": 0.5104, "loss_nan_ranks": 0, "loss_rank_avg": 0.17967820167541504, "step": 160, "valid_targets_mean": 11142.9, "valid_targets_min": 2725 }, { "epoch": 0.1584, "grad_norm": 0.2558192460223346, "learning_rate": 1.2591170825335894e-05, "loss": 0.5194, "loss_nan_ranks": 0, "loss_rank_avg": 0.16853728890419006, "step": 165, "valid_targets_mean": 10722.9, "valid_targets_min": 3225 }, { "epoch": 0.1632, "grad_norm": 0.24528680520963095, "learning_rate": 1.2975047984644915e-05, "loss": 0.517, "loss_nan_ranks": 0, "loss_rank_avg": 0.16261857748031616, "step": 170, "valid_targets_mean": 9597.3, "valid_targets_min": 2714 }, { "epoch": 0.168, "grad_norm": 0.2330765401016573, "learning_rate": 1.3358925143953936e-05, "loss": 0.5123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1625608503818512, "step": 175, "valid_targets_mean": 9343.4, "valid_targets_min": 1455 }, { "epoch": 0.1728, "grad_norm": 0.2662782596501721, "learning_rate": 1.3742802303262956e-05, "loss": 0.5099, "loss_nan_ranks": 0, "loss_rank_avg": 0.15402890741825104, "step": 180, "valid_targets_mean": 9405.9, "valid_targets_min": 2750 }, { "epoch": 0.1776, "grad_norm": 0.23548854171410669, "learning_rate": 1.4126679462571978e-05, "loss": 0.5082, "loss_nan_ranks": 0, "loss_rank_avg": 0.15284034609794617, "step": 185, "valid_targets_mean": 10169.3, "valid_targets_min": 2559 }, { "epoch": 0.1824, "grad_norm": 0.2493807137284219, "learning_rate": 1.4510556621881e-05, "loss": 0.5078, "loss_nan_ranks": 0, "loss_rank_avg": 0.224237859249115, "step": 190, "valid_targets_mean": 13936.2, "valid_targets_min": 1967 }, { "epoch": 0.1872, "grad_norm": 0.23080076777747327, "learning_rate": 1.4894433781190021e-05, "loss": 0.4977, "loss_nan_ranks": 0, "loss_rank_avg": 0.18542718887329102, "step": 195, "valid_targets_mean": 11386.7, "valid_targets_min": 1049 }, { "epoch": 0.192, "grad_norm": 0.24356875674311323, "learning_rate": 1.527831094049904e-05, "loss": 0.4938, "loss_nan_ranks": 0, "loss_rank_avg": 0.15462642908096313, "step": 200, "valid_targets_mean": 9353.9, "valid_targets_min": 1881 }, { "epoch": 0.1968, "grad_norm": 0.21231400448563495, "learning_rate": 1.566218809980806e-05, "loss": 0.497, "loss_nan_ranks": 0, "loss_rank_avg": 0.19362452626228333, "step": 205, "valid_targets_mean": 13543.5, "valid_targets_min": 3151 }, { "epoch": 0.2016, "grad_norm": 0.22632075151001788, "learning_rate": 1.6046065259117082e-05, "loss": 0.4923, "loss_nan_ranks": 0, "loss_rank_avg": 0.17729297280311584, "step": 210, "valid_targets_mean": 11808.5, "valid_targets_min": 3102 }, { "epoch": 0.2064, "grad_norm": 0.27758108971137807, "learning_rate": 1.6429942418426105e-05, "loss": 0.4899, "loss_nan_ranks": 0, "loss_rank_avg": 0.17895910143852234, "step": 215, "valid_targets_mean": 11082.8, "valid_targets_min": 3656 }, { "epoch": 0.2112, "grad_norm": 0.28957622378218517, "learning_rate": 1.6813819577735126e-05, "loss": 0.4913, "loss_nan_ranks": 0, "loss_rank_avg": 0.14970815181732178, "step": 220, "valid_targets_mean": 9667.3, "valid_targets_min": 1173 }, { "epoch": 0.216, "grad_norm": 0.27937879612714905, "learning_rate": 1.7197696737044146e-05, "loss": 0.5047, "loss_nan_ranks": 0, "loss_rank_avg": 0.14511623978614807, "step": 225, "valid_targets_mean": 9465.0, "valid_targets_min": 2634 }, { "epoch": 0.2208, "grad_norm": 0.24089811245385753, "learning_rate": 1.758157389635317e-05, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.16545206308364868, "step": 230, "valid_targets_mean": 11997.9, "valid_targets_min": 2677 }, { "epoch": 0.2256, "grad_norm": 0.2578591546428462, "learning_rate": 1.796545105566219e-05, "loss": 0.4873, "loss_nan_ranks": 0, "loss_rank_avg": 0.2065517008304596, "step": 235, "valid_targets_mean": 13886.1, "valid_targets_min": 2298 }, { "epoch": 0.2304, "grad_norm": 0.24203958143555748, "learning_rate": 1.8349328214971213e-05, "loss": 0.4971, "loss_nan_ranks": 0, "loss_rank_avg": 0.17147715389728546, "step": 240, "valid_targets_mean": 11135.5, "valid_targets_min": 2340 }, { "epoch": 0.2352, "grad_norm": 0.23970277281734395, "learning_rate": 1.8733205374280233e-05, "loss": 0.4825, "loss_nan_ranks": 0, "loss_rank_avg": 0.1593427062034607, "step": 245, "valid_targets_mean": 9909.9, "valid_targets_min": 4293 }, { "epoch": 0.24, "grad_norm": 0.31598621631855395, "learning_rate": 1.9117082533589253e-05, "loss": 0.4898, "loss_nan_ranks": 0, "loss_rank_avg": 0.18410634994506836, "step": 250, "valid_targets_mean": 12043.8, "valid_targets_min": 1907 }, { "epoch": 0.2448, "grad_norm": 0.27841537067755107, "learning_rate": 1.9500959692898273e-05, "loss": 0.4934, "loss_nan_ranks": 0, "loss_rank_avg": 0.15667122602462769, "step": 255, "valid_targets_mean": 9791.7, "valid_targets_min": 1688 }, { "epoch": 0.2496, "grad_norm": 0.27493246532697335, "learning_rate": 1.9884836852207294e-05, "loss": 0.5018, "loss_nan_ranks": 0, "loss_rank_avg": 0.15299372375011444, "step": 260, "valid_targets_mean": 9514.1, "valid_targets_min": 301 }, { "epoch": 0.2544, "grad_norm": 0.266140461511119, "learning_rate": 2.0268714011516314e-05, "loss": 0.4811, "loss_nan_ranks": 0, "loss_rank_avg": 0.15985918045043945, "step": 265, "valid_targets_mean": 10259.5, "valid_targets_min": 2847 }, { "epoch": 0.2592, "grad_norm": 0.2544591628433433, "learning_rate": 2.0652591170825337e-05, "loss": 0.4853, "loss_nan_ranks": 0, "loss_rank_avg": 0.17325814068317413, "step": 270, "valid_targets_mean": 10599.2, "valid_targets_min": 1957 }, { "epoch": 0.264, "grad_norm": 0.2550761566659248, "learning_rate": 2.103646833013436e-05, "loss": 0.4838, "loss_nan_ranks": 0, "loss_rank_avg": 0.18994951248168945, "step": 275, "valid_targets_mean": 12406.7, "valid_targets_min": 1763 }, { "epoch": 0.2688, "grad_norm": 0.2648060038919729, "learning_rate": 2.142034548944338e-05, "loss": 0.4877, "loss_nan_ranks": 0, "loss_rank_avg": 0.17854821681976318, "step": 280, "valid_targets_mean": 12377.0, "valid_targets_min": 3205 }, { "epoch": 0.2736, "grad_norm": 0.2892489787345957, "learning_rate": 2.18042226487524e-05, "loss": 0.485, "loss_nan_ranks": 0, "loss_rank_avg": 0.15922245383262634, "step": 285, "valid_targets_mean": 10091.9, "valid_targets_min": 1776 }, { "epoch": 0.2784, "grad_norm": 0.27182050087807624, "learning_rate": 2.218809980806142e-05, "loss": 0.4832, "loss_nan_ranks": 0, "loss_rank_avg": 0.18173915147781372, "step": 290, "valid_targets_mean": 11485.0, "valid_targets_min": 2412 }, { "epoch": 0.2832, "grad_norm": 0.29753560881114305, "learning_rate": 2.2571976967370445e-05, "loss": 0.4876, "loss_nan_ranks": 0, "loss_rank_avg": 0.15241312980651855, "step": 295, "valid_targets_mean": 10455.7, "valid_targets_min": 1760 }, { "epoch": 0.288, "grad_norm": 0.2920243091279055, "learning_rate": 2.2955854126679465e-05, "loss": 0.4809, "loss_nan_ranks": 0, "loss_rank_avg": 0.17634551227092743, "step": 300, "valid_targets_mean": 11262.6, "valid_targets_min": 2395 }, { "epoch": 0.2928, "grad_norm": 0.3068931126861716, "learning_rate": 2.3339731285988485e-05, "loss": 0.4787, "loss_nan_ranks": 0, "loss_rank_avg": 0.16455751657485962, "step": 305, "valid_targets_mean": 10402.1, "valid_targets_min": 1814 }, { "epoch": 0.2976, "grad_norm": 0.29189757761278545, "learning_rate": 2.372360844529751e-05, "loss": 0.4849, "loss_nan_ranks": 0, "loss_rank_avg": 0.14844027161598206, "step": 310, "valid_targets_mean": 10187.0, "valid_targets_min": 1855 }, { "epoch": 0.3024, "grad_norm": 0.29114274622108255, "learning_rate": 2.4107485604606525e-05, "loss": 0.4819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1699836403131485, "step": 315, "valid_targets_mean": 11114.6, "valid_targets_min": 1042 }, { "epoch": 0.3072, "grad_norm": 0.2954997654982877, "learning_rate": 2.449136276391555e-05, "loss": 0.4742, "loss_nan_ranks": 0, "loss_rank_avg": 0.16469603776931763, "step": 320, "valid_targets_mean": 9133.3, "valid_targets_min": 1297 }, { "epoch": 0.312, "grad_norm": 0.2773131204544206, "learning_rate": 2.4875239923224573e-05, "loss": 0.4866, "loss_nan_ranks": 0, "loss_rank_avg": 0.15901392698287964, "step": 325, "valid_targets_mean": 10840.6, "valid_targets_min": 1563 }, { "epoch": 0.3168, "grad_norm": 0.25978690369987806, "learning_rate": 2.525911708253359e-05, "loss": 0.483, "loss_nan_ranks": 0, "loss_rank_avg": 0.17150971293449402, "step": 330, "valid_targets_mean": 12225.6, "valid_targets_min": 2997 }, { "epoch": 0.3216, "grad_norm": 0.2534243499422545, "learning_rate": 2.5642994241842613e-05, "loss": 0.4759, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597476452589035, "step": 335, "valid_targets_mean": 10479.3, "valid_targets_min": 979 }, { "epoch": 0.3264, "grad_norm": 0.2609983072842597, "learning_rate": 2.6026871401151633e-05, "loss": 0.4812, "loss_nan_ranks": 0, "loss_rank_avg": 0.16786131262779236, "step": 340, "valid_targets_mean": 10247.2, "valid_targets_min": 3687 }, { "epoch": 0.3312, "grad_norm": 0.2539569867124708, "learning_rate": 2.6410748560460657e-05, "loss": 0.4854, "loss_nan_ranks": 0, "loss_rank_avg": 0.17365418374538422, "step": 345, "valid_targets_mean": 11493.6, "valid_targets_min": 1776 }, { "epoch": 0.336, "grad_norm": 0.24499201124304537, "learning_rate": 2.6794625719769677e-05, "loss": 0.4805, "loss_nan_ranks": 0, "loss_rank_avg": 0.1610392928123474, "step": 350, "valid_targets_mean": 11080.4, "valid_targets_min": 885 }, { "epoch": 0.3408, "grad_norm": 0.3168783571987516, "learning_rate": 2.7178502879078697e-05, "loss": 0.4777, "loss_nan_ranks": 0, "loss_rank_avg": 0.1885453164577484, "step": 355, "valid_targets_mean": 11284.8, "valid_targets_min": 2053 }, { "epoch": 0.3456, "grad_norm": 0.29757777058122253, "learning_rate": 2.756238003838772e-05, "loss": 0.4757, "loss_nan_ranks": 0, "loss_rank_avg": 0.12922048568725586, "step": 360, "valid_targets_mean": 9008.3, "valid_targets_min": 2069 }, { "epoch": 0.3504, "grad_norm": 0.29845542522302926, "learning_rate": 2.7946257197696737e-05, "loss": 0.4738, "loss_nan_ranks": 0, "loss_rank_avg": 0.1480693519115448, "step": 365, "valid_targets_mean": 9970.8, "valid_targets_min": 2240 }, { "epoch": 0.3552, "grad_norm": 0.2607162119403624, "learning_rate": 2.833013435700576e-05, "loss": 0.4573, "loss_nan_ranks": 0, "loss_rank_avg": 0.15535274147987366, "step": 370, "valid_targets_mean": 11197.2, "valid_targets_min": 2704 }, { "epoch": 0.36, "grad_norm": 0.2899828540897501, "learning_rate": 2.8714011516314784e-05, "loss": 0.4684, "loss_nan_ranks": 0, "loss_rank_avg": 0.18022534251213074, "step": 375, "valid_targets_mean": 10962.7, "valid_targets_min": 1224 }, { "epoch": 0.3648, "grad_norm": 0.26481660377161126, "learning_rate": 2.90978886756238e-05, "loss": 0.4698, "loss_nan_ranks": 0, "loss_rank_avg": 0.13400977849960327, "step": 380, "valid_targets_mean": 9079.6, "valid_targets_min": 1891 }, { "epoch": 0.3696, "grad_norm": 0.2617162429432194, "learning_rate": 2.9481765834932825e-05, "loss": 0.4707, "loss_nan_ranks": 0, "loss_rank_avg": 0.13027355074882507, "step": 385, "valid_targets_mean": 8412.9, "valid_targets_min": 1498 }, { "epoch": 0.3744, "grad_norm": 0.2701862190450275, "learning_rate": 2.9865642994241845e-05, "loss": 0.4708, "loss_nan_ranks": 0, "loss_rank_avg": 0.16891103982925415, "step": 390, "valid_targets_mean": 11449.3, "valid_targets_min": 1279 }, { "epoch": 0.3792, "grad_norm": 0.29379480481092074, "learning_rate": 3.0249520153550865e-05, "loss": 0.4707, "loss_nan_ranks": 0, "loss_rank_avg": 0.14961659908294678, "step": 395, "valid_targets_mean": 8604.1, "valid_targets_min": 1994 }, { "epoch": 0.384, "grad_norm": 0.27150103043577656, "learning_rate": 3.063339731285989e-05, "loss": 0.4753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1796588897705078, "step": 400, "valid_targets_mean": 11844.7, "valid_targets_min": 2622 }, { "epoch": 0.3888, "grad_norm": 0.29573597688488124, "learning_rate": 3.101727447216891e-05, "loss": 0.4705, "loss_nan_ranks": 0, "loss_rank_avg": 0.20640979707241058, "step": 405, "valid_targets_mean": 14013.4, "valid_targets_min": 2984 }, { "epoch": 0.3936, "grad_norm": 0.25248186174434967, "learning_rate": 3.140115163147793e-05, "loss": 0.4614, "loss_nan_ranks": 0, "loss_rank_avg": 0.16427947580814362, "step": 410, "valid_targets_mean": 11053.4, "valid_targets_min": 2699 }, { "epoch": 0.3984, "grad_norm": 0.3765832037408977, "learning_rate": 3.178502879078695e-05, "loss": 0.4713, "loss_nan_ranks": 0, "loss_rank_avg": 0.14113269746303558, "step": 415, "valid_targets_mean": 9704.3, "valid_targets_min": 3191 }, { "epoch": 0.4032, "grad_norm": 0.29914718763920833, "learning_rate": 3.216890595009597e-05, "loss": 0.4694, "loss_nan_ranks": 0, "loss_rank_avg": 0.15573322772979736, "step": 420, "valid_targets_mean": 10724.8, "valid_targets_min": 1674 }, { "epoch": 0.408, "grad_norm": 0.28083425113360516, "learning_rate": 3.2552783109404996e-05, "loss": 0.4588, "loss_nan_ranks": 0, "loss_rank_avg": 0.17997148633003235, "step": 425, "valid_targets_mean": 12482.6, "valid_targets_min": 2166 }, { "epoch": 0.4128, "grad_norm": 0.2976974373969709, "learning_rate": 3.2936660268714016e-05, "loss": 0.4657, "loss_nan_ranks": 0, "loss_rank_avg": 0.15475307404994965, "step": 430, "valid_targets_mean": 10911.6, "valid_targets_min": 2009 }, { "epoch": 0.4176, "grad_norm": 0.24542082786514977, "learning_rate": 3.3320537428023036e-05, "loss": 0.4645, "loss_nan_ranks": 0, "loss_rank_avg": 0.1643528938293457, "step": 435, "valid_targets_mean": 12095.1, "valid_targets_min": 4705 }, { "epoch": 0.4224, "grad_norm": 0.29303842872775576, "learning_rate": 3.3704414587332056e-05, "loss": 0.4647, "loss_nan_ranks": 0, "loss_rank_avg": 0.13531912863254547, "step": 440, "valid_targets_mean": 9222.8, "valid_targets_min": 2233 }, { "epoch": 0.4272, "grad_norm": 0.2828869010226847, "learning_rate": 3.4088291746641077e-05, "loss": 0.474, "loss_nan_ranks": 0, "loss_rank_avg": 0.14599958062171936, "step": 445, "valid_targets_mean": 11280.1, "valid_targets_min": 2279 }, { "epoch": 0.432, "grad_norm": 0.29431208133429276, "learning_rate": 3.4472168905950104e-05, "loss": 0.4621, "loss_nan_ranks": 0, "loss_rank_avg": 0.14398963749408722, "step": 450, "valid_targets_mean": 10311.7, "valid_targets_min": 1728 }, { "epoch": 0.4368, "grad_norm": 0.2585227807649877, "learning_rate": 3.485604606525912e-05, "loss": 0.461, "loss_nan_ranks": 0, "loss_rank_avg": 0.1372634768486023, "step": 455, "valid_targets_mean": 8504.6, "valid_targets_min": 1508 }, { "epoch": 0.4416, "grad_norm": 0.29941740189685506, "learning_rate": 3.5239923224568144e-05, "loss": 0.4618, "loss_nan_ranks": 0, "loss_rank_avg": 0.13782289624214172, "step": 460, "valid_targets_mean": 9918.3, "valid_targets_min": 2310 }, { "epoch": 0.4464, "grad_norm": 0.29746723988147145, "learning_rate": 3.5623800383877164e-05, "loss": 0.4669, "loss_nan_ranks": 0, "loss_rank_avg": 0.12251640856266022, "step": 465, "valid_targets_mean": 8674.2, "valid_targets_min": 1732 }, { "epoch": 0.4512, "grad_norm": 0.3516933086901854, "learning_rate": 3.6007677543186184e-05, "loss": 0.4707, "loss_nan_ranks": 0, "loss_rank_avg": 0.18415644764900208, "step": 470, "valid_targets_mean": 12712.0, "valid_targets_min": 1951 }, { "epoch": 0.456, "grad_norm": 0.2704944515833381, "learning_rate": 3.6391554702495204e-05, "loss": 0.4571, "loss_nan_ranks": 0, "loss_rank_avg": 0.15503855049610138, "step": 475, "valid_targets_mean": 10973.3, "valid_targets_min": 2568 }, { "epoch": 0.4608, "grad_norm": 0.2579883782673916, "learning_rate": 3.6775431861804224e-05, "loss": 0.4611, "loss_nan_ranks": 0, "loss_rank_avg": 0.15346036851406097, "step": 480, "valid_targets_mean": 9707.8, "valid_targets_min": 3027 }, { "epoch": 0.4656, "grad_norm": 0.28982082854321284, "learning_rate": 3.7159309021113245e-05, "loss": 0.4471, "loss_nan_ranks": 0, "loss_rank_avg": 0.12727707624435425, "step": 485, "valid_targets_mean": 9593.2, "valid_targets_min": 2884 }, { "epoch": 0.4704, "grad_norm": 0.2646662239031736, "learning_rate": 3.7543186180422265e-05, "loss": 0.459, "loss_nan_ranks": 0, "loss_rank_avg": 0.16413524746894836, "step": 490, "valid_targets_mean": 11934.7, "valid_targets_min": 3560 }, { "epoch": 0.4752, "grad_norm": 0.266665098284034, "learning_rate": 3.792706333973129e-05, "loss": 0.4616, "loss_nan_ranks": 0, "loss_rank_avg": 0.1243312731385231, "step": 495, "valid_targets_mean": 8476.5, "valid_targets_min": 2652 }, { "epoch": 0.48, "grad_norm": 0.28190317886063865, "learning_rate": 3.831094049904031e-05, "loss": 0.4639, "loss_nan_ranks": 0, "loss_rank_avg": 0.16007450222969055, "step": 500, "valid_targets_mean": 9943.0, "valid_targets_min": 2220 }, { "epoch": 0.4848, "grad_norm": 0.29271223570474775, "learning_rate": 3.869481765834933e-05, "loss": 0.4679, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724342703819275, "step": 505, "valid_targets_mean": 11642.2, "valid_targets_min": 1354 }, { "epoch": 0.4896, "grad_norm": 0.26903639753216824, "learning_rate": 3.907869481765835e-05, "loss": 0.449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14683669805526733, "step": 510, "valid_targets_mean": 10091.7, "valid_targets_min": 2840 }, { "epoch": 0.4944, "grad_norm": 0.2559878906486554, "learning_rate": 3.946257197696737e-05, "loss": 0.4672, "loss_nan_ranks": 0, "loss_rank_avg": 0.18146558105945587, "step": 515, "valid_targets_mean": 11818.8, "valid_targets_min": 939 }, { "epoch": 0.4992, "grad_norm": 0.3302113861791353, "learning_rate": 3.984644913627639e-05, "loss": 0.4534, "loss_nan_ranks": 0, "loss_rank_avg": 0.13053454458713531, "step": 520, "valid_targets_mean": 8831.3, "valid_targets_min": 742 }, { "epoch": 0.504, "grad_norm": 0.26972775533524873, "learning_rate": 3.999995959997414e-05, "loss": 0.4643, "loss_nan_ranks": 0, "loss_rank_avg": 0.16849611699581146, "step": 525, "valid_targets_mean": 10903.1, "valid_targets_min": 1886 }, { "epoch": 0.5088, "grad_norm": 0.2603085017747878, "learning_rate": 3.999971271151827e-05, "loss": 0.4612, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302165389060974, "step": 530, "valid_targets_mean": 8817.5, "valid_targets_min": 1843 }, { "epoch": 0.5136, "grad_norm": 0.2858496522578758, "learning_rate": 3.9999241381832614e-05, "loss": 0.4637, "loss_nan_ranks": 0, "loss_rank_avg": 0.14295253157615662, "step": 535, "valid_targets_mean": 10053.8, "valid_targets_min": 2740 }, { "epoch": 0.5184, "grad_norm": 0.26152174514020043, "learning_rate": 3.999854561620655e-05, "loss": 0.4595, "loss_nan_ranks": 0, "loss_rank_avg": 0.14226208627223969, "step": 540, "valid_targets_mean": 11106.9, "valid_targets_min": 1576 }, { "epoch": 0.5232, "grad_norm": 0.26028352862388787, "learning_rate": 3.9997625422448114e-05, "loss": 0.4545, "loss_nan_ranks": 0, "loss_rank_avg": 0.15191048383712769, "step": 545, "valid_targets_mean": 9975.0, "valid_targets_min": 3918 }, { "epoch": 0.528, "grad_norm": 0.252965467893726, "learning_rate": 3.999648081088391e-05, "loss": 0.4534, "loss_nan_ranks": 0, "loss_rank_avg": 0.13953734934329987, "step": 550, "valid_targets_mean": 9347.6, "valid_targets_min": 2024 }, { "epoch": 0.5328, "grad_norm": 0.25661462861347195, "learning_rate": 3.999511179435905e-05, "loss": 0.4592, "loss_nan_ranks": 0, "loss_rank_avg": 0.15799963474273682, "step": 555, "valid_targets_mean": 10477.4, "valid_targets_min": 3319 }, { "epoch": 0.5376, "grad_norm": 0.270288528995941, "learning_rate": 3.999351838823691e-05, "loss": 0.4602, "loss_nan_ranks": 0, "loss_rank_avg": 0.15654206275939941, "step": 560, "valid_targets_mean": 10189.6, "valid_targets_min": 1777 }, { "epoch": 0.5424, "grad_norm": 0.35156440192336935, "learning_rate": 3.999170061039908e-05, "loss": 0.4535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1559731662273407, "step": 565, "valid_targets_mean": 9539.7, "valid_targets_min": 2028 }, { "epoch": 0.5472, "grad_norm": 0.2539828685860791, "learning_rate": 3.998965848124505e-05, "loss": 0.4551, "loss_nan_ranks": 0, "loss_rank_avg": 0.13896337151527405, "step": 570, "valid_targets_mean": 10557.0, "valid_targets_min": 2887 }, { "epoch": 0.552, "grad_norm": 0.2598033898247074, "learning_rate": 3.998739202369205e-05, "loss": 0.4584, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374547779560089, "step": 575, "valid_targets_mean": 10081.8, "valid_targets_min": 1494 }, { "epoch": 0.5568, "grad_norm": 0.30314441059434327, "learning_rate": 3.998490126317477e-05, "loss": 0.4483, "loss_nan_ranks": 0, "loss_rank_avg": 0.16131776571273804, "step": 580, "valid_targets_mean": 10033.4, "valid_targets_min": 1706 }, { "epoch": 0.5616, "grad_norm": 0.22031863670397067, "learning_rate": 3.9982186227645085e-05, "loss": 0.4571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1602936089038849, "step": 585, "valid_targets_mean": 11657.8, "valid_targets_min": 1006 }, { "epoch": 0.5664, "grad_norm": 0.26943631448171856, "learning_rate": 3.9979246947571724e-05, "loss": 0.4517, "loss_nan_ranks": 0, "loss_rank_avg": 0.16911017894744873, "step": 590, "valid_targets_mean": 12263.9, "valid_targets_min": 1702 }, { "epoch": 0.5712, "grad_norm": 0.25061495037382847, "learning_rate": 3.9976083455939945e-05, "loss": 0.4532, "loss_nan_ranks": 0, "loss_rank_avg": 0.15989217162132263, "step": 595, "valid_targets_mean": 11708.3, "valid_targets_min": 1871 }, { "epoch": 0.576, "grad_norm": 0.261621992497104, "learning_rate": 3.9972695788251155e-05, "loss": 0.4401, "loss_nan_ranks": 0, "loss_rank_avg": 0.1598036289215088, "step": 600, "valid_targets_mean": 10135.6, "valid_targets_min": 2569 }, { "epoch": 0.5808, "grad_norm": 0.2808004182619828, "learning_rate": 3.996908398252251e-05, "loss": 0.4541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1376391500234604, "step": 605, "valid_targets_mean": 8971.0, "valid_targets_min": 1025 }, { "epoch": 0.5856, "grad_norm": 0.25161025940924875, "learning_rate": 3.9965248079286505e-05, "loss": 0.4419, "loss_nan_ranks": 0, "loss_rank_avg": 0.15694254636764526, "step": 610, "valid_targets_mean": 11790.6, "valid_targets_min": 2403 }, { "epoch": 0.5904, "grad_norm": 0.391406643033309, "learning_rate": 3.99611881215905e-05, "loss": 0.4492, "loss_nan_ranks": 0, "loss_rank_avg": 0.13714802265167236, "step": 615, "valid_targets_mean": 8819.1, "valid_targets_min": 1645 }, { "epoch": 0.5952, "grad_norm": 0.3027879951842276, "learning_rate": 3.995690415499624e-05, "loss": 0.4483, "loss_nan_ranks": 0, "loss_rank_avg": 0.15102067589759827, "step": 620, "valid_targets_mean": 10631.6, "valid_targets_min": 2143 }, { "epoch": 0.6, "grad_norm": 0.25471127728925685, "learning_rate": 3.995239622757936e-05, "loss": 0.4476, "loss_nan_ranks": 0, "loss_rank_avg": 0.15196582674980164, "step": 625, "valid_targets_mean": 10613.7, "valid_targets_min": 2445 }, { "epoch": 0.6048, "grad_norm": 0.2491408938992097, "learning_rate": 3.994766438992882e-05, "loss": 0.4545, "loss_nan_ranks": 0, "loss_rank_avg": 0.15728193521499634, "step": 630, "valid_targets_mean": 11646.2, "valid_targets_min": 3345 }, { "epoch": 0.6096, "grad_norm": 0.2718517988380648, "learning_rate": 3.994270869514635e-05, "loss": 0.4479, "loss_nan_ranks": 0, "loss_rank_avg": 0.17402216792106628, "step": 635, "valid_targets_mean": 10870.4, "valid_targets_min": 2319 }, { "epoch": 0.6144, "grad_norm": 0.2626639858806631, "learning_rate": 3.9937529198845864e-05, "loss": 0.4471, "loss_nan_ranks": 0, "loss_rank_avg": 0.15539997816085815, "step": 640, "valid_targets_mean": 9441.2, "valid_targets_min": 2925 }, { "epoch": 0.6192, "grad_norm": 0.249237014812052, "learning_rate": 3.9932125959152833e-05, "loss": 0.4508, "loss_nan_ranks": 0, "loss_rank_avg": 0.13891427218914032, "step": 645, "valid_targets_mean": 8957.0, "valid_targets_min": 861 }, { "epoch": 0.624, "grad_norm": 0.25544849188790725, "learning_rate": 3.9926499036703607e-05, "loss": 0.4544, "loss_nan_ranks": 0, "loss_rank_avg": 0.14250892400741577, "step": 650, "valid_targets_mean": 9748.9, "valid_targets_min": 1507 }, { "epoch": 0.6288, "grad_norm": 0.2577063394014419, "learning_rate": 3.992064849464476e-05, "loss": 0.4533, "loss_nan_ranks": 0, "loss_rank_avg": 0.156438410282135, "step": 655, "valid_targets_mean": 10886.6, "valid_targets_min": 1328 }, { "epoch": 0.6336, "grad_norm": 0.26664954451504175, "learning_rate": 3.991457439863238e-05, "loss": 0.4544, "loss_nan_ranks": 0, "loss_rank_avg": 0.16429439187049866, "step": 660, "valid_targets_mean": 11470.5, "valid_targets_min": 1398 }, { "epoch": 0.6384, "grad_norm": 0.2585738675100044, "learning_rate": 3.990827681683133e-05, "loss": 0.4511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1722051352262497, "step": 665, "valid_targets_mean": 11573.3, "valid_targets_min": 274 }, { "epoch": 0.6432, "grad_norm": 0.24473615866589019, "learning_rate": 3.990175581991448e-05, "loss": 0.4536, "loss_nan_ranks": 0, "loss_rank_avg": 0.16524508595466614, "step": 670, "valid_targets_mean": 11921.1, "valid_targets_min": 2460 }, { "epoch": 0.648, "grad_norm": 0.2588924362804296, "learning_rate": 3.989501148106189e-05, "loss": 0.4416, "loss_nan_ranks": 0, "loss_rank_avg": 0.12152011692523956, "step": 675, "valid_targets_mean": 8583.5, "valid_targets_min": 1520 }, { "epoch": 0.6528, "grad_norm": 0.2906148484888001, "learning_rate": 3.988804387596005e-05, "loss": 0.4543, "loss_nan_ranks": 0, "loss_rank_avg": 0.1639477014541626, "step": 680, "valid_targets_mean": 10996.6, "valid_targets_min": 1719 }, { "epoch": 0.6576, "grad_norm": 0.2269520950972862, "learning_rate": 3.9880853082800965e-05, "loss": 0.4538, "loss_nan_ranks": 0, "loss_rank_avg": 0.14809130132198334, "step": 685, "valid_targets_mean": 10731.2, "valid_targets_min": 1983 }, { "epoch": 0.6624, "grad_norm": 0.2878053426516386, "learning_rate": 3.987343918228133e-05, "loss": 0.4439, "loss_nan_ranks": 0, "loss_rank_avg": 0.15128569304943085, "step": 690, "valid_targets_mean": 11356.6, "valid_targets_min": 4547 }, { "epoch": 0.6672, "grad_norm": 0.24198387949329253, "learning_rate": 3.9865802257601584e-05, "loss": 0.4475, "loss_nan_ranks": 0, "loss_rank_avg": 0.1544976532459259, "step": 695, "valid_targets_mean": 10080.2, "valid_targets_min": 1962 }, { "epoch": 0.672, "grad_norm": 0.28830935840143584, "learning_rate": 3.9857942394464976e-05, "loss": 0.4534, "loss_nan_ranks": 0, "loss_rank_avg": 0.13071781396865845, "step": 700, "valid_targets_mean": 8885.0, "valid_targets_min": 1579 }, { "epoch": 0.6768, "grad_norm": 0.2662828860280673, "learning_rate": 3.984985968107667e-05, "loss": 0.4491, "loss_nan_ranks": 0, "loss_rank_avg": 0.15589673817157745, "step": 705, "valid_targets_mean": 11279.5, "valid_targets_min": 1977 }, { "epoch": 0.6816, "grad_norm": 0.2606792021323181, "learning_rate": 3.984155420814266e-05, "loss": 0.4422, "loss_nan_ranks": 0, "loss_rank_avg": 0.14421959221363068, "step": 710, "valid_targets_mean": 10752.7, "valid_targets_min": 2087 }, { "epoch": 0.6864, "grad_norm": 0.28331509780837333, "learning_rate": 3.9833026068868814e-05, "loss": 0.4399, "loss_nan_ranks": 0, "loss_rank_avg": 0.16088783740997314, "step": 715, "valid_targets_mean": 11895.5, "valid_targets_min": 2299 }, { "epoch": 0.6912, "grad_norm": 0.2401398741428507, "learning_rate": 3.982427535895982e-05, "loss": 0.4493, "loss_nan_ranks": 0, "loss_rank_avg": 0.12636323273181915, "step": 720, "valid_targets_mean": 8741.3, "valid_targets_min": 2064 }, { "epoch": 0.696, "grad_norm": 0.24623098098235072, "learning_rate": 3.9815302176618076e-05, "loss": 0.4372, "loss_nan_ranks": 0, "loss_rank_avg": 0.14504778385162354, "step": 725, "valid_targets_mean": 9609.4, "valid_targets_min": 2910 }, { "epoch": 0.7008, "grad_norm": 0.27011416048003173, "learning_rate": 3.980610662254264e-05, "loss": 0.4452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1622447371482849, "step": 730, "valid_targets_mean": 11419.7, "valid_targets_min": 2401 }, { "epoch": 0.7056, "grad_norm": 0.29719134463341074, "learning_rate": 3.9796688799928075e-05, "loss": 0.444, "loss_nan_ranks": 0, "loss_rank_avg": 0.13660922646522522, "step": 735, "valid_targets_mean": 10302.8, "valid_targets_min": 2296 }, { "epoch": 0.7104, "grad_norm": 0.24542996505841894, "learning_rate": 3.978704881446327e-05, "loss": 0.4418, "loss_nan_ranks": 0, "loss_rank_avg": 0.17318297922611237, "step": 740, "valid_targets_mean": 13040.1, "valid_targets_min": 2918 }, { "epoch": 0.7152, "grad_norm": 0.23791161407706576, "learning_rate": 3.9777186774330304e-05, "loss": 0.4415, "loss_nan_ranks": 0, "loss_rank_avg": 0.14803707599639893, "step": 745, "valid_targets_mean": 10797.8, "valid_targets_min": 2483 }, { "epoch": 0.72, "grad_norm": 0.25166109994851354, "learning_rate": 3.976710279020318e-05, "loss": 0.4447, "loss_nan_ranks": 0, "loss_rank_avg": 0.17335036396980286, "step": 750, "valid_targets_mean": 11030.3, "valid_targets_min": 2140 }, { "epoch": 0.7248, "grad_norm": 0.28361399295331674, "learning_rate": 3.975679697524661e-05, "loss": 0.4451, "loss_nan_ranks": 0, "loss_rank_avg": 0.148225799202919, "step": 755, "valid_targets_mean": 11292.8, "valid_targets_min": 1960 }, { "epoch": 0.7296, "grad_norm": 0.24746500944939762, "learning_rate": 3.974626944511475e-05, "loss": 0.4438, "loss_nan_ranks": 0, "loss_rank_avg": 0.16841234266757965, "step": 760, "valid_targets_mean": 12154.3, "valid_targets_min": 2203 }, { "epoch": 0.7344, "grad_norm": 0.2241960168441248, "learning_rate": 3.973552031794988e-05, "loss": 0.4427, "loss_nan_ranks": 0, "loss_rank_avg": 0.14119960367679596, "step": 765, "valid_targets_mean": 9363.3, "valid_targets_min": 2701 }, { "epoch": 0.7392, "grad_norm": 0.23458423848116103, "learning_rate": 3.9724549714381106e-05, "loss": 0.4472, "loss_nan_ranks": 0, "loss_rank_avg": 0.13517552614212036, "step": 770, "valid_targets_mean": 10275.2, "valid_targets_min": 2268 }, { "epoch": 0.744, "grad_norm": 0.24225388329162625, "learning_rate": 3.971335775752298e-05, "loss": 0.4472, "loss_nan_ranks": 0, "loss_rank_avg": 0.17425012588500977, "step": 775, "valid_targets_mean": 11925.4, "valid_targets_min": 3083 }, { "epoch": 0.7488, "grad_norm": 0.2297680649270912, "learning_rate": 3.970194457297414e-05, "loss": 0.4468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15473422408103943, "step": 780, "valid_targets_mean": 10975.8, "valid_targets_min": 1764 }, { "epoch": 0.7536, "grad_norm": 0.27742186379777073, "learning_rate": 3.9690310288815876e-05, "loss": 0.4381, "loss_nan_ranks": 0, "loss_rank_avg": 0.1480221152305603, "step": 785, "valid_targets_mean": 10486.0, "valid_targets_min": 1116 }, { "epoch": 0.7584, "grad_norm": 0.27198081218563974, "learning_rate": 3.967845503561073e-05, "loss": 0.4552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1705826222896576, "step": 790, "valid_targets_mean": 11610.0, "valid_targets_min": 3639 }, { "epoch": 0.7632, "grad_norm": 0.2102169384572373, "learning_rate": 3.9666378946400974e-05, "loss": 0.4484, "loss_nan_ranks": 0, "loss_rank_avg": 0.1382056474685669, "step": 795, "valid_targets_mean": 10808.0, "valid_targets_min": 1630 }, { "epoch": 0.768, "grad_norm": 0.23391900735891194, "learning_rate": 3.965408215670719e-05, "loss": 0.4495, "loss_nan_ranks": 0, "loss_rank_avg": 0.15888884663581848, "step": 800, "valid_targets_mean": 10829.6, "valid_targets_min": 3350 }, { "epoch": 0.7728, "grad_norm": 0.22879398550516797, "learning_rate": 3.964156480452667e-05, "loss": 0.4371, "loss_nan_ranks": 0, "loss_rank_avg": 0.15504437685012817, "step": 805, "valid_targets_mean": 11066.4, "valid_targets_min": 2243 }, { "epoch": 0.7776, "grad_norm": 0.24667088526976355, "learning_rate": 3.962882703033195e-05, "loss": 0.4391, "loss_nan_ranks": 0, "loss_rank_avg": 0.14036577939987183, "step": 810, "valid_targets_mean": 10358.6, "valid_targets_min": 2893 }, { "epoch": 0.7824, "grad_norm": 0.23114425024656984, "learning_rate": 3.961586897706915e-05, "loss": 0.4349, "loss_nan_ranks": 0, "loss_rank_avg": 0.13787609338760376, "step": 815, "valid_targets_mean": 9714.0, "valid_targets_min": 2687 }, { "epoch": 0.7872, "grad_norm": 0.23473702906122673, "learning_rate": 3.960269079015643e-05, "loss": 0.4449, "loss_nan_ranks": 0, "loss_rank_avg": 0.15032735466957092, "step": 820, "valid_targets_mean": 9774.9, "valid_targets_min": 2028 }, { "epoch": 0.792, "grad_norm": 0.2162385966678345, "learning_rate": 3.958929261748236e-05, "loss": 0.4405, "loss_nan_ranks": 0, "loss_rank_avg": 0.14596378803253174, "step": 825, "valid_targets_mean": 10958.2, "valid_targets_min": 2010 }, { "epoch": 0.7968, "grad_norm": 0.24222519458371453, "learning_rate": 3.957567460940419e-05, "loss": 0.4394, "loss_nan_ranks": 0, "loss_rank_avg": 0.12375211715698242, "step": 830, "valid_targets_mean": 8580.5, "valid_targets_min": 1205 }, { "epoch": 0.8016, "grad_norm": 0.2933772610237654, "learning_rate": 3.9561836918746256e-05, "loss": 0.4398, "loss_nan_ranks": 0, "loss_rank_avg": 0.15357926487922668, "step": 835, "valid_targets_mean": 11393.8, "valid_targets_min": 2154 }, { "epoch": 0.8064, "grad_norm": 0.2531199798856708, "learning_rate": 3.95477797007982e-05, "loss": 0.4379, "loss_nan_ranks": 0, "loss_rank_avg": 0.15377768874168396, "step": 840, "valid_targets_mean": 10993.3, "valid_targets_min": 2009 }, { "epoch": 0.8112, "grad_norm": 0.24295989807739177, "learning_rate": 3.953350311331325e-05, "loss": 0.4436, "loss_nan_ranks": 0, "loss_rank_avg": 0.11503560096025467, "step": 845, "valid_targets_mean": 9558.3, "valid_targets_min": 3104 }, { "epoch": 0.816, "grad_norm": 0.3035777048117532, "learning_rate": 3.951900731650645e-05, "loss": 0.4324, "loss_nan_ranks": 0, "loss_rank_avg": 0.1553291380405426, "step": 850, "valid_targets_mean": 9700.8, "valid_targets_min": 1456 }, { "epoch": 0.8208, "grad_norm": 0.2708795633114363, "learning_rate": 3.950429247305286e-05, "loss": 0.4363, "loss_nan_ranks": 0, "loss_rank_avg": 0.15550169348716736, "step": 855, "valid_targets_mean": 11636.9, "valid_targets_min": 1244 }, { "epoch": 0.8256, "grad_norm": 0.2719042040403292, "learning_rate": 3.9489358748085737e-05, "loss": 0.4371, "loss_nan_ranks": 0, "loss_rank_avg": 0.10961782932281494, "step": 860, "valid_targets_mean": 8280.6, "valid_targets_min": 1860 }, { "epoch": 0.8304, "grad_norm": 0.24090820427969437, "learning_rate": 3.947420630919466e-05, "loss": 0.4395, "loss_nan_ranks": 0, "loss_rank_avg": 0.1432057023048401, "step": 865, "valid_targets_mean": 10116.8, "valid_targets_min": 3043 }, { "epoch": 0.8352, "grad_norm": 0.27574496492858264, "learning_rate": 3.9458835326423674e-05, "loss": 0.4404, "loss_nan_ranks": 0, "loss_rank_avg": 0.11399415135383606, "step": 870, "valid_targets_mean": 8621.7, "valid_targets_min": 2606 }, { "epoch": 0.84, "grad_norm": 0.23514909460962988, "learning_rate": 3.9443245972269376e-05, "loss": 0.4385, "loss_nan_ranks": 0, "loss_rank_avg": 0.16591641306877136, "step": 875, "valid_targets_mean": 11010.5, "valid_targets_min": 1678 }, { "epoch": 0.8448, "grad_norm": 0.248267579212623, "learning_rate": 3.942743842167896e-05, "loss": 0.4349, "loss_nan_ranks": 0, "loss_rank_avg": 0.14936822652816772, "step": 880, "valid_targets_mean": 9566.6, "valid_targets_min": 1706 }, { "epoch": 0.8496, "grad_norm": 0.22128202143359202, "learning_rate": 3.941141285204829e-05, "loss": 0.4381, "loss_nan_ranks": 0, "loss_rank_avg": 0.11705336719751358, "step": 885, "valid_targets_mean": 8686.6, "valid_targets_min": 1291 }, { "epoch": 0.8544, "grad_norm": 0.24239550122658543, "learning_rate": 3.939516944321986e-05, "loss": 0.4412, "loss_nan_ranks": 0, "loss_rank_avg": 0.16379308700561523, "step": 890, "valid_targets_mean": 10584.9, "valid_targets_min": 1898 }, { "epoch": 0.8592, "grad_norm": 0.21297377581920748, "learning_rate": 3.937870837748085e-05, "loss": 0.4425, "loss_nan_ranks": 0, "loss_rank_avg": 0.15646252036094666, "step": 895, "valid_targets_mean": 10218.3, "valid_targets_min": 2225 }, { "epoch": 0.864, "grad_norm": 0.271473838990007, "learning_rate": 3.936202983956098e-05, "loss": 0.4401, "loss_nan_ranks": 0, "loss_rank_avg": 0.18577039241790771, "step": 900, "valid_targets_mean": 12629.7, "valid_targets_min": 2401 }, { "epoch": 0.8688, "grad_norm": 0.2347160954091539, "learning_rate": 3.934513401663052e-05, "loss": 0.4322, "loss_nan_ranks": 0, "loss_rank_avg": 0.14884625375270844, "step": 905, "valid_targets_mean": 10616.7, "valid_targets_min": 2416 }, { "epoch": 0.8736, "grad_norm": 0.23617851555656597, "learning_rate": 3.9328021098298164e-05, "loss": 0.4458, "loss_nan_ranks": 0, "loss_rank_avg": 0.18026357889175415, "step": 910, "valid_targets_mean": 13847.2, "valid_targets_min": 2601 }, { "epoch": 0.8784, "grad_norm": 0.23774940308190678, "learning_rate": 3.9310691276608894e-05, "loss": 0.443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1618087887763977, "step": 915, "valid_targets_mean": 9275.4, "valid_targets_min": 1435 }, { "epoch": 0.8832, "grad_norm": 0.2299724409741465, "learning_rate": 3.9293144746041824e-05, "loss": 0.4363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1557924896478653, "step": 920, "valid_targets_mean": 10640.8, "valid_targets_min": 2643 }, { "epoch": 0.888, "grad_norm": 0.20806032544047204, "learning_rate": 3.9275381703508034e-05, "loss": 0.434, "loss_nan_ranks": 0, "loss_rank_avg": 0.14001302421092987, "step": 925, "valid_targets_mean": 10628.8, "valid_targets_min": 4377 }, { "epoch": 0.8928, "grad_norm": 0.20442904327913097, "learning_rate": 3.925740234834833e-05, "loss": 0.4428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1151759922504425, "step": 930, "valid_targets_mean": 9097.5, "valid_targets_min": 2592 }, { "epoch": 0.8976, "grad_norm": 0.2779844590431934, "learning_rate": 3.9239206882331045e-05, "loss": 0.4426, "loss_nan_ranks": 0, "loss_rank_avg": 0.1592455804347992, "step": 935, "valid_targets_mean": 10262.3, "valid_targets_min": 1553 }, { "epoch": 0.9024, "grad_norm": 0.2376479952598136, "learning_rate": 3.922079550964976e-05, "loss": 0.4377, "loss_nan_ranks": 0, "loss_rank_avg": 0.17629006505012512, "step": 940, "valid_targets_mean": 11368.9, "valid_targets_min": 1441 }, { "epoch": 0.9072, "grad_norm": 0.2610581487793073, "learning_rate": 3.920216843692099e-05, "loss": 0.4376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378932148218155, "step": 945, "valid_targets_mean": 10733.7, "valid_targets_min": 631 }, { "epoch": 0.912, "grad_norm": 0.23384408666927872, "learning_rate": 3.918332587318189e-05, "loss": 0.4332, "loss_nan_ranks": 0, "loss_rank_avg": 0.14836661517620087, "step": 950, "valid_targets_mean": 10466.8, "valid_targets_min": 1466 }, { "epoch": 0.9168, "grad_norm": 0.24291701861640366, "learning_rate": 3.916426802988791e-05, "loss": 0.4426, "loss_nan_ranks": 0, "loss_rank_avg": 0.14258360862731934, "step": 955, "valid_targets_mean": 10359.5, "valid_targets_min": 2176 }, { "epoch": 0.9216, "grad_norm": 0.25156841355285575, "learning_rate": 3.9144995120910414e-05, "loss": 0.4328, "loss_nan_ranks": 0, "loss_rank_avg": 0.13940885663032532, "step": 960, "valid_targets_mean": 9649.2, "valid_targets_min": 1351 }, { "epoch": 0.9264, "grad_norm": 0.23893594978350297, "learning_rate": 3.912550736253428e-05, "loss": 0.4315, "loss_nan_ranks": 0, "loss_rank_avg": 0.14351066946983337, "step": 965, "valid_targets_mean": 9654.1, "valid_targets_min": 2523 }, { "epoch": 0.9312, "grad_norm": 0.21816935655353778, "learning_rate": 3.9105804973455466e-05, "loss": 0.4282, "loss_nan_ranks": 0, "loss_rank_avg": 0.15850083529949188, "step": 970, "valid_targets_mean": 9993.9, "valid_targets_min": 2456 }, { "epoch": 0.936, "grad_norm": 0.21964927011900748, "learning_rate": 3.908588817477858e-05, "loss": 0.4372, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543029099702835, "step": 975, "valid_targets_mean": 10524.8, "valid_targets_min": 2105 }, { "epoch": 0.9408, "grad_norm": 0.2520400609926727, "learning_rate": 3.9065757190014356e-05, "loss": 0.4309, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531248688697815, "step": 980, "valid_targets_mean": 10672.6, "valid_targets_min": 1765 }, { "epoch": 0.9456, "grad_norm": 0.22766144278022285, "learning_rate": 3.90454122450772e-05, "loss": 0.4256, "loss_nan_ranks": 0, "loss_rank_avg": 0.17786508798599243, "step": 985, "valid_targets_mean": 14325.0, "valid_targets_min": 1820 }, { "epoch": 0.9504, "grad_norm": 0.21863446792464766, "learning_rate": 3.9024853568282615e-05, "loss": 0.4301, "loss_nan_ranks": 0, "loss_rank_avg": 0.14357662200927734, "step": 990, "valid_targets_mean": 11311.1, "valid_targets_min": 2214 }, { "epoch": 0.9552, "grad_norm": 0.2722964437044844, "learning_rate": 3.900408139034464e-05, "loss": 0.4387, "loss_nan_ranks": 0, "loss_rank_avg": 0.15044580399990082, "step": 995, "valid_targets_mean": 10024.0, "valid_targets_min": 2247 }, { "epoch": 0.96, "grad_norm": 0.22324695304768527, "learning_rate": 3.89830959443733e-05, "loss": 0.4401, "loss_nan_ranks": 0, "loss_rank_avg": 0.11514655500650406, "step": 1000, "valid_targets_mean": 8407.6, "valid_targets_min": 883 }, { "epoch": 0.9648, "grad_norm": 0.21542830139427063, "learning_rate": 3.896189746587192e-05, "loss": 0.4278, "loss_nan_ranks": 0, "loss_rank_avg": 0.14129936695098877, "step": 1005, "valid_targets_mean": 10078.5, "valid_targets_min": 1519 }, { "epoch": 0.9696, "grad_norm": 0.2051780043293131, "learning_rate": 3.894048619273457e-05, "loss": 0.4368, "loss_nan_ranks": 0, "loss_rank_avg": 0.14626026153564453, "step": 1010, "valid_targets_mean": 11932.6, "valid_targets_min": 1957 }, { "epoch": 0.9744, "grad_norm": 0.2504604799803636, "learning_rate": 3.89188623652433e-05, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564769744873047, "step": 1015, "valid_targets_mean": 10482.3, "valid_targets_min": 1443 }, { "epoch": 0.9792, "grad_norm": 0.21386579709839965, "learning_rate": 3.889702622606553e-05, "loss": 0.4358, "loss_nan_ranks": 0, "loss_rank_avg": 0.14831697940826416, "step": 1020, "valid_targets_mean": 10429.1, "valid_targets_min": 1235 }, { "epoch": 0.984, "grad_norm": 0.21260607427844888, "learning_rate": 3.887497802025129e-05, "loss": 0.4304, "loss_nan_ranks": 0, "loss_rank_avg": 0.13159194588661194, "step": 1025, "valid_targets_mean": 10932.1, "valid_targets_min": 2067 }, { "epoch": 0.9888, "grad_norm": 0.21391124051203142, "learning_rate": 3.885271799523043e-05, "loss": 0.4355, "loss_nan_ranks": 0, "loss_rank_avg": 0.13605813682079315, "step": 1030, "valid_targets_mean": 10411.8, "valid_targets_min": 1926 }, { "epoch": 0.9936, "grad_norm": 0.23829142954877147, "learning_rate": 3.8830246400809925e-05, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.17297562956809998, "step": 1035, "valid_targets_mean": 12221.7, "valid_targets_min": 4900 }, { "epoch": 0.9984, "grad_norm": 0.2160903034725571, "learning_rate": 3.880756348917101e-05, "loss": 0.4387, "loss_nan_ranks": 0, "loss_rank_avg": 0.15260297060012817, "step": 1040, "valid_targets_mean": 11269.4, "valid_targets_min": 1774 }, { "epoch": 1.00288, "grad_norm": 0.2273858654830621, "learning_rate": 3.8784669514866365e-05, "loss": 0.4294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1466825157403946, "step": 1045, "valid_targets_mean": 10658.0, "valid_targets_min": 3956 }, { "epoch": 1.00768, "grad_norm": 0.2315486695024205, "learning_rate": 3.876156473481727e-05, "loss": 0.4192, "loss_nan_ranks": 0, "loss_rank_avg": 0.1460821032524109, "step": 1050, "valid_targets_mean": 10631.7, "valid_targets_min": 2487 }, { "epoch": 1.01248, "grad_norm": 0.20848555300232693, "learning_rate": 3.8738249408310716e-05, "loss": 0.4181, "loss_nan_ranks": 0, "loss_rank_avg": 0.15337705612182617, "step": 1055, "valid_targets_mean": 11120.5, "valid_targets_min": 2295 }, { "epoch": 1.01728, "grad_norm": 0.2340676151350968, "learning_rate": 3.871472379699648e-05, "loss": 0.415, "loss_nan_ranks": 0, "loss_rank_avg": 0.12295055389404297, "step": 1060, "valid_targets_mean": 9224.1, "valid_targets_min": 1906 }, { "epoch": 1.02208, "grad_norm": 0.2432845446630706, "learning_rate": 3.869098816488422e-05, "loss": 0.424, "loss_nan_ranks": 0, "loss_rank_avg": 0.16106806695461273, "step": 1065, "valid_targets_mean": 12667.0, "valid_targets_min": 176 }, { "epoch": 1.02688, "grad_norm": 0.22947146647749891, "learning_rate": 3.866704277834049e-05, "loss": 0.4142, "loss_nan_ranks": 0, "loss_rank_avg": 0.11316105723381042, "step": 1070, "valid_targets_mean": 9858.5, "valid_targets_min": 2145 }, { "epoch": 1.03168, "grad_norm": 0.24700109955600275, "learning_rate": 3.864288790608573e-05, "loss": 0.4215, "loss_nan_ranks": 0, "loss_rank_avg": 0.16960284113883972, "step": 1075, "valid_targets_mean": 12659.7, "valid_targets_min": 3683 }, { "epoch": 1.03648, "grad_norm": 0.2935586573382416, "learning_rate": 3.861852381919132e-05, "loss": 0.4162, "loss_nan_ranks": 0, "loss_rank_avg": 0.12964990735054016, "step": 1080, "valid_targets_mean": 10707.2, "valid_targets_min": 1762 }, { "epoch": 1.04128, "grad_norm": 0.2292250396833103, "learning_rate": 3.8593950791076446e-05, "loss": 0.4173, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273222416639328, "step": 1085, "valid_targets_mean": 10119.5, "valid_targets_min": 2996 }, { "epoch": 1.04608, "grad_norm": 0.23498404250581678, "learning_rate": 3.856916909750512e-05, "loss": 0.4237, "loss_nan_ranks": 0, "loss_rank_avg": 0.13587495684623718, "step": 1090, "valid_targets_mean": 9965.6, "valid_targets_min": 2608 }, { "epoch": 1.05088, "grad_norm": 0.2553523699964282, "learning_rate": 3.854417901658301e-05, "loss": 0.4144, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318424940109253, "step": 1095, "valid_targets_mean": 8775.3, "valid_targets_min": 1827 }, { "epoch": 1.05568, "grad_norm": 0.28410804952434837, "learning_rate": 3.851898082875438e-05, "loss": 0.4127, "loss_nan_ranks": 0, "loss_rank_avg": 0.11669185757637024, "step": 1100, "valid_targets_mean": 9423.7, "valid_targets_min": 1411 }, { "epoch": 1.06048, "grad_norm": 0.21362583920709594, "learning_rate": 3.849357481679891e-05, "loss": 0.4175, "loss_nan_ranks": 0, "loss_rank_avg": 0.13717737793922424, "step": 1105, "valid_targets_mean": 11139.1, "valid_targets_min": 444 }, { "epoch": 1.06528, "grad_norm": 0.21752994977677992, "learning_rate": 3.846796126582851e-05, "loss": 0.4145, "loss_nan_ranks": 0, "loss_rank_avg": 0.13477230072021484, "step": 1110, "valid_targets_mean": 9537.8, "valid_targets_min": 1859 }, { "epoch": 1.07008, "grad_norm": 0.21257443662623238, "learning_rate": 3.844214046328416e-05, "loss": 0.4178, "loss_nan_ranks": 0, "loss_rank_avg": 0.14064884185791016, "step": 1115, "valid_targets_mean": 10565.9, "valid_targets_min": 1678 }, { "epoch": 1.07488, "grad_norm": 0.21862660809429926, "learning_rate": 3.841611269893266e-05, "loss": 0.4145, "loss_nan_ranks": 0, "loss_rank_avg": 0.1589120626449585, "step": 1120, "valid_targets_mean": 12369.5, "valid_targets_min": 2869 }, { "epoch": 1.07968, "grad_norm": 0.23792509429969855, "learning_rate": 3.8389878264863364e-05, "loss": 0.421, "loss_nan_ranks": 0, "loss_rank_avg": 0.15697196125984192, "step": 1125, "valid_targets_mean": 11654.8, "valid_targets_min": 2508 }, { "epoch": 1.08448, "grad_norm": 0.21339081246699299, "learning_rate": 3.836343745548495e-05, "loss": 0.4216, "loss_nan_ranks": 0, "loss_rank_avg": 0.14548815786838531, "step": 1130, "valid_targets_mean": 10870.5, "valid_targets_min": 1455 }, { "epoch": 1.08928, "grad_norm": 0.23060046636231427, "learning_rate": 3.833679056752205e-05, "loss": 0.4127, "loss_nan_ranks": 0, "loss_rank_avg": 0.1275004744529724, "step": 1135, "valid_targets_mean": 10123.6, "valid_targets_min": 1678 }, { "epoch": 1.09408, "grad_norm": 0.2636941558147357, "learning_rate": 3.8309937900012e-05, "loss": 0.4058, "loss_nan_ranks": 0, "loss_rank_avg": 0.12546730041503906, "step": 1140, "valid_targets_mean": 9488.0, "valid_targets_min": 3625 }, { "epoch": 1.09888, "grad_norm": 0.2915428207378038, "learning_rate": 3.8282879754301395e-05, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.142788827419281, "step": 1145, "valid_targets_mean": 11112.1, "valid_targets_min": 1347 }, { "epoch": 1.10368, "grad_norm": 0.21952478308998585, "learning_rate": 3.825561643404277e-05, "loss": 0.4125, "loss_nan_ranks": 0, "loss_rank_avg": 0.1304585486650467, "step": 1150, "valid_targets_mean": 10049.1, "valid_targets_min": 2730 }, { "epoch": 1.10848, "grad_norm": 0.25038615090928107, "learning_rate": 3.8228148245191195e-05, "loss": 0.4078, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327395886182785, "step": 1155, "valid_targets_mean": 10158.7, "valid_targets_min": 2185 }, { "epoch": 1.11328, "grad_norm": 0.23435295175638923, "learning_rate": 3.820047549600078e-05, "loss": 0.4206, "loss_nan_ranks": 0, "loss_rank_avg": 0.11310620605945587, "step": 1160, "valid_targets_mean": 8340.7, "valid_targets_min": 3053 }, { "epoch": 1.11808, "grad_norm": 0.29168324649773325, "learning_rate": 3.8172598497021304e-05, "loss": 0.4194, "loss_nan_ranks": 0, "loss_rank_avg": 0.13903772830963135, "step": 1165, "valid_targets_mean": 9254.2, "valid_targets_min": 2835 }, { "epoch": 1.12288, "grad_norm": 0.23637632288605004, "learning_rate": 3.8144517561094635e-05, "loss": 0.41, "loss_nan_ranks": 0, "loss_rank_avg": 0.12995116412639618, "step": 1170, "valid_targets_mean": 9100.4, "valid_targets_min": 1907 }, { "epoch": 1.12768, "grad_norm": 0.25218695892611065, "learning_rate": 3.811623300335129e-05, "loss": 0.4132, "loss_nan_ranks": 0, "loss_rank_avg": 0.14638108015060425, "step": 1175, "valid_targets_mean": 12772.2, "valid_targets_min": 1483 }, { "epoch": 1.13248, "grad_norm": 0.2230090673998303, "learning_rate": 3.808774514120689e-05, "loss": 0.4148, "loss_nan_ranks": 0, "loss_rank_avg": 0.12883812189102173, "step": 1180, "valid_targets_mean": 10551.2, "valid_targets_min": 3589 }, { "epoch": 1.13728, "grad_norm": 0.2309263447970177, "learning_rate": 3.805905429435856e-05, "loss": 0.4188, "loss_nan_ranks": 0, "loss_rank_avg": 0.13861598074436188, "step": 1185, "valid_targets_mean": 10784.2, "valid_targets_min": 1672 }, { "epoch": 1.14208, "grad_norm": 0.20154037362791907, "learning_rate": 3.803016078478137e-05, "loss": 0.4225, "loss_nan_ranks": 0, "loss_rank_avg": 0.13277360796928406, "step": 1190, "valid_targets_mean": 10616.0, "valid_targets_min": 2123 }, { "epoch": 1.14688, "grad_norm": 0.26637911945778125, "learning_rate": 3.800106493672472e-05, "loss": 0.4149, "loss_nan_ranks": 0, "loss_rank_avg": 0.1266065239906311, "step": 1195, "valid_targets_mean": 9035.4, "valid_targets_min": 1418 }, { "epoch": 1.15168, "grad_norm": 0.23840346583222496, "learning_rate": 3.7971767076708704e-05, "loss": 0.4139, "loss_nan_ranks": 0, "loss_rank_avg": 0.14263322949409485, "step": 1200, "valid_targets_mean": 10720.5, "valid_targets_min": 2768 }, { "epoch": 1.15648, "grad_norm": 0.2464513849806541, "learning_rate": 3.794226753352042e-05, "loss": 0.4169, "loss_nan_ranks": 0, "loss_rank_avg": 0.13991528749465942, "step": 1205, "valid_targets_mean": 9465.7, "valid_targets_min": 1860 }, { "epoch": 1.16128, "grad_norm": 0.23364677185568442, "learning_rate": 3.791256663821032e-05, "loss": 0.4252, "loss_nan_ranks": 0, "loss_rank_avg": 0.14799943566322327, "step": 1210, "valid_targets_mean": 10576.1, "valid_targets_min": 1972 }, { "epoch": 1.16608, "grad_norm": 0.2061601497448703, "learning_rate": 3.788266472408846e-05, "loss": 0.4202, "loss_nan_ranks": 0, "loss_rank_avg": 0.14230754971504211, "step": 1215, "valid_targets_mean": 11516.0, "valid_targets_min": 2542 }, { "epoch": 1.17088, "grad_norm": 0.25288643954396195, "learning_rate": 3.785256212672077e-05, "loss": 0.4244, "loss_nan_ranks": 0, "loss_rank_avg": 0.14614298939704895, "step": 1220, "valid_targets_mean": 10024.8, "valid_targets_min": 755 }, { "epoch": 1.17568, "grad_norm": 0.2397437276470604, "learning_rate": 3.7822259183925324e-05, "loss": 0.4195, "loss_nan_ranks": 0, "loss_rank_avg": 0.13796095550060272, "step": 1225, "valid_targets_mean": 9419.6, "valid_targets_min": 3489 }, { "epoch": 1.18048, "grad_norm": 0.20449254174295872, "learning_rate": 3.7791756235768476e-05, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.13413485884666443, "step": 1230, "valid_targets_mean": 11258.3, "valid_targets_min": 1243 }, { "epoch": 1.1852800000000001, "grad_norm": 0.24344645692417433, "learning_rate": 3.7761053624561104e-05, "loss": 0.4119, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314702332019806, "step": 1235, "valid_targets_mean": 8748.3, "valid_targets_min": 2184 }, { "epoch": 1.19008, "grad_norm": 0.20991725263743807, "learning_rate": 3.7730151694854757e-05, "loss": 0.4154, "loss_nan_ranks": 0, "loss_rank_avg": 0.14757773280143738, "step": 1240, "valid_targets_mean": 11077.1, "valid_targets_min": 3770 }, { "epoch": 1.19488, "grad_norm": 0.21767909667008972, "learning_rate": 3.769905079343777e-05, "loss": 0.4095, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390220671892166, "step": 1245, "valid_targets_mean": 11480.1, "valid_targets_min": 2477 }, { "epoch": 1.19968, "grad_norm": 0.2257068986303116, "learning_rate": 3.766775126933138e-05, "loss": 0.4125, "loss_nan_ranks": 0, "loss_rank_avg": 0.14113309979438782, "step": 1250, "valid_targets_mean": 10721.3, "valid_targets_min": 3756 }, { "epoch": 1.20448, "grad_norm": 0.21009605592367017, "learning_rate": 3.7636253473785815e-05, "loss": 0.411, "loss_nan_ranks": 0, "loss_rank_avg": 0.13418659567832947, "step": 1255, "valid_targets_mean": 10695.7, "valid_targets_min": 1715 }, { "epoch": 1.20928, "grad_norm": 0.21016348721733408, "learning_rate": 3.760455776027636e-05, "loss": 0.4135, "loss_nan_ranks": 0, "loss_rank_avg": 0.13643574714660645, "step": 1260, "valid_targets_mean": 9691.2, "valid_targets_min": 2566 }, { "epoch": 1.21408, "grad_norm": 0.20524820111349146, "learning_rate": 3.7572664484499365e-05, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1784619688987732, "step": 1265, "valid_targets_mean": 13633.3, "valid_targets_min": 4476 }, { "epoch": 1.21888, "grad_norm": 0.21123899434747842, "learning_rate": 3.7540574004368264e-05, "loss": 0.4215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381276249885559, "step": 1270, "valid_targets_mean": 10542.8, "valid_targets_min": 929 }, { "epoch": 1.2236799999999999, "grad_norm": 0.21233244655622904, "learning_rate": 3.750828668000959e-05, "loss": 0.4131, "loss_nan_ranks": 0, "loss_rank_avg": 0.13086965680122375, "step": 1275, "valid_targets_mean": 10361.3, "valid_targets_min": 1469 }, { "epoch": 1.22848, "grad_norm": 0.2103899640818159, "learning_rate": 3.747580287375887e-05, "loss": 0.4176, "loss_nan_ranks": 0, "loss_rank_avg": 0.10956547409296036, "step": 1280, "valid_targets_mean": 8526.0, "valid_targets_min": 2046 }, { "epoch": 1.23328, "grad_norm": 0.21594844805715224, "learning_rate": 3.744312295015662e-05, "loss": 0.4115, "loss_nan_ranks": 0, "loss_rank_avg": 0.13053172826766968, "step": 1285, "valid_targets_mean": 9360.7, "valid_targets_min": 832 }, { "epoch": 1.23808, "grad_norm": 0.2109355374562815, "learning_rate": 3.7410247275944223e-05, "loss": 0.4142, "loss_nan_ranks": 0, "loss_rank_avg": 0.14856983721256256, "step": 1290, "valid_targets_mean": 11521.5, "valid_targets_min": 831 }, { "epoch": 1.24288, "grad_norm": 0.2243955319900153, "learning_rate": 3.737717622005981e-05, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.14200091361999512, "step": 1295, "valid_targets_mean": 11954.9, "valid_targets_min": 1765 }, { "epoch": 1.24768, "grad_norm": 0.21861344610496983, "learning_rate": 3.734391015363413e-05, "loss": 0.4258, "loss_nan_ranks": 0, "loss_rank_avg": 0.13023564219474792, "step": 1300, "valid_targets_mean": 9402.0, "valid_targets_min": 1620 }, { "epoch": 1.25248, "grad_norm": 0.2048384270850224, "learning_rate": 3.7310449449986404e-05, "loss": 0.4174, "loss_nan_ranks": 0, "loss_rank_avg": 0.13601598143577576, "step": 1305, "valid_targets_mean": 9952.6, "valid_targets_min": 3102 }, { "epoch": 1.25728, "grad_norm": 0.22440521964428292, "learning_rate": 3.727679448462009e-05, "loss": 0.4108, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419730931520462, "step": 1310, "valid_targets_mean": 9742.3, "valid_targets_min": 1035 }, { "epoch": 1.26208, "grad_norm": 0.20132327484258444, "learning_rate": 3.7242945635218696e-05, "loss": 0.4159, "loss_nan_ranks": 0, "loss_rank_avg": 0.16398459672927856, "step": 1315, "valid_targets_mean": 13264.6, "valid_targets_min": 3009 }, { "epoch": 1.26688, "grad_norm": 0.21742026246369942, "learning_rate": 3.720890328164156e-05, "loss": 0.4155, "loss_nan_ranks": 0, "loss_rank_avg": 0.13954755663871765, "step": 1320, "valid_targets_mean": 11703.3, "valid_targets_min": 2602 }, { "epoch": 1.27168, "grad_norm": 0.2232888027873828, "learning_rate": 3.717466780591956e-05, "loss": 0.4116, "loss_nan_ranks": 0, "loss_rank_avg": 0.14647075533866882, "step": 1325, "valid_targets_mean": 11269.9, "valid_targets_min": 2647 }, { "epoch": 1.27648, "grad_norm": 0.21225121412651402, "learning_rate": 3.7140239592250804e-05, "loss": 0.4165, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489778608083725, "step": 1330, "valid_targets_mean": 11695.9, "valid_targets_min": 398 }, { "epoch": 1.28128, "grad_norm": 0.20279925882385536, "learning_rate": 3.71056190269964e-05, "loss": 0.4189, "loss_nan_ranks": 0, "loss_rank_avg": 0.15311786532402039, "step": 1335, "valid_targets_mean": 12422.6, "valid_targets_min": 2518 }, { "epoch": 1.2860800000000001, "grad_norm": 0.2005051063097678, "learning_rate": 3.7070806498676025e-05, "loss": 0.4183, "loss_nan_ranks": 0, "loss_rank_avg": 0.14334993064403534, "step": 1340, "valid_targets_mean": 11061.7, "valid_targets_min": 1411 }, { "epoch": 1.29088, "grad_norm": 0.21303853310340795, "learning_rate": 3.7035802397963625e-05, "loss": 0.4092, "loss_nan_ranks": 0, "loss_rank_avg": 0.11744124442338943, "step": 1345, "valid_targets_mean": 9264.0, "valid_targets_min": 3090 }, { "epoch": 1.29568, "grad_norm": 0.20486927969536597, "learning_rate": 3.700060711768302e-05, "loss": 0.4192, "loss_nan_ranks": 0, "loss_rank_avg": 0.14721707999706268, "step": 1350, "valid_targets_mean": 11086.1, "valid_targets_min": 3188 }, { "epoch": 1.30048, "grad_norm": 0.22248326527528745, "learning_rate": 3.696522105280348e-05, "loss": 0.422, "loss_nan_ranks": 0, "loss_rank_avg": 0.15628677606582642, "step": 1355, "valid_targets_mean": 11830.6, "valid_targets_min": 1827 }, { "epoch": 1.30528, "grad_norm": 0.2024567255287873, "learning_rate": 3.6929644600435303e-05, "loss": 0.4112, "loss_nan_ranks": 0, "loss_rank_avg": 0.11964519321918488, "step": 1360, "valid_targets_mean": 9261.3, "valid_targets_min": 2101 }, { "epoch": 1.3100800000000001, "grad_norm": 0.2386785505217334, "learning_rate": 3.689387815982536e-05, "loss": 0.4086, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595247983932495, "step": 1365, "valid_targets_mean": 11489.6, "valid_targets_min": 1626 }, { "epoch": 1.31488, "grad_norm": 0.20397522674415516, "learning_rate": 3.6857922132352617e-05, "loss": 0.4222, "loss_nan_ranks": 0, "loss_rank_avg": 0.11339862644672394, "step": 1370, "valid_targets_mean": 10194.9, "valid_targets_min": 2049 }, { "epoch": 1.31968, "grad_norm": 0.21700887949212488, "learning_rate": 3.6821776921523615e-05, "loss": 0.4119, "loss_nan_ranks": 0, "loss_rank_avg": 0.13566583395004272, "step": 1375, "valid_targets_mean": 10100.3, "valid_targets_min": 2186 }, { "epoch": 1.3244799999999999, "grad_norm": 0.21424490251596093, "learning_rate": 3.678544293296797e-05, "loss": 0.4181, "loss_nan_ranks": 0, "loss_rank_avg": 0.13172942399978638, "step": 1380, "valid_targets_mean": 10231.2, "valid_targets_min": 1195 }, { "epoch": 1.32928, "grad_norm": 0.24557977923755359, "learning_rate": 3.674892057443378e-05, "loss": 0.4143, "loss_nan_ranks": 0, "loss_rank_avg": 0.15770123898983002, "step": 1385, "valid_targets_mean": 11602.1, "valid_targets_min": 2966 }, { "epoch": 1.33408, "grad_norm": 0.24185457949860034, "learning_rate": 3.671221025578309e-05, "loss": 0.4187, "loss_nan_ranks": 0, "loss_rank_avg": 0.14546245336532593, "step": 1390, "valid_targets_mean": 10557.9, "valid_targets_min": 1920 }, { "epoch": 1.33888, "grad_norm": 0.1999001199945465, "learning_rate": 3.6675312388987274e-05, "loss": 0.4198, "loss_nan_ranks": 0, "loss_rank_avg": 0.12263347208499908, "step": 1395, "valid_targets_mean": 10265.5, "valid_targets_min": 1258 }, { "epoch": 1.34368, "grad_norm": 0.2084056987805099, "learning_rate": 3.663822738812241e-05, "loss": 0.4124, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537923514842987, "step": 1400, "valid_targets_mean": 12081.8, "valid_targets_min": 2073 }, { "epoch": 1.34848, "grad_norm": 0.2411579451936407, "learning_rate": 3.660095566936462e-05, "loss": 0.4164, "loss_nan_ranks": 0, "loss_rank_avg": 0.13250426948070526, "step": 1405, "valid_targets_mean": 10960.7, "valid_targets_min": 1195 }, { "epoch": 1.35328, "grad_norm": 0.229844139672178, "learning_rate": 3.656349765098546e-05, "loss": 0.3969, "loss_nan_ranks": 0, "loss_rank_avg": 0.10777662694454193, "step": 1410, "valid_targets_mean": 8199.8, "valid_targets_min": 1762 }, { "epoch": 1.35808, "grad_norm": 0.2087959755159777, "learning_rate": 3.652585375334714e-05, "loss": 0.4057, "loss_nan_ranks": 0, "loss_rank_avg": 0.17145152390003204, "step": 1415, "valid_targets_mean": 12745.7, "valid_targets_min": 1819 }, { "epoch": 1.36288, "grad_norm": 0.22405679106885293, "learning_rate": 3.648802439889785e-05, "loss": 0.4109, "loss_nan_ranks": 0, "loss_rank_avg": 0.1325543373823166, "step": 1420, "valid_targets_mean": 9900.9, "valid_targets_min": 1880 }, { "epoch": 1.36768, "grad_norm": 0.2691908667273548, "learning_rate": 3.645001001216705e-05, "loss": 0.4063, "loss_nan_ranks": 0, "loss_rank_avg": 0.11722728610038757, "step": 1425, "valid_targets_mean": 9083.3, "valid_targets_min": 1996 }, { "epoch": 1.37248, "grad_norm": 0.19573723387921657, "learning_rate": 3.641181101976065e-05, "loss": 0.4107, "loss_nan_ranks": 0, "loss_rank_avg": 0.11058799177408218, "step": 1430, "valid_targets_mean": 9659.8, "valid_targets_min": 1617 }, { "epoch": 1.37728, "grad_norm": 0.2134623022289432, "learning_rate": 3.637342785035624e-05, "loss": 0.4116, "loss_nan_ranks": 0, "loss_rank_avg": 0.15618430078029633, "step": 1435, "valid_targets_mean": 12706.1, "valid_targets_min": 1818 }, { "epoch": 1.38208, "grad_norm": 0.22397148122572136, "learning_rate": 3.633486093469829e-05, "loss": 0.4123, "loss_nan_ranks": 0, "loss_rank_avg": 0.12754711508750916, "step": 1440, "valid_targets_mean": 9612.8, "valid_targets_min": 2126 }, { "epoch": 1.3868800000000001, "grad_norm": 0.22201805653034568, "learning_rate": 3.629611070559333e-05, "loss": 0.4122, "loss_nan_ranks": 0, "loss_rank_avg": 0.17742006480693817, "step": 1445, "valid_targets_mean": 14002.2, "valid_targets_min": 3607 }, { "epoch": 1.39168, "grad_norm": 0.20713390355062825, "learning_rate": 3.625717759790506e-05, "loss": 0.4046, "loss_nan_ranks": 0, "loss_rank_avg": 0.13317152857780457, "step": 1450, "valid_targets_mean": 10315.7, "valid_targets_min": 2648 }, { "epoch": 1.39648, "grad_norm": 0.20581742916420195, "learning_rate": 3.621806204854947e-05, "loss": 0.4057, "loss_nan_ranks": 0, "loss_rank_avg": 0.12615267932415009, "step": 1455, "valid_targets_mean": 9761.5, "valid_targets_min": 2595 }, { "epoch": 1.40128, "grad_norm": 0.2253326544939486, "learning_rate": 3.617876449648998e-05, "loss": 0.4156, "loss_nan_ranks": 0, "loss_rank_avg": 0.13411745429039001, "step": 1460, "valid_targets_mean": 10907.1, "valid_targets_min": 1940 }, { "epoch": 1.40608, "grad_norm": 0.2158021375696706, "learning_rate": 3.613928538273247e-05, "loss": 0.4045, "loss_nan_ranks": 0, "loss_rank_avg": 0.15256470441818237, "step": 1465, "valid_targets_mean": 11172.7, "valid_targets_min": 2042 }, { "epoch": 1.4108800000000001, "grad_norm": 0.23215844714790715, "learning_rate": 3.609962515032034e-05, "loss": 0.4071, "loss_nan_ranks": 0, "loss_rank_avg": 0.13259349763393402, "step": 1470, "valid_targets_mean": 9956.5, "valid_targets_min": 1151 }, { "epoch": 1.41568, "grad_norm": 0.20191946885445114, "learning_rate": 3.605978424432954e-05, "loss": 0.4086, "loss_nan_ranks": 0, "loss_rank_avg": 0.14187245070934296, "step": 1475, "valid_targets_mean": 11490.5, "valid_targets_min": 2044 }, { "epoch": 1.42048, "grad_norm": 0.2129186932802564, "learning_rate": 3.601976311186361e-05, "loss": 0.4036, "loss_nan_ranks": 0, "loss_rank_avg": 0.15841859579086304, "step": 1480, "valid_targets_mean": 11375.0, "valid_targets_min": 2719 }, { "epoch": 1.4252799999999999, "grad_norm": 0.22986360631556008, "learning_rate": 3.597956220204861e-05, "loss": 0.4159, "loss_nan_ranks": 0, "loss_rank_avg": 0.14085061848163605, "step": 1485, "valid_targets_mean": 11803.7, "valid_targets_min": 2323 }, { "epoch": 1.43008, "grad_norm": 0.23033386303941059, "learning_rate": 3.5939181966028084e-05, "loss": 0.4136, "loss_nan_ranks": 0, "loss_rank_avg": 0.1093810647726059, "step": 1490, "valid_targets_mean": 8520.8, "valid_targets_min": 2352 }, { "epoch": 1.43488, "grad_norm": 0.22690875952678244, "learning_rate": 3.589862285695804e-05, "loss": 0.4072, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403937041759491, "step": 1495, "valid_targets_mean": 10915.5, "valid_targets_min": 2952 }, { "epoch": 1.43968, "grad_norm": 0.20071387459694237, "learning_rate": 3.585788533000184e-05, "loss": 0.4044, "loss_nan_ranks": 0, "loss_rank_avg": 0.12689334154129028, "step": 1500, "valid_targets_mean": 10028.5, "valid_targets_min": 2214 }, { "epoch": 1.44448, "grad_norm": 0.23884170249895356, "learning_rate": 3.581696984232508e-05, "loss": 0.4005, "loss_nan_ranks": 0, "loss_rank_avg": 0.13245141506195068, "step": 1505, "valid_targets_mean": 10572.4, "valid_targets_min": 384 }, { "epoch": 1.44928, "grad_norm": 0.23906878983233132, "learning_rate": 3.5775876853090465e-05, "loss": 0.4137, "loss_nan_ranks": 0, "loss_rank_avg": 0.13135510683059692, "step": 1510, "valid_targets_mean": 10596.6, "valid_targets_min": 2137 }, { "epoch": 1.45408, "grad_norm": 0.21408874742248546, "learning_rate": 3.5734606823452686e-05, "loss": 0.4073, "loss_nan_ranks": 0, "loss_rank_avg": 0.15579737722873688, "step": 1515, "valid_targets_mean": 11520.9, "valid_targets_min": 1168 }, { "epoch": 1.45888, "grad_norm": 0.23082224637767995, "learning_rate": 3.569316021655319e-05, "loss": 0.4074, "loss_nan_ranks": 0, "loss_rank_avg": 0.12368214875459671, "step": 1520, "valid_targets_mean": 9717.6, "valid_targets_min": 3395 }, { "epoch": 1.46368, "grad_norm": 0.23974373684279676, "learning_rate": 3.565153749751505e-05, "loss": 0.3944, "loss_nan_ranks": 0, "loss_rank_avg": 0.1179773360490799, "step": 1525, "valid_targets_mean": 9593.9, "valid_targets_min": 1719 }, { "epoch": 1.46848, "grad_norm": 0.21789884302707357, "learning_rate": 3.5609739133437666e-05, "loss": 0.403, "loss_nan_ranks": 0, "loss_rank_avg": 0.14593097567558289, "step": 1530, "valid_targets_mean": 10919.9, "valid_targets_min": 3251 }, { "epoch": 1.47328, "grad_norm": 0.2684640365660121, "learning_rate": 3.55677655933916e-05, "loss": 0.4021, "loss_nan_ranks": 0, "loss_rank_avg": 0.12168829143047333, "step": 1535, "valid_targets_mean": 9522.3, "valid_targets_min": 724 }, { "epoch": 1.47808, "grad_norm": 0.21931539915256654, "learning_rate": 3.5525617348413265e-05, "loss": 0.4072, "loss_nan_ranks": 0, "loss_rank_avg": 0.12263620644807816, "step": 1540, "valid_targets_mean": 9469.0, "valid_targets_min": 1597 }, { "epoch": 1.48288, "grad_norm": 0.2263527046157457, "learning_rate": 3.5483294871499646e-05, "loss": 0.4099, "loss_nan_ranks": 0, "loss_rank_avg": 0.12820056080818176, "step": 1545, "valid_targets_mean": 9946.8, "valid_targets_min": 2444 }, { "epoch": 1.4876800000000001, "grad_norm": 0.2137941586747305, "learning_rate": 3.544079863760302e-05, "loss": 0.4034, "loss_nan_ranks": 0, "loss_rank_avg": 0.1168578639626503, "step": 1550, "valid_targets_mean": 8876.6, "valid_targets_min": 1681 }, { "epoch": 1.49248, "grad_norm": 0.22498503782561743, "learning_rate": 3.5398129123625565e-05, "loss": 0.4087, "loss_nan_ranks": 0, "loss_rank_avg": 0.163137748837471, "step": 1555, "valid_targets_mean": 11269.5, "valid_targets_min": 1604 }, { "epoch": 1.49728, "grad_norm": 0.2096852182318285, "learning_rate": 3.535528680841408e-05, "loss": 0.4012, "loss_nan_ranks": 0, "loss_rank_avg": 0.1431254893541336, "step": 1560, "valid_targets_mean": 10506.5, "valid_targets_min": 321 }, { "epoch": 1.5020799999999999, "grad_norm": 0.19907417765637198, "learning_rate": 3.5312272172754566e-05, "loss": 0.4059, "loss_nan_ranks": 0, "loss_rank_avg": 0.15149365365505219, "step": 1565, "valid_targets_mean": 12395.6, "valid_targets_min": 1800 }, { "epoch": 1.50688, "grad_norm": 0.21755973079142352, "learning_rate": 3.5269085699366844e-05, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263016015291214, "step": 1570, "valid_targets_mean": 10658.8, "valid_targets_min": 2443 }, { "epoch": 1.5116800000000001, "grad_norm": 0.24303549201558827, "learning_rate": 3.5225727872899136e-05, "loss": 0.4114, "loss_nan_ranks": 0, "loss_rank_avg": 0.12606140971183777, "step": 1575, "valid_targets_mean": 9330.3, "valid_targets_min": 1058 }, { "epoch": 1.51648, "grad_norm": 0.2835144410727879, "learning_rate": 3.518219917992262e-05, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.149481400847435, "step": 1580, "valid_targets_mean": 11042.7, "valid_targets_min": 1431 }, { "epoch": 1.52128, "grad_norm": 0.2441642529443939, "learning_rate": 3.5138500108926e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.14199629426002502, "step": 1585, "valid_targets_mean": 10971.2, "valid_targets_min": 2014 }, { "epoch": 1.5260799999999999, "grad_norm": 0.22227721700480615, "learning_rate": 3.509463115030995e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.14047616720199585, "step": 1590, "valid_targets_mean": 11059.1, "valid_targets_min": 2218 }, { "epoch": 1.53088, "grad_norm": 0.22052339326979958, "learning_rate": 3.505059279638172e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.12846125662326813, "step": 1595, "valid_targets_mean": 9715.1, "valid_targets_min": 2285 }, { "epoch": 1.5356800000000002, "grad_norm": 0.2194673984483837, "learning_rate": 3.500638554134952e-05, "loss": 0.4039, "loss_nan_ranks": 0, "loss_rank_avg": 0.10912424325942993, "step": 1600, "valid_targets_mean": 9214.8, "valid_targets_min": 1891 }, { "epoch": 1.54048, "grad_norm": 0.2177575764877966, "learning_rate": 3.4962009881317005e-05, "loss": 0.4029, "loss_nan_ranks": 0, "loss_rank_avg": 0.14358478784561157, "step": 1605, "valid_targets_mean": 11452.6, "valid_targets_min": 2380 }, { "epoch": 1.54528, "grad_norm": 0.22537318863877479, "learning_rate": 3.491746631427772e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.14550143480300903, "step": 1610, "valid_targets_mean": 10776.5, "valid_targets_min": 2025 }, { "epoch": 1.55008, "grad_norm": 0.22553034346150513, "learning_rate": 3.487275534010948e-05, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.13195769488811493, "step": 1615, "valid_targets_mean": 9417.9, "valid_targets_min": 2104 }, { "epoch": 1.55488, "grad_norm": 0.2646860204126771, "learning_rate": 3.482787746056881e-05, "loss": 0.4013, "loss_nan_ranks": 0, "loss_rank_avg": 0.13002309203147888, "step": 1620, "valid_targets_mean": 9772.6, "valid_targets_min": 276 }, { "epoch": 1.55968, "grad_norm": 0.19817526014002387, "learning_rate": 3.4782833179285256e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.12554329633712769, "step": 1625, "valid_targets_mean": 10098.5, "valid_targets_min": 3998 }, { "epoch": 1.56448, "grad_norm": 0.23265845390648024, "learning_rate": 3.473762300175578e-05, "loss": 0.4055, "loss_nan_ranks": 0, "loss_rank_avg": 0.10745157301425934, "step": 1630, "valid_targets_mean": 8866.5, "valid_targets_min": 2414 }, { "epoch": 1.56928, "grad_norm": 0.21681894549050468, "learning_rate": 3.469224743533906e-05, "loss": 0.3997, "loss_nan_ranks": 0, "loss_rank_avg": 0.14574511349201202, "step": 1635, "valid_targets_mean": 10075.9, "valid_targets_min": 2725 }, { "epoch": 1.57408, "grad_norm": 0.21721065351913352, "learning_rate": 3.464670698924981e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.13828513026237488, "step": 1640, "valid_targets_mean": 10433.1, "valid_targets_min": 2115 }, { "epoch": 1.5788799999999998, "grad_norm": 0.2214508043669377, "learning_rate": 3.4601002174553055e-05, "loss": 0.3944, "loss_nan_ranks": 0, "loss_rank_avg": 0.12395211309194565, "step": 1645, "valid_targets_mean": 9867.7, "valid_targets_min": 2175 }, { "epoch": 1.58368, "grad_norm": 0.1976456316917021, "learning_rate": 3.45551335041584e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447567641735077, "step": 1650, "valid_targets_mean": 10812.8, "valid_targets_min": 1525 }, { "epoch": 1.5884800000000001, "grad_norm": 0.2150887282101477, "learning_rate": 3.4509101492814286e-05, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.11536484211683273, "step": 1655, "valid_targets_mean": 8026.8, "valid_targets_min": 1294 }, { "epoch": 1.59328, "grad_norm": 0.2032204949161656, "learning_rate": 3.446290665710219e-05, "loss": 0.3986, "loss_nan_ranks": 0, "loss_rank_avg": 0.13227199018001556, "step": 1660, "valid_targets_mean": 10462.0, "valid_targets_min": 3347 }, { "epoch": 1.59808, "grad_norm": 0.21431437862340466, "learning_rate": 3.441654951543085e-05, "loss": 0.397, "loss_nan_ranks": 0, "loss_rank_avg": 0.12322622537612915, "step": 1665, "valid_targets_mean": 9954.2, "valid_targets_min": 2445 }, { "epoch": 1.6028799999999999, "grad_norm": 0.21808100784816117, "learning_rate": 3.4370030588030425e-05, "loss": 0.4059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262700855731964, "step": 1670, "valid_targets_mean": 9128.3, "valid_targets_min": 2970 }, { "epoch": 1.60768, "grad_norm": 0.22192127783593246, "learning_rate": 3.432335039694669e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.1360887736082077, "step": 1675, "valid_targets_mean": 10192.9, "valid_targets_min": 2388 }, { "epoch": 1.6124800000000001, "grad_norm": 0.2105589706564431, "learning_rate": 3.427650946603513e-05, "loss": 0.3968, "loss_nan_ranks": 0, "loss_rank_avg": 0.14164552092552185, "step": 1680, "valid_targets_mean": 11665.5, "valid_targets_min": 1873 }, { "epoch": 1.61728, "grad_norm": 0.20917890739253076, "learning_rate": 3.422950832095511e-05, "loss": 0.4013, "loss_nan_ranks": 0, "loss_rank_avg": 0.14686794579029083, "step": 1685, "valid_targets_mean": 11836.5, "valid_targets_min": 1526 }, { "epoch": 1.62208, "grad_norm": 0.218689384602607, "learning_rate": 3.418234748916395e-05, "loss": 0.3978, "loss_nan_ranks": 0, "loss_rank_avg": 0.15382401645183563, "step": 1690, "valid_targets_mean": 12671.2, "valid_targets_min": 3689 }, { "epoch": 1.6268799999999999, "grad_norm": 0.20427477458609572, "learning_rate": 3.4135027499911003e-05, "loss": 0.4039, "loss_nan_ranks": 0, "loss_rank_avg": 0.1121823638677597, "step": 1695, "valid_targets_mean": 8827.9, "valid_targets_min": 2336 }, { "epoch": 1.63168, "grad_norm": 0.25324102620237127, "learning_rate": 3.408754888423173e-05, "loss": 0.4016, "loss_nan_ranks": 0, "loss_rank_avg": 0.12924690544605255, "step": 1700, "valid_targets_mean": 9792.0, "valid_targets_min": 1363 }, { "epoch": 1.6364800000000002, "grad_norm": 0.23575060015918897, "learning_rate": 3.403991217494172e-05, "loss": 0.4062, "loss_nan_ranks": 0, "loss_rank_avg": 0.12108415365219116, "step": 1705, "valid_targets_mean": 9316.2, "valid_targets_min": 2950 }, { "epoch": 1.64128, "grad_norm": 0.19785865556687454, "learning_rate": 3.3992117906630744e-05, "loss": 0.4074, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475123167037964, "step": 1710, "valid_targets_mean": 12372.2, "valid_targets_min": 2309 }, { "epoch": 1.64608, "grad_norm": 0.21415769305814603, "learning_rate": 3.394416661565671e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.11862894892692566, "step": 1715, "valid_targets_mean": 8912.2, "valid_targets_min": 1675 }, { "epoch": 1.65088, "grad_norm": 0.23826038703312183, "learning_rate": 3.389605884013969e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426897943019867, "step": 1720, "valid_targets_mean": 10804.0, "valid_targets_min": 2234 }, { "epoch": 1.65568, "grad_norm": 0.24170373795005826, "learning_rate": 3.384779511995587e-05, "loss": 0.4011, "loss_nan_ranks": 0, "loss_rank_avg": 0.13612665235996246, "step": 1725, "valid_targets_mean": 10696.4, "valid_targets_min": 1778 }, { "epoch": 1.66048, "grad_norm": 0.23931550486897354, "learning_rate": 3.379937599673144e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.12457090616226196, "step": 1730, "valid_targets_mean": 9632.0, "valid_targets_min": 2851 }, { "epoch": 1.66528, "grad_norm": 0.2061576914555314, "learning_rate": 3.3750802013836596e-05, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.11049826443195343, "step": 1735, "valid_targets_mean": 8703.4, "valid_targets_min": 2022 }, { "epoch": 1.67008, "grad_norm": 0.21374204056001617, "learning_rate": 3.370207371637939e-05, "loss": 0.4011, "loss_nan_ranks": 0, "loss_rank_avg": 0.15568511188030243, "step": 1740, "valid_targets_mean": 11633.8, "valid_targets_min": 3684 }, { "epoch": 1.67488, "grad_norm": 0.21337916221726186, "learning_rate": 3.3653191651199635e-05, "loss": 0.4064, "loss_nan_ranks": 0, "loss_rank_avg": 0.15145465731620789, "step": 1745, "valid_targets_mean": 10421.4, "valid_targets_min": 2316 }, { "epoch": 1.6796799999999998, "grad_norm": 0.23004226232229372, "learning_rate": 3.360415636686274e-05, "loss": 0.4024, "loss_nan_ranks": 0, "loss_rank_avg": 0.12970012426376343, "step": 1750, "valid_targets_mean": 9696.3, "valid_targets_min": 2038 }, { "epoch": 1.68448, "grad_norm": 0.20561270288874453, "learning_rate": 3.355496841365359e-05, "loss": 0.3912, "loss_nan_ranks": 0, "loss_rank_avg": 0.12068414688110352, "step": 1755, "valid_targets_mean": 9217.6, "valid_targets_min": 3244 }, { "epoch": 1.6892800000000001, "grad_norm": 0.22563271293316586, "learning_rate": 3.350562834357034e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.14101052284240723, "step": 1760, "valid_targets_mean": 10387.0, "valid_targets_min": 3548 }, { "epoch": 1.69408, "grad_norm": 0.24142812450638393, "learning_rate": 3.345613671031827e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.13549157977104187, "step": 1765, "valid_targets_mean": 10715.5, "valid_targets_min": 2714 }, { "epoch": 1.69888, "grad_norm": 0.21228849973724254, "learning_rate": 3.340649406930349e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.12110074609518051, "step": 1770, "valid_targets_mean": 11074.2, "valid_targets_min": 1359 }, { "epoch": 1.7036799999999999, "grad_norm": 0.2156200959319992, "learning_rate": 3.335670097762677e-05, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.1143205314874649, "step": 1775, "valid_targets_mean": 9483.5, "valid_targets_min": 1606 }, { "epoch": 1.70848, "grad_norm": 0.23246732383901142, "learning_rate": 3.330675799407728e-05, "loss": 0.3956, "loss_nan_ranks": 0, "loss_rank_avg": 0.13464942574501038, "step": 1780, "valid_targets_mean": 11230.7, "valid_targets_min": 1710 }, { "epoch": 1.7132800000000001, "grad_norm": 0.22253356811827898, "learning_rate": 3.32566656791263e-05, "loss": 0.3986, "loss_nan_ranks": 0, "loss_rank_avg": 0.12669792771339417, "step": 1785, "valid_targets_mean": 10284.6, "valid_targets_min": 2270 }, { "epoch": 1.71808, "grad_norm": 0.20486126933947996, "learning_rate": 3.320642459492095e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.12168687582015991, "step": 1790, "valid_targets_mean": 9668.6, "valid_targets_min": 1877 }, { "epoch": 1.72288, "grad_norm": 0.2502018008883989, "learning_rate": 3.315603530527785e-05, "loss": 0.3987, "loss_nan_ranks": 0, "loss_rank_avg": 0.13025622069835663, "step": 1795, "valid_targets_mean": 10071.4, "valid_targets_min": 1291 }, { "epoch": 1.7276799999999999, "grad_norm": 0.22100999377103495, "learning_rate": 3.310549837567685e-05, "loss": 0.4005, "loss_nan_ranks": 0, "loss_rank_avg": 0.13234061002731323, "step": 1800, "valid_targets_mean": 10166.8, "valid_targets_min": 1177 }, { "epoch": 1.73248, "grad_norm": 0.2129959699349399, "learning_rate": 3.3054814373254615e-05, "loss": 0.3973, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542513072490692, "step": 1805, "valid_targets_mean": 10941.1, "valid_targets_min": 2436 }, { "epoch": 1.7372800000000002, "grad_norm": 0.20978747808047463, "learning_rate": 3.300398386679831e-05, "loss": 0.3999, "loss_nan_ranks": 0, "loss_rank_avg": 0.1411202847957611, "step": 1810, "valid_targets_mean": 11338.0, "valid_targets_min": 2897 }, { "epoch": 1.74208, "grad_norm": 0.21485236379949604, "learning_rate": 3.2953007426739204e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.13011616468429565, "step": 1815, "valid_targets_mean": 9627.8, "valid_targets_min": 2142 }, { "epoch": 1.74688, "grad_norm": 0.20840933175004347, "learning_rate": 3.290188562514624e-05, "loss": 0.3981, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490216851234436, "step": 1820, "valid_targets_mean": 11321.6, "valid_targets_min": 2398 }, { "epoch": 1.75168, "grad_norm": 0.20026765690303727, "learning_rate": 3.285061903571968e-05, "loss": 0.3957, "loss_nan_ranks": 0, "loss_rank_avg": 0.13110694289207458, "step": 1825, "valid_targets_mean": 9812.0, "valid_targets_min": 2429 }, { "epoch": 1.75648, "grad_norm": 0.2292840920686858, "learning_rate": 3.27992082337846e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.15019527077674866, "step": 1830, "valid_targets_mean": 11044.8, "valid_targets_min": 2095 }, { "epoch": 1.76128, "grad_norm": 0.22099436299927055, "learning_rate": 3.274765379628447e-05, "loss": 0.4065, "loss_nan_ranks": 0, "loss_rank_avg": 0.14847183227539062, "step": 1835, "valid_targets_mean": 11189.2, "valid_targets_min": 1796 }, { "epoch": 1.76608, "grad_norm": 0.20320537061481944, "learning_rate": 3.2695956301774664e-05, "loss": 0.3973, "loss_nan_ranks": 0, "loss_rank_avg": 0.13340553641319275, "step": 1840, "valid_targets_mean": 10326.3, "valid_targets_min": 1462 }, { "epoch": 1.77088, "grad_norm": 0.21167489305289328, "learning_rate": 3.264411633041598e-05, "loss": 0.3987, "loss_nan_ranks": 0, "loss_rank_avg": 0.1621175855398178, "step": 1845, "valid_targets_mean": 11443.7, "valid_targets_min": 1542 }, { "epoch": 1.77568, "grad_norm": 0.2186721440660899, "learning_rate": 3.259213446396812e-05, "loss": 0.3917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1408073753118515, "step": 1850, "valid_targets_mean": 11004.1, "valid_targets_min": 497 }, { "epoch": 1.7804799999999998, "grad_norm": 0.2163856042786629, "learning_rate": 3.254001128578317e-05, "loss": 0.391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433507800102234, "step": 1855, "valid_targets_mean": 11132.0, "valid_targets_min": 3359 }, { "epoch": 1.78528, "grad_norm": 0.20279384664468394, "learning_rate": 3.2487747380799036e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.10963033139705658, "step": 1860, "valid_targets_mean": 8810.3, "valid_targets_min": 2143 }, { "epoch": 1.7900800000000001, "grad_norm": 0.20087820022966488, "learning_rate": 3.243534333553291e-05, "loss": 0.3956, "loss_nan_ranks": 0, "loss_rank_avg": 0.11881513893604279, "step": 1865, "valid_targets_mean": 11328.5, "valid_targets_min": 2388 }, { "epoch": 1.79488, "grad_norm": 0.21398495522011107, "learning_rate": 3.2382799738074635e-05, "loss": 0.3989, "loss_nan_ranks": 0, "loss_rank_avg": 0.14420190453529358, "step": 1870, "valid_targets_mean": 10098.8, "valid_targets_min": 2226 }, { "epoch": 1.79968, "grad_norm": 0.2164572857663917, "learning_rate": 3.2330117178080184e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.12767937779426575, "step": 1875, "valid_targets_mean": 9393.9, "valid_targets_min": 2123 }, { "epoch": 1.8044799999999999, "grad_norm": 0.30012965010498455, "learning_rate": 3.227729624676497e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.11639062315225601, "step": 1880, "valid_targets_mean": 9530.6, "valid_targets_min": 1401 }, { "epoch": 1.80928, "grad_norm": 0.24176122916815607, "learning_rate": 3.222433753689724e-05, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.15518411993980408, "step": 1885, "valid_targets_mean": 10808.2, "valid_targets_min": 1017 }, { "epoch": 1.8140800000000001, "grad_norm": 0.22436718375518214, "learning_rate": 3.2171241642791443e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.14497432112693787, "step": 1890, "valid_targets_mean": 11211.7, "valid_targets_min": 1983 }, { "epoch": 1.81888, "grad_norm": 0.23787343944723544, "learning_rate": 3.211800916030152e-05, "loss": 0.3912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1524227112531662, "step": 1895, "valid_targets_mean": 11464.1, "valid_targets_min": 2878 }, { "epoch": 1.82368, "grad_norm": 0.2572060361202662, "learning_rate": 3.206464068681424e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.12020900100469589, "step": 1900, "valid_targets_mean": 9636.8, "valid_targets_min": 2548 }, { "epoch": 1.8284799999999999, "grad_norm": 0.21078383512361049, "learning_rate": 3.20111368212425e-05, "loss": 0.3968, "loss_nan_ranks": 0, "loss_rank_avg": 0.11897289752960205, "step": 1905, "valid_targets_mean": 11681.4, "valid_targets_min": 3107 }, { "epoch": 1.83328, "grad_norm": 0.20294316150292713, "learning_rate": 3.19574981640186e-05, "loss": 0.3959, "loss_nan_ranks": 0, "loss_rank_avg": 0.14064642786979675, "step": 1910, "valid_targets_mean": 11299.5, "valid_targets_min": 2709 }, { "epoch": 1.8380800000000002, "grad_norm": 0.18972454533577332, "learning_rate": 3.1903725317087495e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.13221979141235352, "step": 1915, "valid_targets_mean": 11891.0, "valid_targets_min": 3651 }, { "epoch": 1.84288, "grad_norm": 0.18943681153553424, "learning_rate": 3.184981888390003e-05, "loss": 0.3957, "loss_nan_ranks": 0, "loss_rank_avg": 0.13814029097557068, "step": 1920, "valid_targets_mean": 11726.5, "valid_targets_min": 2799 }, { "epoch": 1.84768, "grad_norm": 0.20435272678520974, "learning_rate": 3.1795779469406226e-05, "loss": 0.3935, "loss_nan_ranks": 0, "loss_rank_avg": 0.13576734066009521, "step": 1925, "valid_targets_mean": 12009.9, "valid_targets_min": 2840 }, { "epoch": 1.85248, "grad_norm": 0.22181511371074905, "learning_rate": 3.174160768004842e-05, "loss": 0.3921, "loss_nan_ranks": 0, "loss_rank_avg": 0.10999979078769684, "step": 1930, "valid_targets_mean": 8584.6, "valid_targets_min": 1345 }, { "epoch": 1.85728, "grad_norm": 0.20259428439496813, "learning_rate": 3.168730412375449e-05, "loss": 0.3995, "loss_nan_ranks": 0, "loss_rank_avg": 0.14881809055805206, "step": 1935, "valid_targets_mean": 11891.6, "valid_targets_min": 1747 }, { "epoch": 1.86208, "grad_norm": 0.20820724171847152, "learning_rate": 3.1632869409931036e-05, "loss": 0.4036, "loss_nan_ranks": 0, "loss_rank_avg": 0.12483834475278854, "step": 1940, "valid_targets_mean": 10321.6, "valid_targets_min": 2655 }, { "epoch": 1.86688, "grad_norm": 0.2273426621166987, "learning_rate": 3.1578304149456544e-05, "loss": 0.3928, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542552411556244, "step": 1945, "valid_targets_mean": 13354.8, "valid_targets_min": 2049 }, { "epoch": 1.87168, "grad_norm": 0.22508915131462948, "learning_rate": 3.1523608954674524e-05, "loss": 0.3969, "loss_nan_ranks": 0, "loss_rank_avg": 0.14855341613292694, "step": 1950, "valid_targets_mean": 9999.3, "valid_targets_min": 1416 }, { "epoch": 1.87648, "grad_norm": 0.21601715129994264, "learning_rate": 3.1468784439386614e-05, "loss": 0.4013, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591084599494934, "step": 1955, "valid_targets_mean": 11878.5, "valid_targets_min": 719 }, { "epoch": 1.8812799999999998, "grad_norm": 0.23007947368682746, "learning_rate": 3.141383121884576e-05, "loss": 0.3955, "loss_nan_ranks": 0, "loss_rank_avg": 0.12612038850784302, "step": 1960, "valid_targets_mean": 10162.7, "valid_targets_min": 1562 }, { "epoch": 1.88608, "grad_norm": 0.23316297834483646, "learning_rate": 3.1358749909749214e-05, "loss": 0.3952, "loss_nan_ranks": 0, "loss_rank_avg": 0.11835485696792603, "step": 1965, "valid_targets_mean": 9112.8, "valid_targets_min": 2014 }, { "epoch": 1.8908800000000001, "grad_norm": 0.2114115011904651, "learning_rate": 3.1303541130231703e-05, "loss": 0.3911, "loss_nan_ranks": 0, "loss_rank_avg": 0.13895109295845032, "step": 1970, "valid_targets_mean": 11622.1, "valid_targets_min": 1624 }, { "epoch": 1.89568, "grad_norm": 0.22891961421868048, "learning_rate": 3.1248205499858446e-05, "loss": 0.3998, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330220252275467, "step": 1975, "valid_targets_mean": 11612.4, "valid_targets_min": 3255 }, { "epoch": 1.90048, "grad_norm": 0.19639013400517918, "learning_rate": 3.119274363961821e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.11368654668331146, "step": 1980, "valid_targets_mean": 10622.1, "valid_targets_min": 1229 }, { "epoch": 1.9052799999999999, "grad_norm": 0.21344525100358355, "learning_rate": 3.113715617191634e-05, "loss": 0.3965, "loss_nan_ranks": 0, "loss_rank_avg": 0.15114393830299377, "step": 1985, "valid_targets_mean": 12539.8, "valid_targets_min": 1786 }, { "epoch": 1.91008, "grad_norm": 0.20445368901845684, "learning_rate": 3.1081443720567785e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.15004891157150269, "step": 1990, "valid_targets_mean": 11998.1, "valid_targets_min": 3386 }, { "epoch": 1.9148800000000001, "grad_norm": 0.19929437058584107, "learning_rate": 3.102560691079007e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.14125114679336548, "step": 1995, "valid_targets_mean": 9776.0, "valid_targets_min": 3376 }, { "epoch": 1.91968, "grad_norm": 0.22575168479848515, "learning_rate": 3.0969646369196307e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.13779957592487335, "step": 2000, "valid_targets_mean": 10278.4, "valid_targets_min": 2325 }, { "epoch": 1.92448, "grad_norm": 0.20409262515285168, "learning_rate": 3.0913562723788174e-05, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357709765434265, "step": 2005, "valid_targets_mean": 10191.1, "valid_targets_min": 1573 }, { "epoch": 1.9292799999999999, "grad_norm": 0.2352276816410141, "learning_rate": 3.085735660394881e-05, "loss": 0.3905, "loss_nan_ranks": 0, "loss_rank_avg": 0.13631772994995117, "step": 2010, "valid_targets_mean": 10502.3, "valid_targets_min": 322 }, { "epoch": 1.93408, "grad_norm": 0.2109305064204127, "learning_rate": 3.080102864043581e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.137748584151268, "step": 2015, "valid_targets_mean": 10613.8, "valid_targets_min": 3961 }, { "epoch": 1.9388800000000002, "grad_norm": 0.2136610461341701, "learning_rate": 3.074457946537413e-05, "loss": 0.3881, "loss_nan_ranks": 0, "loss_rank_avg": 0.09953026473522186, "step": 2020, "valid_targets_mean": 8608.3, "valid_targets_min": 2488 }, { "epoch": 1.94368, "grad_norm": 0.20513829600366332, "learning_rate": 3.068800971224898e-05, "loss": 0.3874, "loss_nan_ranks": 0, "loss_rank_avg": 0.13289940357208252, "step": 2025, "valid_targets_mean": 9401.7, "valid_targets_min": 1490 }, { "epoch": 1.94848, "grad_norm": 0.20197105825927517, "learning_rate": 3.0631320015898735e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.12039284408092499, "step": 2030, "valid_targets_mean": 10141.2, "valid_targets_min": 3005 }, { "epoch": 1.95328, "grad_norm": 0.20795752182412858, "learning_rate": 3.057451101250778e-05, "loss": 0.3926, "loss_nan_ranks": 0, "loss_rank_avg": 0.12851007282733917, "step": 2035, "valid_targets_mean": 9688.7, "valid_targets_min": 1591 }, { "epoch": 1.95808, "grad_norm": 0.21314778698152376, "learning_rate": 3.051758333959941e-05, "loss": 0.3962, "loss_nan_ranks": 0, "loss_rank_avg": 0.13587504625320435, "step": 2040, "valid_targets_mean": 9627.9, "valid_targets_min": 2228 }, { "epoch": 1.96288, "grad_norm": 0.20482304692000647, "learning_rate": 3.046053763602865e-05, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.12451982498168945, "step": 2045, "valid_targets_mean": 10732.7, "valid_targets_min": 1660 }, { "epoch": 1.96768, "grad_norm": 0.22387606059097612, "learning_rate": 3.0403374541975078e-05, "loss": 0.3872, "loss_nan_ranks": 0, "loss_rank_avg": 0.13428357243537903, "step": 2050, "valid_targets_mean": 10365.8, "valid_targets_min": 2933 }, { "epoch": 1.97248, "grad_norm": 0.1998358036134206, "learning_rate": 3.034609469893567e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.11720042675733566, "step": 2055, "valid_targets_mean": 9579.6, "valid_targets_min": 1590 }, { "epoch": 1.97728, "grad_norm": 0.19831729145649243, "learning_rate": 3.028869874971758e-05, "loss": 0.3948, "loss_nan_ranks": 0, "loss_rank_avg": 0.12150508165359497, "step": 2060, "valid_targets_mean": 9771.9, "valid_targets_min": 1538 }, { "epoch": 1.9820799999999998, "grad_norm": 0.21459891896364366, "learning_rate": 3.0231187338430944e-05, "loss": 0.3881, "loss_nan_ranks": 0, "loss_rank_avg": 0.12095307558774948, "step": 2065, "valid_targets_mean": 8782.9, "valid_targets_min": 1729 }, { "epoch": 1.98688, "grad_norm": 0.21508972922553282, "learning_rate": 3.0173561110481606e-05, "loss": 0.3944, "loss_nan_ranks": 0, "loss_rank_avg": 0.142621248960495, "step": 2070, "valid_targets_mean": 11738.8, "valid_targets_min": 2939 }, { "epoch": 1.9916800000000001, "grad_norm": 0.2374644700039593, "learning_rate": 3.011582071256394e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.13136368989944458, "step": 2075, "valid_targets_mean": 9781.7, "valid_targets_min": 1517 }, { "epoch": 1.99648, "grad_norm": 0.22812721698709595, "learning_rate": 3.0057966792653547e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.16073977947235107, "step": 2080, "valid_targets_mean": 11632.2, "valid_targets_min": 1621 }, { "epoch": 2.00096, "grad_norm": 0.23520090782122327, "learning_rate": 3.0000000000000004e-05, "loss": 0.3982, "loss_nan_ranks": 0, "loss_rank_avg": 0.1233157068490982, "step": 2085, "valid_targets_mean": 9876.7, "valid_targets_min": 1508 }, { "epoch": 2.00576, "grad_norm": 0.2216631791006346, "learning_rate": 2.9941920985119562e-05, "loss": 0.391, "loss_nan_ranks": 0, "loss_rank_avg": 0.13492241501808167, "step": 2090, "valid_targets_mean": 10056.4, "valid_targets_min": 1290 }, { "epoch": 2.01056, "grad_norm": 0.2400982673308614, "learning_rate": 2.988373039978786e-05, "loss": 0.3832, "loss_nan_ranks": 0, "loss_rank_avg": 0.1363467276096344, "step": 2095, "valid_targets_mean": 11063.2, "valid_targets_min": 3770 }, { "epoch": 2.01536, "grad_norm": 0.23156897134336338, "learning_rate": 2.98254288970326e-05, "loss": 0.3775, "loss_nan_ranks": 0, "loss_rank_avg": 0.09604047238826752, "step": 2100, "valid_targets_mean": 7552.9, "valid_targets_min": 2284 }, { "epoch": 2.02016, "grad_norm": 0.20724384057820167, "learning_rate": 2.9767017131126245e-05, "loss": 0.3916, "loss_nan_ranks": 0, "loss_rank_avg": 0.10275719314813614, "step": 2105, "valid_targets_mean": 9190.3, "valid_targets_min": 1996 }, { "epoch": 2.02496, "grad_norm": 0.1961879146915268, "learning_rate": 2.9708495757578633e-05, "loss": 0.3818, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239154756069183, "step": 2110, "valid_targets_mean": 11486.5, "valid_targets_min": 1604 }, { "epoch": 2.02976, "grad_norm": 0.2151407272702704, "learning_rate": 2.964986543312964e-05, "loss": 0.3796, "loss_nan_ranks": 0, "loss_rank_avg": 0.1200903132557869, "step": 2115, "valid_targets_mean": 9579.2, "valid_targets_min": 1869 }, { "epoch": 2.03456, "grad_norm": 0.19765475611331146, "learning_rate": 2.9591126815741832e-05, "loss": 0.38, "loss_nan_ranks": 0, "loss_rank_avg": 0.10982204973697662, "step": 2120, "valid_targets_mean": 9895.5, "valid_targets_min": 1146 }, { "epoch": 2.03936, "grad_norm": 0.2308073882459791, "learning_rate": 2.953228056459305e-05, "loss": 0.3831, "loss_nan_ranks": 0, "loss_rank_avg": 0.13495692610740662, "step": 2125, "valid_targets_mean": 11730.5, "valid_targets_min": 3230 }, { "epoch": 2.04416, "grad_norm": 0.2210810128406193, "learning_rate": 2.947332734006903e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.141627237200737, "step": 2130, "valid_targets_mean": 11017.2, "valid_targets_min": 3168 }, { "epoch": 2.04896, "grad_norm": 0.22292894896010498, "learning_rate": 2.9414267803755988e-05, "loss": 0.3744, "loss_nan_ranks": 0, "loss_rank_avg": 0.1303427368402481, "step": 2135, "valid_targets_mean": 10870.1, "valid_targets_min": 1314 }, { "epoch": 2.05376, "grad_norm": 0.21603225038870696, "learning_rate": 2.9355102618433197e-05, "loss": 0.3821, "loss_nan_ranks": 0, "loss_rank_avg": 0.12586045265197754, "step": 2140, "valid_targets_mean": 9648.2, "valid_targets_min": 1780 }, { "epoch": 2.05856, "grad_norm": 0.19143697649106933, "learning_rate": 2.929583244806553e-05, "loss": 0.3827, "loss_nan_ranks": 0, "loss_rank_avg": 0.11953039467334747, "step": 2145, "valid_targets_mean": 10312.8, "valid_targets_min": 1286 }, { "epoch": 2.06336, "grad_norm": 0.1926989550668403, "learning_rate": 2.9236457957796047e-05, "loss": 0.3949, "loss_nan_ranks": 0, "loss_rank_avg": 0.1427406370639801, "step": 2150, "valid_targets_mean": 12204.4, "valid_targets_min": 3038 }, { "epoch": 2.0681599999999998, "grad_norm": 0.20349926888856612, "learning_rate": 2.9176979813938494e-05, "loss": 0.3828, "loss_nan_ranks": 0, "loss_rank_avg": 0.13766226172447205, "step": 2155, "valid_targets_mean": 11886.8, "valid_targets_min": 1810 }, { "epoch": 2.07296, "grad_norm": 0.20794478653140658, "learning_rate": 2.9117398683969857e-05, "loss": 0.3849, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351398229598999, "step": 2160, "valid_targets_mean": 11531.9, "valid_targets_min": 929 }, { "epoch": 2.07776, "grad_norm": 0.19642909203052808, "learning_rate": 2.9057715236522833e-05, "loss": 0.3783, "loss_nan_ranks": 0, "loss_rank_avg": 0.13603469729423523, "step": 2165, "valid_targets_mean": 10830.4, "valid_targets_min": 1968 }, { "epoch": 2.08256, "grad_norm": 0.1924151874734592, "learning_rate": 2.899793014137836e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.12676164507865906, "step": 2170, "valid_targets_mean": 10274.2, "valid_targets_min": 1836 }, { "epoch": 2.08736, "grad_norm": 0.20744477541749562, "learning_rate": 2.8938044069458094e-05, "loss": 0.3768, "loss_nan_ranks": 0, "loss_rank_avg": 0.1298026740550995, "step": 2175, "valid_targets_mean": 10860.8, "valid_targets_min": 1674 }, { "epoch": 2.09216, "grad_norm": 0.21185656425668636, "learning_rate": 2.8878057692816877e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.13175363838672638, "step": 2180, "valid_targets_mean": 11086.3, "valid_targets_min": 2251 }, { "epoch": 2.09696, "grad_norm": 0.2012977437878008, "learning_rate": 2.8817971684635178e-05, "loss": 0.3836, "loss_nan_ranks": 0, "loss_rank_avg": 0.10911810398101807, "step": 2185, "valid_targets_mean": 9224.0, "valid_targets_min": 1876 }, { "epoch": 2.10176, "grad_norm": 0.20119464174885665, "learning_rate": 2.8757786719211555e-05, "loss": 0.3822, "loss_nan_ranks": 0, "loss_rank_avg": 0.12016467750072479, "step": 2190, "valid_targets_mean": 9766.5, "valid_targets_min": 2315 }, { "epoch": 2.10656, "grad_norm": 0.2103441930729234, "learning_rate": 2.8697503471955106e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.10794928669929504, "step": 2195, "valid_targets_mean": 9752.1, "valid_targets_min": 1734 }, { "epoch": 2.11136, "grad_norm": 0.1973128218861176, "learning_rate": 2.8637122619377848e-05, "loss": 0.3805, "loss_nan_ranks": 0, "loss_rank_avg": 0.13639453053474426, "step": 2200, "valid_targets_mean": 10859.4, "valid_targets_min": 374 }, { "epoch": 2.11616, "grad_norm": 0.21955743114852744, "learning_rate": 2.8576644839087152e-05, "loss": 0.3812, "loss_nan_ranks": 0, "loss_rank_avg": 0.13809733092784882, "step": 2205, "valid_targets_mean": 9867.9, "valid_targets_min": 1767 }, { "epoch": 2.12096, "grad_norm": 0.2068750644897939, "learning_rate": 2.8516070809778145e-05, "loss": 0.3814, "loss_nan_ranks": 0, "loss_rank_avg": 0.10828588157892227, "step": 2210, "valid_targets_mean": 10207.7, "valid_targets_min": 2529 }, { "epoch": 2.12576, "grad_norm": 0.20719191927343455, "learning_rate": 2.845540121122607e-05, "loss": 0.385, "loss_nan_ranks": 0, "loss_rank_avg": 0.12375476211309433, "step": 2215, "valid_targets_mean": 10426.1, "valid_targets_min": 1358 }, { "epoch": 2.13056, "grad_norm": 0.2039973480587662, "learning_rate": 2.839463672427867e-05, "loss": 0.3835, "loss_nan_ranks": 0, "loss_rank_avg": 0.1495930552482605, "step": 2220, "valid_targets_mean": 11969.6, "valid_targets_min": 2805 }, { "epoch": 2.13536, "grad_norm": 0.18986775376722906, "learning_rate": 2.833377803084855e-05, "loss": 0.3856, "loss_nan_ranks": 0, "loss_rank_avg": 0.12233369052410126, "step": 2225, "valid_targets_mean": 11053.6, "valid_targets_min": 3083 }, { "epoch": 2.14016, "grad_norm": 0.2278637593281419, "learning_rate": 2.8272825813905522e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278565227985382, "step": 2230, "valid_targets_mean": 10910.4, "valid_targets_min": 3721 }, { "epoch": 2.14496, "grad_norm": 0.20280471378821244, "learning_rate": 2.8211780757468942e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.12041682004928589, "step": 2235, "valid_targets_mean": 10993.0, "valid_targets_min": 2153 }, { "epoch": 2.14976, "grad_norm": 0.19991212575067607, "learning_rate": 2.8150643546600012e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.11163853108882904, "step": 2240, "valid_targets_mean": 9899.4, "valid_targets_min": 1843 }, { "epoch": 2.15456, "grad_norm": 0.2632475734932872, "learning_rate": 2.808941486739414e-05, "loss": 0.3811, "loss_nan_ranks": 0, "loss_rank_avg": 0.13694193959236145, "step": 2245, "valid_targets_mean": 11136.0, "valid_targets_min": 2839 }, { "epoch": 2.15936, "grad_norm": 0.21727180359137785, "learning_rate": 2.80280954069732e-05, "loss": 0.3854, "loss_nan_ranks": 0, "loss_rank_avg": 0.11582939326763153, "step": 2250, "valid_targets_mean": 8610.1, "valid_targets_min": 2262 }, { "epoch": 2.16416, "grad_norm": 0.22481090765530318, "learning_rate": 2.7966685853477828e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.12704181671142578, "step": 2255, "valid_targets_mean": 10174.8, "valid_targets_min": 2123 }, { "epoch": 2.16896, "grad_norm": 0.19369274940731798, "learning_rate": 2.790518689605971e-05, "loss": 0.3842, "loss_nan_ranks": 0, "loss_rank_avg": 0.12195196747779846, "step": 2260, "valid_targets_mean": 10902.6, "valid_targets_min": 2382 }, { "epoch": 2.17376, "grad_norm": 0.19672184157117886, "learning_rate": 2.7843599224873833e-05, "loss": 0.3836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1163254827260971, "step": 2265, "valid_targets_mean": 9992.1, "valid_targets_min": 2825 }, { "epoch": 2.17856, "grad_norm": 0.19723613015471497, "learning_rate": 2.7781923531070775e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.11363483965396881, "step": 2270, "valid_targets_mean": 9348.0, "valid_targets_min": 2631 }, { "epoch": 2.18336, "grad_norm": 0.2116943766512944, "learning_rate": 2.7720160506788896e-05, "loss": 0.3781, "loss_nan_ranks": 0, "loss_rank_avg": 0.11357665807008743, "step": 2275, "valid_targets_mean": 9558.6, "valid_targets_min": 1989 }, { "epoch": 2.18816, "grad_norm": 0.20054780631886765, "learning_rate": 2.7658310845146598e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.13914844393730164, "step": 2280, "valid_targets_mean": 11377.4, "valid_targets_min": 4677 }, { "epoch": 2.19296, "grad_norm": 0.22068280866813472, "learning_rate": 2.7596375240234574e-05, "loss": 0.3746, "loss_nan_ranks": 0, "loss_rank_avg": 0.12389899790287018, "step": 2285, "valid_targets_mean": 10821.3, "valid_targets_min": 2024 }, { "epoch": 2.19776, "grad_norm": 0.18781808934850716, "learning_rate": 2.7534354387107975e-05, "loss": 0.3762, "loss_nan_ranks": 0, "loss_rank_avg": 0.11634353548288345, "step": 2290, "valid_targets_mean": 10232.5, "valid_targets_min": 2110 }, { "epoch": 2.20256, "grad_norm": 0.2010597215182537, "learning_rate": 2.747224898177862e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.12369689345359802, "step": 2295, "valid_targets_mean": 9952.7, "valid_targets_min": 1838 }, { "epoch": 2.20736, "grad_norm": 0.21868349840227744, "learning_rate": 2.7410059721207187e-05, "loss": 0.3768, "loss_nan_ranks": 0, "loss_rank_avg": 0.11973851174116135, "step": 2300, "valid_targets_mean": 9082.8, "valid_targets_min": 2068 }, { "epoch": 2.21216, "grad_norm": 0.20931814759974568, "learning_rate": 2.734778730329543e-05, "loss": 0.3826, "loss_nan_ranks": 0, "loss_rank_avg": 0.11982230842113495, "step": 2305, "valid_targets_mean": 9954.4, "valid_targets_min": 1498 }, { "epoch": 2.21696, "grad_norm": 0.23696165400189556, "learning_rate": 2.7285432426878275e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.12035034596920013, "step": 2310, "valid_targets_mean": 10853.3, "valid_targets_min": 1405 }, { "epoch": 2.22176, "grad_norm": 0.19598291857765024, "learning_rate": 2.7222995791716034e-05, "loss": 0.3816, "loss_nan_ranks": 0, "loss_rank_avg": 0.14030274748802185, "step": 2315, "valid_targets_mean": 11407.2, "valid_targets_min": 1318 }, { "epoch": 2.22656, "grad_norm": 0.21215296796191113, "learning_rate": 2.716047809848653e-05, "loss": 0.3775, "loss_nan_ranks": 0, "loss_rank_avg": 0.13955843448638916, "step": 2320, "valid_targets_mean": 10772.2, "valid_targets_min": 1950 }, { "epoch": 2.23136, "grad_norm": 0.18886797079153328, "learning_rate": 2.7097880048777238e-05, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.12690003216266632, "step": 2325, "valid_targets_mean": 10627.6, "valid_targets_min": 2055 }, { "epoch": 2.23616, "grad_norm": 0.19135950944457367, "learning_rate": 2.703520234507742e-05, "loss": 0.3762, "loss_nan_ranks": 0, "loss_rank_avg": 0.1010352373123169, "step": 2330, "valid_targets_mean": 9337.2, "valid_targets_min": 1811 }, { "epoch": 2.24096, "grad_norm": 0.2055854776241585, "learning_rate": 2.697244569077021e-05, "loss": 0.374, "loss_nan_ranks": 0, "loss_rank_avg": 0.13945433497428894, "step": 2335, "valid_targets_mean": 10882.8, "valid_targets_min": 2564 }, { "epoch": 2.24576, "grad_norm": 0.190056204731367, "learning_rate": 2.6909610790124772e-05, "loss": 0.3735, "loss_nan_ranks": 0, "loss_rank_avg": 0.11307604610919952, "step": 2340, "valid_targets_mean": 9797.4, "valid_targets_min": 2176 }, { "epoch": 2.25056, "grad_norm": 0.19722871848427742, "learning_rate": 2.684669834828835e-05, "loss": 0.3751, "loss_nan_ranks": 0, "loss_rank_avg": 0.11232331395149231, "step": 2345, "valid_targets_mean": 10427.9, "valid_targets_min": 1359 }, { "epoch": 2.25536, "grad_norm": 0.20080194987727418, "learning_rate": 2.6783709071278372e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.1365032196044922, "step": 2350, "valid_targets_mean": 10621.3, "valid_targets_min": 1238 }, { "epoch": 2.26016, "grad_norm": 0.19001922126213333, "learning_rate": 2.6720643665974522e-05, "loss": 0.3845, "loss_nan_ranks": 0, "loss_rank_avg": 0.12681028246879578, "step": 2355, "valid_targets_mean": 9610.5, "valid_targets_min": 1365 }, { "epoch": 2.26496, "grad_norm": 0.19450897157350197, "learning_rate": 2.665750284011085e-05, "loss": 0.3767, "loss_nan_ranks": 0, "loss_rank_avg": 0.10528913885354996, "step": 2360, "valid_targets_mean": 8842.7, "valid_targets_min": 1482 }, { "epoch": 2.2697599999999998, "grad_norm": 0.20499479594100586, "learning_rate": 2.6594287302267744e-05, "loss": 0.3815, "loss_nan_ranks": 0, "loss_rank_avg": 0.11198015511035919, "step": 2365, "valid_targets_mean": 8527.8, "valid_targets_min": 1726 }, { "epoch": 2.27456, "grad_norm": 0.21729149125673355, "learning_rate": 2.653099776186405e-05, "loss": 0.3853, "loss_nan_ranks": 0, "loss_rank_avg": 0.11937613785266876, "step": 2370, "valid_targets_mean": 10422.3, "valid_targets_min": 2676 }, { "epoch": 2.27936, "grad_norm": 0.23936814043935242, "learning_rate": 2.646763492914908e-05, "loss": 0.3803, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370958685874939, "step": 2375, "valid_targets_mean": 11603.8, "valid_targets_min": 2639 }, { "epoch": 2.28416, "grad_norm": 0.226255238554012, "learning_rate": 2.640419951519467e-05, "loss": 0.3843, "loss_nan_ranks": 0, "loss_rank_avg": 0.13546521961688995, "step": 2380, "valid_targets_mean": 10853.2, "valid_targets_min": 2467 }, { "epoch": 2.28896, "grad_norm": 0.21000459214162845, "learning_rate": 2.634069223188715e-05, "loss": 0.3763, "loss_nan_ranks": 0, "loss_rank_avg": 0.1364605724811554, "step": 2385, "valid_targets_mean": 10490.6, "valid_targets_min": 3184 }, { "epoch": 2.29376, "grad_norm": 0.21053819505844917, "learning_rate": 2.627711379191939e-05, "loss": 0.3796, "loss_nan_ranks": 0, "loss_rank_avg": 0.13308705389499664, "step": 2390, "valid_targets_mean": 10670.0, "valid_targets_min": 2594 }, { "epoch": 2.29856, "grad_norm": 0.1968976461253721, "learning_rate": 2.621346490878281e-05, "loss": 0.3815, "loss_nan_ranks": 0, "loss_rank_avg": 0.12212714552879333, "step": 2395, "valid_targets_mean": 9727.0, "valid_targets_min": 1864 }, { "epoch": 2.30336, "grad_norm": 0.20200418718795113, "learning_rate": 2.614974629675935e-05, "loss": 0.3859, "loss_nan_ranks": 0, "loss_rank_avg": 0.13653194904327393, "step": 2400, "valid_targets_mean": 10758.1, "valid_targets_min": 3469 }, { "epoch": 2.30816, "grad_norm": 0.2133100603107007, "learning_rate": 2.608595867091346e-05, "loss": 0.3715, "loss_nan_ranks": 0, "loss_rank_avg": 0.12559379637241364, "step": 2405, "valid_targets_mean": 10498.1, "valid_targets_min": 1046 }, { "epoch": 2.31296, "grad_norm": 0.2033345530571247, "learning_rate": 2.6022102747084084e-05, "loss": 0.3815, "loss_nan_ranks": 0, "loss_rank_avg": 0.1133851408958435, "step": 2410, "valid_targets_mean": 8877.1, "valid_targets_min": 1354 }, { "epoch": 2.31776, "grad_norm": 0.2152577606604185, "learning_rate": 2.595817924187663e-05, "loss": 0.3734, "loss_nan_ranks": 0, "loss_rank_avg": 0.1213955357670784, "step": 2415, "valid_targets_mean": 10695.1, "valid_targets_min": 3535 }, { "epoch": 2.32256, "grad_norm": 0.22398470485476252, "learning_rate": 2.589418887265489e-05, "loss": 0.3748, "loss_nan_ranks": 0, "loss_rank_avg": 0.11093949526548386, "step": 2420, "valid_targets_mean": 9716.8, "valid_targets_min": 2130 }, { "epoch": 2.32736, "grad_norm": 0.1980562737542359, "learning_rate": 2.5830132357533044e-05, "loss": 0.3764, "loss_nan_ranks": 0, "loss_rank_avg": 0.12728214263916016, "step": 2425, "valid_targets_mean": 10986.3, "valid_targets_min": 2171 }, { "epoch": 2.33216, "grad_norm": 0.22230894654473113, "learning_rate": 2.5766010415367567e-05, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.11757129430770874, "step": 2430, "valid_targets_mean": 10236.9, "valid_targets_min": 1959 }, { "epoch": 2.33696, "grad_norm": 0.20767824848398078, "learning_rate": 2.5701823765749187e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.10535033047199249, "step": 2435, "valid_targets_mean": 10114.5, "valid_targets_min": 3175 }, { "epoch": 2.34176, "grad_norm": 0.20058624194170693, "learning_rate": 2.563757312899477e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.11982904374599457, "step": 2440, "valid_targets_mean": 9704.2, "valid_targets_min": 1319 }, { "epoch": 2.34656, "grad_norm": 0.21452305848338077, "learning_rate": 2.557325922613926e-05, "loss": 0.3742, "loss_nan_ranks": 0, "loss_rank_avg": 0.136878103017807, "step": 2445, "valid_targets_mean": 11417.2, "valid_targets_min": 4316 }, { "epoch": 2.35136, "grad_norm": 0.20622376969404346, "learning_rate": 2.5508882778927615e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.09706181287765503, "step": 2450, "valid_targets_mean": 9376.6, "valid_targets_min": 2567 }, { "epoch": 2.35616, "grad_norm": 0.2269780856123984, "learning_rate": 2.5444444509806654e-05, "loss": 0.3619, "loss_nan_ranks": 0, "loss_rank_avg": 0.10020601749420166, "step": 2455, "valid_targets_mean": 8076.2, "valid_targets_min": 2098 }, { "epoch": 2.36096, "grad_norm": 0.20946019964551488, "learning_rate": 2.5379945141916976e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.09800328314304352, "step": 2460, "valid_targets_mean": 8551.6, "valid_targets_min": 1660 }, { "epoch": 2.36576, "grad_norm": 0.2008350967896554, "learning_rate": 2.531538539908486e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.12654729187488556, "step": 2465, "valid_targets_mean": 10316.7, "valid_targets_min": 1557 }, { "epoch": 2.3705600000000002, "grad_norm": 0.2229363972372055, "learning_rate": 2.5250766005814108e-05, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.12344948947429657, "step": 2470, "valid_targets_mean": 10335.5, "valid_targets_min": 2896 }, { "epoch": 2.37536, "grad_norm": 0.21842342622258043, "learning_rate": 2.5186087687277956e-05, "loss": 0.373, "loss_nan_ranks": 0, "loss_rank_avg": 0.11907872557640076, "step": 2475, "valid_targets_mean": 10898.4, "valid_targets_min": 2757 }, { "epoch": 2.38016, "grad_norm": 0.21743760724252226, "learning_rate": 2.5121351169310887e-05, "loss": 0.3763, "loss_nan_ranks": 0, "loss_rank_avg": 0.14003226161003113, "step": 2480, "valid_targets_mean": 11164.4, "valid_targets_min": 2369 }, { "epoch": 2.38496, "grad_norm": 0.254434215027223, "learning_rate": 2.505655717840052e-05, "loss": 0.3738, "loss_nan_ranks": 0, "loss_rank_avg": 0.13954034447669983, "step": 2485, "valid_targets_mean": 11127.9, "valid_targets_min": 2012 }, { "epoch": 2.38976, "grad_norm": 0.23856981677013078, "learning_rate": 2.499170644167946e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.11923474073410034, "step": 2490, "valid_targets_mean": 9402.1, "valid_targets_min": 2200 }, { "epoch": 2.3945600000000002, "grad_norm": 0.2042522121463096, "learning_rate": 2.49267996869171e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.12613581120967865, "step": 2495, "valid_targets_mean": 11327.1, "valid_targets_min": 2319 }, { "epoch": 2.39936, "grad_norm": 0.2169067842374301, "learning_rate": 2.486183764251151e-05, "loss": 0.376, "loss_nan_ranks": 0, "loss_rank_avg": 0.11283647269010544, "step": 2500, "valid_targets_mean": 10245.0, "valid_targets_min": 316 }, { "epoch": 2.40416, "grad_norm": 0.20640537266510697, "learning_rate": 2.4796821037481215e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.11287974566221237, "step": 2505, "valid_targets_mean": 8545.9, "valid_targets_min": 1182 }, { "epoch": 2.40896, "grad_norm": 0.2142294699914048, "learning_rate": 2.473175060145703e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.11034555733203888, "step": 2510, "valid_targets_mean": 8637.3, "valid_targets_min": 2107 }, { "epoch": 2.41376, "grad_norm": 0.20836784046085266, "learning_rate": 2.4666627064673892e-05, "loss": 0.3766, "loss_nan_ranks": 0, "loss_rank_avg": 0.12005623430013657, "step": 2515, "valid_targets_mean": 10009.1, "valid_targets_min": 2183 }, { "epoch": 2.41856, "grad_norm": 0.21472818748145794, "learning_rate": 2.4601451157962616e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.1286231279373169, "step": 2520, "valid_targets_mean": 11829.6, "valid_targets_min": 3279 }, { "epoch": 2.42336, "grad_norm": 0.20869745151391522, "learning_rate": 2.4536223612741754e-05, "loss": 0.3701, "loss_nan_ranks": 0, "loss_rank_avg": 0.12529705464839935, "step": 2525, "valid_targets_mean": 10626.5, "valid_targets_min": 279 }, { "epoch": 2.42816, "grad_norm": 0.19164417929518518, "learning_rate": 2.447094516100934e-05, "loss": 0.3838, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397651880979538, "step": 2530, "valid_targets_mean": 12536.2, "valid_targets_min": 1225 }, { "epoch": 2.43296, "grad_norm": 0.2036217280117751, "learning_rate": 2.4405616535334695e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.12778422236442566, "step": 2535, "valid_targets_mean": 11081.4, "valid_targets_min": 2051 }, { "epoch": 2.43776, "grad_norm": 0.2061723618850725, "learning_rate": 2.43402384688502e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277051866054535, "step": 2540, "valid_targets_mean": 11323.4, "valid_targets_min": 2471 }, { "epoch": 2.44256, "grad_norm": 0.19889048966025744, "learning_rate": 2.4274811695243085e-05, "loss": 0.3601, "loss_nan_ranks": 0, "loss_rank_avg": 0.11608883738517761, "step": 2545, "valid_targets_mean": 9306.0, "valid_targets_min": 2322 }, { "epoch": 2.4473599999999998, "grad_norm": 0.24626904970503338, "learning_rate": 2.4209336948747168e-05, "loss": 0.3759, "loss_nan_ranks": 0, "loss_rank_avg": 0.12030565738677979, "step": 2550, "valid_targets_mean": 11547.6, "valid_targets_min": 1259 }, { "epoch": 2.45216, "grad_norm": 0.2306461738859341, "learning_rate": 2.414381496413464e-05, "loss": 0.3813, "loss_nan_ranks": 0, "loss_rank_avg": 0.10795653611421585, "step": 2555, "valid_targets_mean": 9398.9, "valid_targets_min": 1431 }, { "epoch": 2.45696, "grad_norm": 0.2080435328672805, "learning_rate": 2.4078246476707793e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.12084488570690155, "step": 2560, "valid_targets_mean": 12174.3, "valid_targets_min": 3205 }, { "epoch": 2.46176, "grad_norm": 0.2061173208068871, "learning_rate": 2.4012632222290802e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.12514223158359528, "step": 2565, "valid_targets_mean": 9897.4, "valid_targets_min": 1837 }, { "epoch": 2.46656, "grad_norm": 0.20556503982483745, "learning_rate": 2.3946972937221444e-05, "loss": 0.36, "loss_nan_ranks": 0, "loss_rank_avg": 0.11990512907505035, "step": 2570, "valid_targets_mean": 9661.3, "valid_targets_min": 1838 }, { "epoch": 2.47136, "grad_norm": 0.19615449425752077, "learning_rate": 2.3881269358342828e-05, "loss": 0.3701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309790462255478, "step": 2575, "valid_targets_mean": 12405.8, "valid_targets_min": 3413 }, { "epoch": 2.47616, "grad_norm": 0.20553075982273802, "learning_rate": 2.3815522222995158e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.1276824176311493, "step": 2580, "valid_targets_mean": 10941.6, "valid_targets_min": 2899 }, { "epoch": 2.48096, "grad_norm": 0.20756905659976432, "learning_rate": 2.3749732269007427e-05, "loss": 0.371, "loss_nan_ranks": 0, "loss_rank_avg": 0.13721966743469238, "step": 2585, "valid_targets_mean": 11002.2, "valid_targets_min": 3037 }, { "epoch": 2.48576, "grad_norm": 0.2089986855086161, "learning_rate": 2.3683900234689142e-05, "loss": 0.3719, "loss_nan_ranks": 0, "loss_rank_avg": 0.10542646795511246, "step": 2590, "valid_targets_mean": 9137.1, "valid_targets_min": 453 }, { "epoch": 2.49056, "grad_norm": 0.19975431503444246, "learning_rate": 2.3618026858822054e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.14532935619354248, "step": 2595, "valid_targets_mean": 11967.5, "valid_targets_min": 2433 }, { "epoch": 2.49536, "grad_norm": 0.20669335366995573, "learning_rate": 2.355211288065187e-05, "loss": 0.3674, "loss_nan_ranks": 0, "loss_rank_avg": 0.12231142818927765, "step": 2600, "valid_targets_mean": 10766.8, "valid_targets_min": 2512 }, { "epoch": 2.50016, "grad_norm": 0.20403508545321805, "learning_rate": 2.348615903987991e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.11272934824228287, "step": 2605, "valid_targets_mean": 9697.4, "valid_targets_min": 906 }, { "epoch": 2.50496, "grad_norm": 0.19991166546341962, "learning_rate": 2.3420166076654873e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.11372819542884827, "step": 2610, "valid_targets_mean": 9772.1, "valid_targets_min": 1562 }, { "epoch": 2.50976, "grad_norm": 0.21927831366966014, "learning_rate": 2.335413473156449e-05, "loss": 0.3752, "loss_nan_ranks": 0, "loss_rank_avg": 0.11094687879085541, "step": 2615, "valid_targets_mean": 9214.7, "valid_targets_min": 1582 }, { "epoch": 2.51456, "grad_norm": 0.2055659911333355, "learning_rate": 2.328806574562722e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.1251363754272461, "step": 2620, "valid_targets_mean": 10513.7, "valid_targets_min": 2205 }, { "epoch": 2.51936, "grad_norm": 0.2025013690361369, "learning_rate": 2.322195986028393e-05, "loss": 0.374, "loss_nan_ranks": 0, "loss_rank_avg": 0.13312791287899017, "step": 2625, "valid_targets_mean": 9986.3, "valid_targets_min": 1383 }, { "epoch": 2.52416, "grad_norm": 0.19390979413109546, "learning_rate": 2.315581781738959e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.10706675052642822, "step": 2630, "valid_targets_mean": 10572.9, "valid_targets_min": 3387 }, { "epoch": 2.52896, "grad_norm": 0.21748660946987688, "learning_rate": 2.3089640359204937e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.12551315128803253, "step": 2635, "valid_targets_mean": 10573.0, "valid_targets_min": 2608 }, { "epoch": 2.53376, "grad_norm": 0.19552172792861605, "learning_rate": 2.3023428228388144e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.11490911990404129, "step": 2640, "valid_targets_mean": 9536.7, "valid_targets_min": 1710 }, { "epoch": 2.53856, "grad_norm": 0.2141206136144874, "learning_rate": 2.2957182167986486e-05, "loss": 0.3696, "loss_nan_ranks": 0, "loss_rank_avg": 0.11893200129270554, "step": 2645, "valid_targets_mean": 10167.2, "valid_targets_min": 1590 }, { "epoch": 2.54336, "grad_norm": 0.20927258265813803, "learning_rate": 2.2890902921428004e-05, "loss": 0.3586, "loss_nan_ranks": 0, "loss_rank_avg": 0.11703682690858841, "step": 2650, "valid_targets_mean": 10636.1, "valid_targets_min": 2815 }, { "epoch": 2.54816, "grad_norm": 0.1970167456568604, "learning_rate": 2.2824591232513153e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.10874166339635849, "step": 2655, "valid_targets_mean": 10392.5, "valid_targets_min": 2435 }, { "epoch": 2.55296, "grad_norm": 0.20392076385963556, "learning_rate": 2.2758247845406495e-05, "loss": 0.3697, "loss_nan_ranks": 0, "loss_rank_avg": 0.12093451619148254, "step": 2660, "valid_targets_mean": 10889.5, "valid_targets_min": 1734 }, { "epoch": 2.55776, "grad_norm": 0.18913518596868675, "learning_rate": 2.2691873504628282e-05, "loss": 0.3578, "loss_nan_ranks": 0, "loss_rank_avg": 0.10009606927633286, "step": 2665, "valid_targets_mean": 10179.2, "valid_targets_min": 3734 }, { "epoch": 2.56256, "grad_norm": 0.22753404829816876, "learning_rate": 2.2625468955046143e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.13020503520965576, "step": 2670, "valid_targets_mean": 10354.9, "valid_targets_min": 2023 }, { "epoch": 2.56736, "grad_norm": 0.2130956888250592, "learning_rate": 2.2559034941866727e-05, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377410888671875, "step": 2675, "valid_targets_mean": 11961.9, "valid_targets_min": 1854 }, { "epoch": 2.5721600000000002, "grad_norm": 0.23396720104016538, "learning_rate": 2.2492572210627325e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.12554751336574554, "step": 2680, "valid_targets_mean": 11309.3, "valid_targets_min": 3110 }, { "epoch": 2.57696, "grad_norm": 0.20949220427342713, "learning_rate": 2.24260815071875e-05, "loss": 0.3553, "loss_nan_ranks": 0, "loss_rank_avg": 0.12479083985090256, "step": 2685, "valid_targets_mean": 11756.3, "valid_targets_min": 2756 }, { "epoch": 2.58176, "grad_norm": 0.22023057058606868, "learning_rate": 2.2359563577720743e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.12142911553382874, "step": 2690, "valid_targets_mean": 10502.6, "valid_targets_min": 1432 }, { "epoch": 2.58656, "grad_norm": 0.1960286783235888, "learning_rate": 2.229301916870606e-05, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.11783711612224579, "step": 2695, "valid_targets_mean": 10609.1, "valid_targets_min": 1423 }, { "epoch": 2.59136, "grad_norm": 0.196287674533827, "learning_rate": 2.2226449026919637e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.13481172919273376, "step": 2700, "valid_targets_mean": 12314.3, "valid_targets_min": 349 }, { "epoch": 2.5961600000000002, "grad_norm": 0.2017354957403159, "learning_rate": 2.2159853899426427e-05, "loss": 0.3597, "loss_nan_ranks": 0, "loss_rank_avg": 0.12297806888818741, "step": 2705, "valid_targets_mean": 11269.6, "valid_targets_min": 921 }, { "epoch": 2.60096, "grad_norm": 0.21504040340795968, "learning_rate": 2.209323453357178e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.09462332725524902, "step": 2710, "valid_targets_mean": 7711.0, "valid_targets_min": 1260 }, { "epoch": 2.60576, "grad_norm": 0.18774009189829208, "learning_rate": 2.202659167697306e-05, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.10885201394557953, "step": 2715, "valid_targets_mean": 10389.9, "valid_targets_min": 2927 }, { "epoch": 2.61056, "grad_norm": 0.20997682496666586, "learning_rate": 2.1959926077511234e-05, "loss": 0.3601, "loss_nan_ranks": 0, "loss_rank_avg": 0.1147003173828125, "step": 2720, "valid_targets_mean": 10074.6, "valid_targets_min": 2761 }, { "epoch": 2.61536, "grad_norm": 0.19602241999739142, "learning_rate": 2.1893238483322512e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930413126945496, "step": 2725, "valid_targets_mean": 12336.5, "valid_targets_min": 3485 }, { "epoch": 2.6201600000000003, "grad_norm": 0.20225701561452372, "learning_rate": 2.1826529642789923e-05, "loss": 0.3593, "loss_nan_ranks": 0, "loss_rank_avg": 0.11931279301643372, "step": 2730, "valid_targets_mean": 10042.8, "valid_targets_min": 2202 }, { "epoch": 2.6249599999999997, "grad_norm": 0.22142458739273158, "learning_rate": 2.1759800304534936e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.14175814390182495, "step": 2735, "valid_targets_mean": 11615.8, "valid_targets_min": 2372 }, { "epoch": 2.62976, "grad_norm": 0.23656684138473588, "learning_rate": 2.1693051217409048e-05, "loss": 0.3728, "loss_nan_ranks": 0, "loss_rank_avg": 0.12897023558616638, "step": 2740, "valid_targets_mean": 11909.6, "valid_targets_min": 1860 }, { "epoch": 2.63456, "grad_norm": 0.20663860230606496, "learning_rate": 2.1626283130485365e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.11588485538959503, "step": 2745, "valid_targets_mean": 10080.9, "valid_targets_min": 1081 }, { "epoch": 2.63936, "grad_norm": 0.20655720033130662, "learning_rate": 2.1559496793050235e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.11520221084356308, "step": 2750, "valid_targets_mean": 10034.1, "valid_targets_min": 2334 }, { "epoch": 2.64416, "grad_norm": 0.2103206956535719, "learning_rate": 2.1492692954594815e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502731442451477, "step": 2755, "valid_targets_mean": 12340.9, "valid_targets_min": 1574 }, { "epoch": 2.6489599999999998, "grad_norm": 0.20142551016494148, "learning_rate": 2.1425872364806642e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.14424043893814087, "step": 2760, "valid_targets_mean": 12143.4, "valid_targets_min": 1267 }, { "epoch": 2.65376, "grad_norm": 0.19957066204774804, "learning_rate": 2.1359035773561275e-05, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.1341516673564911, "step": 2765, "valid_targets_mean": 11031.7, "valid_targets_min": 2913 }, { "epoch": 2.65856, "grad_norm": 0.2011661145672297, "learning_rate": 2.1292183930913803e-05, "loss": 0.3716, "loss_nan_ranks": 0, "loss_rank_avg": 0.14259979128837585, "step": 2770, "valid_targets_mean": 12015.1, "valid_targets_min": 1469 }, { "epoch": 2.66336, "grad_norm": 0.21848616875295573, "learning_rate": 2.1225317587090507e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.1095510944724083, "step": 2775, "valid_targets_mean": 9779.4, "valid_targets_min": 1433 }, { "epoch": 2.66816, "grad_norm": 0.24628573916420246, "learning_rate": 2.1158437492480384e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1268613338470459, "step": 2780, "valid_targets_mean": 11715.3, "valid_targets_min": 1504 }, { "epoch": 2.67296, "grad_norm": 0.18719854699996888, "learning_rate": 2.1091544397626752e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1171911209821701, "step": 2785, "valid_targets_mean": 10388.6, "valid_targets_min": 2184 }, { "epoch": 2.67776, "grad_norm": 0.2394102887498419, "learning_rate": 2.102463905321881e-05, "loss": 0.3686, "loss_nan_ranks": 0, "loss_rank_avg": 0.13961833715438843, "step": 2790, "valid_targets_mean": 10197.9, "valid_targets_min": 1424 }, { "epoch": 2.68256, "grad_norm": 0.18070241452128152, "learning_rate": 2.095772221008323e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.12561923265457153, "step": 2795, "valid_targets_mean": 12434.9, "valid_targets_min": 979 }, { "epoch": 2.68736, "grad_norm": 0.24663833335176194, "learning_rate": 2.0890794619175745e-05, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.10567250102758408, "step": 2800, "valid_targets_mean": 8472.5, "valid_targets_min": 1461 }, { "epoch": 2.69216, "grad_norm": 0.20289405773135852, "learning_rate": 2.0823857031572663e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317484974861145, "step": 2805, "valid_targets_mean": 11333.3, "valid_targets_min": 444 }, { "epoch": 2.69696, "grad_norm": 0.20744664772043325, "learning_rate": 2.0756910198462515e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.13761654496192932, "step": 2810, "valid_targets_mean": 10870.6, "valid_targets_min": 1506 }, { "epoch": 2.70176, "grad_norm": 0.21097955156861722, "learning_rate": 2.0689954871137558e-05, "loss": 0.3616, "loss_nan_ranks": 0, "loss_rank_avg": 0.11286822706460953, "step": 2815, "valid_targets_mean": 9823.9, "valid_targets_min": 1617 }, { "epoch": 2.70656, "grad_norm": 0.2110640803089252, "learning_rate": 2.0622991800985398e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.11495064944028854, "step": 2820, "valid_targets_mean": 9073.9, "valid_targets_min": 1187 }, { "epoch": 2.71136, "grad_norm": 0.22613715754326771, "learning_rate": 2.055602173948051e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1298108845949173, "step": 2825, "valid_targets_mean": 10639.9, "valid_targets_min": 2426 }, { "epoch": 2.71616, "grad_norm": 0.21676181508143738, "learning_rate": 2.0489045438175842e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.0962882786989212, "step": 2830, "valid_targets_mean": 9108.2, "valid_targets_min": 2854 }, { "epoch": 2.72096, "grad_norm": 0.2026053135412824, "learning_rate": 2.042206364869436e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.11987446993589401, "step": 2835, "valid_targets_mean": 10001.6, "valid_targets_min": 2254 }, { "epoch": 2.72576, "grad_norm": 0.21857205264961743, "learning_rate": 2.0355077122720625e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.11152277886867523, "step": 2840, "valid_targets_mean": 9368.9, "valid_targets_min": 232 }, { "epoch": 2.73056, "grad_norm": 0.2235096544972368, "learning_rate": 2.0288086611992344e-05, "loss": 0.3597, "loss_nan_ranks": 0, "loss_rank_avg": 0.13391023874282837, "step": 2845, "valid_targets_mean": 10348.2, "valid_targets_min": 1288 }, { "epoch": 2.73536, "grad_norm": 0.20288624688622384, "learning_rate": 2.0221092868291953e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.11558884382247925, "step": 2850, "valid_targets_mean": 10537.2, "valid_targets_min": 2252 }, { "epoch": 2.74016, "grad_norm": 0.19954417000954933, "learning_rate": 2.0154096643438153e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.10435223579406738, "step": 2855, "valid_targets_mean": 9052.9, "valid_targets_min": 175 }, { "epoch": 2.74496, "grad_norm": 0.19802408710823705, "learning_rate": 2.008709868927751e-05, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.11530742049217224, "step": 2860, "valid_targets_mean": 9975.5, "valid_targets_min": 2684 }, { "epoch": 2.74976, "grad_norm": 0.2187266128310994, "learning_rate": 2.0020099757675978e-05, "loss": 0.3611, "loss_nan_ranks": 0, "loss_rank_avg": 0.11976270377635956, "step": 2865, "valid_targets_mean": 9873.7, "valid_targets_min": 1817 }, { "epoch": 2.75456, "grad_norm": 0.22996724727881987, "learning_rate": 1.9953100600510487e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.11876045167446136, "step": 2870, "valid_targets_mean": 11607.8, "valid_targets_min": 1452 }, { "epoch": 2.75936, "grad_norm": 0.2306692684829691, "learning_rate": 1.9886101969660504e-05, "loss": 0.3778, "loss_nan_ranks": 0, "loss_rank_avg": 0.11759520322084427, "step": 2875, "valid_targets_mean": 9185.2, "valid_targets_min": 1996 }, { "epoch": 2.76416, "grad_norm": 0.2391988826978733, "learning_rate": 1.9819104616999584e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.12147517502307892, "step": 2880, "valid_targets_mean": 11028.3, "valid_targets_min": 3506 }, { "epoch": 2.76896, "grad_norm": 0.20185735285509163, "learning_rate": 1.975210929438693e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.10030334442853928, "step": 2885, "valid_targets_mean": 9568.4, "valid_targets_min": 3429 }, { "epoch": 2.7737600000000002, "grad_norm": 0.19875807889149402, "learning_rate": 1.9685116753658982e-05, "loss": 0.3501, "loss_nan_ranks": 0, "loss_rank_avg": 0.13128820061683655, "step": 2890, "valid_targets_mean": 11010.5, "valid_targets_min": 1659 }, { "epoch": 2.77856, "grad_norm": 0.20966066469853917, "learning_rate": 1.9618127746620944e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.0992082953453064, "step": 2895, "valid_targets_mean": 9702.0, "valid_targets_min": 1449 }, { "epoch": 2.78336, "grad_norm": 0.20465611439947812, "learning_rate": 1.9551143025038363e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.12780556082725525, "step": 2900, "valid_targets_mean": 10775.2, "valid_targets_min": 2243 }, { "epoch": 2.78816, "grad_norm": 0.19999884250519026, "learning_rate": 1.9484163340628724e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.159572571516037, "step": 2905, "valid_targets_mean": 13880.4, "valid_targets_min": 2055 }, { "epoch": 2.79296, "grad_norm": 0.2267797595338644, "learning_rate": 1.941718944505294e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.1121618002653122, "step": 2910, "valid_targets_mean": 9450.2, "valid_targets_min": 1890 }, { "epoch": 2.7977600000000002, "grad_norm": 0.20806241852536878, "learning_rate": 1.9350222089906994e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.10966132581233978, "step": 2915, "valid_targets_mean": 10078.5, "valid_targets_min": 2442 }, { "epoch": 2.80256, "grad_norm": 0.1901812453004743, "learning_rate": 1.9283262026713456e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494556963443756, "step": 2920, "valid_targets_mean": 13154.9, "valid_targets_min": 2097 }, { "epoch": 2.80736, "grad_norm": 0.19629416111197162, "learning_rate": 1.9216310006913058e-05, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.15318551659584045, "step": 2925, "valid_targets_mean": 12243.2, "valid_targets_min": 2044 }, { "epoch": 2.81216, "grad_norm": 0.22492866436695402, "learning_rate": 1.914936678185629e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.10800520330667496, "step": 2930, "valid_targets_mean": 8264.8, "valid_targets_min": 1432 }, { "epoch": 2.81696, "grad_norm": 0.2322759557369981, "learning_rate": 1.9082433102794918e-05, "loss": 0.3562, "loss_nan_ranks": 0, "loss_rank_avg": 0.10694816708564758, "step": 2935, "valid_targets_mean": 8236.9, "valid_targets_min": 1158 }, { "epoch": 2.8217600000000003, "grad_norm": 0.19751066773571385, "learning_rate": 1.9015509720873603e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.10615318268537521, "step": 2940, "valid_targets_mean": 9977.6, "valid_targets_min": 2450 }, { "epoch": 2.8265599999999997, "grad_norm": 0.2580598020963001, "learning_rate": 1.894859738712143e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.12153971195220947, "step": 2945, "valid_targets_mean": 11254.8, "valid_targets_min": 1980 }, { "epoch": 2.83136, "grad_norm": 0.20053695833514487, "learning_rate": 1.888169685244352e-05, "loss": 0.3664, "loss_nan_ranks": 0, "loss_rank_avg": 0.12622089684009552, "step": 2950, "valid_targets_mean": 11249.8, "valid_targets_min": 3481 }, { "epoch": 2.83616, "grad_norm": 0.22387411298344964, "learning_rate": 1.8814808867612568e-05, "loss": 0.3656, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262330412864685, "step": 2955, "valid_targets_mean": 10618.3, "valid_targets_min": 1324 }, { "epoch": 2.84096, "grad_norm": 0.20084054265106147, "learning_rate": 1.8747934183260427e-05, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.12606924772262573, "step": 2960, "valid_targets_mean": 10792.8, "valid_targets_min": 2360 }, { "epoch": 2.84576, "grad_norm": 0.20134811185220372, "learning_rate": 1.868107354986971e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.10368680953979492, "step": 2965, "valid_targets_mean": 9323.5, "valid_targets_min": 2257 }, { "epoch": 2.8505599999999998, "grad_norm": 0.21432043298936881, "learning_rate": 1.8614227717765327e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.12553778290748596, "step": 2970, "valid_targets_mean": 10495.8, "valid_targets_min": 2166 }, { "epoch": 2.85536, "grad_norm": 0.21010257773368773, "learning_rate": 1.8547397437106084e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.10031257569789886, "step": 2975, "valid_targets_mean": 8612.8, "valid_targets_min": 1990 }, { "epoch": 2.86016, "grad_norm": 0.2151100013139827, "learning_rate": 1.848058345787629e-05, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.11149641126394272, "step": 2980, "valid_targets_mean": 9591.8, "valid_targets_min": 1578 }, { "epoch": 2.86496, "grad_norm": 0.20690191454976406, "learning_rate": 1.8413786529877288e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.11248461902141571, "step": 2985, "valid_targets_mean": 9634.5, "valid_targets_min": 1976 }, { "epoch": 2.86976, "grad_norm": 0.19091194792371544, "learning_rate": 1.8347007402719082e-05, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.15383237600326538, "step": 2990, "valid_targets_mean": 13756.3, "valid_targets_min": 3591 }, { "epoch": 2.87456, "grad_norm": 0.25381121983321503, "learning_rate": 1.828024682581191e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.12134871631860733, "step": 2995, "valid_targets_mean": 10468.4, "valid_targets_min": 1861 }, { "epoch": 2.87936, "grad_norm": 0.20681853099155056, "learning_rate": 1.8213505548357822e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.11575278639793396, "step": 3000, "valid_targets_mean": 10195.7, "valid_targets_min": 1365 }, { "epoch": 2.88416, "grad_norm": 0.2586449714167572, "learning_rate": 1.814678431934231e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.13470815122127533, "step": 3005, "valid_targets_mean": 10735.1, "valid_targets_min": 1758 }, { "epoch": 2.88896, "grad_norm": 0.19973456872577822, "learning_rate": 1.8080083887525862e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.13693934679031372, "step": 3010, "valid_targets_mean": 11732.4, "valid_targets_min": 2603 }, { "epoch": 2.89376, "grad_norm": 0.27571022032343157, "learning_rate": 1.801340500143557e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.11827176064252853, "step": 3015, "valid_targets_mean": 9584.5, "valid_targets_min": 1872 }, { "epoch": 2.89856, "grad_norm": 0.20586896983288694, "learning_rate": 1.7946748409356746e-05, "loss": 0.3631, "loss_nan_ranks": 0, "loss_rank_avg": 0.132304847240448, "step": 3020, "valid_targets_mean": 11284.5, "valid_targets_min": 2521 }, { "epoch": 2.90336, "grad_norm": 0.2156847432711145, "learning_rate": 1.788011485932451e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.13747841119766235, "step": 3025, "valid_targets_mean": 12327.1, "valid_targets_min": 3063 }, { "epoch": 2.90816, "grad_norm": 0.19504637524682655, "learning_rate": 1.78135050991154e-05, "loss": 0.3601, "loss_nan_ranks": 0, "loss_rank_avg": 0.11804535984992981, "step": 3030, "valid_targets_mean": 9373.9, "valid_targets_min": 1669 }, { "epoch": 2.91296, "grad_norm": 0.2085548541654179, "learning_rate": 1.774691987623898e-05, "loss": 0.3616, "loss_nan_ranks": 0, "loss_rank_avg": 0.11510040611028671, "step": 3035, "valid_targets_mean": 10716.6, "valid_targets_min": 996 }, { "epoch": 2.91776, "grad_norm": 0.21766250562775843, "learning_rate": 1.768035993792944e-05, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.13932877779006958, "step": 3040, "valid_targets_mean": 12401.8, "valid_targets_min": 1150 }, { "epoch": 2.92256, "grad_norm": 0.22907780830855445, "learning_rate": 1.7613826031137245e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.12984474003314972, "step": 3045, "valid_targets_mean": 9680.3, "valid_targets_min": 3371 }, { "epoch": 2.92736, "grad_norm": 0.19920710075709197, "learning_rate": 1.7547318902520693e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.12504421174526215, "step": 3050, "valid_targets_mean": 10457.5, "valid_targets_min": 1864 }, { "epoch": 2.93216, "grad_norm": 0.1863477376482489, "learning_rate": 1.7480839298437612e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1148369163274765, "step": 3055, "valid_targets_mean": 10887.1, "valid_targets_min": 2181 }, { "epoch": 2.93696, "grad_norm": 0.20514036723322157, "learning_rate": 1.7414387964936913e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.11017856001853943, "step": 3060, "valid_targets_mean": 9396.2, "valid_targets_min": 1286 }, { "epoch": 2.94176, "grad_norm": 0.19968116055603938, "learning_rate": 1.7347965647750264e-05, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.11665418744087219, "step": 3065, "valid_targets_mean": 10102.7, "valid_targets_min": 1289 }, { "epoch": 2.94656, "grad_norm": 0.20817684656234767, "learning_rate": 1.7281573092283698e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.10370459407567978, "step": 3070, "valid_targets_mean": 9148.8, "valid_targets_min": 2335 }, { "epoch": 2.95136, "grad_norm": 0.1992253544024843, "learning_rate": 1.721521104360925e-05, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.12574630975723267, "step": 3075, "valid_targets_mean": 11535.0, "valid_targets_min": 2265 }, { "epoch": 2.95616, "grad_norm": 0.209456797096903, "learning_rate": 1.714888024645662e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.09037169814109802, "step": 3080, "valid_targets_mean": 7926.5, "valid_targets_min": 1720 }, { "epoch": 2.96096, "grad_norm": 0.23173634572043963, "learning_rate": 1.708258144520478e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.11924492567777634, "step": 3085, "valid_targets_mean": 10889.4, "valid_targets_min": 1408 }, { "epoch": 2.96576, "grad_norm": 0.20975622608835376, "learning_rate": 1.7016315383873637e-05, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.12030082941055298, "step": 3090, "valid_targets_mean": 10797.7, "valid_targets_min": 3240 }, { "epoch": 2.97056, "grad_norm": 0.21701184668492338, "learning_rate": 1.6950082806115692e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.11946055293083191, "step": 3095, "valid_targets_mean": 10773.8, "valid_targets_min": 3241 }, { "epoch": 2.9753600000000002, "grad_norm": 0.19977669409558643, "learning_rate": 1.6883884455207685e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.11068576574325562, "step": 3100, "valid_targets_mean": 9751.3, "valid_targets_min": 851 }, { "epoch": 2.98016, "grad_norm": 0.2059080526574065, "learning_rate": 1.6817721074042254e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.13456991314888, "step": 3105, "valid_targets_mean": 11390.2, "valid_targets_min": 1956 }, { "epoch": 2.98496, "grad_norm": 0.20080719781787096, "learning_rate": 1.675159340511958e-05, "loss": 0.3586, "loss_nan_ranks": 0, "loss_rank_avg": 0.12177115678787231, "step": 3110, "valid_targets_mean": 11015.5, "valid_targets_min": 2312 }, { "epoch": 2.98976, "grad_norm": 0.22633322795913888, "learning_rate": 1.6685502190539106e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.14303162693977356, "step": 3115, "valid_targets_mean": 11830.6, "valid_targets_min": 2556 }, { "epoch": 2.99456, "grad_norm": 0.20303697576064644, "learning_rate": 1.6619448171991155e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.1473173052072525, "step": 3120, "valid_targets_mean": 12810.6, "valid_targets_min": 2805 }, { "epoch": 2.9993600000000002, "grad_norm": 0.21006741878018884, "learning_rate": 1.6553432090748624e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.12304878979921341, "step": 3125, "valid_targets_mean": 10014.9, "valid_targets_min": 352 }, { "epoch": 3.00384, "grad_norm": 0.1911338881768588, "learning_rate": 1.648745468765869e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1106758713722229, "step": 3130, "valid_targets_mean": 10679.0, "valid_targets_min": 2647 }, { "epoch": 3.00864, "grad_norm": 0.18503418871632474, "learning_rate": 1.6421516703134463e-05, "loss": 0.3507, "loss_nan_ranks": 0, "loss_rank_avg": 0.10718891024589539, "step": 3135, "valid_targets_mean": 9676.6, "valid_targets_min": 3561 }, { "epoch": 3.01344, "grad_norm": 0.19632597147141265, "learning_rate": 1.6355618877146685e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.1160854697227478, "step": 3140, "valid_targets_mean": 10539.7, "valid_targets_min": 2460 }, { "epoch": 3.01824, "grad_norm": 0.18389649394404944, "learning_rate": 1.6289761949215435e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.10422074794769287, "step": 3145, "valid_targets_mean": 8746.8, "valid_targets_min": 1724 }, { "epoch": 3.02304, "grad_norm": 0.19428247076021085, "learning_rate": 1.6223946658401818e-05, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.11618025600910187, "step": 3150, "valid_targets_mean": 10644.7, "valid_targets_min": 2639 }, { "epoch": 3.02784, "grad_norm": 0.1989538133285283, "learning_rate": 1.6158173743299692e-05, "loss": 0.3535, "loss_nan_ranks": 0, "loss_rank_avg": 0.13024590909481049, "step": 3155, "valid_targets_mean": 11188.2, "valid_targets_min": 2165 }, { "epoch": 3.03264, "grad_norm": 0.1993685753545757, "learning_rate": 1.6092443942027356e-05, "loss": 0.3623, "loss_nan_ranks": 0, "loss_rank_avg": 0.109580397605896, "step": 3160, "valid_targets_mean": 9663.8, "valid_targets_min": 1420 }, { "epoch": 3.03744, "grad_norm": 0.18751059894772873, "learning_rate": 1.602675799221927e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.12348620593547821, "step": 3165, "valid_targets_mean": 10874.9, "valid_targets_min": 2228 }, { "epoch": 3.04224, "grad_norm": 0.19821491707707475, "learning_rate": 1.59611166310178e-05, "loss": 0.3616, "loss_nan_ranks": 0, "loss_rank_avg": 0.11230102926492691, "step": 3170, "valid_targets_mean": 9740.4, "valid_targets_min": 1925 }, { "epoch": 3.04704, "grad_norm": 0.1944362720163763, "learning_rate": 1.5895520595064913e-05, "loss": 0.3529, "loss_nan_ranks": 0, "loss_rank_avg": 0.1168983057141304, "step": 3175, "valid_targets_mean": 10594.9, "valid_targets_min": 1259 }, { "epoch": 3.05184, "grad_norm": 0.1956092410315661, "learning_rate": 1.5829970620493932e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.09523244202136993, "step": 3180, "valid_targets_mean": 8686.4, "valid_targets_min": 1431 }, { "epoch": 3.05664, "grad_norm": 0.18827941293584474, "learning_rate": 1.5764467442921274e-05, "loss": 0.3503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1236504539847374, "step": 3185, "valid_targets_mean": 12017.0, "valid_targets_min": 1252 }, { "epoch": 3.06144, "grad_norm": 0.18656827183872657, "learning_rate": 1.569901179743818e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.12331358343362808, "step": 3190, "valid_targets_mean": 11676.1, "valid_targets_min": 2242 }, { "epoch": 3.06624, "grad_norm": 0.19798995046879575, "learning_rate": 1.5633604418602483e-05, "loss": 0.3529, "loss_nan_ranks": 0, "loss_rank_avg": 0.12344086915254593, "step": 3195, "valid_targets_mean": 11296.1, "valid_targets_min": 2591 }, { "epoch": 3.07104, "grad_norm": 0.20696979517957703, "learning_rate": 1.5568246040430343e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.1138351783156395, "step": 3200, "valid_targets_mean": 9281.8, "valid_targets_min": 1942 }, { "epoch": 3.07584, "grad_norm": 0.1915849618482703, "learning_rate": 1.5502937396388046e-05, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10900023579597473, "step": 3205, "valid_targets_mean": 10877.6, "valid_targets_min": 2699 }, { "epoch": 3.08064, "grad_norm": 0.1827720297353329, "learning_rate": 1.543767921938374e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1224978119134903, "step": 3210, "valid_targets_mean": 11502.3, "valid_targets_min": 1838 }, { "epoch": 3.08544, "grad_norm": 0.18647047083470117, "learning_rate": 1.537247224175922e-05, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.12575547397136688, "step": 3215, "valid_targets_mean": 10821.2, "valid_targets_min": 2280 }, { "epoch": 3.09024, "grad_norm": 0.20310601224851935, "learning_rate": 1.53073171952817e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.09874022006988525, "step": 3220, "valid_targets_mean": 8396.7, "valid_targets_min": 1481 }, { "epoch": 3.09504, "grad_norm": 0.1907050422414701, "learning_rate": 1.5242214811135631e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317986696958542, "step": 3225, "valid_targets_mean": 11944.2, "valid_targets_min": 1024 }, { "epoch": 3.09984, "grad_norm": 0.23024193549682415, "learning_rate": 1.5177165819914461e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.1109505295753479, "step": 3230, "valid_targets_mean": 10249.3, "valid_targets_min": 2751 }, { "epoch": 3.10464, "grad_norm": 0.21783714840986526, "learning_rate": 1.5112170951612455e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.128553107380867, "step": 3235, "valid_targets_mean": 9875.0, "valid_targets_min": 1253 }, { "epoch": 3.10944, "grad_norm": 0.1859714790317045, "learning_rate": 1.5047230935616497e-05, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.12540477514266968, "step": 3240, "valid_targets_mean": 9422.7, "valid_targets_min": 1985 }, { "epoch": 3.11424, "grad_norm": 0.17930792691047237, "learning_rate": 1.4982346500697916e-05, "loss": 0.3648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338803768157959, "step": 3245, "valid_targets_mean": 11366.2, "valid_targets_min": 1835 }, { "epoch": 3.11904, "grad_norm": 0.19775983710451614, "learning_rate": 1.4917518375004281e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.11442698538303375, "step": 3250, "valid_targets_mean": 9435.9, "valid_targets_min": 2168 }, { "epoch": 3.12384, "grad_norm": 0.18680122426497975, "learning_rate": 1.4852747286051254e-05, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.12294398248195648, "step": 3255, "valid_targets_mean": 10353.2, "valid_targets_min": 1413 }, { "epoch": 3.12864, "grad_norm": 0.1925913840839781, "learning_rate": 1.478803396071443e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.10112228244543076, "step": 3260, "valid_targets_mean": 9614.4, "valid_targets_min": 2012 }, { "epoch": 3.1334400000000002, "grad_norm": 0.1892566760221108, "learning_rate": 1.472337912522115e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.12162721157073975, "step": 3265, "valid_targets_mean": 10449.9, "valid_targets_min": 410 }, { "epoch": 3.13824, "grad_norm": 0.1986424282020148, "learning_rate": 1.4658783505142368e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560564637184143, "step": 3270, "valid_targets_mean": 12148.1, "valid_targets_min": 979 }, { "epoch": 3.14304, "grad_norm": 0.19036134077024724, "learning_rate": 1.4594247825384529e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.10178598761558533, "step": 3275, "valid_targets_mean": 9834.5, "valid_targets_min": 1698 }, { "epoch": 3.14784, "grad_norm": 0.19790264725596374, "learning_rate": 1.4529772810181398e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1019100546836853, "step": 3280, "valid_targets_mean": 9963.8, "valid_targets_min": 1741 }, { "epoch": 3.15264, "grad_norm": 0.18612486364274605, "learning_rate": 1.4465359183085958e-05, "loss": 0.3506, "loss_nan_ranks": 0, "loss_rank_avg": 0.12211617082357407, "step": 3285, "valid_targets_mean": 10298.8, "valid_targets_min": 2362 }, { "epoch": 3.15744, "grad_norm": 0.19467475396240183, "learning_rate": 1.4401007666962276e-05, "loss": 0.3586, "loss_nan_ranks": 0, "loss_rank_avg": 0.120920330286026, "step": 3290, "valid_targets_mean": 10495.0, "valid_targets_min": 2093 }, { "epoch": 3.16224, "grad_norm": 0.1929595161256868, "learning_rate": 1.4336718983977389e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.1146123930811882, "step": 3295, "valid_targets_mean": 10586.0, "valid_targets_min": 1173 }, { "epoch": 3.16704, "grad_norm": 0.18264708976721075, "learning_rate": 1.4272493855593222e-05, "loss": 0.3576, "loss_nan_ranks": 0, "loss_rank_avg": 0.13314726948738098, "step": 3300, "valid_targets_mean": 11679.8, "valid_targets_min": 1112 }, { "epoch": 3.17184, "grad_norm": 0.1913530013358868, "learning_rate": 1.4208333002558462e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.10753712058067322, "step": 3305, "valid_targets_mean": 9290.6, "valid_targets_min": 1387 }, { "epoch": 3.17664, "grad_norm": 0.20193716674075288, "learning_rate": 1.4144237144900497e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11723098158836365, "step": 3310, "valid_targets_mean": 10084.2, "valid_targets_min": 1711 }, { "epoch": 3.18144, "grad_norm": 0.18684656406178907, "learning_rate": 1.4080207001917302e-05, "loss": 0.3524, "loss_nan_ranks": 0, "loss_rank_avg": 0.11985105276107788, "step": 3315, "valid_targets_mean": 10388.2, "valid_targets_min": 1748 }, { "epoch": 3.18624, "grad_norm": 0.18906821405151913, "learning_rate": 1.4016243292169413e-05, "loss": 0.358, "loss_nan_ranks": 0, "loss_rank_avg": 0.10248436778783798, "step": 3320, "valid_targets_mean": 9951.2, "valid_targets_min": 2571 }, { "epoch": 3.19104, "grad_norm": 0.21691396130072285, "learning_rate": 1.3952346733471822e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.13228540122509003, "step": 3325, "valid_targets_mean": 11530.5, "valid_targets_min": 1585 }, { "epoch": 3.19584, "grad_norm": 0.20831678580666343, "learning_rate": 1.3888518042885934e-05, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.11678709089756012, "step": 3330, "valid_targets_mean": 9578.8, "valid_targets_min": 2241 }, { "epoch": 3.20064, "grad_norm": 0.22016906998882896, "learning_rate": 1.3824757936711537e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.11219100654125214, "step": 3335, "valid_targets_mean": 9951.4, "valid_targets_min": 1808 }, { "epoch": 3.20544, "grad_norm": 0.1737671280514502, "learning_rate": 1.3761067130478738e-05, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.12665574252605438, "step": 3340, "valid_targets_mean": 12212.2, "valid_targets_min": 3127 }, { "epoch": 3.21024, "grad_norm": 0.18679582060053115, "learning_rate": 1.3697446338939942e-05, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.12244650721549988, "step": 3345, "valid_targets_mean": 10303.5, "valid_targets_min": 3638 }, { "epoch": 3.21504, "grad_norm": 0.18953197574821232, "learning_rate": 1.3633896276061847e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.11921748518943787, "step": 3350, "valid_targets_mean": 10747.9, "valid_targets_min": 2550 }, { "epoch": 3.21984, "grad_norm": 0.19332856848026225, "learning_rate": 1.3570417655017405e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.12070733308792114, "step": 3355, "valid_targets_mean": 10950.4, "valid_targets_min": 1986 }, { "epoch": 3.22464, "grad_norm": 0.17752470811518664, "learning_rate": 1.3507011188177846e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.11526253074407578, "step": 3360, "valid_targets_mean": 11321.6, "valid_targets_min": 2605 }, { "epoch": 3.22944, "grad_norm": 0.19017706432063974, "learning_rate": 1.3443677587104655e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.08614403009414673, "step": 3365, "valid_targets_mean": 8164.4, "valid_targets_min": 1641 }, { "epoch": 3.23424, "grad_norm": 0.1923946538335053, "learning_rate": 1.3380417562541604e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1379067748785019, "step": 3370, "valid_targets_mean": 11554.5, "valid_targets_min": 274 }, { "epoch": 3.23904, "grad_norm": 0.2183518088024744, "learning_rate": 1.3317231824406783e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.12228928506374359, "step": 3375, "valid_targets_mean": 10087.4, "valid_targets_min": 761 }, { "epoch": 3.24384, "grad_norm": 0.1802788340350456, "learning_rate": 1.325412108178461e-05, "loss": 0.3554, "loss_nan_ranks": 0, "loss_rank_avg": 0.11406947672367096, "step": 3380, "valid_targets_mean": 10006.9, "valid_targets_min": 1848 }, { "epoch": 3.24864, "grad_norm": 0.20894077379192982, "learning_rate": 1.3191086042917895e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.11614423245191574, "step": 3385, "valid_targets_mean": 9981.8, "valid_targets_min": 1502 }, { "epoch": 3.25344, "grad_norm": 0.19977532613637036, "learning_rate": 1.3128127415199883e-05, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377061903476715, "step": 3390, "valid_targets_mean": 10633.7, "valid_targets_min": 1012 }, { "epoch": 3.25824, "grad_norm": 0.1901378820426991, "learning_rate": 1.3065245905166316e-05, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.12295252829790115, "step": 3395, "valid_targets_mean": 11947.4, "valid_targets_min": 2325 }, { "epoch": 3.26304, "grad_norm": 0.18578663753606683, "learning_rate": 1.30024422184875e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.11808900535106659, "step": 3400, "valid_targets_mean": 11162.8, "valid_targets_min": 1875 }, { "epoch": 3.26784, "grad_norm": 0.186713719935275, "learning_rate": 1.2939717059960384e-05, "loss": 0.3525, "loss_nan_ranks": 0, "loss_rank_avg": 0.11969725042581558, "step": 3405, "valid_targets_mean": 10443.7, "valid_targets_min": 1996 }, { "epoch": 3.27264, "grad_norm": 0.17502503273066872, "learning_rate": 1.287707113350068e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.11786532402038574, "step": 3410, "valid_targets_mean": 11139.2, "valid_targets_min": 1627 }, { "epoch": 3.27744, "grad_norm": 0.1998399471402172, "learning_rate": 1.2814505142134921e-05, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.10916991531848907, "step": 3415, "valid_targets_mean": 10066.5, "valid_targets_min": 2648 }, { "epoch": 3.28224, "grad_norm": 0.18258313932232073, "learning_rate": 1.2752019787992587e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.12325777858495712, "step": 3420, "valid_targets_mean": 11230.4, "valid_targets_min": 2024 }, { "epoch": 3.28704, "grad_norm": 0.19416187067441554, "learning_rate": 1.268961577229824e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.14313529431819916, "step": 3425, "valid_targets_mean": 12805.9, "valid_targets_min": 2969 }, { "epoch": 3.29184, "grad_norm": 0.18140295108808063, "learning_rate": 1.262729379536365e-05, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.11013881862163544, "step": 3430, "valid_targets_mean": 9937.2, "valid_targets_min": 1936 }, { "epoch": 3.29664, "grad_norm": 0.199023784044211, "learning_rate": 1.2565054556579917e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.13415634632110596, "step": 3435, "valid_targets_mean": 10926.6, "valid_targets_min": 3449 }, { "epoch": 3.30144, "grad_norm": 0.19049442802798405, "learning_rate": 1.2502898754409637e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.14396649599075317, "step": 3440, "valid_targets_mean": 12972.6, "valid_targets_min": 811 }, { "epoch": 3.30624, "grad_norm": 0.1885705753589618, "learning_rate": 1.2440827086379055e-05, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.12890590727329254, "step": 3445, "valid_targets_mean": 10910.4, "valid_targets_min": 2691 }, { "epoch": 3.31104, "grad_norm": 0.19529808846683833, "learning_rate": 1.2378840249070265e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.09891938418149948, "step": 3450, "valid_targets_mean": 7235.0, "valid_targets_min": 1740 }, { "epoch": 3.31584, "grad_norm": 0.19195203994171842, "learning_rate": 1.2316938938113356e-05, "loss": 0.3494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13893388211727142, "step": 3455, "valid_targets_mean": 10672.0, "valid_targets_min": 1852 }, { "epoch": 3.32064, "grad_norm": 0.18938418133544757, "learning_rate": 1.2255123848178619e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.14761734008789062, "step": 3460, "valid_targets_mean": 12264.5, "valid_targets_min": 1059 }, { "epoch": 3.32544, "grad_norm": 0.2245840467957242, "learning_rate": 1.2193395672968765e-05, "loss": 0.356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1288203001022339, "step": 3465, "valid_targets_mean": 11682.1, "valid_targets_min": 3245 }, { "epoch": 3.33024, "grad_norm": 0.24566943058202834, "learning_rate": 1.2131755105211118e-05, "loss": 0.3503, "loss_nan_ranks": 0, "loss_rank_avg": 0.12490352988243103, "step": 3470, "valid_targets_mean": 10748.3, "valid_targets_min": 2691 }, { "epoch": 3.3350400000000002, "grad_norm": 0.19570442808701657, "learning_rate": 1.2070202836649855e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.11817985028028488, "step": 3475, "valid_targets_mean": 10496.6, "valid_targets_min": 1164 }, { "epoch": 3.33984, "grad_norm": 0.1938457143624076, "learning_rate": 1.2008739558038247e-05, "loss": 0.3576, "loss_nan_ranks": 0, "loss_rank_avg": 0.12001006305217743, "step": 3480, "valid_targets_mean": 10190.2, "valid_targets_min": 1310 }, { "epoch": 3.34464, "grad_norm": 0.19830141758413053, "learning_rate": 1.1947365959130895e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.11415542662143707, "step": 3485, "valid_targets_mean": 9767.1, "valid_targets_min": 1479 }, { "epoch": 3.34944, "grad_norm": 0.18805418601396895, "learning_rate": 1.1886082728675984e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.10864933580160141, "step": 3490, "valid_targets_mean": 9316.0, "valid_targets_min": 2287 }, { "epoch": 3.35424, "grad_norm": 0.19446719017345912, "learning_rate": 1.1824890554407574e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.10024982690811157, "step": 3495, "valid_targets_mean": 9009.9, "valid_targets_min": 263 }, { "epoch": 3.3590400000000002, "grad_norm": 0.18135088395469234, "learning_rate": 1.1763790123037873e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.14061683416366577, "step": 3500, "valid_targets_mean": 12592.8, "valid_targets_min": 3445 }, { "epoch": 3.36384, "grad_norm": 0.18546771956201968, "learning_rate": 1.1702782120249539e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.1133251041173935, "step": 3505, "valid_targets_mean": 10291.1, "valid_targets_min": 1576 }, { "epoch": 3.36864, "grad_norm": 0.19807807518664403, "learning_rate": 1.164186723068795e-05, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.11753286421298981, "step": 3510, "valid_targets_mean": 10020.5, "valid_targets_min": 1826 }, { "epoch": 3.37344, "grad_norm": 0.2278874445711356, "learning_rate": 1.1581046137953575e-05, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.10156413912773132, "step": 3515, "valid_targets_mean": 9347.9, "valid_targets_min": 2769 }, { "epoch": 3.37824, "grad_norm": 0.18710166735457182, "learning_rate": 1.1520319524594256e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.12491115182638168, "step": 3520, "valid_targets_mean": 10771.9, "valid_targets_min": 2445 }, { "epoch": 3.38304, "grad_norm": 0.2024893783584319, "learning_rate": 1.1459688072097568e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.13399648666381836, "step": 3525, "valid_targets_mean": 9379.2, "valid_targets_min": 2095 }, { "epoch": 3.38784, "grad_norm": 0.1861201118297581, "learning_rate": 1.1399152460883176e-05, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.11231739073991776, "step": 3530, "valid_targets_mean": 9798.0, "valid_targets_min": 2038 }, { "epoch": 3.39264, "grad_norm": 0.1966601165631479, "learning_rate": 1.1338713370295189e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.117458775639534, "step": 3535, "valid_targets_mean": 10878.8, "valid_targets_min": 2845 }, { "epoch": 3.39744, "grad_norm": 0.2085490830405768, "learning_rate": 1.1278371478594538e-05, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.10531540215015411, "step": 3540, "valid_targets_mean": 9678.8, "valid_targets_min": 2667 }, { "epoch": 3.40224, "grad_norm": 0.18946887709543617, "learning_rate": 1.1218127462951367e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.1102088987827301, "step": 3545, "valid_targets_mean": 10510.7, "valid_targets_min": 1094 }, { "epoch": 3.40704, "grad_norm": 0.17892277003492862, "learning_rate": 1.1157981999437444e-05, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.13594399392604828, "step": 3550, "valid_targets_mean": 12380.1, "valid_targets_min": 2776 }, { "epoch": 3.4118399999999998, "grad_norm": 0.217465251290386, "learning_rate": 1.109793576301855e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.13660013675689697, "step": 3555, "valid_targets_mean": 11982.4, "valid_targets_min": 3267 }, { "epoch": 3.41664, "grad_norm": 0.20923061680624425, "learning_rate": 1.1037989427546924e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.10261556506156921, "step": 3560, "valid_targets_mean": 9321.8, "valid_targets_min": 1740 }, { "epoch": 3.42144, "grad_norm": 0.18390467258543086, "learning_rate": 1.0978143665753692e-05, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.10945111513137817, "step": 3565, "valid_targets_mean": 9768.1, "valid_targets_min": 424 }, { "epoch": 3.42624, "grad_norm": 0.1854201454238558, "learning_rate": 1.0918399149241314e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.11244992911815643, "step": 3570, "valid_targets_mean": 9936.3, "valid_targets_min": 1494 }, { "epoch": 3.43104, "grad_norm": 0.19331857879904846, "learning_rate": 1.0858756548476058e-05, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.11202079802751541, "step": 3575, "valid_targets_mean": 9803.0, "valid_targets_min": 1987 }, { "epoch": 3.43584, "grad_norm": 0.19396064861205353, "learning_rate": 1.0799216532780478e-05, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.12126053869724274, "step": 3580, "valid_targets_mean": 11055.3, "valid_targets_min": 2296 }, { "epoch": 3.44064, "grad_norm": 0.17874507316377455, "learning_rate": 1.0739779770325885e-05, "loss": 0.3495, "loss_nan_ranks": 0, "loss_rank_avg": 0.12120386958122253, "step": 3585, "valid_targets_mean": 10554.2, "valid_targets_min": 2168 }, { "epoch": 3.44544, "grad_norm": 0.19495375081499186, "learning_rate": 1.0680446928124872e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.12293912470340729, "step": 3590, "valid_targets_mean": 10255.5, "valid_targets_min": 1716 }, { "epoch": 3.45024, "grad_norm": 0.1910897590945172, "learning_rate": 1.06212186720238e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.1188676506280899, "step": 3595, "valid_targets_mean": 9686.2, "valid_targets_min": 3623 }, { "epoch": 3.45504, "grad_norm": 0.1811992412391965, "learning_rate": 1.0562095666695352e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.10783851146697998, "step": 3600, "valid_targets_mean": 9709.2, "valid_targets_min": 1990 }, { "epoch": 3.45984, "grad_norm": 0.19304297830203423, "learning_rate": 1.0503078575631052e-05, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.13060978055000305, "step": 3605, "valid_targets_mean": 12093.8, "valid_targets_min": 2563 }, { "epoch": 3.46464, "grad_norm": 0.19848303325348635, "learning_rate": 1.0444168061133846e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.11622381210327148, "step": 3610, "valid_targets_mean": 11091.0, "valid_targets_min": 1856 }, { "epoch": 3.46944, "grad_norm": 0.1962983514499632, "learning_rate": 1.0385364784310636e-05, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.10630473494529724, "step": 3615, "valid_targets_mean": 9552.4, "valid_targets_min": 1488 }, { "epoch": 3.47424, "grad_norm": 0.18394754371487584, "learning_rate": 1.0326669405064904e-05, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.12049125134944916, "step": 3620, "valid_targets_mean": 11530.6, "valid_targets_min": 1867 }, { "epoch": 3.47904, "grad_norm": 0.20134945522749817, "learning_rate": 1.0268082582089263e-05, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.09410315752029419, "step": 3625, "valid_targets_mean": 9730.5, "valid_targets_min": 1819 }, { "epoch": 3.48384, "grad_norm": 0.20430868467866287, "learning_rate": 1.0209604972858081e-05, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.1092514842748642, "step": 3630, "valid_targets_mean": 10808.2, "valid_targets_min": 932 }, { "epoch": 3.48864, "grad_norm": 0.1923622457140111, "learning_rate": 1.0151237233620115e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.10817442834377289, "step": 3635, "valid_targets_mean": 10063.6, "valid_targets_min": 504 }, { "epoch": 3.49344, "grad_norm": 0.1919431133222278, "learning_rate": 1.0092980019391132e-05, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.11262176185846329, "step": 3640, "valid_targets_mean": 11249.9, "valid_targets_min": 2827 }, { "epoch": 3.49824, "grad_norm": 0.22049311818233236, "learning_rate": 1.0034833983946561e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.09713824093341827, "step": 3645, "valid_targets_mean": 9480.8, "valid_targets_min": 2041 }, { "epoch": 3.50304, "grad_norm": 0.18906192877132377, "learning_rate": 9.976799779814157e-06, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.10813942551612854, "step": 3650, "valid_targets_mean": 9799.3, "valid_targets_min": 2045 }, { "epoch": 3.50784, "grad_norm": 0.20056904457870012, "learning_rate": 9.918878058266687e-06, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.12527769804000854, "step": 3655, "valid_targets_mean": 11885.8, "valid_targets_min": 2417 }, { "epoch": 3.51264, "grad_norm": 0.20011413770145697, "learning_rate": 9.86106946931462e-06, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.11193445324897766, "step": 3660, "valid_targets_mean": 9013.2, "valid_targets_min": 1957 }, { "epoch": 3.51744, "grad_norm": 0.25272674369217807, "learning_rate": 9.803374661698802e-06, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1340043842792511, "step": 3665, "valid_targets_mean": 11369.7, "valid_targets_min": 2172 }, { "epoch": 3.52224, "grad_norm": 0.2061921625077728, "learning_rate": 9.745794282883215e-06, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308523714542389, "step": 3670, "valid_targets_mean": 11718.5, "valid_targets_min": 2566 }, { "epoch": 3.52704, "grad_norm": 0.2140394863007355, "learning_rate": 9.688328979047689e-06, "loss": 0.3339, "loss_nan_ranks": 0, "loss_rank_avg": 0.1149681806564331, "step": 3675, "valid_targets_mean": 10297.6, "valid_targets_min": 2433 }, { "epoch": 3.53184, "grad_norm": 0.20548285119646126, "learning_rate": 9.630979395080667e-06, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.10696137696504593, "step": 3680, "valid_targets_mean": 10548.2, "valid_targets_min": 2192 }, { "epoch": 3.5366400000000002, "grad_norm": 0.20553549970341442, "learning_rate": 9.573746174571947e-06, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.09759115427732468, "step": 3685, "valid_targets_mean": 9031.1, "valid_targets_min": 394 }, { "epoch": 3.54144, "grad_norm": 0.2451074762204898, "learning_rate": 9.516629959805468e-06, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.10014495253562927, "step": 3690, "valid_targets_mean": 9580.7, "valid_targets_min": 1801 }, { "epoch": 3.54624, "grad_norm": 0.21626968302427205, "learning_rate": 9.459631391752126e-06, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11678461730480194, "step": 3695, "valid_targets_mean": 10609.9, "valid_targets_min": 1721 }, { "epoch": 3.55104, "grad_norm": 0.19392085602556414, "learning_rate": 9.40275111006254e-06, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.08821696043014526, "step": 3700, "valid_targets_mean": 9932.8, "valid_targets_min": 3422 }, { "epoch": 3.55584, "grad_norm": 0.201996804562783, "learning_rate": 9.345989753059895e-06, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1151978075504303, "step": 3705, "valid_targets_mean": 11600.8, "valid_targets_min": 3168 }, { "epoch": 3.5606400000000002, "grad_norm": 0.22336753266344042, "learning_rate": 9.289347957732779e-06, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.12304936349391937, "step": 3710, "valid_targets_mean": 10241.5, "valid_targets_min": 2089 }, { "epoch": 3.56544, "grad_norm": 0.19062223595038535, "learning_rate": 9.232826359728034e-06, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.11184520274400711, "step": 3715, "valid_targets_mean": 10874.9, "valid_targets_min": 1798 }, { "epoch": 3.57024, "grad_norm": 0.19077344761804907, "learning_rate": 9.17642559334362e-06, "loss": 0.336, "loss_nan_ranks": 0, "loss_rank_avg": 0.12285032868385315, "step": 3720, "valid_targets_mean": 10946.0, "valid_targets_min": 1827 }, { "epoch": 3.57504, "grad_norm": 0.2083508079173029, "learning_rate": 9.120146291521488e-06, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.10798792541027069, "step": 3725, "valid_targets_mean": 9431.4, "valid_targets_min": 1744 }, { "epoch": 3.57984, "grad_norm": 0.19931430642605075, "learning_rate": 9.063989085840506e-06, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.10994656383991241, "step": 3730, "valid_targets_mean": 10691.3, "valid_targets_min": 3764 }, { "epoch": 3.5846400000000003, "grad_norm": 0.20157589308788418, "learning_rate": 9.007954606509346e-06, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12041280418634415, "step": 3735, "valid_targets_mean": 11329.4, "valid_targets_min": 317 }, { "epoch": 3.5894399999999997, "grad_norm": 0.19739606946409297, "learning_rate": 8.952043482359408e-06, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.11637447774410248, "step": 3740, "valid_targets_mean": 10785.2, "valid_targets_min": 2678 }, { "epoch": 3.59424, "grad_norm": 0.19236658753285724, "learning_rate": 8.896256340837779e-06, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.10516636818647385, "step": 3745, "valid_targets_mean": 10048.1, "valid_targets_min": 452 }, { "epoch": 3.59904, "grad_norm": 0.22012325224639936, "learning_rate": 8.840593808000182e-06, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.11621899902820587, "step": 3750, "valid_targets_mean": 10399.3, "valid_targets_min": 2540 }, { "epoch": 3.60384, "grad_norm": 0.18658943719781973, "learning_rate": 8.785056508503956e-06, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.10126075148582458, "step": 3755, "valid_targets_mean": 8977.8, "valid_targets_min": 2025 }, { "epoch": 3.60864, "grad_norm": 0.20321229778516367, "learning_rate": 8.729645065601045e-06, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.10659228265285492, "step": 3760, "valid_targets_mean": 9902.1, "valid_targets_min": 1186 }, { "epoch": 3.6134399999999998, "grad_norm": 0.20835216151670474, "learning_rate": 8.674360101130994e-06, "loss": 0.3303, "loss_nan_ranks": 0, "loss_rank_avg": 0.12322533875703812, "step": 3765, "valid_targets_mean": 10761.2, "valid_targets_min": 2155 }, { "epoch": 3.61824, "grad_norm": 0.24853022651912218, "learning_rate": 8.619202235514e-06, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.10587123781442642, "step": 3770, "valid_targets_mean": 10205.1, "valid_targets_min": 1463 }, { "epoch": 3.62304, "grad_norm": 0.18590936223050844, "learning_rate": 8.564172087743903e-06, "loss": 0.3368, "loss_nan_ranks": 0, "loss_rank_avg": 0.09855873882770538, "step": 3775, "valid_targets_mean": 10165.1, "valid_targets_min": 1423 }, { "epoch": 3.62784, "grad_norm": 0.19324732375974865, "learning_rate": 8.50927027538128e-06, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.11301326006650925, "step": 3780, "valid_targets_mean": 11568.4, "valid_targets_min": 3325 }, { "epoch": 3.63264, "grad_norm": 0.19183324907556853, "learning_rate": 8.454497414546497e-06, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.10337097197771072, "step": 3785, "valid_targets_mean": 9855.3, "valid_targets_min": 1252 }, { "epoch": 3.63744, "grad_norm": 0.21893269097934628, "learning_rate": 8.39985411991279e-06, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.11065911501646042, "step": 3790, "valid_targets_mean": 8598.5, "valid_targets_min": 2729 }, { "epoch": 3.64224, "grad_norm": 0.2037498536595881, "learning_rate": 8.345341004699386e-06, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.10529591143131256, "step": 3795, "valid_targets_mean": 10991.3, "valid_targets_min": 2372 }, { "epoch": 3.64704, "grad_norm": 0.20553055083765032, "learning_rate": 8.290958680664591e-06, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.11532579362392426, "step": 3800, "valid_targets_mean": 10666.8, "valid_targets_min": 2320 }, { "epoch": 3.65184, "grad_norm": 0.19243076020293992, "learning_rate": 8.236707758098965e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.10770958662033081, "step": 3805, "valid_targets_mean": 10406.8, "valid_targets_min": 2341 }, { "epoch": 3.65664, "grad_norm": 0.19327308471343702, "learning_rate": 8.182588845818452e-06, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.11743837594985962, "step": 3810, "valid_targets_mean": 11392.2, "valid_targets_min": 778 }, { "epoch": 3.66144, "grad_norm": 0.5322781547709468, "learning_rate": 8.128602551157523e-06, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.1046619713306427, "step": 3815, "valid_targets_mean": 9404.5, "valid_targets_min": 1286 }, { "epoch": 3.66624, "grad_norm": 0.18200763770766343, "learning_rate": 8.074749479962407e-06, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.10478302091360092, "step": 3820, "valid_targets_mean": 10424.2, "valid_targets_min": 2328 }, { "epoch": 3.67104, "grad_norm": 0.20154542379432241, "learning_rate": 8.021030236584254e-06, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.10680904239416122, "step": 3825, "valid_targets_mean": 9686.7, "valid_targets_min": 2481 }, { "epoch": 3.67584, "grad_norm": 0.20471388463535073, "learning_rate": 7.967445423872384e-06, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.12352913618087769, "step": 3830, "valid_targets_mean": 10895.8, "valid_targets_min": 2669 }, { "epoch": 3.68064, "grad_norm": 0.19496961604395602, "learning_rate": 7.913995643167494e-06, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.10220825672149658, "step": 3835, "valid_targets_mean": 11739.0, "valid_targets_min": 1646 }, { "epoch": 3.68544, "grad_norm": 0.18616220712690562, "learning_rate": 7.860681494294917e-06, "loss": 0.3331, "loss_nan_ranks": 0, "loss_rank_avg": 0.11336371302604675, "step": 3840, "valid_targets_mean": 12121.3, "valid_targets_min": 2219 }, { "epoch": 3.69024, "grad_norm": 0.19672724322192428, "learning_rate": 7.80750357555792e-06, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.10641404986381531, "step": 3845, "valid_targets_mean": 9148.8, "valid_targets_min": 1182 }, { "epoch": 3.69504, "grad_norm": 0.18760061959670887, "learning_rate": 7.75446248373094e-06, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.09877805411815643, "step": 3850, "valid_targets_mean": 10289.6, "valid_targets_min": 1531 }, { "epoch": 3.69984, "grad_norm": 0.1989894615739904, "learning_rate": 7.701558814052928e-06, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.11524476110935211, "step": 3855, "valid_targets_mean": 10849.2, "valid_targets_min": 2253 }, { "epoch": 3.70464, "grad_norm": 0.21263096110802848, "learning_rate": 7.648793160220637e-06, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.0896211490035057, "step": 3860, "valid_targets_mean": 8943.8, "valid_targets_min": 2080 }, { "epoch": 3.70944, "grad_norm": 0.20660700096766874, "learning_rate": 7.596166114381991e-06, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.12305016815662384, "step": 3865, "valid_targets_mean": 11404.3, "valid_targets_min": 2439 }, { "epoch": 3.71424, "grad_norm": 0.1887513060702262, "learning_rate": 7.543678267129408e-06, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.10012684017419815, "step": 3870, "valid_targets_mean": 9752.9, "valid_targets_min": 2479 }, { "epoch": 3.71904, "grad_norm": 0.19859233526993486, "learning_rate": 7.491330207493215e-06, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.10596565902233124, "step": 3875, "valid_targets_mean": 9964.5, "valid_targets_min": 2429 }, { "epoch": 3.72384, "grad_norm": 0.1926164171143439, "learning_rate": 7.4391225229349785e-06, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.11391852796077728, "step": 3880, "valid_targets_mean": 12301.7, "valid_targets_min": 2739 }, { "epoch": 3.72864, "grad_norm": 0.2044202427462678, "learning_rate": 7.387055799340977e-06, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.09524258971214294, "step": 3885, "valid_targets_mean": 9396.2, "valid_targets_min": 2039 }, { "epoch": 3.73344, "grad_norm": 0.20832735693973597, "learning_rate": 7.3351306210155645e-06, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12448085099458694, "step": 3890, "valid_targets_mean": 11666.6, "valid_targets_min": 2410 }, { "epoch": 3.7382400000000002, "grad_norm": 0.2012811682766443, "learning_rate": 7.283347570674664e-06, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.09556588530540466, "step": 3895, "valid_targets_mean": 8674.2, "valid_targets_min": 2091 }, { "epoch": 3.74304, "grad_norm": 0.1954028099618188, "learning_rate": 7.231707229439191e-06, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.11363653838634491, "step": 3900, "valid_targets_mean": 10786.8, "valid_targets_min": 1764 }, { "epoch": 3.74784, "grad_norm": 0.20984038963396634, "learning_rate": 7.180210176828557e-06, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.11528477072715759, "step": 3905, "valid_targets_mean": 10695.7, "valid_targets_min": 1713 }, { "epoch": 3.75264, "grad_norm": 0.19426620615010454, "learning_rate": 7.1288569907541495e-06, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.09247671067714691, "step": 3910, "valid_targets_mean": 9820.4, "valid_targets_min": 2085 }, { "epoch": 3.75744, "grad_norm": 0.20099406626199876, "learning_rate": 7.0776482475128674e-06, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.12034967541694641, "step": 3915, "valid_targets_mean": 11045.9, "valid_targets_min": 2748 }, { "epoch": 3.7622400000000003, "grad_norm": 0.2012651470799037, "learning_rate": 7.026584521780628e-06, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.11899619549512863, "step": 3920, "valid_targets_mean": 10818.9, "valid_targets_min": 2197 }, { "epoch": 3.76704, "grad_norm": 0.2170502759681478, "learning_rate": 6.9756663866059324e-06, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.10469336807727814, "step": 3925, "valid_targets_mean": 9436.8, "valid_targets_min": 2091 }, { "epoch": 3.77184, "grad_norm": 0.19380358298158798, "learning_rate": 6.924894413403434e-06, "loss": 0.3261, "loss_nan_ranks": 0, "loss_rank_avg": 0.11549240350723267, "step": 3930, "valid_targets_mean": 10453.5, "valid_targets_min": 993 }, { "epoch": 3.77664, "grad_norm": 0.19883634363318978, "learning_rate": 6.874269171947516e-06, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.09396840631961823, "step": 3935, "valid_targets_mean": 9193.5, "valid_targets_min": 1774 }, { "epoch": 3.78144, "grad_norm": 0.19563421512476295, "learning_rate": 6.8237912303659195e-06, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.1019580215215683, "step": 3940, "valid_targets_mean": 8852.4, "valid_targets_min": 406 }, { "epoch": 3.7862400000000003, "grad_norm": 0.1972328228862978, "learning_rate": 6.773461155133334e-06, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.11583631485700607, "step": 3945, "valid_targets_mean": 10057.0, "valid_targets_min": 1606 }, { "epoch": 3.7910399999999997, "grad_norm": 0.1779667766611541, "learning_rate": 6.723279511065088e-06, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.13784457743167877, "step": 3950, "valid_targets_mean": 12148.1, "valid_targets_min": 1637 }, { "epoch": 3.79584, "grad_norm": 0.24094579223060217, "learning_rate": 6.673246861310751e-06, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.09021230041980743, "step": 3955, "valid_targets_mean": 9060.4, "valid_targets_min": 1710 }, { "epoch": 3.80064, "grad_norm": 0.20096836711477922, "learning_rate": 6.623363767347874e-06, "loss": 0.334, "loss_nan_ranks": 0, "loss_rank_avg": 0.11364022642374039, "step": 3960, "valid_targets_mean": 10833.1, "valid_targets_min": 1812 }, { "epoch": 3.80544, "grad_norm": 0.19641419404223437, "learning_rate": 6.5736307889756425e-06, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12811903655529022, "step": 3965, "valid_targets_mean": 11935.5, "valid_targets_min": 3243 }, { "epoch": 3.81024, "grad_norm": 0.2088422125497686, "learning_rate": 6.5240484843086095e-06, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.11009708046913147, "step": 3970, "valid_targets_mean": 9540.8, "valid_targets_min": 2491 }, { "epoch": 3.8150399999999998, "grad_norm": 0.17629238607105105, "learning_rate": 6.474617409770441e-06, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.08507069945335388, "step": 3975, "valid_targets_mean": 8515.1, "valid_targets_min": 1979 }, { "epoch": 3.81984, "grad_norm": 0.20252130389575573, "learning_rate": 6.425338120087665e-06, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.1134904995560646, "step": 3980, "valid_targets_mean": 10508.7, "valid_targets_min": 893 }, { "epoch": 3.82464, "grad_norm": 0.1879269492686956, "learning_rate": 6.3762111682834374e-06, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.09007836878299713, "step": 3985, "valid_targets_mean": 8626.4, "valid_targets_min": 1175 }, { "epoch": 3.82944, "grad_norm": 0.176619695453459, "learning_rate": 6.327237105671362e-06, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.12505346536636353, "step": 3990, "valid_targets_mean": 12297.1, "valid_targets_min": 2315 }, { "epoch": 3.83424, "grad_norm": 0.18064417692761175, "learning_rate": 6.278416481849274e-06, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.10311710834503174, "step": 3995, "valid_targets_mean": 10158.5, "valid_targets_min": 2461 }, { "epoch": 3.83904, "grad_norm": 0.19352979258741507, "learning_rate": 6.22974984469308e-06, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.10242927074432373, "step": 4000, "valid_targets_mean": 10619.7, "valid_targets_min": 2218 }, { "epoch": 3.84384, "grad_norm": 0.20312962511126573, "learning_rate": 6.181237740350625e-06, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12367504835128784, "step": 4005, "valid_targets_mean": 10997.3, "valid_targets_min": 2039 }, { "epoch": 3.84864, "grad_norm": 0.20281314060838945, "learning_rate": 6.132880713235543e-06, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.10259454697370529, "step": 4010, "valid_targets_mean": 10200.3, "valid_targets_min": 1817 }, { "epoch": 3.85344, "grad_norm": 0.19236705300579124, "learning_rate": 6.084679306021162e-06, "loss": 0.3341, "loss_nan_ranks": 0, "loss_rank_avg": 0.11262617260217667, "step": 4015, "valid_targets_mean": 10491.1, "valid_targets_min": 2912 }, { "epoch": 3.85824, "grad_norm": 0.21216763050139026, "learning_rate": 6.036634059634403e-06, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.12088140100240707, "step": 4020, "valid_targets_mean": 10524.1, "valid_targets_min": 2892 }, { "epoch": 3.86304, "grad_norm": 0.18810111079172934, "learning_rate": 5.988745513249723e-06, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.11481692641973495, "step": 4025, "valid_targets_mean": 11395.9, "valid_targets_min": 2159 }, { "epoch": 3.86784, "grad_norm": 0.18646315134853542, "learning_rate": 5.941014204283065e-06, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.12088949233293533, "step": 4030, "valid_targets_mean": 10613.7, "valid_targets_min": 2751 }, { "epoch": 3.87264, "grad_norm": 0.24880825961937425, "learning_rate": 5.893440668385797e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.10480111837387085, "step": 4035, "valid_targets_mean": 9637.3, "valid_targets_min": 1479 }, { "epoch": 3.87744, "grad_norm": 0.21853378472081741, "learning_rate": 5.8460254394387335e-06, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.10361306369304657, "step": 4040, "valid_targets_mean": 9368.8, "valid_targets_min": 1418 }, { "epoch": 3.88224, "grad_norm": 0.1811642976364691, "learning_rate": 5.798769049546136e-06, "loss": 0.3341, "loss_nan_ranks": 0, "loss_rank_avg": 0.11255176365375519, "step": 4045, "valid_targets_mean": 12307.6, "valid_targets_min": 3160 }, { "epoch": 3.88704, "grad_norm": 0.17835674257256226, "learning_rate": 5.751672029029734e-06, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.11680912226438522, "step": 4050, "valid_targets_mean": 11949.1, "valid_targets_min": 2171 }, { "epoch": 3.89184, "grad_norm": 0.2660592016540433, "learning_rate": 5.704734906422775e-06, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.09463915973901749, "step": 4055, "valid_targets_mean": 9402.0, "valid_targets_min": 2696 }, { "epoch": 3.89664, "grad_norm": 0.19566691507927225, "learning_rate": 5.657958208464103e-06, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.12318737804889679, "step": 4060, "valid_targets_mean": 11424.6, "valid_targets_min": 2863 }, { "epoch": 3.90144, "grad_norm": 0.1844478364760468, "learning_rate": 5.611342460092244e-06, "loss": 0.3359, "loss_nan_ranks": 0, "loss_rank_avg": 0.08694644272327423, "step": 4065, "valid_targets_mean": 9213.2, "valid_targets_min": 1996 }, { "epoch": 3.90624, "grad_norm": 0.1873501610977791, "learning_rate": 5.564888184439505e-06, "loss": 0.3394, "loss_nan_ranks": 0, "loss_rank_avg": 0.1016213595867157, "step": 4070, "valid_targets_mean": 8913.0, "valid_targets_min": 2279 }, { "epoch": 3.91104, "grad_norm": 0.1966574544973596, "learning_rate": 5.5185959028261135e-06, "loss": 0.3359, "loss_nan_ranks": 0, "loss_rank_avg": 0.10623191297054291, "step": 4075, "valid_targets_mean": 10693.3, "valid_targets_min": 2865 }, { "epoch": 3.91584, "grad_norm": 0.1879431423815426, "learning_rate": 5.47246613475436e-06, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.12403889000415802, "step": 4080, "valid_targets_mean": 11291.2, "valid_targets_min": 1544 }, { "epoch": 3.92064, "grad_norm": 0.18364320485487998, "learning_rate": 5.4264993979027735e-06, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.12664386630058289, "step": 4085, "valid_targets_mean": 12097.9, "valid_targets_min": 2029 }, { "epoch": 3.92544, "grad_norm": 0.19447101711983544, "learning_rate": 5.380696208120315e-06, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.10284821689128876, "step": 4090, "valid_targets_mean": 10145.8, "valid_targets_min": 1838 }, { "epoch": 3.93024, "grad_norm": 0.18444617156461748, "learning_rate": 5.335057079420571e-06, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.10592512786388397, "step": 4095, "valid_targets_mean": 9922.3, "valid_targets_min": 2912 }, { "epoch": 3.93504, "grad_norm": 0.19573933070889935, "learning_rate": 5.289582523976015e-06, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.09200359880924225, "step": 4100, "valid_targets_mean": 8765.0, "valid_targets_min": 3189 }, { "epoch": 3.9398400000000002, "grad_norm": 0.21184991033974448, "learning_rate": 5.244273052112241e-06, "loss": 0.3304, "loss_nan_ranks": 0, "loss_rank_avg": 0.11215705424547195, "step": 4105, "valid_targets_mean": 9907.4, "valid_targets_min": 1249 }, { "epoch": 3.94464, "grad_norm": 0.18565904600835953, "learning_rate": 5.199129172302224e-06, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.10161211341619492, "step": 4110, "valid_targets_mean": 10105.3, "valid_targets_min": 2284 }, { "epoch": 3.94944, "grad_norm": 0.1772815671503692, "learning_rate": 5.154151391160638e-06, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.08798927068710327, "step": 4115, "valid_targets_mean": 9611.5, "valid_targets_min": 2646 }, { "epoch": 3.95424, "grad_norm": 0.19590311785568074, "learning_rate": 5.109340213438156e-06, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.11088310182094574, "step": 4120, "valid_targets_mean": 10398.2, "valid_targets_min": 2528 }, { "epoch": 3.95904, "grad_norm": 0.18151207861605087, "learning_rate": 5.0646961420157995e-06, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.11617287993431091, "step": 4125, "valid_targets_mean": 11599.7, "valid_targets_min": 2772 }, { "epoch": 3.9638400000000003, "grad_norm": 0.19116201774572908, "learning_rate": 5.020219677899276e-06, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.10209350287914276, "step": 4130, "valid_targets_mean": 10222.2, "valid_targets_min": 2429 }, { "epoch": 3.9686399999999997, "grad_norm": 0.2024256331856205, "learning_rate": 4.975911320213365e-06, "loss": 0.3299, "loss_nan_ranks": 0, "loss_rank_avg": 0.08789606392383575, "step": 4135, "valid_targets_mean": 8624.2, "valid_targets_min": 1467 }, { "epoch": 3.97344, "grad_norm": 0.19195030700994084, "learning_rate": 4.931771566196332e-06, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.10818715393543243, "step": 4140, "valid_targets_mean": 10638.1, "valid_targets_min": 2718 }, { "epoch": 3.97824, "grad_norm": 0.18238669600596105, "learning_rate": 4.887800911194327e-06, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.1121128499507904, "step": 4145, "valid_targets_mean": 10199.2, "valid_targets_min": 1693 }, { "epoch": 3.98304, "grad_norm": 0.19665733186907425, "learning_rate": 4.8439998486558246e-06, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.11327169835567474, "step": 4150, "valid_targets_mean": 10270.0, "valid_targets_min": 2069 }, { "epoch": 3.9878400000000003, "grad_norm": 0.20032239446085373, "learning_rate": 4.800368870126111e-06, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.12412586808204651, "step": 4155, "valid_targets_mean": 9892.8, "valid_targets_min": 1814 }, { "epoch": 3.9926399999999997, "grad_norm": 0.20869919617855076, "learning_rate": 4.756908465241736e-06, "loss": 0.336, "loss_nan_ranks": 0, "loss_rank_avg": 0.12254258990287781, "step": 4160, "valid_targets_mean": 11407.7, "valid_targets_min": 2934 }, { "epoch": 3.99744, "grad_norm": 0.21961616056297487, "learning_rate": 4.713619121725039e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.11416822671890259, "step": 4165, "valid_targets_mean": 9896.4, "valid_targets_min": 2042 }, { "epoch": 4.00192, "grad_norm": 0.20465337196618452, "learning_rate": 4.670501325378682e-06, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.09974993765354156, "step": 4170, "valid_targets_mean": 9093.5, "valid_targets_min": 2111 }, { "epoch": 4.00672, "grad_norm": 0.18822425307587917, "learning_rate": 4.627555560080173e-06, "loss": 0.3463, "loss_nan_ranks": 0, "loss_rank_avg": 0.11911550164222717, "step": 4175, "valid_targets_mean": 10731.2, "valid_targets_min": 2580 }, { "epoch": 4.01152, "grad_norm": 0.17412564908685052, "learning_rate": 4.5847823077764565e-06, "loss": 0.3483, "loss_nan_ranks": 0, "loss_rank_avg": 0.08448906242847443, "step": 4180, "valid_targets_mean": 8920.5, "valid_targets_min": 1525 }, { "epoch": 4.01632, "grad_norm": 0.20289618242630778, "learning_rate": 4.5421820484784936e-06, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.0968443751335144, "step": 4185, "valid_targets_mean": 9025.8, "valid_targets_min": 1431 }, { "epoch": 4.02112, "grad_norm": 0.18576117005555698, "learning_rate": 4.499755260255881e-06, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.12763839960098267, "step": 4190, "valid_targets_mean": 10916.9, "valid_targets_min": 1377 }, { "epoch": 4.02592, "grad_norm": 0.19396303860305614, "learning_rate": 4.457502419231483e-06, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.11627334356307983, "step": 4195, "valid_targets_mean": 10039.9, "valid_targets_min": 2095 }, { "epoch": 4.03072, "grad_norm": 0.17938812248691008, "learning_rate": 4.415423999576091e-06, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.11132301390171051, "step": 4200, "valid_targets_mean": 9779.9, "valid_targets_min": 1798 }, { "epoch": 4.03552, "grad_norm": 0.19198874415999007, "learning_rate": 4.373520473503097e-06, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.12028753757476807, "step": 4205, "valid_targets_mean": 10074.8, "valid_targets_min": 2026 }, { "epoch": 4.04032, "grad_norm": 0.19108626766525713, "learning_rate": 4.33179231126321e-06, "loss": 0.3394, "loss_nan_ranks": 0, "loss_rank_avg": 0.12190006673336029, "step": 4210, "valid_targets_mean": 10831.8, "valid_targets_min": 1403 }, { "epoch": 4.04512, "grad_norm": 0.17387555307348446, "learning_rate": 4.2902399811391575e-06, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.11498603224754333, "step": 4215, "valid_targets_mean": 11074.9, "valid_targets_min": 3269 }, { "epoch": 4.04992, "grad_norm": 0.19072981281428716, "learning_rate": 4.248863949440436e-06, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.1275830864906311, "step": 4220, "valid_targets_mean": 11321.0, "valid_targets_min": 2614 }, { "epoch": 4.05472, "grad_norm": 0.17614221224241058, "learning_rate": 4.207664680498094e-06, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.10699561983346939, "step": 4225, "valid_targets_mean": 9597.5, "valid_targets_min": 1610 }, { "epoch": 4.05952, "grad_norm": 0.17640127607763398, "learning_rate": 4.166642636659495e-06, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.12896181643009186, "step": 4230, "valid_targets_mean": 10785.8, "valid_targets_min": 2068 }, { "epoch": 4.06432, "grad_norm": 0.2190402246225578, "learning_rate": 4.125798278283155e-06, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.12219704687595367, "step": 4235, "valid_targets_mean": 11353.1, "valid_targets_min": 1816 }, { "epoch": 4.06912, "grad_norm": 0.18092997420777618, "learning_rate": 4.085132063733554e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.11919304728507996, "step": 4240, "valid_targets_mean": 10082.1, "valid_targets_min": 2704 }, { "epoch": 4.07392, "grad_norm": 0.1823612174354958, "learning_rate": 4.0446444493760165e-06, "loss": 0.3487, "loss_nan_ranks": 0, "loss_rank_avg": 0.12384763360023499, "step": 4245, "valid_targets_mean": 10839.3, "valid_targets_min": 1936 }, { "epoch": 4.07872, "grad_norm": 0.20653639568032384, "learning_rate": 4.004335889571556e-06, "loss": 0.3514, "loss_nan_ranks": 0, "loss_rank_avg": 0.11276553571224213, "step": 4250, "valid_targets_mean": 10286.0, "valid_targets_min": 2725 }, { "epoch": 4.08352, "grad_norm": 0.24765300903341972, "learning_rate": 3.96420683667182e-06, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.13264083862304688, "step": 4255, "valid_targets_mean": 10544.3, "valid_targets_min": 2485 }, { "epoch": 4.08832, "grad_norm": 0.1854786999415691, "learning_rate": 3.924257741013968e-06, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.1216278001666069, "step": 4260, "valid_targets_mean": 11002.3, "valid_targets_min": 2382 }, { "epoch": 4.09312, "grad_norm": 0.1746636739434648, "learning_rate": 3.884489050915652e-06, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.10394848883152008, "step": 4265, "valid_targets_mean": 9912.5, "valid_targets_min": 1695 }, { "epoch": 4.09792, "grad_norm": 0.19193550197987494, "learning_rate": 3.844901212669962e-06, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10642480850219727, "step": 4270, "valid_targets_mean": 11185.8, "valid_targets_min": 1752 }, { "epoch": 4.10272, "grad_norm": 0.17195296130981225, "learning_rate": 3.8054946705404415e-06, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.15103162825107574, "step": 4275, "valid_targets_mean": 13565.3, "valid_targets_min": 2685 }, { "epoch": 4.10752, "grad_norm": 0.18746276379642257, "learning_rate": 3.7662698667560714e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.1165471002459526, "step": 4280, "valid_targets_mean": 9233.0, "valid_targets_min": 3457 }, { "epoch": 4.11232, "grad_norm": 0.19394818833899224, "learning_rate": 3.7272272415063484e-06, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.10333932936191559, "step": 4285, "valid_targets_mean": 10364.3, "valid_targets_min": 2115 }, { "epoch": 4.11712, "grad_norm": 0.19359491194847078, "learning_rate": 3.6883672329363007e-06, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.10657678544521332, "step": 4290, "valid_targets_mean": 8299.9, "valid_targets_min": 1375 }, { "epoch": 4.12192, "grad_norm": 0.1932798960704116, "learning_rate": 3.649690277141598e-06, "loss": 0.3469, "loss_nan_ranks": 0, "loss_rank_avg": 0.11276364326477051, "step": 4295, "valid_targets_mean": 8782.7, "valid_targets_min": 2273 }, { "epoch": 4.12672, "grad_norm": 0.19351234269362713, "learning_rate": 3.6111968081636507e-06, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.10978444665670395, "step": 4300, "valid_targets_mean": 9584.4, "valid_targets_min": 1770 }, { "epoch": 4.13152, "grad_norm": 0.18945958380808156, "learning_rate": 3.572887257984743e-06, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.10315452516078949, "step": 4305, "valid_targets_mean": 9444.8, "valid_targets_min": 2531 }, { "epoch": 4.1363199999999996, "grad_norm": 0.179621377461173, "learning_rate": 3.5347620565231733e-06, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.10427289456129074, "step": 4310, "valid_targets_mean": 9924.7, "valid_targets_min": 2863 }, { "epoch": 4.14112, "grad_norm": 0.19555836606663374, "learning_rate": 3.496821631628442e-06, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.10842613875865936, "step": 4315, "valid_targets_mean": 10095.8, "valid_targets_min": 1958 }, { "epoch": 4.14592, "grad_norm": 0.19157171700505904, "learning_rate": 3.459066409076448e-06, "loss": 0.3552, "loss_nan_ranks": 0, "loss_rank_avg": 0.12181080877780914, "step": 4320, "valid_targets_mean": 10471.4, "valid_targets_min": 3460 }, { "epoch": 4.15072, "grad_norm": 0.18309997648220724, "learning_rate": 3.421496812564713e-06, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.11011368781328201, "step": 4325, "valid_targets_mean": 10075.7, "valid_targets_min": 1911 }, { "epoch": 4.15552, "grad_norm": 0.1998393681086798, "learning_rate": 3.384113263707609e-06, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.10688625276088715, "step": 4330, "valid_targets_mean": 10504.6, "valid_targets_min": 1870 }, { "epoch": 4.16032, "grad_norm": 0.18024162398203716, "learning_rate": 3.34691618203165e-06, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.11504953354597092, "step": 4335, "valid_targets_mean": 11245.9, "valid_targets_min": 1556 }, { "epoch": 4.16512, "grad_norm": 0.1937504451913351, "learning_rate": 3.309905984970765e-06, "loss": 0.3436, "loss_nan_ranks": 0, "loss_rank_avg": 0.12348227202892303, "step": 4340, "valid_targets_mean": 11246.7, "valid_targets_min": 1248 }, { "epoch": 4.16992, "grad_norm": 0.17943992287185476, "learning_rate": 3.2730830878616305e-06, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.1096753403544426, "step": 4345, "valid_targets_mean": 9908.5, "valid_targets_min": 2863 }, { "epoch": 4.17472, "grad_norm": 0.20407149963617882, "learning_rate": 3.2364479039389973e-06, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1211603581905365, "step": 4350, "valid_targets_mean": 10384.3, "valid_targets_min": 2893 }, { "epoch": 4.17952, "grad_norm": 0.1758432680334536, "learning_rate": 3.2000008443310505e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.12273865193128586, "step": 4355, "valid_targets_mean": 11879.3, "valid_targets_min": 210 }, { "epoch": 4.18432, "grad_norm": 0.18831892864707575, "learning_rate": 3.1637423180548232e-06, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.07836240530014038, "step": 4360, "valid_targets_mean": 6800.3, "valid_targets_min": 1637 }, { "epoch": 4.18912, "grad_norm": 0.1783636331291251, "learning_rate": 3.127672732011564e-06, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.11790993809700012, "step": 4365, "valid_targets_mean": 11705.6, "valid_targets_min": 3960 }, { "epoch": 4.19392, "grad_norm": 0.1805010427405642, "learning_rate": 3.0917924909821993e-06, "loss": 0.3473, "loss_nan_ranks": 0, "loss_rank_avg": 0.13108694553375244, "step": 4370, "valid_targets_mean": 11730.7, "valid_targets_min": 1672 }, { "epoch": 4.19872, "grad_norm": 0.16950549661719758, "learning_rate": 3.0561019976227867e-06, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.10931354761123657, "step": 4375, "valid_targets_mean": 11013.4, "valid_targets_min": 2257 }, { "epoch": 4.20352, "grad_norm": 0.171592888138618, "learning_rate": 3.020601652459989e-06, "loss": 0.3489, "loss_nan_ranks": 0, "loss_rank_avg": 0.095522940158844, "step": 4380, "valid_targets_mean": 9442.3, "valid_targets_min": 2247 }, { "epoch": 4.20832, "grad_norm": 0.2140466499221073, "learning_rate": 2.9852918538865847e-06, "loss": 0.3401, "loss_nan_ranks": 0, "loss_rank_avg": 0.09676612168550491, "step": 4385, "valid_targets_mean": 8869.3, "valid_targets_min": 2524 }, { "epoch": 4.21312, "grad_norm": 0.18684710732010837, "learning_rate": 2.950172998156995e-06, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.11988385021686554, "step": 4390, "valid_targets_mean": 11438.3, "valid_targets_min": 2188 }, { "epoch": 4.21792, "grad_norm": 0.18184742236751114, "learning_rate": 2.91524547938284e-06, "loss": 0.339, "loss_nan_ranks": 0, "loss_rank_avg": 0.09970283508300781, "step": 4395, "valid_targets_mean": 9403.1, "valid_targets_min": 2697 }, { "epoch": 4.22272, "grad_norm": 0.2114210981320018, "learning_rate": 2.880509689528519e-06, "loss": 0.3379, "loss_nan_ranks": 0, "loss_rank_avg": 0.12056919932365417, "step": 4400, "valid_targets_mean": 10573.0, "valid_targets_min": 1906 }, { "epoch": 4.22752, "grad_norm": 0.18883655838403018, "learning_rate": 2.845966018406796e-06, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.10442760586738586, "step": 4405, "valid_targets_mean": 9225.2, "valid_targets_min": 2768 }, { "epoch": 4.23232, "grad_norm": 0.17426172584380423, "learning_rate": 2.8116148536744448e-06, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.12738531827926636, "step": 4410, "valid_targets_mean": 11602.2, "valid_targets_min": 2304 }, { "epoch": 4.23712, "grad_norm": 0.18410375145788294, "learning_rate": 2.777456580827882e-06, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.12198962271213531, "step": 4415, "valid_targets_mean": 11050.6, "valid_targets_min": 2639 }, { "epoch": 4.24192, "grad_norm": 0.18769558990904503, "learning_rate": 2.7434915831988517e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.11794613301753998, "step": 4420, "valid_targets_mean": 10889.8, "valid_targets_min": 1751 }, { "epoch": 4.24672, "grad_norm": 0.2338405926765633, "learning_rate": 2.7097202419501246e-06, "loss": 0.3488, "loss_nan_ranks": 0, "loss_rank_avg": 0.11257736384868622, "step": 4425, "valid_targets_mean": 9287.1, "valid_targets_min": 1177 }, { "epoch": 4.25152, "grad_norm": 0.17360265309040923, "learning_rate": 2.6761429360712045e-06, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.11555704474449158, "step": 4430, "valid_targets_mean": 10002.6, "valid_targets_min": 2074 }, { "epoch": 4.25632, "grad_norm": 0.17568574678772966, "learning_rate": 2.642760042374106e-06, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.1140856221318245, "step": 4435, "valid_targets_mean": 10473.9, "valid_targets_min": 993 }, { "epoch": 4.26112, "grad_norm": 0.17776634189725837, "learning_rate": 2.6095719354890903e-06, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.11473214626312256, "step": 4440, "valid_targets_mean": 10775.9, "valid_targets_min": 3243 }, { "epoch": 4.26592, "grad_norm": 0.1786523752405562, "learning_rate": 2.5765789878604852e-06, "loss": 0.3424, "loss_nan_ranks": 0, "loss_rank_avg": 0.11675288528203964, "step": 4445, "valid_targets_mean": 11546.2, "valid_targets_min": 2326 }, { "epoch": 4.27072, "grad_norm": 0.18468001890763955, "learning_rate": 2.543781569742496e-06, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.11585703492164612, "step": 4450, "valid_targets_mean": 10161.7, "valid_targets_min": 2874 }, { "epoch": 4.27552, "grad_norm": 0.16761680409745108, "learning_rate": 2.5111800491950523e-06, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.09747034311294556, "step": 4455, "valid_targets_mean": 10170.5, "valid_targets_min": 2789 }, { "epoch": 4.28032, "grad_norm": 0.17728096040510224, "learning_rate": 2.4787747920796723e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1128934770822525, "step": 4460, "valid_targets_mean": 9173.6, "valid_targets_min": 2190 }, { "epoch": 4.28512, "grad_norm": 0.20554125763942052, "learning_rate": 2.446566162055377e-06, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10944950580596924, "step": 4465, "valid_targets_mean": 10507.8, "valid_targets_min": 1729 }, { "epoch": 4.28992, "grad_norm": 0.1758382654598812, "learning_rate": 2.414554520574579e-06, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.10320094227790833, "step": 4470, "valid_targets_mean": 10201.0, "valid_targets_min": 3485 }, { "epoch": 4.29472, "grad_norm": 0.17816869342253958, "learning_rate": 2.382740226879052e-06, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.10201025754213333, "step": 4475, "valid_targets_mean": 9838.3, "valid_targets_min": 1592 }, { "epoch": 4.29952, "grad_norm": 0.18182023122642407, "learning_rate": 2.3511236379958824e-06, "loss": 0.356, "loss_nan_ranks": 0, "loss_rank_avg": 0.13841117918491364, "step": 4480, "valid_targets_mean": 11641.9, "valid_targets_min": 1969 }, { "epoch": 4.30432, "grad_norm": 0.18550688293565978, "learning_rate": 2.31970510873347e-06, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.1117786392569542, "step": 4485, "valid_targets_mean": 9739.4, "valid_targets_min": 3570 }, { "epoch": 4.30912, "grad_norm": 0.1928516912071047, "learning_rate": 2.2884849916775485e-06, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.10244566947221756, "step": 4490, "valid_targets_mean": 10692.5, "valid_targets_min": 3162 }, { "epoch": 4.3139199999999995, "grad_norm": 0.16862425883484716, "learning_rate": 2.257463637187225e-06, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.11895417422056198, "step": 4495, "valid_targets_mean": 12142.8, "valid_targets_min": 1920 }, { "epoch": 4.31872, "grad_norm": 0.18427884441538028, "learning_rate": 2.2266413933910426e-06, "loss": 0.3379, "loss_nan_ranks": 0, "loss_rank_avg": 0.09559936076402664, "step": 4500, "valid_targets_mean": 8994.3, "valid_targets_min": 1878 }, { "epoch": 4.32352, "grad_norm": 0.18394017197686685, "learning_rate": 2.196018606183088e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.11445660144090652, "step": 4505, "valid_targets_mean": 10953.6, "valid_targets_min": 4550 }, { "epoch": 4.32832, "grad_norm": 0.18355428048580366, "learning_rate": 2.1655956192191007e-06, "loss": 0.3462, "loss_nan_ranks": 0, "loss_rank_avg": 0.12067331373691559, "step": 4510, "valid_targets_mean": 10323.3, "valid_targets_min": 1860 }, { "epoch": 4.33312, "grad_norm": 0.1761313915534513, "learning_rate": 2.135372773912614e-06, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.11238518357276917, "step": 4515, "valid_targets_mean": 11524.8, "valid_targets_min": 1482 }, { "epoch": 4.33792, "grad_norm": 0.18470830979727362, "learning_rate": 2.1053504094311285e-06, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.10500926524400711, "step": 4520, "valid_targets_mean": 9474.5, "valid_targets_min": 1961 }, { "epoch": 4.34272, "grad_norm": 0.18970881351612737, "learning_rate": 2.0755288626923022e-06, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.12795764207839966, "step": 4525, "valid_targets_mean": 11386.8, "valid_targets_min": 2975 }, { "epoch": 4.34752, "grad_norm": 0.1770264238485995, "learning_rate": 2.0459084683601736e-06, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.11818675696849823, "step": 4530, "valid_targets_mean": 10696.7, "valid_targets_min": 464 }, { "epoch": 4.35232, "grad_norm": 0.1739206041365824, "learning_rate": 2.0164895588414037e-06, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.10573488473892212, "step": 4535, "valid_targets_mean": 10361.7, "valid_targets_min": 1279 }, { "epoch": 4.35712, "grad_norm": 0.18709941006713426, "learning_rate": 1.987272464281551e-06, "loss": 0.3469, "loss_nan_ranks": 0, "loss_rank_avg": 0.11464584618806839, "step": 4540, "valid_targets_mean": 10028.0, "valid_targets_min": 1617 }, { "epoch": 4.36192, "grad_norm": 0.1875055355309111, "learning_rate": 1.95825751256135e-06, "loss": 0.348, "loss_nan_ranks": 0, "loss_rank_avg": 0.1142655611038208, "step": 4545, "valid_targets_mean": 11262.9, "valid_targets_min": 663 }, { "epoch": 4.36672, "grad_norm": 0.17711939064351098, "learning_rate": 1.9294450292930576e-06, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.1202390268445015, "step": 4550, "valid_targets_mean": 10644.8, "valid_targets_min": 1748 }, { "epoch": 4.37152, "grad_norm": 0.16979213105299187, "learning_rate": 1.9008353378167755e-06, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.09257425367832184, "step": 4555, "valid_targets_mean": 9115.6, "valid_targets_min": 1620 }, { "epoch": 4.37632, "grad_norm": 0.1782408703909472, "learning_rate": 1.8724287591968294e-06, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.12132684886455536, "step": 4560, "valid_targets_mean": 9446.9, "valid_targets_min": 1860 }, { "epoch": 4.38112, "grad_norm": 0.17449121941176965, "learning_rate": 1.8442256122181735e-06, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10900422930717468, "step": 4565, "valid_targets_mean": 10929.7, "valid_targets_min": 2945 }, { "epoch": 4.38592, "grad_norm": 0.1737945902259658, "learning_rate": 1.8162262133828013e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.08825558423995972, "step": 4570, "valid_targets_mean": 8506.4, "valid_targets_min": 1854 }, { "epoch": 4.39072, "grad_norm": 0.16676669408587796, "learning_rate": 1.7884308769061974e-06, "loss": 0.3375, "loss_nan_ranks": 0, "loss_rank_avg": 0.09462806582450867, "step": 4575, "valid_targets_mean": 9547.1, "valid_targets_min": 2747 }, { "epoch": 4.39552, "grad_norm": 0.16189552847802557, "learning_rate": 1.7608399147138278e-06, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1256551742553711, "step": 4580, "valid_targets_mean": 11958.6, "valid_targets_min": 2896 }, { "epoch": 4.40032, "grad_norm": 0.17469772786856827, "learning_rate": 1.7334536364376075e-06, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.10779605805873871, "step": 4585, "valid_targets_mean": 10866.5, "valid_targets_min": 2471 }, { "epoch": 4.40512, "grad_norm": 0.1811986214517229, "learning_rate": 1.7062723494124545e-06, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.10402344167232513, "step": 4590, "valid_targets_mean": 9006.3, "valid_targets_min": 1845 }, { "epoch": 4.40992, "grad_norm": 0.16980388534020766, "learning_rate": 1.6792963586728195e-06, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.0950300395488739, "step": 4595, "valid_targets_mean": 9814.0, "valid_targets_min": 1630 }, { "epoch": 4.41472, "grad_norm": 0.16301035387109108, "learning_rate": 1.6525259669492832e-06, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.11410839855670929, "step": 4600, "valid_targets_mean": 10504.8, "valid_targets_min": 2394 }, { "epoch": 4.41952, "grad_norm": 0.16745675250061537, "learning_rate": 1.6259614746651364e-06, "loss": 0.344, "loss_nan_ranks": 0, "loss_rank_avg": 0.09161694347858429, "step": 4605, "valid_targets_mean": 9358.8, "valid_targets_min": 1206 }, { "epoch": 4.42432, "grad_norm": 0.17079049191662332, "learning_rate": 1.5996031799330315e-06, "loss": 0.3465, "loss_nan_ranks": 0, "loss_rank_avg": 0.11210022866725922, "step": 4610, "valid_targets_mean": 10135.9, "valid_targets_min": 1119 }, { "epoch": 4.42912, "grad_norm": 0.18208336880669124, "learning_rate": 1.5734513785516227e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.13680927455425262, "step": 4615, "valid_targets_mean": 10683.7, "valid_targets_min": 661 }, { "epoch": 4.43392, "grad_norm": 0.17456794356981462, "learning_rate": 1.5475063640022425e-06, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.1233920305967331, "step": 4620, "valid_targets_mean": 11128.3, "valid_targets_min": 2410 }, { "epoch": 4.43872, "grad_norm": 0.16623507798468853, "learning_rate": 1.5217684274456314e-06, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353224217891693, "step": 4625, "valid_targets_mean": 11848.9, "valid_targets_min": 4052 }, { "epoch": 4.44352, "grad_norm": 0.16759933941207006, "learning_rate": 1.496237857718641e-06, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1048666313290596, "step": 4630, "valid_targets_mean": 9752.1, "valid_targets_min": 1334 }, { "epoch": 4.44832, "grad_norm": 0.1731976789468967, "learning_rate": 1.4709149413310076e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.10677183419466019, "step": 4635, "valid_targets_mean": 10148.2, "valid_targets_min": 1431 }, { "epoch": 4.45312, "grad_norm": 0.17632086604566713, "learning_rate": 1.445799962462142e-06, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.1264108419418335, "step": 4640, "valid_targets_mean": 11090.9, "valid_targets_min": 2144 }, { "epoch": 4.45792, "grad_norm": 0.2015434537773057, "learning_rate": 1.420893202957927e-06, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.12211460620164871, "step": 4645, "valid_targets_mean": 10521.4, "valid_targets_min": 1339 }, { "epoch": 4.46272, "grad_norm": 0.19766730718798986, "learning_rate": 1.3961949423275622e-06, "loss": 0.3438, "loss_nan_ranks": 0, "loss_rank_avg": 0.10595884174108505, "step": 4650, "valid_targets_mean": 10818.3, "valid_targets_min": 1780 }, { "epoch": 4.46752, "grad_norm": 0.16173720804735958, "learning_rate": 1.3717054577404331e-06, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.11681263148784637, "step": 4655, "valid_targets_mean": 10793.5, "valid_targets_min": 1843 }, { "epoch": 4.47232, "grad_norm": 0.16770635422754943, "learning_rate": 1.347425024022988e-06, "loss": 0.3401, "loss_nan_ranks": 0, "loss_rank_avg": 0.11594116687774658, "step": 4660, "valid_targets_mean": 10751.7, "valid_targets_min": 1547 }, { "epoch": 4.47712, "grad_norm": 0.1653276152734862, "learning_rate": 1.3233539136556606e-06, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.11187846958637238, "step": 4665, "valid_targets_mean": 10446.6, "valid_targets_min": 273 }, { "epoch": 4.48192, "grad_norm": 0.16370885544823352, "learning_rate": 1.2994923967698125e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.11684323102235794, "step": 4670, "valid_targets_mean": 12331.6, "valid_targets_min": 1289 }, { "epoch": 4.48672, "grad_norm": 0.16981609122208036, "learning_rate": 1.2758407411446982e-06, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.11591038107872009, "step": 4675, "valid_targets_mean": 11103.5, "valid_targets_min": 2529 }, { "epoch": 4.49152, "grad_norm": 0.17284755314757133, "learning_rate": 1.252399212204467e-06, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.13455729186534882, "step": 4680, "valid_targets_mean": 11908.0, "valid_targets_min": 2585 }, { "epoch": 4.49632, "grad_norm": 0.18136262437177075, "learning_rate": 1.22916807301517e-06, "loss": 0.3445, "loss_nan_ranks": 0, "loss_rank_avg": 0.12223325669765472, "step": 4685, "valid_targets_mean": 12023.1, "valid_targets_min": 641 }, { "epoch": 4.50112, "grad_norm": 0.18252354714474517, "learning_rate": 1.2061475842818337e-06, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.10622070729732513, "step": 4690, "valid_targets_mean": 8431.8, "valid_targets_min": 1989 }, { "epoch": 4.50592, "grad_norm": 0.18226766259332344, "learning_rate": 1.1833380043455e-06, "loss": 0.3398, "loss_nan_ranks": 0, "loss_rank_avg": 0.11837948113679886, "step": 4695, "valid_targets_mean": 11590.0, "valid_targets_min": 2921 }, { "epoch": 4.51072, "grad_norm": 0.17228749691379655, "learning_rate": 1.1607395891803641e-06, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.1034156084060669, "step": 4700, "valid_targets_mean": 8960.0, "valid_targets_min": 798 }, { "epoch": 4.51552, "grad_norm": 0.1674133892638723, "learning_rate": 1.1383525923908678e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247507631778717, "step": 4705, "valid_targets_mean": 12181.7, "valid_targets_min": 2280 }, { "epoch": 4.52032, "grad_norm": 0.17529666189411555, "learning_rate": 1.1161772652088775e-06, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.13458766043186188, "step": 4710, "valid_targets_mean": 12041.3, "valid_targets_min": 1864 }, { "epoch": 4.52512, "grad_norm": 0.17111281681111487, "learning_rate": 1.094213856490849e-06, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.10330748558044434, "step": 4715, "valid_targets_mean": 10015.7, "valid_targets_min": 1452 }, { "epoch": 4.52992, "grad_norm": 0.2005388972740762, "learning_rate": 1.0724626127150462e-06, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.08862671256065369, "step": 4720, "valid_targets_mean": 8354.8, "valid_targets_min": 3056 }, { "epoch": 4.53472, "grad_norm": 0.17715957408643013, "learning_rate": 1.0509237779787717e-06, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.11850816756486893, "step": 4725, "valid_targets_mean": 10371.2, "valid_targets_min": 2187 }, { "epoch": 4.5395199999999996, "grad_norm": 0.17960490638825066, "learning_rate": 1.029597593995626e-06, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.08903937041759491, "step": 4730, "valid_targets_mean": 8203.3, "valid_targets_min": 2693 }, { "epoch": 4.54432, "grad_norm": 0.17401873267818355, "learning_rate": 1.008484300092798e-06, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.10742789506912231, "step": 4735, "valid_targets_mean": 10027.1, "valid_targets_min": 1839 }, { "epoch": 4.54912, "grad_norm": 0.17464251590964316, "learning_rate": 9.87584133208368e-07, "loss": 0.344, "loss_nan_ranks": 0, "loss_rank_avg": 0.11865642666816711, "step": 4740, "valid_targets_mean": 10533.8, "valid_targets_min": 1782 }, { "epoch": 4.55392, "grad_norm": 0.17735860025401656, "learning_rate": 9.66897327888665e-07, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.08903376758098602, "step": 4745, "valid_targets_mean": 7992.7, "valid_targets_min": 1978 }, { "epoch": 4.55872, "grad_norm": 0.1746267689098251, "learning_rate": 9.464241162856269e-07, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.11897937208414078, "step": 4750, "valid_targets_mean": 9702.0, "valid_targets_min": 1915 }, { "epoch": 4.5635200000000005, "grad_norm": 0.198861765601018, "learning_rate": 9.261647281541908e-07, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.09576556831598282, "step": 4755, "valid_targets_mean": 9174.2, "valid_targets_min": 1621 }, { "epoch": 4.56832, "grad_norm": 0.18337917468789947, "learning_rate": 9.061193908497201e-07, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.10396026074886322, "step": 4760, "valid_targets_mean": 9406.8, "valid_targets_min": 1230 }, { "epoch": 4.57312, "grad_norm": 0.1808441935327845, "learning_rate": 8.862883293254598e-07, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12486404925584793, "step": 4765, "valid_targets_mean": 10789.8, "valid_targets_min": 1360 }, { "epoch": 4.57792, "grad_norm": 0.16657100940314107, "learning_rate": 8.666717661299917e-07, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.10040232539176941, "step": 4770, "valid_targets_mean": 9042.8, "valid_targets_min": 1681 }, { "epoch": 4.58272, "grad_norm": 0.1689035714259787, "learning_rate": 8.472699214047652e-07, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.10922395437955856, "step": 4775, "valid_targets_mean": 10596.6, "valid_targets_min": 3097 }, { "epoch": 4.58752, "grad_norm": 0.1826428218690589, "learning_rate": 8.280830128815953e-07, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.1335485279560089, "step": 4780, "valid_targets_mean": 10975.2, "valid_targets_min": 2341 }, { "epoch": 4.59232, "grad_norm": 0.17116832164377946, "learning_rate": 8.09111255880246e-07, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.11295709758996964, "step": 4785, "valid_targets_mean": 10168.0, "valid_targets_min": 2184 }, { "epoch": 4.59712, "grad_norm": 0.17427051060924245, "learning_rate": 7.903548633059955e-07, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.12648193538188934, "step": 4790, "valid_targets_mean": 12529.5, "valid_targets_min": 2135 }, { "epoch": 4.60192, "grad_norm": 0.17846209627157872, "learning_rate": 7.718140456472612e-07, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.12587639689445496, "step": 4795, "valid_targets_mean": 12501.2, "valid_targets_min": 4045 }, { "epoch": 4.60672, "grad_norm": 0.20330776478305493, "learning_rate": 7.534890109732229e-07, "loss": 0.3438, "loss_nan_ranks": 0, "loss_rank_avg": 0.12395921349525452, "step": 4800, "valid_targets_mean": 10552.5, "valid_targets_min": 2740 }, { "epoch": 4.61152, "grad_norm": 0.2195640643749424, "learning_rate": 7.353799649315085e-07, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.10619883239269257, "step": 4805, "valid_targets_mean": 9509.2, "valid_targets_min": 2083 }, { "epoch": 4.61632, "grad_norm": 0.1969968854393267, "learning_rate": 7.174871107458603e-07, "loss": 0.3176, "loss_nan_ranks": 0, "loss_rank_avg": 0.06790103018283844, "step": 4810, "valid_targets_mean": 7099.1, "valid_targets_min": 2387 }, { "epoch": 4.62112, "grad_norm": 0.17970023876518615, "learning_rate": 6.998106492138724e-07, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.08052967488765717, "step": 4815, "valid_targets_mean": 8661.2, "valid_targets_min": 1760 }, { "epoch": 4.62592, "grad_norm": 0.2643732118194215, "learning_rate": 6.823507787047346e-07, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.11436612904071808, "step": 4820, "valid_targets_mean": 10493.6, "valid_targets_min": 2318 }, { "epoch": 4.63072, "grad_norm": 0.18775742452444713, "learning_rate": 6.65107695156999e-07, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.0929485410451889, "step": 4825, "valid_targets_mean": 9043.9, "valid_targets_min": 198 }, { "epoch": 4.63552, "grad_norm": 0.17230531701786073, "learning_rate": 6.480815920763905e-07, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.11901643872261047, "step": 4830, "valid_targets_mean": 11895.4, "valid_targets_min": 2087 }, { "epoch": 4.64032, "grad_norm": 0.1867088568173494, "learning_rate": 6.312726605336306e-07, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.10454428941011429, "step": 4835, "valid_targets_mean": 10254.8, "valid_targets_min": 787 }, { "epoch": 4.64512, "grad_norm": 0.16712749995514461, "learning_rate": 6.146810891622923e-07, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.11394192278385162, "step": 4840, "valid_targets_mean": 12640.7, "valid_targets_min": 2962 }, { "epoch": 4.64992, "grad_norm": 0.19618712934379526, "learning_rate": 5.983070641566802e-07, "loss": 0.3262, "loss_nan_ranks": 0, "loss_rank_avg": 0.11127905547618866, "step": 4845, "valid_targets_mean": 10063.4, "valid_targets_min": 2380 }, { "epoch": 4.65472, "grad_norm": 0.16924869165042286, "learning_rate": 5.821507692697537e-07, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.11467337608337402, "step": 4850, "valid_targets_mean": 11078.0, "valid_targets_min": 2362 }, { "epoch": 4.65952, "grad_norm": 0.1876290335332049, "learning_rate": 5.662123858110513e-07, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.10478425770998001, "step": 4855, "valid_targets_mean": 9512.6, "valid_targets_min": 1837 }, { "epoch": 4.66432, "grad_norm": 0.1766138454915962, "learning_rate": 5.504920926446611e-07, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.10728782415390015, "step": 4860, "valid_targets_mean": 9908.5, "valid_targets_min": 1208 }, { "epoch": 4.66912, "grad_norm": 0.2026546604505345, "learning_rate": 5.349900661872132e-07, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.10532692074775696, "step": 4865, "valid_targets_mean": 9793.9, "valid_targets_min": 2861 }, { "epoch": 4.67392, "grad_norm": 0.17334646571349133, "learning_rate": 5.197064804058971e-07, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.13173431158065796, "step": 4870, "valid_targets_mean": 12489.1, "valid_targets_min": 2679 }, { "epoch": 4.67872, "grad_norm": 0.18757067240596395, "learning_rate": 5.046415068165234e-07, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.10075395554304123, "step": 4875, "valid_targets_mean": 9802.2, "valid_targets_min": 485 }, { "epoch": 4.68352, "grad_norm": 0.177281674085286, "learning_rate": 4.897953144815759e-07, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.10982857644557953, "step": 4880, "valid_targets_mean": 11444.7, "valid_targets_min": 1799 }, { "epoch": 4.68832, "grad_norm": 0.1934502627098448, "learning_rate": 4.7516807000833165e-07, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.12236753851175308, "step": 4885, "valid_targets_mean": 10206.5, "valid_targets_min": 1389 }, { "epoch": 4.69312, "grad_norm": 0.18487124008481706, "learning_rate": 4.6075993754698623e-07, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.11507151275873184, "step": 4890, "valid_targets_mean": 10522.4, "valid_targets_min": 582 }, { "epoch": 4.69792, "grad_norm": 0.17836285144449607, "learning_rate": 4.4657107878881113e-07, "loss": 0.3182, "loss_nan_ranks": 0, "loss_rank_avg": 0.10496693849563599, "step": 4895, "valid_targets_mean": 11460.4, "valid_targets_min": 2740 }, { "epoch": 4.70272, "grad_norm": 0.17167486779210717, "learning_rate": 4.326016529643351e-07, "loss": 0.3231, "loss_nan_ranks": 0, "loss_rank_avg": 0.11415878683328629, "step": 4900, "valid_targets_mean": 10817.6, "valid_targets_min": 2485 }, { "epoch": 4.70752, "grad_norm": 0.1964776797540304, "learning_rate": 4.1885181684157005e-07, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.10461924225091934, "step": 4905, "valid_targets_mean": 8784.8, "valid_targets_min": 282 }, { "epoch": 4.71232, "grad_norm": 0.17362601714443157, "learning_rate": 4.053217247242369e-07, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.10980254411697388, "step": 4910, "valid_targets_mean": 11650.2, "valid_targets_min": 2463 }, { "epoch": 4.7171199999999995, "grad_norm": 0.17887761398779373, "learning_rate": 3.9201152845004476e-07, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12469217926263809, "step": 4915, "valid_targets_mean": 10989.0, "valid_targets_min": 2740 }, { "epoch": 4.72192, "grad_norm": 0.16738018734424778, "learning_rate": 3.789213773889744e-07, "loss": 0.3247, "loss_nan_ranks": 0, "loss_rank_avg": 0.13059523701667786, "step": 4920, "valid_targets_mean": 13034.5, "valid_targets_min": 2818 }, { "epoch": 4.72672, "grad_norm": 0.20767029106159066, "learning_rate": 3.6605141844162417e-07, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.08879049867391586, "step": 4925, "valid_targets_mean": 8753.4, "valid_targets_min": 1851 }, { "epoch": 4.73152, "grad_norm": 0.1712477054459363, "learning_rate": 3.5340179603753354e-07, "loss": 0.3192, "loss_nan_ranks": 0, "loss_rank_avg": 0.10303573310375214, "step": 4930, "valid_targets_mean": 10877.0, "valid_targets_min": 2178 }, { "epoch": 4.73632, "grad_norm": 0.16736585429671713, "learning_rate": 3.4097265213358435e-07, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.09548261761665344, "step": 4935, "valid_targets_mean": 9767.3, "valid_targets_min": 1734 }, { "epoch": 4.7411200000000004, "grad_norm": 0.17681548589034818, "learning_rate": 3.287641262123975e-07, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.11017492413520813, "step": 4940, "valid_targets_mean": 11359.5, "valid_targets_min": 2218 }, { "epoch": 4.74592, "grad_norm": 0.17919361359580346, "learning_rate": 3.1677635528076566e-07, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.09803116321563721, "step": 4945, "valid_targets_mean": 10205.0, "valid_targets_min": 1498 }, { "epoch": 4.75072, "grad_norm": 0.19010332335370647, "learning_rate": 3.0500947386812973e-07, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.10954975336790085, "step": 4950, "valid_targets_mean": 10306.6, "valid_targets_min": 3022 }, { "epoch": 4.75552, "grad_norm": 0.1828282852986503, "learning_rate": 2.934636140250513e-07, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.12371116876602173, "step": 4955, "valid_targets_mean": 11596.5, "valid_targets_min": 2277 }, { "epoch": 4.76032, "grad_norm": 0.17838738493258707, "learning_rate": 2.821389053217383e-07, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.11714506149291992, "step": 4960, "valid_targets_mean": 10788.5, "valid_targets_min": 2539 }, { "epoch": 4.76512, "grad_norm": 0.1870925307726946, "learning_rate": 2.710354748465949e-07, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.0950358510017395, "step": 4965, "valid_targets_mean": 10334.6, "valid_targets_min": 2003 }, { "epoch": 4.76992, "grad_norm": 0.1693238168125335, "learning_rate": 2.6015344720479395e-07, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.11703760176897049, "step": 4970, "valid_targets_mean": 11903.3, "valid_targets_min": 1790 }, { "epoch": 4.77472, "grad_norm": 0.20693809617550638, "learning_rate": 2.49492944516867e-07, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14453014731407166, "step": 4975, "valid_targets_mean": 13146.5, "valid_targets_min": 1755 }, { "epoch": 4.77952, "grad_norm": 0.17184835822806188, "learning_rate": 2.3905408641735183e-07, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.10461593419313431, "step": 4980, "valid_targets_mean": 10058.9, "valid_targets_min": 1491 }, { "epoch": 4.78432, "grad_norm": 0.16319405021168346, "learning_rate": 2.288369900534404e-07, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.0974310040473938, "step": 4985, "valid_targets_mean": 10337.2, "valid_targets_min": 2286 }, { "epoch": 4.7891200000000005, "grad_norm": 0.18659021837351797, "learning_rate": 2.1884177008366203e-07, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.08041709661483765, "step": 4990, "valid_targets_mean": 7788.0, "valid_targets_min": 2433 }, { "epoch": 4.79392, "grad_norm": 0.1798733045442116, "learning_rate": 2.0906853867660004e-07, "loss": 0.3208, "loss_nan_ranks": 0, "loss_rank_avg": 0.10868051648139954, "step": 4995, "valid_targets_mean": 10577.7, "valid_targets_min": 2165 }, { "epoch": 4.79872, "grad_norm": 0.17603612006223165, "learning_rate": 1.9951740550963493e-07, "loss": 0.3249, "loss_nan_ranks": 0, "loss_rank_avg": 0.09991029649972916, "step": 5000, "valid_targets_mean": 9431.1, "valid_targets_min": 1700 }, { "epoch": 4.80352, "grad_norm": 0.18066066507787595, "learning_rate": 1.9018847776770987e-07, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.11398864537477493, "step": 5005, "valid_targets_mean": 9737.5, "valid_targets_min": 2127 }, { "epoch": 4.80832, "grad_norm": 0.16844954184287267, "learning_rate": 1.8108186014212935e-07, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.11392287909984589, "step": 5010, "valid_targets_mean": 12332.1, "valid_targets_min": 2224 }, { "epoch": 4.81312, "grad_norm": 0.17563215197193438, "learning_rate": 1.7219765482938465e-07, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.10459068417549133, "step": 5015, "valid_targets_mean": 8703.7, "valid_targets_min": 1410 }, { "epoch": 4.81792, "grad_norm": 0.1776646013731571, "learning_rate": 1.635359615300036e-07, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.09462516754865646, "step": 5020, "valid_targets_mean": 8818.8, "valid_targets_min": 1617 }, { "epoch": 4.82272, "grad_norm": 0.1791496937556602, "learning_rate": 1.5509687744744262e-07, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.10216499119997025, "step": 5025, "valid_targets_mean": 9467.8, "valid_targets_min": 2429 }, { "epoch": 4.82752, "grad_norm": 0.16653700292134213, "learning_rate": 1.468804972869786e-07, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.12149834632873535, "step": 5030, "valid_targets_mean": 11981.9, "valid_targets_min": 3300 }, { "epoch": 4.83232, "grad_norm": 0.17172327709459417, "learning_rate": 1.3888691325465886e-07, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.08818644285202026, "step": 5035, "valid_targets_mean": 8631.6, "valid_targets_min": 1206 }, { "epoch": 4.83712, "grad_norm": 0.18997648114127738, "learning_rate": 1.3111621505626616e-07, "loss": 0.3266, "loss_nan_ranks": 0, "loss_rank_avg": 0.09478943049907684, "step": 5040, "valid_targets_mean": 8689.6, "valid_targets_min": 2156 }, { "epoch": 4.84192, "grad_norm": 0.18259426394205755, "learning_rate": 1.235684898963041e-07, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.08341314643621445, "step": 5045, "valid_targets_mean": 8050.8, "valid_targets_min": 2530 }, { "epoch": 4.84672, "grad_norm": 0.17177250528846147, "learning_rate": 1.1624382247702681e-07, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.11258942633867264, "step": 5050, "valid_targets_mean": 11464.4, "valid_targets_min": 2338 }, { "epoch": 4.85152, "grad_norm": 0.1808670185893642, "learning_rate": 1.0914229499748186e-07, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.13074561953544617, "step": 5055, "valid_targets_mean": 12076.3, "valid_targets_min": 3777 }, { "epoch": 4.85632, "grad_norm": 0.1819844593461489, "learning_rate": 1.0226398715259322e-07, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.08755750954151154, "step": 5060, "valid_targets_mean": 8355.9, "valid_targets_min": 2486 }, { "epoch": 4.86112, "grad_norm": 0.177684711321361, "learning_rate": 9.560897613226205e-08, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.11981816589832306, "step": 5065, "valid_targets_mean": 10488.2, "valid_targets_min": 301 }, { "epoch": 4.86592, "grad_norm": 0.18615913929358685, "learning_rate": 8.917733662050287e-08, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.1071147471666336, "step": 5070, "valid_targets_mean": 10314.9, "valid_targets_min": 2260 }, { "epoch": 4.87072, "grad_norm": 0.18230202290942948, "learning_rate": 8.296914079461094e-08, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.10978755354881287, "step": 5075, "valid_targets_mean": 10930.6, "valid_targets_min": 2365 }, { "epoch": 4.87552, "grad_norm": 0.17407475640883, "learning_rate": 7.698445832433843e-08, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.11135123670101166, "step": 5080, "valid_targets_mean": 10441.7, "valid_targets_min": 2090 }, { "epoch": 4.88032, "grad_norm": 0.17657507510506681, "learning_rate": 7.122335637112621e-08, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.10902173817157745, "step": 5085, "valid_targets_mean": 10547.8, "valid_targets_min": 851 }, { "epoch": 4.88512, "grad_norm": 0.17631444132818108, "learning_rate": 6.568589958734218e-08, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.10108692944049835, "step": 5090, "valid_targets_mean": 9943.4, "valid_targets_min": 824 }, { "epoch": 4.88992, "grad_norm": 0.18617727239056273, "learning_rate": 6.037215011556185e-08, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.14152035117149353, "step": 5095, "valid_targets_mean": 12125.5, "valid_targets_min": 1758 }, { "epoch": 4.8947199999999995, "grad_norm": 0.17410976874888923, "learning_rate": 5.5282167587862314e-08, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.10145286470651627, "step": 5100, "valid_targets_mean": 9976.4, "valid_targets_min": 2352 }, { "epoch": 4.89952, "grad_norm": 0.2115545191279235, "learning_rate": 5.041600912516264e-08, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.12674742937088013, "step": 5105, "valid_targets_mean": 11855.3, "valid_targets_min": 934 }, { "epoch": 4.90432, "grad_norm": 0.1786956533463368, "learning_rate": 4.5773729336577865e-08, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.11230462044477463, "step": 5110, "valid_targets_mean": 10612.1, "valid_targets_min": 1741 }, { "epoch": 4.90912, "grad_norm": 0.16647888826427865, "learning_rate": 4.1355380318803816e-08, "loss": 0.3247, "loss_nan_ranks": 0, "loss_rank_avg": 0.10658138990402222, "step": 5115, "valid_targets_mean": 12273.5, "valid_targets_min": 2656 }, { "epoch": 4.91392, "grad_norm": 0.17235372520662695, "learning_rate": 3.7161011655535425e-08, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.1133071631193161, "step": 5120, "valid_targets_mean": 11972.8, "valid_targets_min": 1868 }, { "epoch": 4.91872, "grad_norm": 0.17876628581017168, "learning_rate": 3.319067041691604e-08, "loss": 0.3208, "loss_nan_ranks": 0, "loss_rank_avg": 0.10460739582777023, "step": 5125, "valid_targets_mean": 10743.4, "valid_targets_min": 2740 }, { "epoch": 4.92352, "grad_norm": 0.18160671877566145, "learning_rate": 2.9444401158995606e-08, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.1146806925535202, "step": 5130, "valid_targets_mean": 11135.2, "valid_targets_min": 2450 }, { "epoch": 4.92832, "grad_norm": 0.18394946348768662, "learning_rate": 2.5922245923244436e-08, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.11141496896743774, "step": 5135, "valid_targets_mean": 10979.2, "valid_targets_min": 3486 }, { "epoch": 4.93312, "grad_norm": 0.17972422728254375, "learning_rate": 2.2624244236071348e-08, "loss": 0.3182, "loss_nan_ranks": 0, "loss_rank_avg": 0.09954261779785156, "step": 5140, "valid_targets_mean": 10688.3, "valid_targets_min": 1839 }, { "epoch": 4.93792, "grad_norm": 0.16849691178434315, "learning_rate": 1.9550433108384005e-08, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.10053584724664688, "step": 5145, "valid_targets_mean": 10856.2, "valid_targets_min": 1150 }, { "epoch": 4.94272, "grad_norm": 0.1698003457201187, "learning_rate": 1.6700847035180378e-08, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.09409875422716141, "step": 5150, "valid_targets_mean": 9585.8, "valid_targets_min": 1851 }, { "epoch": 4.94752, "grad_norm": 0.1863998752880038, "learning_rate": 1.4075517995146837e-08, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.13018685579299927, "step": 5155, "valid_targets_mean": 11728.6, "valid_targets_min": 1242 }, { "epoch": 4.95232, "grad_norm": 0.23040330350119576, "learning_rate": 1.167447545031175e-08, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12115727365016937, "step": 5160, "valid_targets_mean": 13134.6, "valid_targets_min": 2568 }, { "epoch": 4.95712, "grad_norm": 0.17389964545892517, "learning_rate": 9.497746345705772e-09, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.09132646024227142, "step": 5165, "valid_targets_mean": 8934.7, "valid_targets_min": 1490 }, { "epoch": 4.96192, "grad_norm": 0.17641121909731672, "learning_rate": 7.545355109073172e-09, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.08680982142686844, "step": 5170, "valid_targets_mean": 9088.2, "valid_targets_min": 2406 }, { "epoch": 4.9667200000000005, "grad_norm": 0.18141331963644278, "learning_rate": 5.817323650578743e-09, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.10711181163787842, "step": 5175, "valid_targets_mean": 10195.1, "valid_targets_min": 3175 }, { "epoch": 4.97152, "grad_norm": 0.1711797674805141, "learning_rate": 4.313671362576877e-09, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.11465975642204285, "step": 5180, "valid_targets_mean": 10932.3, "valid_targets_min": 1807 }, { "epoch": 4.97632, "grad_norm": 0.1710617977047733, "learning_rate": 3.0344151193917316e-09, "loss": 0.3295, "loss_nan_ranks": 0, "loss_rank_avg": 0.09889707714319229, "step": 5185, "valid_targets_mean": 9771.4, "valid_targets_min": 1784 }, { "epoch": 4.98112, "grad_norm": 0.19876991237981612, "learning_rate": 1.979569277117399e-09, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.09426333010196686, "step": 5190, "valid_targets_mean": 9083.2, "valid_targets_min": 1813 }, { "epoch": 4.98592, "grad_norm": 0.17924834504421394, "learning_rate": 1.1491456734713524e-09, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.10984489321708679, "step": 5195, "valid_targets_mean": 10042.7, "valid_targets_min": 3989 }, { "epoch": 4.99072, "grad_norm": 0.1840599715302738, "learning_rate": 5.431536276523375e-10, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.10118210315704346, "step": 5200, "valid_targets_mean": 9091.2, "valid_targets_min": 1931 }, { "epoch": 4.99552, "grad_norm": 0.17650718737736182, "learning_rate": 1.6159994023601245e-10, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.09146692603826523, "step": 5205, "valid_targets_mean": 9079.4, "valid_targets_min": 1583 }, { "epoch": 5.0, "grad_norm": 0.21227037203133356, "learning_rate": 4.488893106113779e-12, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.15339435636997223, "step": 5210, "valid_targets_mean": 9953.1, "valid_targets_min": 2228 }, { "epoch": 5.0, "step": 5210, "total_flos": 2.038899186550912e+19, "train_loss": 0.0, "train_runtime": 1.0148, "train_samples_per_second": 492687.515, "train_steps_per_second": 5133.804 } ], "logging_steps": 5, "max_steps": 5210, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 300, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.038899186550912e+19, "train_batch_size": 1, "trial_name": null, "trial_params": null }