{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 5210, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0048, "grad_norm": 6.937965654420425, "learning_rate": 3.071017274472169e-07, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.11469614505767822, "step": 5, "valid_targets_mean": 3499.5, "valid_targets_min": 1863 }, { "epoch": 0.0096, "grad_norm": 6.5863821052475515, "learning_rate": 6.909788867562381e-07, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.12012797594070435, "step": 10, "valid_targets_mean": 3721.8, "valid_targets_min": 1764 }, { "epoch": 0.0144, "grad_norm": 5.343535940478726, "learning_rate": 1.074856046065259e-06, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.12584523856639862, "step": 15, "valid_targets_mean": 3173.9, "valid_targets_min": 1727 }, { "epoch": 0.0192, "grad_norm": 2.3671652084368016, "learning_rate": 1.4587332053742803e-06, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.09593678265810013, "step": 20, "valid_targets_mean": 4235.9, "valid_targets_min": 1930 }, { "epoch": 0.024, "grad_norm": 1.5821432353896931, "learning_rate": 1.8426103646833015e-06, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.0928233414888382, "step": 25, "valid_targets_mean": 3918.5, "valid_targets_min": 2012 }, { "epoch": 0.0288, "grad_norm": 1.0466260829406362, "learning_rate": 2.2264875239923228e-06, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.09647513926029205, "step": 30, "valid_targets_mean": 3579.7, "valid_targets_min": 1909 }, { "epoch": 0.0336, "grad_norm": 0.7301653193288717, "learning_rate": 2.6103646833013433e-06, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.09100286662578583, "step": 35, "valid_targets_mean": 3455.0, "valid_targets_min": 2080 }, { "epoch": 0.0384, "grad_norm": 0.5634397105921576, "learning_rate": 2.9942418426103648e-06, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.06531375646591187, "step": 40, "valid_targets_mean": 2997.9, "valid_targets_min": 1907 }, { "epoch": 0.0432, "grad_norm": 0.3771989155832216, "learning_rate": 3.378119001919386e-06, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.05960608273744583, "step": 45, "valid_targets_mean": 3948.8, "valid_targets_min": 1863 }, { "epoch": 0.048, "grad_norm": 0.2913641430638286, "learning_rate": 3.761996161228407e-06, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.05882091447710991, "step": 50, "valid_targets_mean": 4149.5, "valid_targets_min": 2046 }, { "epoch": 0.0528, "grad_norm": 0.2153147490996494, "learning_rate": 4.145873320537428e-06, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.04906277358531952, "step": 55, "valid_targets_mean": 4259.8, "valid_targets_min": 1940 }, { "epoch": 0.0576, "grad_norm": 0.20723734858542475, "learning_rate": 4.52975047984645e-06, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.050851885229349136, "step": 60, "valid_targets_mean": 3494.0, "valid_targets_min": 2009 }, { "epoch": 0.0624, "grad_norm": 0.17986844485497974, "learning_rate": 4.91362763915547e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.048392847180366516, "step": 65, "valid_targets_mean": 4253.8, "valid_targets_min": 1937 }, { "epoch": 0.0672, "grad_norm": 0.17301691819215223, "learning_rate": 5.297504798464492e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.046146441251039505, "step": 70, "valid_targets_mean": 3649.2, "valid_targets_min": 1939 }, { "epoch": 0.072, "grad_norm": 0.16766105949933824, "learning_rate": 5.681381957773513e-06, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.04667827486991882, "step": 75, "valid_targets_mean": 3832.0, "valid_targets_min": 1995 }, { "epoch": 0.0768, "grad_norm": 0.19338450140560143, "learning_rate": 6.065259117082534e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.045901913195848465, "step": 80, "valid_targets_mean": 3223.5, "valid_targets_min": 1930 }, { "epoch": 0.0816, "grad_norm": 0.163903129334992, "learning_rate": 6.449136276391556e-06, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.03836950659751892, "step": 85, "valid_targets_mean": 4337.8, "valid_targets_min": 1716 }, { "epoch": 0.0864, "grad_norm": 0.1732436888952196, "learning_rate": 6.833013435700576e-06, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.04401613771915436, "step": 90, "valid_targets_mean": 4111.6, "valid_targets_min": 1857 }, { "epoch": 0.0912, "grad_norm": 0.19082139608668852, "learning_rate": 7.216890595009598e-06, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.03892116993665695, "step": 95, "valid_targets_mean": 2942.4, "valid_targets_min": 1977 }, { "epoch": 0.096, "grad_norm": 0.17638352231994248, "learning_rate": 7.600767754318619e-06, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.0390937514603138, "step": 100, "valid_targets_mean": 3591.5, "valid_targets_min": 1680 }, { "epoch": 0.1008, "grad_norm": 0.1944525138076534, "learning_rate": 7.98464491362764e-06, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.048598822206258774, "step": 105, "valid_targets_mean": 3481.1, "valid_targets_min": 1868 }, { "epoch": 0.1056, "grad_norm": 0.22035770940213192, "learning_rate": 8.368522072936662e-06, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.039973922073841095, "step": 110, "valid_targets_mean": 3435.9, "valid_targets_min": 2010 }, { "epoch": 0.1104, "grad_norm": 0.18001026275208665, "learning_rate": 8.752399232245682e-06, "loss": 0.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.03717381879687309, "step": 115, "valid_targets_mean": 3578.4, "valid_targets_min": 1929 }, { "epoch": 0.1152, "grad_norm": 0.20166628598885344, "learning_rate": 9.136276391554704e-06, "loss": 0.1142, "loss_nan_ranks": 0, "loss_rank_avg": 0.034547075629234314, "step": 120, "valid_targets_mean": 3295.2, "valid_targets_min": 1662 }, { "epoch": 0.12, "grad_norm": 0.19167865931651773, "learning_rate": 9.520153550863724e-06, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.03747241944074631, "step": 125, "valid_targets_mean": 4539.3, "valid_targets_min": 1847 }, { "epoch": 0.1248, "grad_norm": 0.19148980089840842, "learning_rate": 9.904030710172746e-06, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.03533416986465454, "step": 130, "valid_targets_mean": 3445.7, "valid_targets_min": 1709 }, { "epoch": 0.1296, "grad_norm": 0.21821353960131265, "learning_rate": 1.0287907869481766e-05, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.03997855633497238, "step": 135, "valid_targets_mean": 3530.8, "valid_targets_min": 2027 }, { "epoch": 0.1344, "grad_norm": 0.23048953683917786, "learning_rate": 1.067178502879079e-05, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.03685012459754944, "step": 140, "valid_targets_mean": 3553.0, "valid_targets_min": 1820 }, { "epoch": 0.1392, "grad_norm": 0.23561676819347502, "learning_rate": 1.105566218809981e-05, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.033116281032562256, "step": 145, "valid_targets_mean": 3572.2, "valid_targets_min": 2180 }, { "epoch": 0.144, "grad_norm": 0.18410766236895754, "learning_rate": 1.143953934740883e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.02970690280199051, "step": 150, "valid_targets_mean": 4146.3, "valid_targets_min": 1719 }, { "epoch": 0.1488, "grad_norm": 0.18049019085906956, "learning_rate": 1.182341650671785e-05, "loss": 0.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.029041530564427376, "step": 155, "valid_targets_mean": 3589.8, "valid_targets_min": 1863 }, { "epoch": 0.1536, "grad_norm": 0.23489464884439978, "learning_rate": 1.2207293666026872e-05, "loss": 0.0924, "loss_nan_ranks": 0, "loss_rank_avg": 0.03265086188912392, "step": 160, "valid_targets_mean": 3268.7, "valid_targets_min": 1847 }, { "epoch": 0.1584, "grad_norm": 0.19835583785764463, "learning_rate": 1.2591170825335894e-05, "loss": 0.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.029566409066319466, "step": 165, "valid_targets_mean": 4323.8, "valid_targets_min": 1974 }, { "epoch": 0.1632, "grad_norm": 0.24846365725039307, "learning_rate": 1.2975047984644915e-05, "loss": 0.0867, "loss_nan_ranks": 0, "loss_rank_avg": 0.0281932782381773, "step": 170, "valid_targets_mean": 4207.3, "valid_targets_min": 2087 }, { "epoch": 0.168, "grad_norm": 0.22919583334361535, "learning_rate": 1.3358925143953936e-05, "loss": 0.0853, "loss_nan_ranks": 0, "loss_rank_avg": 0.02949838899075985, "step": 175, "valid_targets_mean": 3960.9, "valid_targets_min": 1857 }, { "epoch": 0.1728, "grad_norm": 0.27434533496042574, "learning_rate": 1.3742802303262956e-05, "loss": 0.0821, "loss_nan_ranks": 0, "loss_rank_avg": 0.02647317200899124, "step": 180, "valid_targets_mean": 3963.9, "valid_targets_min": 2022 }, { "epoch": 0.1776, "grad_norm": 0.2554410371258365, "learning_rate": 1.4126679462571978e-05, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.028740808367729187, "step": 185, "valid_targets_mean": 3598.1, "valid_targets_min": 1970 }, { "epoch": 0.1824, "grad_norm": 0.22965813069707355, "learning_rate": 1.4510556621881e-05, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.022127017378807068, "step": 190, "valid_targets_mean": 4289.5, "valid_targets_min": 1764 }, { "epoch": 0.1872, "grad_norm": 0.2288532296930469, "learning_rate": 1.4894433781190021e-05, "loss": 0.0723, "loss_nan_ranks": 0, "loss_rank_avg": 0.02306653931736946, "step": 195, "valid_targets_mean": 4330.4, "valid_targets_min": 1993 }, { "epoch": 0.192, "grad_norm": 0.27240454535637443, "learning_rate": 1.527831094049904e-05, "loss": 0.0712, "loss_nan_ranks": 0, "loss_rank_avg": 0.025289515033364296, "step": 200, "valid_targets_mean": 2736.6, "valid_targets_min": 1614 }, { "epoch": 0.1968, "grad_norm": 0.242681238840325, "learning_rate": 1.566218809980806e-05, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.024639660492539406, "step": 205, "valid_targets_mean": 4075.1, "valid_targets_min": 2080 }, { "epoch": 0.2016, "grad_norm": 0.24849701794363202, "learning_rate": 1.6046065259117082e-05, "loss": 0.0645, "loss_nan_ranks": 0, "loss_rank_avg": 0.01965644210577011, "step": 210, "valid_targets_mean": 3752.0, "valid_targets_min": 1719 }, { "epoch": 0.2064, "grad_norm": 0.27241151966507293, "learning_rate": 1.6429942418426105e-05, "loss": 0.0602, "loss_nan_ranks": 0, "loss_rank_avg": 0.01922878436744213, "step": 215, "valid_targets_mean": 3878.5, "valid_targets_min": 1662 }, { "epoch": 0.2112, "grad_norm": 0.3082022682540152, "learning_rate": 1.6813819577735126e-05, "loss": 0.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.019677884876728058, "step": 220, "valid_targets_mean": 3743.6, "valid_targets_min": 2048 }, { "epoch": 0.216, "grad_norm": 0.3058526962109295, "learning_rate": 1.7197696737044146e-05, "loss": 0.0583, "loss_nan_ranks": 0, "loss_rank_avg": 0.02079184725880623, "step": 225, "valid_targets_mean": 3293.6, "valid_targets_min": 1662 }, { "epoch": 0.2208, "grad_norm": 0.27962167396369564, "learning_rate": 1.758157389635317e-05, "loss": 0.0544, "loss_nan_ranks": 0, "loss_rank_avg": 0.01946953497827053, "step": 230, "valid_targets_mean": 4708.4, "valid_targets_min": 2046 }, { "epoch": 0.2256, "grad_norm": 0.28869191640978553, "learning_rate": 1.796545105566219e-05, "loss": 0.0519, "loss_nan_ranks": 0, "loss_rank_avg": 0.01823297329246998, "step": 235, "valid_targets_mean": 3593.3, "valid_targets_min": 2081 }, { "epoch": 0.2304, "grad_norm": 0.2898824996991812, "learning_rate": 1.8349328214971213e-05, "loss": 0.0499, "loss_nan_ranks": 0, "loss_rank_avg": 0.016215849667787552, "step": 240, "valid_targets_mean": 4142.3, "valid_targets_min": 2089 }, { "epoch": 0.2352, "grad_norm": 0.30149704768269103, "learning_rate": 1.8733205374280233e-05, "loss": 0.0509, "loss_nan_ranks": 0, "loss_rank_avg": 0.01709664985537529, "step": 245, "valid_targets_mean": 3813.4, "valid_targets_min": 1928 }, { "epoch": 0.24, "grad_norm": 0.2979272115801746, "learning_rate": 1.9117082533589253e-05, "loss": 0.0452, "loss_nan_ranks": 0, "loss_rank_avg": 0.010545975528657436, "step": 250, "valid_targets_mean": 3071.1, "valid_targets_min": 1877 }, { "epoch": 0.2448, "grad_norm": 0.3057707833669144, "learning_rate": 1.9500959692898273e-05, "loss": 0.0424, "loss_nan_ranks": 0, "loss_rank_avg": 0.014655347913503647, "step": 255, "valid_targets_mean": 3741.1, "valid_targets_min": 1763 }, { "epoch": 0.2496, "grad_norm": 0.2995200667585905, "learning_rate": 1.9884836852207294e-05, "loss": 0.0419, "loss_nan_ranks": 0, "loss_rank_avg": 0.01323431171476841, "step": 260, "valid_targets_mean": 4534.5, "valid_targets_min": 1889 }, { "epoch": 0.2544, "grad_norm": 0.3284439605360466, "learning_rate": 2.0268714011516314e-05, "loss": 0.038, "loss_nan_ranks": 0, "loss_rank_avg": 0.013670418411493301, "step": 265, "valid_targets_mean": 3705.1, "valid_targets_min": 1877 }, { "epoch": 0.2592, "grad_norm": 0.28351371383795076, "learning_rate": 2.0652591170825337e-05, "loss": 0.0364, "loss_nan_ranks": 0, "loss_rank_avg": 0.010727550834417343, "step": 270, "valid_targets_mean": 3922.1, "valid_targets_min": 1889 }, { "epoch": 0.264, "grad_norm": 0.3150839446969937, "learning_rate": 2.103646833013436e-05, "loss": 0.0342, "loss_nan_ranks": 0, "loss_rank_avg": 0.011736005544662476, "step": 275, "valid_targets_mean": 3559.4, "valid_targets_min": 1919 }, { "epoch": 0.2688, "grad_norm": 0.2806927089920171, "learning_rate": 2.142034548944338e-05, "loss": 0.0318, "loss_nan_ranks": 0, "loss_rank_avg": 0.013169767335057259, "step": 280, "valid_targets_mean": 4125.0, "valid_targets_min": 1952 }, { "epoch": 0.2736, "grad_norm": 0.2971395106031058, "learning_rate": 2.18042226487524e-05, "loss": 0.0338, "loss_nan_ranks": 0, "loss_rank_avg": 0.009649878367781639, "step": 285, "valid_targets_mean": 3847.2, "valid_targets_min": 1839 }, { "epoch": 0.2784, "grad_norm": 0.30462593223391954, "learning_rate": 2.218809980806142e-05, "loss": 0.0309, "loss_nan_ranks": 0, "loss_rank_avg": 0.007476530969142914, "step": 290, "valid_targets_mean": 4701.7, "valid_targets_min": 1802 }, { "epoch": 0.2832, "grad_norm": 0.30038151573422667, "learning_rate": 2.2571976967370445e-05, "loss": 0.0287, "loss_nan_ranks": 0, "loss_rank_avg": 0.007295252755284309, "step": 295, "valid_targets_mean": 3913.3, "valid_targets_min": 1799 }, { "epoch": 0.288, "grad_norm": 0.29158760056491095, "learning_rate": 2.2955854126679465e-05, "loss": 0.028, "loss_nan_ranks": 0, "loss_rank_avg": 0.009111661463975906, "step": 300, "valid_targets_mean": 3851.0, "valid_targets_min": 1952 }, { "epoch": 0.2928, "grad_norm": 0.29029858315528134, "learning_rate": 2.3339731285988485e-05, "loss": 0.0265, "loss_nan_ranks": 0, "loss_rank_avg": 0.00890104379504919, "step": 305, "valid_targets_mean": 3463.2, "valid_targets_min": 1751 }, { "epoch": 0.2976, "grad_norm": 0.3432214228291009, "learning_rate": 2.372360844529751e-05, "loss": 0.0243, "loss_nan_ranks": 0, "loss_rank_avg": 0.008902271278202534, "step": 310, "valid_targets_mean": 2587.8, "valid_targets_min": 1917 }, { "epoch": 0.3024, "grad_norm": 0.2780773407000986, "learning_rate": 2.4107485604606525e-05, "loss": 0.0231, "loss_nan_ranks": 0, "loss_rank_avg": 0.00839188788086176, "step": 315, "valid_targets_mean": 3983.3, "valid_targets_min": 1601 }, { "epoch": 0.3072, "grad_norm": 0.32885066035163374, "learning_rate": 2.449136276391555e-05, "loss": 0.0233, "loss_nan_ranks": 0, "loss_rank_avg": 0.008772674016654491, "step": 320, "valid_targets_mean": 3652.5, "valid_targets_min": 2008 }, { "epoch": 0.312, "grad_norm": 0.3055398782817974, "learning_rate": 2.4875239923224573e-05, "loss": 0.0233, "loss_nan_ranks": 0, "loss_rank_avg": 0.009282301180064678, "step": 325, "valid_targets_mean": 4054.7, "valid_targets_min": 1716 }, { "epoch": 0.3168, "grad_norm": 0.36149353916895155, "learning_rate": 2.525911708253359e-05, "loss": 0.0224, "loss_nan_ranks": 0, "loss_rank_avg": 0.007749137934297323, "step": 330, "valid_targets_mean": 3019.2, "valid_targets_min": 1939 }, { "epoch": 0.3216, "grad_norm": 0.3228633275486538, "learning_rate": 2.5642994241842613e-05, "loss": 0.0202, "loss_nan_ranks": 0, "loss_rank_avg": 0.007192028686404228, "step": 335, "valid_targets_mean": 3837.0, "valid_targets_min": 1760 }, { "epoch": 0.3264, "grad_norm": 0.25093922169727056, "learning_rate": 2.6026871401151633e-05, "loss": 0.0175, "loss_nan_ranks": 0, "loss_rank_avg": 0.00533191068097949, "step": 340, "valid_targets_mean": 3737.1, "valid_targets_min": 1517 }, { "epoch": 0.3312, "grad_norm": 0.35279337813115486, "learning_rate": 2.6410748560460657e-05, "loss": 0.0175, "loss_nan_ranks": 0, "loss_rank_avg": 0.007894867099821568, "step": 345, "valid_targets_mean": 3601.5, "valid_targets_min": 1907 }, { "epoch": 0.336, "grad_norm": 0.26818158089815164, "learning_rate": 2.6794625719769677e-05, "loss": 0.0173, "loss_nan_ranks": 0, "loss_rank_avg": 0.005505319684743881, "step": 350, "valid_targets_mean": 4927.9, "valid_targets_min": 2030 }, { "epoch": 0.3408, "grad_norm": 0.2897950061058035, "learning_rate": 2.7178502879078697e-05, "loss": 0.0178, "loss_nan_ranks": 0, "loss_rank_avg": 0.005148059222847223, "step": 355, "valid_targets_mean": 3249.0, "valid_targets_min": 2031 }, { "epoch": 0.3456, "grad_norm": 0.29798905792631397, "learning_rate": 2.756238003838772e-05, "loss": 0.0175, "loss_nan_ranks": 0, "loss_rank_avg": 0.005866318475455046, "step": 360, "valid_targets_mean": 3637.2, "valid_targets_min": 2012 }, { "epoch": 0.3504, "grad_norm": 0.23388716919207966, "learning_rate": 2.7946257197696737e-05, "loss": 0.0157, "loss_nan_ranks": 0, "loss_rank_avg": 0.0034332945942878723, "step": 365, "valid_targets_mean": 3665.2, "valid_targets_min": 1562 }, { "epoch": 0.3552, "grad_norm": 0.3144219799825524, "learning_rate": 2.833013435700576e-05, "loss": 0.0165, "loss_nan_ranks": 0, "loss_rank_avg": 0.005330200307071209, "step": 370, "valid_targets_mean": 3714.6, "valid_targets_min": 1918 }, { "epoch": 0.36, "grad_norm": 0.2347921761514834, "learning_rate": 2.8714011516314784e-05, "loss": 0.015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0039110006764531136, "step": 375, "valid_targets_mean": 3327.7, "valid_targets_min": 1764 }, { "epoch": 0.3648, "grad_norm": 0.2904804056955613, "learning_rate": 2.90978886756238e-05, "loss": 0.0151, "loss_nan_ranks": 0, "loss_rank_avg": 0.005027526989579201, "step": 380, "valid_targets_mean": 3128.4, "valid_targets_min": 1868 }, { "epoch": 0.3696, "grad_norm": 0.28700226054014716, "learning_rate": 2.9481765834932825e-05, "loss": 0.016, "loss_nan_ranks": 0, "loss_rank_avg": 0.004024747759103775, "step": 385, "valid_targets_mean": 3588.8, "valid_targets_min": 1601 }, { "epoch": 0.3744, "grad_norm": 0.26884448060402233, "learning_rate": 2.9865642994241845e-05, "loss": 0.0141, "loss_nan_ranks": 0, "loss_rank_avg": 0.004564404953271151, "step": 390, "valid_targets_mean": 3236.8, "valid_targets_min": 1900 }, { "epoch": 0.3792, "grad_norm": 0.24611041897462416, "learning_rate": 3.0249520153550865e-05, "loss": 0.0141, "loss_nan_ranks": 0, "loss_rank_avg": 0.004304606467485428, "step": 395, "valid_targets_mean": 4403.7, "valid_targets_min": 1709 }, { "epoch": 0.384, "grad_norm": 0.48825494706248906, "learning_rate": 3.063339731285989e-05, "loss": 0.012, "loss_nan_ranks": 0, "loss_rank_avg": 0.004420734476298094, "step": 400, "valid_targets_mean": 3538.8, "valid_targets_min": 1614 }, { "epoch": 0.3888, "grad_norm": 0.2792081008190513, "learning_rate": 3.101727447216891e-05, "loss": 0.0144, "loss_nan_ranks": 0, "loss_rank_avg": 0.005862731486558914, "step": 405, "valid_targets_mean": 4681.7, "valid_targets_min": 2091 }, { "epoch": 0.3936, "grad_norm": 0.30743113561108026, "learning_rate": 3.140115163147793e-05, "loss": 0.0142, "loss_nan_ranks": 0, "loss_rank_avg": 0.006006536073982716, "step": 410, "valid_targets_mean": 4158.8, "valid_targets_min": 1906 }, { "epoch": 0.3984, "grad_norm": 0.23617729705125162, "learning_rate": 3.178502879078695e-05, "loss": 0.0112, "loss_nan_ranks": 0, "loss_rank_avg": 0.0039299000054597855, "step": 415, "valid_targets_mean": 5437.2, "valid_targets_min": 2126 }, { "epoch": 0.4032, "grad_norm": 0.24273874285561925, "learning_rate": 3.216890595009597e-05, "loss": 0.0121, "loss_nan_ranks": 0, "loss_rank_avg": 0.002637755125761032, "step": 420, "valid_targets_mean": 4218.1, "valid_targets_min": 1836 }, { "epoch": 0.408, "grad_norm": 0.2571274327476414, "learning_rate": 3.2552783109404996e-05, "loss": 0.0126, "loss_nan_ranks": 0, "loss_rank_avg": 0.004715914838016033, "step": 425, "valid_targets_mean": 3939.8, "valid_targets_min": 2195 }, { "epoch": 0.4128, "grad_norm": 0.2500933896104518, "learning_rate": 3.2936660268714016e-05, "loss": 0.0118, "loss_nan_ranks": 0, "loss_rank_avg": 0.0031941996421664953, "step": 430, "valid_targets_mean": 3576.3, "valid_targets_min": 1705 }, { "epoch": 0.4176, "grad_norm": 0.22701352422866455, "learning_rate": 3.3320537428023036e-05, "loss": 0.0106, "loss_nan_ranks": 0, "loss_rank_avg": 0.003280221950262785, "step": 435, "valid_targets_mean": 3586.2, "valid_targets_min": 1942 }, { "epoch": 0.4224, "grad_norm": 0.2524861159968299, "learning_rate": 3.3704414587332056e-05, "loss": 0.0114, "loss_nan_ranks": 0, "loss_rank_avg": 0.004017299972474575, "step": 440, "valid_targets_mean": 3009.8, "valid_targets_min": 1952 }, { "epoch": 0.4272, "grad_norm": 0.22783228209467407, "learning_rate": 3.4088291746641077e-05, "loss": 0.0109, "loss_nan_ranks": 0, "loss_rank_avg": 0.003924804739654064, "step": 445, "valid_targets_mean": 4031.3, "valid_targets_min": 1906 }, { "epoch": 0.432, "grad_norm": 0.2675229581899117, "learning_rate": 3.4472168905950104e-05, "loss": 0.012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0031715864315629005, "step": 450, "valid_targets_mean": 3449.6, "valid_targets_min": 1942 }, { "epoch": 0.4368, "grad_norm": 0.22212296709946297, "learning_rate": 3.485604606525912e-05, "loss": 0.0109, "loss_nan_ranks": 0, "loss_rank_avg": 0.0034985882230103016, "step": 455, "valid_targets_mean": 4985.9, "valid_targets_min": 1802 }, { "epoch": 0.4416, "grad_norm": 0.22671994440103954, "learning_rate": 3.5239923224568144e-05, "loss": 0.0101, "loss_nan_ranks": 0, "loss_rank_avg": 0.003531843423843384, "step": 460, "valid_targets_mean": 4070.9, "valid_targets_min": 2019 }, { "epoch": 0.4464, "grad_norm": 0.21948437480345728, "learning_rate": 3.5623800383877164e-05, "loss": 0.0101, "loss_nan_ranks": 0, "loss_rank_avg": 0.0022159013897180557, "step": 465, "valid_targets_mean": 4492.9, "valid_targets_min": 1775 }, { "epoch": 0.4512, "grad_norm": 0.25220894753487705, "learning_rate": 3.6007677543186184e-05, "loss": 0.0107, "loss_nan_ranks": 0, "loss_rank_avg": 0.003613119013607502, "step": 470, "valid_targets_mean": 3354.7, "valid_targets_min": 1786 }, { "epoch": 0.456, "grad_norm": 0.2409715853264873, "learning_rate": 3.6391554702495204e-05, "loss": 0.0111, "loss_nan_ranks": 0, "loss_rank_avg": 0.00343118398450315, "step": 475, "valid_targets_mean": 3894.3, "valid_targets_min": 1917 }, { "epoch": 0.4608, "grad_norm": 0.2170729540621222, "learning_rate": 3.6775431861804224e-05, "loss": 0.0092, "loss_nan_ranks": 0, "loss_rank_avg": 0.0030733980238437653, "step": 480, "valid_targets_mean": 4114.4, "valid_targets_min": 1995 }, { "epoch": 0.4656, "grad_norm": 0.21068892921988389, "learning_rate": 3.7159309021113245e-05, "loss": 0.0096, "loss_nan_ranks": 0, "loss_rank_avg": 0.003135197563096881, "step": 485, "valid_targets_mean": 3322.5, "valid_targets_min": 1763 }, { "epoch": 0.4704, "grad_norm": 0.21972566727493456, "learning_rate": 3.7543186180422265e-05, "loss": 0.0094, "loss_nan_ranks": 0, "loss_rank_avg": 0.0030888905748724937, "step": 490, "valid_targets_mean": 3647.6, "valid_targets_min": 1912 }, { "epoch": 0.4752, "grad_norm": 0.2442380917642565, "learning_rate": 3.792706333973129e-05, "loss": 0.0088, "loss_nan_ranks": 0, "loss_rank_avg": 0.0034611904993653297, "step": 495, "valid_targets_mean": 2969.6, "valid_targets_min": 1933 }, { "epoch": 0.48, "grad_norm": 0.19420220971217322, "learning_rate": 3.831094049904031e-05, "loss": 0.0081, "loss_nan_ranks": 0, "loss_rank_avg": 0.003016189206391573, "step": 500, "valid_targets_mean": 4435.8, "valid_targets_min": 1900 }, { "epoch": 0.4848, "grad_norm": 0.22164558812400362, "learning_rate": 3.869481765834933e-05, "loss": 0.0092, "loss_nan_ranks": 0, "loss_rank_avg": 0.0032875773031264544, "step": 505, "valid_targets_mean": 4127.6, "valid_targets_min": 1719 }, { "epoch": 0.4896, "grad_norm": 0.22374906160761918, "learning_rate": 3.907869481765835e-05, "loss": 0.0094, "loss_nan_ranks": 0, "loss_rank_avg": 0.003515136195346713, "step": 510, "valid_targets_mean": 3748.6, "valid_targets_min": 1991 }, { "epoch": 0.4944, "grad_norm": 0.23454630233428864, "learning_rate": 3.946257197696737e-05, "loss": 0.0089, "loss_nan_ranks": 0, "loss_rank_avg": 0.00364376581273973, "step": 515, "valid_targets_mean": 3213.7, "valid_targets_min": 1870 }, { "epoch": 0.4992, "grad_norm": 0.21562525432252683, "learning_rate": 3.984644913627639e-05, "loss": 0.0099, "loss_nan_ranks": 0, "loss_rank_avg": 0.0031704031862318516, "step": 520, "valid_targets_mean": 4295.1, "valid_targets_min": 1719 }, { "epoch": 0.504, "grad_norm": 0.19124689835472855, "learning_rate": 3.999995959997414e-05, "loss": 0.0086, "loss_nan_ranks": 0, "loss_rank_avg": 0.0025279440451413393, "step": 525, "valid_targets_mean": 4059.2, "valid_targets_min": 1949 }, { "epoch": 0.5088, "grad_norm": 0.23017443414998648, "learning_rate": 3.999971271151827e-05, "loss": 0.0094, "loss_nan_ranks": 0, "loss_rank_avg": 0.00394061952829361, "step": 530, "valid_targets_mean": 3380.1, "valid_targets_min": 1716 }, { "epoch": 0.5136, "grad_norm": 0.23319549902718553, "learning_rate": 3.9999241381832614e-05, "loss": 0.0083, "loss_nan_ranks": 0, "loss_rank_avg": 0.0036682155914604664, "step": 535, "valid_targets_mean": 4276.3, "valid_targets_min": 1662 }, { "epoch": 0.5184, "grad_norm": 0.21660253159440473, "learning_rate": 3.999854561620655e-05, "loss": 0.0077, "loss_nan_ranks": 0, "loss_rank_avg": 0.0027715754695236683, "step": 540, "valid_targets_mean": 4977.5, "valid_targets_min": 2008 }, { "epoch": 0.5232, "grad_norm": 0.19912853298801866, "learning_rate": 3.9997625422448114e-05, "loss": 0.0085, "loss_nan_ranks": 0, "loss_rank_avg": 0.0031935221049934626, "step": 545, "valid_targets_mean": 3682.2, "valid_targets_min": 1887 }, { "epoch": 0.528, "grad_norm": 0.23896432906358125, "learning_rate": 3.999648081088391e-05, "loss": 0.0084, "loss_nan_ranks": 0, "loss_rank_avg": 0.0029742794577032328, "step": 550, "valid_targets_mean": 2679.8, "valid_targets_min": 1361 }, { "epoch": 0.5328, "grad_norm": 0.1861883799280027, "learning_rate": 3.999511179435905e-05, "loss": 0.0081, "loss_nan_ranks": 0, "loss_rank_avg": 0.003043075557798147, "step": 555, "valid_targets_mean": 4540.3, "valid_targets_min": 1925 }, { "epoch": 0.5376, "grad_norm": 0.199027392427487, "learning_rate": 3.999351838823691e-05, "loss": 0.0073, "loss_nan_ranks": 0, "loss_rank_avg": 0.0025762999430298805, "step": 560, "valid_targets_mean": 3683.8, "valid_targets_min": 1924 }, { "epoch": 0.5424, "grad_norm": 0.17389819697427045, "learning_rate": 3.999170061039908e-05, "loss": 0.0081, "loss_nan_ranks": 0, "loss_rank_avg": 0.0023557578679174185, "step": 565, "valid_targets_mean": 3989.9, "valid_targets_min": 2056 }, { "epoch": 0.5472, "grad_norm": 0.2334228789161362, "learning_rate": 3.998965848124505e-05, "loss": 0.0078, "loss_nan_ranks": 0, "loss_rank_avg": 0.00438684830442071, "step": 570, "valid_targets_mean": 3362.2, "valid_targets_min": 2027 }, { "epoch": 0.552, "grad_norm": 0.17945821748347074, "learning_rate": 3.998739202369205e-05, "loss": 0.0076, "loss_nan_ranks": 0, "loss_rank_avg": 0.002859172411262989, "step": 575, "valid_targets_mean": 3952.9, "valid_targets_min": 1924 }, { "epoch": 0.5568, "grad_norm": 0.18678690741356818, "learning_rate": 3.998490126317477e-05, "loss": 0.0071, "loss_nan_ranks": 0, "loss_rank_avg": 0.002055731136351824, "step": 580, "valid_targets_mean": 3083.8, "valid_targets_min": 1950 }, { "epoch": 0.5616, "grad_norm": 0.18250900877509713, "learning_rate": 3.9982186227645085e-05, "loss": 0.0065, "loss_nan_ranks": 0, "loss_rank_avg": 0.00249089440330863, "step": 585, "valid_targets_mean": 3829.1, "valid_targets_min": 1829 }, { "epoch": 0.5664, "grad_norm": 0.25762748462961554, "learning_rate": 3.9979246947571724e-05, "loss": 0.0075, "loss_nan_ranks": 0, "loss_rank_avg": 0.00278734159655869, "step": 590, "valid_targets_mean": 3546.0, "valid_targets_min": 1847 }, { "epoch": 0.5712, "grad_norm": 0.16262986702540477, "learning_rate": 3.9976083455939945e-05, "loss": 0.007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0021733571775257587, "step": 595, "valid_targets_mean": 3765.6, "valid_targets_min": 1820 }, { "epoch": 0.576, "grad_norm": 0.15646991186627635, "learning_rate": 3.9972695788251155e-05, "loss": 0.007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0019335944671183825, "step": 600, "valid_targets_mean": 2733.1, "valid_targets_min": 1948 }, { "epoch": 0.5808, "grad_norm": 0.1866634582185585, "learning_rate": 3.996908398252251e-05, "loss": 0.0067, "loss_nan_ranks": 0, "loss_rank_avg": 0.002379871904850006, "step": 605, "valid_targets_mean": 3607.9, "valid_targets_min": 1361 }, { "epoch": 0.5856, "grad_norm": 0.17961524657660505, "learning_rate": 3.9965248079286505e-05, "loss": 0.0065, "loss_nan_ranks": 0, "loss_rank_avg": 0.0021986260544508696, "step": 610, "valid_targets_mean": 3557.2, "valid_targets_min": 1716 }, { "epoch": 0.5904, "grad_norm": 0.17270751315569516, "learning_rate": 3.99611881215905e-05, "loss": 0.0063, "loss_nan_ranks": 0, "loss_rank_avg": 0.001944814925082028, "step": 615, "valid_targets_mean": 3441.6, "valid_targets_min": 1652 }, { "epoch": 0.5952, "grad_norm": 0.16463245499969842, "learning_rate": 3.995690415499624e-05, "loss": 0.0061, "loss_nan_ranks": 0, "loss_rank_avg": 0.002012577373534441, "step": 620, "valid_targets_mean": 4407.1, "valid_targets_min": 1972 }, { "epoch": 0.6, "grad_norm": 0.1498606450916074, "learning_rate": 3.995239622757936e-05, "loss": 0.0059, "loss_nan_ranks": 0, "loss_rank_avg": 0.0020940229296684265, "step": 625, "valid_targets_mean": 3533.7, "valid_targets_min": 1760 }, { "epoch": 0.6048, "grad_norm": 0.16182624313567134, "learning_rate": 3.994766438992882e-05, "loss": 0.0063, "loss_nan_ranks": 0, "loss_rank_avg": 0.002139991382136941, "step": 630, "valid_targets_mean": 3479.1, "valid_targets_min": 1727 }, { "epoch": 0.6096, "grad_norm": 0.16492253100569335, "learning_rate": 3.994270869514635e-05, "loss": 0.0061, "loss_nan_ranks": 0, "loss_rank_avg": 0.0020363912917673588, "step": 635, "valid_targets_mean": 3303.8, "valid_targets_min": 1361 }, { "epoch": 0.6144, "grad_norm": 0.19146820633459416, "learning_rate": 3.9937529198845864e-05, "loss": 0.0057, "loss_nan_ranks": 0, "loss_rank_avg": 0.0017477039946243167, "step": 640, "valid_targets_mean": 4908.4, "valid_targets_min": 1833 }, { "epoch": 0.6192, "grad_norm": 0.16755843461256645, "learning_rate": 3.9932125959152833e-05, "loss": 0.0051, "loss_nan_ranks": 0, "loss_rank_avg": 0.001417946070432663, "step": 645, "valid_targets_mean": 3218.1, "valid_targets_min": 1763 }, { "epoch": 0.624, "grad_norm": 0.1491212416818786, "learning_rate": 3.9926499036703607e-05, "loss": 0.0064, "loss_nan_ranks": 0, "loss_rank_avg": 0.0022455165162682533, "step": 650, "valid_targets_mean": 4048.8, "valid_targets_min": 1930 }, { "epoch": 0.6288, "grad_norm": 0.17871275289420183, "learning_rate": 3.992064849464476e-05, "loss": 0.0056, "loss_nan_ranks": 0, "loss_rank_avg": 0.0021069804206490517, "step": 655, "valid_targets_mean": 3222.5, "valid_targets_min": 1939 }, { "epoch": 0.6336, "grad_norm": 0.15026244145657655, "learning_rate": 3.991457439863238e-05, "loss": 0.0052, "loss_nan_ranks": 0, "loss_rank_avg": 0.0020846365951001644, "step": 660, "valid_targets_mean": 4101.5, "valid_targets_min": 1802 }, { "epoch": 0.6384, "grad_norm": 0.15132033151846047, "learning_rate": 3.990827681683133e-05, "loss": 0.0054, "loss_nan_ranks": 0, "loss_rank_avg": 0.0013402425684034824, "step": 665, "valid_targets_mean": 4053.0, "valid_targets_min": 2089 }, { "epoch": 0.6432, "grad_norm": 0.14291482930175778, "learning_rate": 3.990175581991448e-05, "loss": 0.0052, "loss_nan_ranks": 0, "loss_rank_avg": 0.001968193333595991, "step": 670, "valid_targets_mean": 4646.0, "valid_targets_min": 1716 }, { "epoch": 0.648, "grad_norm": 0.13205771498876573, "learning_rate": 3.989501148106189e-05, "loss": 0.005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0014164431486278772, "step": 675, "valid_targets_mean": 4138.6, "valid_targets_min": 1517 }, { "epoch": 0.6528, "grad_norm": 0.1454241022903471, "learning_rate": 3.988804387596005e-05, "loss": 0.0052, "loss_nan_ranks": 0, "loss_rank_avg": 0.0017517493106424809, "step": 680, "valid_targets_mean": 4377.7, "valid_targets_min": 1925 }, { "epoch": 0.6576, "grad_norm": 0.15080631968356206, "learning_rate": 3.9880853082800965e-05, "loss": 0.0051, "loss_nan_ranks": 0, "loss_rank_avg": 0.002116061747074127, "step": 685, "valid_targets_mean": 3755.3, "valid_targets_min": 1909 }, { "epoch": 0.6624, "grad_norm": 0.1377601399723467, "learning_rate": 3.987343918228133e-05, "loss": 0.0049, "loss_nan_ranks": 0, "loss_rank_avg": 0.0015512771205976605, "step": 690, "valid_targets_mean": 3227.3, "valid_targets_min": 1970 }, { "epoch": 0.6672, "grad_norm": 0.16894800757253736, "learning_rate": 3.9865802257601584e-05, "loss": 0.0051, "loss_nan_ranks": 0, "loss_rank_avg": 0.0015093731926754117, "step": 695, "valid_targets_mean": 3398.4, "valid_targets_min": 2031 }, { "epoch": 0.672, "grad_norm": 0.13885441728364661, "learning_rate": 3.9857942394464976e-05, "loss": 0.005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0017606966430321336, "step": 700, "valid_targets_mean": 3476.6, "valid_targets_min": 1930 }, { "epoch": 0.6768, "grad_norm": 0.1338580199682233, "learning_rate": 3.984985968107667e-05, "loss": 0.0051, "loss_nan_ranks": 0, "loss_rank_avg": 0.001561261946335435, "step": 705, "valid_targets_mean": 4040.5, "valid_targets_min": 1913 }, { "epoch": 0.6816, "grad_norm": 0.1432672149680153, "learning_rate": 3.984155420814266e-05, "loss": 0.0047, "loss_nan_ranks": 0, "loss_rank_avg": 0.0013145990669727325, "step": 710, "valid_targets_mean": 4966.2, "valid_targets_min": 1988 }, { "epoch": 0.6864, "grad_norm": 0.13283116074357573, "learning_rate": 3.9833026068868814e-05, "loss": 0.0048, "loss_nan_ranks": 0, "loss_rank_avg": 0.001742208143696189, "step": 715, "valid_targets_mean": 4114.5, "valid_targets_min": 1914 }, { "epoch": 0.6912, "grad_norm": 0.12495828177583537, "learning_rate": 3.982427535895982e-05, "loss": 0.0043, "loss_nan_ranks": 0, "loss_rank_avg": 0.001497375313192606, "step": 720, "valid_targets_mean": 3872.3, "valid_targets_min": 1942 }, { "epoch": 0.696, "grad_norm": 0.26157930715172134, "learning_rate": 3.9815302176618076e-05, "loss": 0.0045, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012776684015989304, "step": 725, "valid_targets_mean": 3521.8, "valid_targets_min": 1751 }, { "epoch": 0.7008, "grad_norm": 0.1247067429593807, "learning_rate": 3.980610662254264e-05, "loss": 0.0047, "loss_nan_ranks": 0, "loss_rank_avg": 0.0015188871184363961, "step": 730, "valid_targets_mean": 3731.8, "valid_targets_min": 1942 }, { "epoch": 0.7056, "grad_norm": 0.10721609529299062, "learning_rate": 3.9796688799928075e-05, "loss": 0.0044, "loss_nan_ranks": 0, "loss_rank_avg": 0.0013464395888149738, "step": 735, "valid_targets_mean": 4545.2, "valid_targets_min": 2003 }, { "epoch": 0.7104, "grad_norm": 0.14094264977785242, "learning_rate": 3.978704881446327e-05, "loss": 0.0044, "loss_nan_ranks": 0, "loss_rank_avg": 0.0014088444877415895, "step": 740, "valid_targets_mean": 3220.6, "valid_targets_min": 1906 }, { "epoch": 0.7152, "grad_norm": 0.10781543110136461, "learning_rate": 3.9777186774330304e-05, "loss": 0.0044, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012600058689713478, "step": 745, "valid_targets_mean": 4427.3, "valid_targets_min": 2263 }, { "epoch": 0.72, "grad_norm": 0.12029787392855426, "learning_rate": 3.976710279020318e-05, "loss": 0.0043, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010703550651669502, "step": 750, "valid_targets_mean": 4369.5, "valid_targets_min": 2020 }, { "epoch": 0.7248, "grad_norm": 0.15068996687496647, "learning_rate": 3.975679697524661e-05, "loss": 0.0046, "loss_nan_ranks": 0, "loss_rank_avg": 0.0014090463519096375, "step": 755, "valid_targets_mean": 4053.9, "valid_targets_min": 1917 }, { "epoch": 0.7296, "grad_norm": 0.12000665726518672, "learning_rate": 3.974626944511475e-05, "loss": 0.0041, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011800779029726982, "step": 760, "valid_targets_mean": 3526.3, "valid_targets_min": 2033 }, { "epoch": 0.7344, "grad_norm": 0.10875222012783078, "learning_rate": 3.973552031794988e-05, "loss": 0.0042, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012633678270503879, "step": 765, "valid_targets_mean": 5437.8, "valid_targets_min": 1943 }, { "epoch": 0.7392, "grad_norm": 0.11241217686368878, "learning_rate": 3.9724549714381106e-05, "loss": 0.0041, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012497665593400598, "step": 770, "valid_targets_mean": 4326.5, "valid_targets_min": 2002 }, { "epoch": 0.744, "grad_norm": 0.11897759021143543, "learning_rate": 3.971335775752298e-05, "loss": 0.0045, "loss_nan_ranks": 0, "loss_rank_avg": 0.001275674207136035, "step": 775, "valid_targets_mean": 2989.6, "valid_targets_min": 1960 }, { "epoch": 0.7488, "grad_norm": 0.11558986969740365, "learning_rate": 3.970194457297414e-05, "loss": 0.0042, "loss_nan_ranks": 0, "loss_rank_avg": 0.0014982791617512703, "step": 780, "valid_targets_mean": 3710.9, "valid_targets_min": 1908 }, { "epoch": 0.7536, "grad_norm": 0.10741653865582416, "learning_rate": 3.9690310288815876e-05, "loss": 0.004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00115393684245646, "step": 785, "valid_targets_mean": 4165.2, "valid_targets_min": 1775 }, { "epoch": 0.7584, "grad_norm": 0.11516842126720446, "learning_rate": 3.967845503561073e-05, "loss": 0.0043, "loss_nan_ranks": 0, "loss_rank_avg": 0.0013473081635311246, "step": 790, "valid_targets_mean": 4067.3, "valid_targets_min": 1942 }, { "epoch": 0.7632, "grad_norm": 0.11351545091236749, "learning_rate": 3.9666378946400974e-05, "loss": 0.0036, "loss_nan_ranks": 0, "loss_rank_avg": 0.001365464529953897, "step": 795, "valid_targets_mean": 3699.9, "valid_targets_min": 1833 }, { "epoch": 0.768, "grad_norm": 0.12309069150799558, "learning_rate": 3.965408215670719e-05, "loss": 0.004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0013098465278744698, "step": 800, "valid_targets_mean": 3937.4, "valid_targets_min": 1964 }, { "epoch": 0.7728, "grad_norm": 0.12432078035897463, "learning_rate": 3.964156480452667e-05, "loss": 0.0042, "loss_nan_ranks": 0, "loss_rank_avg": 0.0015537126455456018, "step": 805, "valid_targets_mean": 4146.9, "valid_targets_min": 1764 }, { "epoch": 0.7776, "grad_norm": 0.11795652999166656, "learning_rate": 3.962882703033195e-05, "loss": 0.0043, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011664225021377206, "step": 810, "valid_targets_mean": 4204.5, "valid_targets_min": 1939 }, { "epoch": 0.7824, "grad_norm": 0.11091476599630226, "learning_rate": 3.961586897706915e-05, "loss": 0.0036, "loss_nan_ranks": 0, "loss_rank_avg": 0.0015496142441406846, "step": 815, "valid_targets_mean": 4644.7, "valid_targets_min": 1939 }, { "epoch": 0.7872, "grad_norm": 0.10688116342811396, "learning_rate": 3.960269079015643e-05, "loss": 0.0039, "loss_nan_ranks": 0, "loss_rank_avg": 0.001176126068457961, "step": 820, "valid_targets_mean": 4056.7, "valid_targets_min": 1980 }, { "epoch": 0.792, "grad_norm": 0.11642692391730794, "learning_rate": 3.958929261748236e-05, "loss": 0.0036, "loss_nan_ranks": 0, "loss_rank_avg": 0.001297774026170373, "step": 825, "valid_targets_mean": 3668.7, "valid_targets_min": 1614 }, { "epoch": 0.7968, "grad_norm": 0.098807867074682, "learning_rate": 3.957567460940419e-05, "loss": 0.0038, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012444111052900553, "step": 830, "valid_targets_mean": 4412.2, "valid_targets_min": 1763 }, { "epoch": 0.8016, "grad_norm": 0.11412160343259568, "learning_rate": 3.9561836918746256e-05, "loss": 0.0035, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010612367186695337, "step": 835, "valid_targets_mean": 4943.7, "valid_targets_min": 1877 }, { "epoch": 0.8064, "grad_norm": 0.11666792034799639, "learning_rate": 3.95477797007982e-05, "loss": 0.0036, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011054251808673143, "step": 840, "valid_targets_mean": 4050.5, "valid_targets_min": 1937 }, { "epoch": 0.8112, "grad_norm": 0.11538500128726843, "learning_rate": 3.953350311331325e-05, "loss": 0.0037, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011343640508130193, "step": 845, "valid_targets_mean": 4588.8, "valid_targets_min": 1775 }, { "epoch": 0.816, "grad_norm": 0.09364586828014224, "learning_rate": 3.951900731650645e-05, "loss": 0.0034, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010743942111730576, "step": 850, "valid_targets_mean": 4492.2, "valid_targets_min": 1906 }, { "epoch": 0.8208, "grad_norm": 0.11750177774881453, "learning_rate": 3.950429247305286e-05, "loss": 0.0036, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011643307516351342, "step": 855, "valid_targets_mean": 2967.8, "valid_targets_min": 1680 }, { "epoch": 0.8256, "grad_norm": 0.11124286170862023, "learning_rate": 3.9489358748085737e-05, "loss": 0.0034, "loss_nan_ranks": 0, "loss_rank_avg": 0.001344716758467257, "step": 860, "valid_targets_mean": 3575.3, "valid_targets_min": 1771 }, { "epoch": 0.8304, "grad_norm": 0.1084575920874673, "learning_rate": 3.947420630919466e-05, "loss": 0.0034, "loss_nan_ranks": 0, "loss_rank_avg": 0.001134268008172512, "step": 865, "valid_targets_mean": 4376.6, "valid_targets_min": 1891 }, { "epoch": 0.8352, "grad_norm": 0.10852534059779477, "learning_rate": 3.9458835326423674e-05, "loss": 0.0035, "loss_nan_ranks": 0, "loss_rank_avg": 0.001093921484425664, "step": 870, "valid_targets_mean": 3641.3, "valid_targets_min": 1838 }, { "epoch": 0.84, "grad_norm": 0.1079926557884953, "learning_rate": 3.9443245972269376e-05, "loss": 0.0038, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012400320265442133, "step": 875, "valid_targets_mean": 3411.1, "valid_targets_min": 1992 }, { "epoch": 0.8448, "grad_norm": 0.11238022059807141, "learning_rate": 3.942743842167896e-05, "loss": 0.0036, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012292286846786737, "step": 880, "valid_targets_mean": 2977.5, "valid_targets_min": 1877 }, { "epoch": 0.8496, "grad_norm": 0.09672286411873122, "learning_rate": 3.941141285204829e-05, "loss": 0.0032, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007136667263694108, "step": 885, "valid_targets_mean": 3401.6, "valid_targets_min": 1727 }, { "epoch": 0.8544, "grad_norm": 0.108672832404322, "learning_rate": 3.939516944321986e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0014265866484493017, "step": 890, "valid_targets_mean": 5317.2, "valid_targets_min": 2096 }, { "epoch": 0.8592, "grad_norm": 0.08500035385803482, "learning_rate": 3.937870837748085e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007657730020582676, "step": 895, "valid_targets_mean": 4747.8, "valid_targets_min": 1652 }, { "epoch": 0.864, "grad_norm": 0.12054172577524297, "learning_rate": 3.936202983956098e-05, "loss": 0.0032, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010280468268319964, "step": 900, "valid_targets_mean": 4090.7, "valid_targets_min": 1921 }, { "epoch": 0.8688, "grad_norm": 0.10234250480193231, "learning_rate": 3.934513401663052e-05, "loss": 0.0032, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010562061797827482, "step": 905, "valid_targets_mean": 3031.4, "valid_targets_min": 1991 }, { "epoch": 0.8736, "grad_norm": 0.12774724999406212, "learning_rate": 3.9328021098298164e-05, "loss": 0.0035, "loss_nan_ranks": 0, "loss_rank_avg": 0.001268667634576559, "step": 910, "valid_targets_mean": 3329.1, "valid_targets_min": 2014 }, { "epoch": 0.8784, "grad_norm": 0.10641838411361687, "learning_rate": 3.9310691276608894e-05, "loss": 0.0032, "loss_nan_ranks": 0, "loss_rank_avg": 0.000988850835710764, "step": 915, "valid_targets_mean": 3899.7, "valid_targets_min": 1716 }, { "epoch": 0.8832, "grad_norm": 0.10827132525574004, "learning_rate": 3.9293144746041824e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011344174854457378, "step": 920, "valid_targets_mean": 3272.9, "valid_targets_min": 1760 }, { "epoch": 0.888, "grad_norm": 0.09513704022755502, "learning_rate": 3.9275381703508034e-05, "loss": 0.0032, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011016558855772018, "step": 925, "valid_targets_mean": 3681.6, "valid_targets_min": 1836 }, { "epoch": 0.8928, "grad_norm": 0.07861451847755797, "learning_rate": 3.925740234834833e-05, "loss": 0.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006670982111245394, "step": 930, "valid_targets_mean": 4255.3, "valid_targets_min": 1361 }, { "epoch": 0.8976, "grad_norm": 0.09716097453724373, "learning_rate": 3.9239206882331045e-05, "loss": 0.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010126556735485792, "step": 935, "valid_targets_mean": 4101.5, "valid_targets_min": 1933 }, { "epoch": 0.9024, "grad_norm": 0.09329297657208854, "learning_rate": 3.922079550964976e-05, "loss": 0.0034, "loss_nan_ranks": 0, "loss_rank_avg": 0.001035340828821063, "step": 940, "valid_targets_mean": 3683.1, "valid_targets_min": 1912 }, { "epoch": 0.9072, "grad_norm": 0.10634525538037214, "learning_rate": 3.920216843692099e-05, "loss": 0.003, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008592663798481226, "step": 945, "valid_targets_mean": 3470.2, "valid_targets_min": 1942 }, { "epoch": 0.912, "grad_norm": 0.09331321143620223, "learning_rate": 3.918332587318189e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009684814722277224, "step": 950, "valid_targets_mean": 3834.3, "valid_targets_min": 1921 }, { "epoch": 0.9168, "grad_norm": 0.0933007582514206, "learning_rate": 3.916426802988791e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009699763031676412, "step": 955, "valid_targets_mean": 4792.5, "valid_targets_min": 1802 }, { "epoch": 0.9216, "grad_norm": 0.08822587812104978, "learning_rate": 3.9144995120910414e-05, "loss": 0.0029, "loss_nan_ranks": 0, "loss_rank_avg": 0.001074823783710599, "step": 960, "valid_targets_mean": 4560.1, "valid_targets_min": 2210 }, { "epoch": 0.9264, "grad_norm": 0.10596108991960777, "learning_rate": 3.912550736253428e-05, "loss": 0.0029, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008593408274464309, "step": 965, "valid_targets_mean": 3210.6, "valid_targets_min": 1833 }, { "epoch": 0.9312, "grad_norm": 0.08707190113521034, "learning_rate": 3.9105804973455466e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010110901203006506, "step": 970, "valid_targets_mean": 4952.5, "valid_targets_min": 1987 }, { "epoch": 0.936, "grad_norm": 0.09171050448973861, "learning_rate": 3.908588817477858e-05, "loss": 0.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010078486520797014, "step": 975, "valid_targets_mean": 5238.2, "valid_targets_min": 1863 }, { "epoch": 0.9408, "grad_norm": 0.09164652188624466, "learning_rate": 3.9065757190014356e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008506424492225051, "step": 980, "valid_targets_mean": 4875.0, "valid_targets_min": 1925 }, { "epoch": 0.9456, "grad_norm": 0.10980723053180172, "learning_rate": 3.90454122450772e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008993170922622085, "step": 985, "valid_targets_mean": 3326.2, "valid_targets_min": 1920 }, { "epoch": 0.9504, "grad_norm": 0.08983452553358251, "learning_rate": 3.9024853568282615e-05, "loss": 0.0031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009225120302289724, "step": 990, "valid_targets_mean": 4108.7, "valid_targets_min": 1975 }, { "epoch": 0.9552, "grad_norm": 0.09169525441917338, "learning_rate": 3.900408139034464e-05, "loss": 0.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007527648704126477, "step": 995, "valid_targets_mean": 3358.1, "valid_targets_min": 1908 }, { "epoch": 0.96, "grad_norm": 0.08231724789721716, "learning_rate": 3.89830959443733e-05, "loss": 0.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007301989244297147, "step": 1000, "valid_targets_mean": 3902.4, "valid_targets_min": 1719 }, { "epoch": 0.9648, "grad_norm": 0.09136251476965629, "learning_rate": 3.896189746587192e-05, "loss": 0.0026, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006765191210433841, "step": 1005, "valid_targets_mean": 3040.7, "valid_targets_min": 1992 }, { "epoch": 0.9696, "grad_norm": 0.0973881927043345, "learning_rate": 3.894048619273457e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008304090006276965, "step": 1010, "valid_targets_mean": 3484.0, "valid_targets_min": 2008 }, { "epoch": 0.9744, "grad_norm": 0.10329326340033367, "learning_rate": 3.89188623652433e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010426387889310718, "step": 1015, "valid_targets_mean": 3487.8, "valid_targets_min": 1933 }, { "epoch": 0.9792, "grad_norm": 0.08556444578908518, "learning_rate": 3.889702622606553e-05, "loss": 0.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.0011887401342391968, "step": 1020, "valid_targets_mean": 4090.1, "valid_targets_min": 1951 }, { "epoch": 0.984, "grad_norm": 0.08515059162016657, "learning_rate": 3.887497802025129e-05, "loss": 0.0024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007636288064531982, "step": 1025, "valid_targets_mean": 4201.1, "valid_targets_min": 1920 }, { "epoch": 0.9888, "grad_norm": 0.09535626849370749, "learning_rate": 3.885271799523043e-05, "loss": 0.0026, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009697978966869414, "step": 1030, "valid_targets_mean": 3636.8, "valid_targets_min": 1614 }, { "epoch": 0.9936, "grad_norm": 0.0980669848781187, "learning_rate": 3.8830246400809925e-05, "loss": 0.0029, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009542859625071287, "step": 1035, "valid_targets_mean": 3659.2, "valid_targets_min": 1870 }, { "epoch": 0.9984, "grad_norm": 0.08778230952309017, "learning_rate": 3.880756348917101e-05, "loss": 0.003, "loss_nan_ranks": 0, "loss_rank_avg": 0.0012875967659056187, "step": 1040, "valid_targets_mean": 4062.1, "valid_targets_min": 2081 }, { "epoch": 1.00288, "grad_norm": 0.086197700086096, "learning_rate": 3.8784669514866365e-05, "loss": 0.0025, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009929087245836854, "step": 1045, "valid_targets_mean": 3231.5, "valid_targets_min": 1719 }, { "epoch": 1.00768, "grad_norm": 0.08547866320552522, "learning_rate": 3.876156473481727e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.000846736365929246, "step": 1050, "valid_targets_mean": 4431.3, "valid_targets_min": 1993 }, { "epoch": 1.01248, "grad_norm": 0.08391253769447353, "learning_rate": 3.8738249408310716e-05, "loss": 0.0024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007149117300286889, "step": 1055, "valid_targets_mean": 3551.1, "valid_targets_min": 1771 }, { "epoch": 1.01728, "grad_norm": 0.07389756284878693, "learning_rate": 3.871472379699648e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007226199377328157, "step": 1060, "valid_targets_mean": 3603.4, "valid_targets_min": 2074 }, { "epoch": 1.02208, "grad_norm": 0.08190003923821697, "learning_rate": 3.869098816488422e-05, "loss": 0.0025, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008007280994206667, "step": 1065, "valid_targets_mean": 3631.3, "valid_targets_min": 1970 }, { "epoch": 1.02688, "grad_norm": 0.0953727091278497, "learning_rate": 3.866704277834049e-05, "loss": 0.0025, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009208035771735013, "step": 1070, "valid_targets_mean": 3726.2, "valid_targets_min": 1906 }, { "epoch": 1.03168, "grad_norm": 0.0782930286061942, "learning_rate": 3.864288790608573e-05, "loss": 0.0029, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010479418560862541, "step": 1075, "valid_targets_mean": 4111.3, "valid_targets_min": 2026 }, { "epoch": 1.03648, "grad_norm": 0.08763252794635999, "learning_rate": 3.861852381919132e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008621154120191932, "step": 1080, "valid_targets_mean": 3631.4, "valid_targets_min": 2011 }, { "epoch": 1.04128, "grad_norm": 0.07975207664420085, "learning_rate": 3.8593950791076446e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007578890072181821, "step": 1085, "valid_targets_mean": 4506.1, "valid_targets_min": 1838 }, { "epoch": 1.04608, "grad_norm": 0.08519082868687813, "learning_rate": 3.856916909750512e-05, "loss": 0.0024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008825008408166468, "step": 1090, "valid_targets_mean": 3900.7, "valid_targets_min": 1889 }, { "epoch": 1.05088, "grad_norm": 0.08661350730724589, "learning_rate": 3.854417901658301e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010637170635163784, "step": 1095, "valid_targets_mean": 3464.5, "valid_targets_min": 1839 }, { "epoch": 1.05568, "grad_norm": 0.0779672388921201, "learning_rate": 3.851898082875438e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006217740592546761, "step": 1100, "valid_targets_mean": 3628.1, "valid_targets_min": 1802 }, { "epoch": 1.06048, "grad_norm": 0.07394866276608925, "learning_rate": 3.849357481679891e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.000598479644395411, "step": 1105, "valid_targets_mean": 3672.1, "valid_targets_min": 1562 }, { "epoch": 1.06528, "grad_norm": 0.08662140030567693, "learning_rate": 3.846796126582851e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008953436627052724, "step": 1110, "valid_targets_mean": 4051.2, "valid_targets_min": 1740 }, { "epoch": 1.07008, "grad_norm": 0.0823370220101719, "learning_rate": 3.844214046328416e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006970255635678768, "step": 1115, "valid_targets_mean": 3599.7, "valid_targets_min": 1928 }, { "epoch": 1.07488, "grad_norm": 0.0901193916034131, "learning_rate": 3.841611269893266e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006074707489460707, "step": 1120, "valid_targets_mean": 3385.9, "valid_targets_min": 1980 }, { "epoch": 1.07968, "grad_norm": 0.0761744661497128, "learning_rate": 3.8389878264863364e-05, "loss": 0.0026, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008789674611762166, "step": 1125, "valid_targets_mean": 3657.1, "valid_targets_min": 1934 }, { "epoch": 1.08448, "grad_norm": 0.08437359007221527, "learning_rate": 3.836343745548495e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008096237434074283, "step": 1130, "valid_targets_mean": 3535.8, "valid_targets_min": 1906 }, { "epoch": 1.08928, "grad_norm": 0.0919856624688295, "learning_rate": 3.833679056752205e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010354400146752596, "step": 1135, "valid_targets_mean": 4240.6, "valid_targets_min": 1662 }, { "epoch": 1.09408, "grad_norm": 0.0672698854888288, "learning_rate": 3.8309937900012e-05, "loss": 0.0024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006182040087878704, "step": 1140, "valid_targets_mean": 5282.5, "valid_targets_min": 1847 }, { "epoch": 1.09888, "grad_norm": 0.09154431881180543, "learning_rate": 3.8282879754301395e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008248881786130369, "step": 1145, "valid_targets_mean": 3183.1, "valid_targets_min": 1868 }, { "epoch": 1.10368, "grad_norm": 0.08087150149583128, "learning_rate": 3.825561643404277e-05, "loss": 0.0024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006553860730491579, "step": 1150, "valid_targets_mean": 4181.3, "valid_targets_min": 1838 }, { "epoch": 1.10848, "grad_norm": 0.07350347984015675, "learning_rate": 3.8228148245191195e-05, "loss": 0.0024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006827219622209668, "step": 1155, "valid_targets_mean": 4734.0, "valid_targets_min": 2008 }, { "epoch": 1.11328, "grad_norm": 0.07091572829462224, "learning_rate": 3.820047549600078e-05, "loss": 0.0027, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006135037983767688, "step": 1160, "valid_targets_mean": 3254.9, "valid_targets_min": 1525 }, { "epoch": 1.11808, "grad_norm": 0.0777569727802482, "learning_rate": 3.8172598497021304e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0010421124752610922, "step": 1165, "valid_targets_mean": 4660.4, "valid_targets_min": 1705 }, { "epoch": 1.12288, "grad_norm": 0.08688863620334608, "learning_rate": 3.8144517561094635e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008928946917876601, "step": 1170, "valid_targets_mean": 3918.8, "valid_targets_min": 1907 }, { "epoch": 1.12768, "grad_norm": 0.07873600105581716, "learning_rate": 3.811623300335129e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007803626358509064, "step": 1175, "valid_targets_mean": 3826.0, "valid_targets_min": 1933 }, { "epoch": 1.13248, "grad_norm": 0.07726798965675107, "learning_rate": 3.808774514120689e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007038116455078125, "step": 1180, "valid_targets_mean": 2743.8, "valid_targets_min": 2007 }, { "epoch": 1.13728, "grad_norm": 0.07403528700578575, "learning_rate": 3.805905429435856e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009153485298156738, "step": 1185, "valid_targets_mean": 4641.1, "valid_targets_min": 1904 }, { "epoch": 1.14208, "grad_norm": 0.0872290553941291, "learning_rate": 3.803016078478137e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007584341801702976, "step": 1190, "valid_targets_mean": 3616.6, "valid_targets_min": 1925 }, { "epoch": 1.14688, "grad_norm": 0.0709258238934523, "learning_rate": 3.800106493672472e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006345144938677549, "step": 1195, "valid_targets_mean": 3609.2, "valid_targets_min": 1786 }, { "epoch": 1.15168, "grad_norm": 0.07801772343781505, "learning_rate": 3.7971767076708704e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009863885352388024, "step": 1200, "valid_targets_mean": 3440.6, "valid_targets_min": 1614 }, { "epoch": 1.15648, "grad_norm": 0.07389611823346304, "learning_rate": 3.794226753352042e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007948827114887536, "step": 1205, "valid_targets_mean": 3287.3, "valid_targets_min": 1361 }, { "epoch": 1.16128, "grad_norm": 0.06497642766755227, "learning_rate": 3.791256663821032e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005222467589192092, "step": 1210, "valid_targets_mean": 4036.9, "valid_targets_min": 2034 }, { "epoch": 1.16608, "grad_norm": 0.06299482388250971, "learning_rate": 3.788266472408846e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005134165403433144, "step": 1215, "valid_targets_mean": 3814.6, "valid_targets_min": 1914 }, { "epoch": 1.17088, "grad_norm": 0.08171326113301111, "learning_rate": 3.785256212672077e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009849846828728914, "step": 1220, "valid_targets_mean": 3237.6, "valid_targets_min": 2013 }, { "epoch": 1.17568, "grad_norm": 0.0804150430123658, "learning_rate": 3.7822259183925324e-05, "loss": 0.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006895281840115786, "step": 1225, "valid_targets_mean": 3147.6, "valid_targets_min": 2073 }, { "epoch": 1.18048, "grad_norm": 0.07953442754835148, "learning_rate": 3.7791756235768476e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005019694799557328, "step": 1230, "valid_targets_mean": 4059.0, "valid_targets_min": 1986 }, { "epoch": 1.1852800000000001, "grad_norm": 0.06855513232526653, "learning_rate": 3.7761053624561104e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006399221601895988, "step": 1235, "valid_targets_mean": 4481.3, "valid_targets_min": 1652 }, { "epoch": 1.19008, "grad_norm": 0.07266331471123853, "learning_rate": 3.7730151694854757e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006030212971381843, "step": 1240, "valid_targets_mean": 3147.8, "valid_targets_min": 2112 }, { "epoch": 1.19488, "grad_norm": 0.07341874027666305, "learning_rate": 3.769905079343777e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005216033896431327, "step": 1245, "valid_targets_mean": 3752.4, "valid_targets_min": 2000 }, { "epoch": 1.19968, "grad_norm": 0.0772295236927303, "learning_rate": 3.766775126933138e-05, "loss": 0.0023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007670236518606544, "step": 1250, "valid_targets_mean": 3803.3, "valid_targets_min": 1887 }, { "epoch": 1.20448, "grad_norm": 0.06534912913900263, "learning_rate": 3.7636253473785815e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006711517926305532, "step": 1255, "valid_targets_mean": 3514.3, "valid_targets_min": 1719 }, { "epoch": 1.20928, "grad_norm": 0.06650634860098974, "learning_rate": 3.760455776027636e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.000556517974473536, "step": 1260, "valid_targets_mean": 4241.4, "valid_targets_min": 1949 }, { "epoch": 1.21408, "grad_norm": 0.08877250893671114, "learning_rate": 3.7572664484499365e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0009134068968705833, "step": 1265, "valid_targets_mean": 2475.9, "valid_targets_min": 1900 }, { "epoch": 1.21888, "grad_norm": 0.07123738698666394, "learning_rate": 3.7540574004368264e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004884611698798835, "step": 1270, "valid_targets_mean": 4605.3, "valid_targets_min": 1833 }, { "epoch": 1.2236799999999999, "grad_norm": 0.06505623796756807, "learning_rate": 3.750828668000959e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005974129308015108, "step": 1275, "valid_targets_mean": 3525.4, "valid_targets_min": 2047 }, { "epoch": 1.22848, "grad_norm": 0.061783395627733356, "learning_rate": 3.747580287375887e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005115181556902826, "step": 1280, "valid_targets_mean": 4752.2, "valid_targets_min": 2102 }, { "epoch": 1.23328, "grad_norm": 0.06631151827050302, "learning_rate": 3.744312295015662e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005237223813310266, "step": 1285, "valid_targets_mean": 4775.7, "valid_targets_min": 1933 }, { "epoch": 1.23808, "grad_norm": 0.08273205851761135, "learning_rate": 3.7410247275944223e-05, "loss": 0.0021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007862814818508923, "step": 1290, "valid_targets_mean": 3475.9, "valid_targets_min": 1771 }, { "epoch": 1.24288, "grad_norm": 0.05896227722198991, "learning_rate": 3.737717622005981e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005240546306595206, "step": 1295, "valid_targets_mean": 4562.6, "valid_targets_min": 2026 }, { "epoch": 1.24768, "grad_norm": 0.0693995618369498, "learning_rate": 3.734391015363413e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005423809634521604, "step": 1300, "valid_targets_mean": 4364.8, "valid_targets_min": 1863 }, { "epoch": 1.25248, "grad_norm": 0.07369923985839384, "learning_rate": 3.7310449449986404e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005977890104986727, "step": 1305, "valid_targets_mean": 3853.8, "valid_targets_min": 1863 }, { "epoch": 1.25728, "grad_norm": 0.07551774484051925, "learning_rate": 3.727679448462009e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006663898238912225, "step": 1310, "valid_targets_mean": 3010.4, "valid_targets_min": 1912 }, { "epoch": 1.26208, "grad_norm": 0.064694527946226, "learning_rate": 3.7242945635218696e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006106563378125429, "step": 1315, "valid_targets_mean": 4648.5, "valid_targets_min": 1614 }, { "epoch": 1.26688, "grad_norm": 0.07397659737573328, "learning_rate": 3.720890328164156e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007054214365780354, "step": 1320, "valid_targets_mean": 3650.5, "valid_targets_min": 1525 }, { "epoch": 1.27168, "grad_norm": 0.06335161480174571, "learning_rate": 3.717466780591956e-05, "loss": 0.002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006929860101081431, "step": 1325, "valid_targets_mean": 5325.5, "valid_targets_min": 2040 }, { "epoch": 1.27648, "grad_norm": 0.06804994355224919, "learning_rate": 3.7140239592250804e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.000726754660718143, "step": 1330, "valid_targets_mean": 4236.4, "valid_targets_min": 1877 }, { "epoch": 1.28128, "grad_norm": 0.06480070102782637, "learning_rate": 3.71056190269964e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006756271468475461, "step": 1335, "valid_targets_mean": 4148.4, "valid_targets_min": 1562 }, { "epoch": 1.2860800000000001, "grad_norm": 0.07074354812550124, "learning_rate": 3.7070806498676025e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006020993459969759, "step": 1340, "valid_targets_mean": 3465.2, "valid_targets_min": 2013 }, { "epoch": 1.29088, "grad_norm": 0.06503461305315013, "learning_rate": 3.7035802397963625e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006871588411740959, "step": 1345, "valid_targets_mean": 3813.0, "valid_targets_min": 1614 }, { "epoch": 1.29568, "grad_norm": 0.07401450353104723, "learning_rate": 3.700060711768302e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006600288324989378, "step": 1350, "valid_targets_mean": 3878.8, "valid_targets_min": 1839 }, { "epoch": 1.30048, "grad_norm": 0.07680667987027859, "learning_rate": 3.696522105280348e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007312206435017288, "step": 1355, "valid_targets_mean": 4043.9, "valid_targets_min": 1764 }, { "epoch": 1.30528, "grad_norm": 0.06469896222704227, "learning_rate": 3.6929644600435303e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006350899348035455, "step": 1360, "valid_targets_mean": 4086.7, "valid_targets_min": 1652 }, { "epoch": 1.3100800000000001, "grad_norm": 0.06477008506037779, "learning_rate": 3.689387815982536e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005677276058122516, "step": 1365, "valid_targets_mean": 4331.5, "valid_targets_min": 2088 }, { "epoch": 1.31488, "grad_norm": 0.06258396354088679, "learning_rate": 3.6857922132352617e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006163810612633824, "step": 1370, "valid_targets_mean": 4495.3, "valid_targets_min": 1705 }, { "epoch": 1.31968, "grad_norm": 0.07028510535202044, "learning_rate": 3.6821776921523615e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007107181008905172, "step": 1375, "valid_targets_mean": 3949.4, "valid_targets_min": 2014 }, { "epoch": 1.3244799999999999, "grad_norm": 0.05077976162402836, "learning_rate": 3.678544293296797e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004410394176375121, "step": 1380, "valid_targets_mean": 4144.0, "valid_targets_min": 1921 }, { "epoch": 1.32928, "grad_norm": 0.07438935849118425, "learning_rate": 3.674892057443378e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0008442823309451342, "step": 1385, "valid_targets_mean": 4133.5, "valid_targets_min": 2143 }, { "epoch": 1.33408, "grad_norm": 0.0682757279109907, "learning_rate": 3.671221025578309e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007162219844758511, "step": 1390, "valid_targets_mean": 4855.8, "valid_targets_min": 1913 }, { "epoch": 1.33888, "grad_norm": 0.07341922338949, "learning_rate": 3.6675312388987274e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006667692796327174, "step": 1395, "valid_targets_mean": 3465.5, "valid_targets_min": 2030 }, { "epoch": 1.34368, "grad_norm": 0.07020332214835699, "learning_rate": 3.663822738812241e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006832577055320144, "step": 1400, "valid_targets_mean": 4072.4, "valid_targets_min": 2007 }, { "epoch": 1.34848, "grad_norm": 0.06099353552564727, "learning_rate": 3.660095566936462e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.00047730878577567637, "step": 1405, "valid_targets_mean": 5152.2, "valid_targets_min": 1977 }, { "epoch": 1.35328, "grad_norm": 0.05528893930640278, "learning_rate": 3.656349765098546e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005526028689928353, "step": 1410, "valid_targets_mean": 4026.0, "valid_targets_min": 2112 }, { "epoch": 1.35808, "grad_norm": 0.06445302958586464, "learning_rate": 3.652585375334714e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005105407908558846, "step": 1415, "valid_targets_mean": 4236.2, "valid_targets_min": 1662 }, { "epoch": 1.36288, "grad_norm": 0.06802186778046675, "learning_rate": 3.648802439889785e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005574011011049151, "step": 1420, "valid_targets_mean": 3783.2, "valid_targets_min": 1839 }, { "epoch": 1.36768, "grad_norm": 0.06528073484942466, "learning_rate": 3.645001001216705e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005780609208159149, "step": 1425, "valid_targets_mean": 2935.5, "valid_targets_min": 1838 }, { "epoch": 1.37248, "grad_norm": 0.05639907531689663, "learning_rate": 3.641181101976065e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004771294188685715, "step": 1430, "valid_targets_mean": 3967.0, "valid_targets_min": 1904 }, { "epoch": 1.37728, "grad_norm": 0.06966113126336215, "learning_rate": 3.637342785035624e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004934966564178467, "step": 1435, "valid_targets_mean": 4545.3, "valid_targets_min": 1680 }, { "epoch": 1.38208, "grad_norm": 0.06651395252299827, "learning_rate": 3.633486093469829e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.000541509420145303, "step": 1440, "valid_targets_mean": 3806.9, "valid_targets_min": 1907 }, { "epoch": 1.3868800000000001, "grad_norm": 0.06692400353511045, "learning_rate": 3.629611070559333e-05, "loss": 0.0018, "loss_nan_ranks": 0, "loss_rank_avg": 0.000700898002833128, "step": 1445, "valid_targets_mean": 2970.4, "valid_targets_min": 1727 }, { "epoch": 1.39168, "grad_norm": 0.0556009908675102, "learning_rate": 3.625717759790506e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005732535501010716, "step": 1450, "valid_targets_mean": 3820.5, "valid_targets_min": 1965 }, { "epoch": 1.39648, "grad_norm": 0.06579603095770614, "learning_rate": 3.621806204854947e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006776693044230342, "step": 1455, "valid_targets_mean": 3576.1, "valid_targets_min": 1719 }, { "epoch": 1.40128, "grad_norm": 0.057150898506148747, "learning_rate": 3.617876449648998e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006130424444563687, "step": 1460, "valid_targets_mean": 4522.8, "valid_targets_min": 1870 }, { "epoch": 1.40608, "grad_norm": 0.06670784102144113, "learning_rate": 3.613928538273247e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.00048188146320171654, "step": 1465, "valid_targets_mean": 3102.2, "valid_targets_min": 1972 }, { "epoch": 1.4108800000000001, "grad_norm": 0.06763203016388951, "learning_rate": 3.609962515032034e-05, "loss": 0.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006231270963326097, "step": 1470, "valid_targets_mean": 2779.9, "valid_targets_min": 1914 }, { "epoch": 1.41568, "grad_norm": 0.06280482861569853, "learning_rate": 3.605978424432954e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004219388938508928, "step": 1475, "valid_targets_mean": 3924.9, "valid_targets_min": 1984 }, { "epoch": 1.42048, "grad_norm": 0.07020653984883694, "learning_rate": 3.601976311186361e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.00041140051325783134, "step": 1480, "valid_targets_mean": 2816.9, "valid_targets_min": 1820 }, { "epoch": 1.4252799999999999, "grad_norm": 0.05898237565692731, "learning_rate": 3.597956220204861e-05, "loss": 0.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005558461998589337, "step": 1485, "valid_targets_mean": 4578.8, "valid_targets_min": 1763 }, { "epoch": 1.43008, "grad_norm": 0.057373824481315346, "learning_rate": 3.5939181966028084e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.000512075494043529, "step": 1490, "valid_targets_mean": 3754.1, "valid_targets_min": 1900 }, { "epoch": 1.43488, "grad_norm": 0.07125513076235777, "learning_rate": 3.589862285695804e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0007729599601589143, "step": 1495, "valid_targets_mean": 3450.2, "valid_targets_min": 1705 }, { "epoch": 1.43968, "grad_norm": 0.060930732371940854, "learning_rate": 3.585788533000184e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006291154422797263, "step": 1500, "valid_targets_mean": 4446.1, "valid_targets_min": 1662 }, { "epoch": 1.44448, "grad_norm": 0.055811659510320806, "learning_rate": 3.581696984232508e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.00038417422911152244, "step": 1505, "valid_targets_mean": 3627.4, "valid_targets_min": 1705 }, { "epoch": 1.44928, "grad_norm": 0.061531493977022365, "learning_rate": 3.5775876853090465e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006389599875546992, "step": 1510, "valid_targets_mean": 3979.2, "valid_targets_min": 2031 }, { "epoch": 1.45408, "grad_norm": 0.0628987310198828, "learning_rate": 3.5734606823452686e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006298416992649436, "step": 1515, "valid_targets_mean": 3707.5, "valid_targets_min": 1839 }, { "epoch": 1.45888, "grad_norm": 0.06317191831321439, "learning_rate": 3.569316021655319e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004600128741003573, "step": 1520, "valid_targets_mean": 4283.7, "valid_targets_min": 1833 }, { "epoch": 1.46368, "grad_norm": 0.0568786391414204, "learning_rate": 3.565153749751505e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005623505567200482, "step": 1525, "valid_targets_mean": 4382.9, "valid_targets_min": 1727 }, { "epoch": 1.46848, "grad_norm": 0.06022997207628912, "learning_rate": 3.5609739133437666e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004593412159010768, "step": 1530, "valid_targets_mean": 4219.6, "valid_targets_min": 1877 }, { "epoch": 1.47328, "grad_norm": 0.062444717675455196, "learning_rate": 3.55677655933916e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005715553415939212, "step": 1535, "valid_targets_mean": 3537.5, "valid_targets_min": 1662 }, { "epoch": 1.47808, "grad_norm": 0.0625345202594014, "learning_rate": 3.5525617348413265e-05, "loss": 0.0016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006118146702647209, "step": 1540, "valid_targets_mean": 3959.2, "valid_targets_min": 1833 }, { "epoch": 1.48288, "grad_norm": 0.0676310496671364, "learning_rate": 3.5483294871499646e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005530751659534872, "step": 1545, "valid_targets_mean": 3372.5, "valid_targets_min": 1877 }, { "epoch": 1.4876800000000001, "grad_norm": 0.060396214971341365, "learning_rate": 3.544079863760302e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.00045702309580519795, "step": 1550, "valid_targets_mean": 4131.5, "valid_targets_min": 1838 }, { "epoch": 1.49248, "grad_norm": 0.054164127702003184, "learning_rate": 3.5398129123625565e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.00044832000276073813, "step": 1555, "valid_targets_mean": 3460.3, "valid_targets_min": 1938 }, { "epoch": 1.49728, "grad_norm": 0.04613403287715913, "learning_rate": 3.535528680841408e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003852218796964735, "step": 1560, "valid_targets_mean": 4295.8, "valid_targets_min": 1662 }, { "epoch": 1.5020799999999999, "grad_norm": 0.0500127512382979, "learning_rate": 3.5312272172754566e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002881671243812889, "step": 1565, "valid_targets_mean": 4434.7, "valid_targets_min": 2013 }, { "epoch": 1.50688, "grad_norm": 0.04570223243728663, "learning_rate": 3.5269085699366844e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.00036125804763287306, "step": 1570, "valid_targets_mean": 3563.8, "valid_targets_min": 1662 }, { "epoch": 1.5116800000000001, "grad_norm": 0.050115443527604414, "learning_rate": 3.5225727872899136e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.00035666252369992435, "step": 1575, "valid_targets_mean": 4493.9, "valid_targets_min": 1958 }, { "epoch": 1.51648, "grad_norm": 0.05814250073314437, "learning_rate": 3.518219917992262e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004859221226070076, "step": 1580, "valid_targets_mean": 3551.9, "valid_targets_min": 1918 }, { "epoch": 1.52128, "grad_norm": 0.06290377895194338, "learning_rate": 3.5138500108926e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005594316171482205, "step": 1585, "valid_targets_mean": 3467.0, "valid_targets_min": 1907 }, { "epoch": 1.5260799999999999, "grad_norm": 0.05486405846197014, "learning_rate": 3.509463115030995e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005741740460507572, "step": 1590, "valid_targets_mean": 3229.7, "valid_targets_min": 1908 }, { "epoch": 1.53088, "grad_norm": 0.05481084601712841, "learning_rate": 3.505059279638172e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004915180034004152, "step": 1595, "valid_targets_mean": 4382.2, "valid_targets_min": 1829 }, { "epoch": 1.5356800000000002, "grad_norm": 0.05643903234898962, "learning_rate": 3.500638554134952e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005215753335505724, "step": 1600, "valid_targets_mean": 4035.5, "valid_targets_min": 1934 }, { "epoch": 1.54048, "grad_norm": 0.05254977998780307, "learning_rate": 3.4962009881317005e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003885997866746038, "step": 1605, "valid_targets_mean": 4436.7, "valid_targets_min": 1839 }, { "epoch": 1.54528, "grad_norm": 0.04901711420583684, "learning_rate": 3.491746631427772e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.00030224508373066783, "step": 1610, "valid_targets_mean": 4003.0, "valid_targets_min": 1836 }, { "epoch": 1.55008, "grad_norm": 0.06623036966544768, "learning_rate": 3.487275534010948e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.00043395202374085784, "step": 1615, "valid_targets_mean": 3309.2, "valid_targets_min": 1964 }, { "epoch": 1.55488, "grad_norm": 0.048836873073373185, "learning_rate": 3.482787746056881e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002878532977774739, "step": 1620, "valid_targets_mean": 3198.2, "valid_targets_min": 1920 }, { "epoch": 1.55968, "grad_norm": 0.056913745823748994, "learning_rate": 3.4782833179285256e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003762117703445256, "step": 1625, "valid_targets_mean": 4056.7, "valid_targets_min": 2048 }, { "epoch": 1.56448, "grad_norm": 0.0639777721623604, "learning_rate": 3.473762300175578e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006554973078891635, "step": 1630, "valid_targets_mean": 4729.8, "valid_targets_min": 1913 }, { "epoch": 1.56928, "grad_norm": 0.051373274326048456, "learning_rate": 3.469224743533906e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003751883050426841, "step": 1635, "valid_targets_mean": 3390.2, "valid_targets_min": 1719 }, { "epoch": 1.57408, "grad_norm": 0.05691966457897771, "learning_rate": 3.464670698924981e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004305654438212514, "step": 1640, "valid_targets_mean": 3745.8, "valid_targets_min": 2113 }, { "epoch": 1.5788799999999998, "grad_norm": 0.05813617644285067, "learning_rate": 3.4601002174553055e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003666894044727087, "step": 1645, "valid_targets_mean": 2813.3, "valid_targets_min": 1716 }, { "epoch": 1.58368, "grad_norm": 0.05612945598126955, "learning_rate": 3.45551335041584e-05, "loss": 0.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006458326242864132, "step": 1650, "valid_targets_mean": 3816.4, "valid_targets_min": 1614 }, { "epoch": 1.5884800000000001, "grad_norm": 0.06049444178287035, "learning_rate": 3.4509101492814286e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003922865726053715, "step": 1655, "valid_targets_mean": 3021.3, "valid_targets_min": 1517 }, { "epoch": 1.59328, "grad_norm": 0.06005838628831204, "learning_rate": 3.446290665710219e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.000557239050976932, "step": 1660, "valid_targets_mean": 3385.1, "valid_targets_min": 1908 }, { "epoch": 1.59808, "grad_norm": 0.057545476191578786, "learning_rate": 3.441654951543085e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004963584360666573, "step": 1665, "valid_targets_mean": 3562.9, "valid_targets_min": 1937 }, { "epoch": 1.6028799999999999, "grad_norm": 0.0441759887433332, "learning_rate": 3.4370030588030425e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003990795521531254, "step": 1670, "valid_targets_mean": 4340.4, "valid_targets_min": 2031 }, { "epoch": 1.60768, "grad_norm": 0.06127534174000278, "learning_rate": 3.432335039694669e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003658411733340472, "step": 1675, "valid_targets_mean": 4327.9, "valid_targets_min": 1917 }, { "epoch": 1.6124800000000001, "grad_norm": 0.058767126137987784, "learning_rate": 3.427650946603513e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005258081946521997, "step": 1680, "valid_targets_mean": 3368.2, "valid_targets_min": 1966 }, { "epoch": 1.61728, "grad_norm": 0.0449556804757125, "learning_rate": 3.422950832095511e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003695829655043781, "step": 1685, "valid_targets_mean": 4248.2, "valid_targets_min": 1940 }, { "epoch": 1.62208, "grad_norm": 0.039865055155997225, "learning_rate": 3.418234748916395e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00027950757066719234, "step": 1690, "valid_targets_mean": 4464.6, "valid_targets_min": 1838 }, { "epoch": 1.6268799999999999, "grad_norm": 0.052016803985212814, "learning_rate": 3.4135027499911003e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003943184856325388, "step": 1695, "valid_targets_mean": 3936.7, "valid_targets_min": 1829 }, { "epoch": 1.63168, "grad_norm": 0.050299889174442704, "learning_rate": 3.408754888423173e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003132482524961233, "step": 1700, "valid_targets_mean": 4339.2, "valid_targets_min": 1705 }, { "epoch": 1.6364800000000002, "grad_norm": 0.047308777354368184, "learning_rate": 3.403991217494172e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002561693836469203, "step": 1705, "valid_targets_mean": 3008.0, "valid_targets_min": 1836 }, { "epoch": 1.64128, "grad_norm": 0.05413378126480606, "learning_rate": 3.3992117906630744e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004959758371114731, "step": 1710, "valid_targets_mean": 4311.6, "valid_targets_min": 2001 }, { "epoch": 1.64608, "grad_norm": 0.04883708091963607, "learning_rate": 3.394416661565671e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003378509427420795, "step": 1715, "valid_targets_mean": 3893.9, "valid_targets_min": 1517 }, { "epoch": 1.65088, "grad_norm": 0.04414000339277738, "learning_rate": 3.389605884013969e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003347942838445306, "step": 1720, "valid_targets_mean": 3723.3, "valid_targets_min": 1933 }, { "epoch": 1.65568, "grad_norm": 0.055219278511505654, "learning_rate": 3.384779511995587e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002406383428024128, "step": 1725, "valid_targets_mean": 3163.8, "valid_targets_min": 1981 }, { "epoch": 1.66048, "grad_norm": 0.05296936286452832, "learning_rate": 3.379937599673144e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.00038539827801287174, "step": 1730, "valid_targets_mean": 2922.3, "valid_targets_min": 1525 }, { "epoch": 1.66528, "grad_norm": 0.06301281456735988, "learning_rate": 3.3750802013836596e-05, "loss": 0.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006307390285655856, "step": 1735, "valid_targets_mean": 3184.9, "valid_targets_min": 2030 }, { "epoch": 1.67008, "grad_norm": 0.040991134654555485, "learning_rate": 3.370207371637939e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00027934444369748235, "step": 1740, "valid_targets_mean": 4248.1, "valid_targets_min": 1917 }, { "epoch": 1.67488, "grad_norm": 0.05525964959165724, "learning_rate": 3.3653191651199635e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00043741060653701425, "step": 1745, "valid_targets_mean": 3096.0, "valid_targets_min": 1942 }, { "epoch": 1.6796799999999998, "grad_norm": 0.04948169779465362, "learning_rate": 3.360415636686274e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00034553324803709984, "step": 1750, "valid_targets_mean": 3762.4, "valid_targets_min": 1839 }, { "epoch": 1.68448, "grad_norm": 0.057814928993456416, "learning_rate": 3.355496841365359e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.00034999416675418615, "step": 1755, "valid_targets_mean": 3363.3, "valid_targets_min": 1614 }, { "epoch": 1.6892800000000001, "grad_norm": 0.04656009081003181, "learning_rate": 3.350562834357034e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003240430378355086, "step": 1760, "valid_targets_mean": 4379.7, "valid_targets_min": 1928 }, { "epoch": 1.69408, "grad_norm": 0.04634663217611643, "learning_rate": 3.345613671031827e-05, "loss": 0.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003630942082963884, "step": 1765, "valid_targets_mean": 2665.6, "valid_targets_min": 1829 }, { "epoch": 1.69888, "grad_norm": 0.05389450610622448, "learning_rate": 3.340649406930349e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00042325188405811787, "step": 1770, "valid_targets_mean": 3036.8, "valid_targets_min": 1908 }, { "epoch": 1.7036799999999999, "grad_norm": 0.04054004078806552, "learning_rate": 3.335670097762677e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003856320690829307, "step": 1775, "valid_targets_mean": 4150.5, "valid_targets_min": 1921 }, { "epoch": 1.70848, "grad_norm": 0.04319122595484807, "learning_rate": 3.330675799407728e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002972689107991755, "step": 1780, "valid_targets_mean": 4059.9, "valid_targets_min": 2010 }, { "epoch": 1.7132800000000001, "grad_norm": 0.0614953115360606, "learning_rate": 3.32566656791263e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00041061831871047616, "step": 1785, "valid_targets_mean": 3852.8, "valid_targets_min": 1820 }, { "epoch": 1.71808, "grad_norm": 0.05093908281170732, "learning_rate": 3.320642459492095e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00046082702465355396, "step": 1790, "valid_targets_mean": 4709.6, "valid_targets_min": 1914 }, { "epoch": 1.72288, "grad_norm": 0.0405281692299427, "learning_rate": 3.315603530527785e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002832312893588096, "step": 1795, "valid_targets_mean": 4104.4, "valid_targets_min": 1829 }, { "epoch": 1.7276799999999999, "grad_norm": 0.04855015633898981, "learning_rate": 3.310549837567685e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00033870741026476026, "step": 1800, "valid_targets_mean": 2691.3, "valid_targets_min": 2029 }, { "epoch": 1.73248, "grad_norm": 0.047363617105796715, "learning_rate": 3.3054814373254615e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002556862309575081, "step": 1805, "valid_targets_mean": 3560.0, "valid_targets_min": 1974 }, { "epoch": 1.7372800000000002, "grad_norm": 0.06870257527043447, "learning_rate": 3.300398386679831e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005319949705153704, "step": 1810, "valid_targets_mean": 3655.3, "valid_targets_min": 1928 }, { "epoch": 1.74208, "grad_norm": 0.04543379139820006, "learning_rate": 3.2953007426739204e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006080212187953293, "step": 1815, "valid_targets_mean": 3771.9, "valid_targets_min": 1950 }, { "epoch": 1.74688, "grad_norm": 0.059110598595154995, "learning_rate": 3.290188562514624e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004835808358620852, "step": 1820, "valid_targets_mean": 3807.7, "valid_targets_min": 1929 }, { "epoch": 1.75168, "grad_norm": 0.053563524383162094, "learning_rate": 3.285061903571968e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00036704057129099965, "step": 1825, "valid_targets_mean": 3920.9, "valid_targets_min": 1525 }, { "epoch": 1.75648, "grad_norm": 0.04025291938966945, "learning_rate": 3.27992082337846e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003524449421092868, "step": 1830, "valid_targets_mean": 3674.2, "valid_targets_min": 1775 }, { "epoch": 1.76128, "grad_norm": 0.04632488808634008, "learning_rate": 3.274765379628447e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003716344363056123, "step": 1835, "valid_targets_mean": 4068.3, "valid_targets_min": 1562 }, { "epoch": 1.76608, "grad_norm": 0.04633480317494468, "learning_rate": 3.2695956301774664e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003534138377290219, "step": 1840, "valid_targets_mean": 4502.1, "valid_targets_min": 1820 }, { "epoch": 1.77088, "grad_norm": 0.05850594818743109, "learning_rate": 3.264411633041598e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00048642410547472537, "step": 1845, "valid_targets_mean": 3579.4, "valid_targets_min": 1836 }, { "epoch": 1.77568, "grad_norm": 0.05387262915143158, "learning_rate": 3.259213446396812e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004213897336740047, "step": 1850, "valid_targets_mean": 4249.3, "valid_targets_min": 1912 }, { "epoch": 1.7804799999999998, "grad_norm": 0.04971774541588144, "learning_rate": 3.254001128578317e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003937389701604843, "step": 1855, "valid_targets_mean": 4642.7, "valid_targets_min": 2057 }, { "epoch": 1.78528, "grad_norm": 0.05572299073574149, "learning_rate": 3.2487747380799036e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.000320199120324105, "step": 1860, "valid_targets_mean": 3592.1, "valid_targets_min": 1361 }, { "epoch": 1.7900800000000001, "grad_norm": 0.04950662800517279, "learning_rate": 3.243534333553291e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004355285782366991, "step": 1865, "valid_targets_mean": 3426.8, "valid_targets_min": 2025 }, { "epoch": 1.79488, "grad_norm": 0.045827956197243926, "learning_rate": 3.2382799738074635e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002996047551278025, "step": 1870, "valid_targets_mean": 4818.6, "valid_targets_min": 1836 }, { "epoch": 1.79968, "grad_norm": 0.043499031883452915, "learning_rate": 3.2330117178080184e-05, "loss": 0.0012, "loss_nan_ranks": 0, "loss_rank_avg": 0.00030622404301539063, "step": 1875, "valid_targets_mean": 4497.5, "valid_targets_min": 1942 }, { "epoch": 1.8044799999999999, "grad_norm": 0.04161937474381663, "learning_rate": 3.227729624676497e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002968889311887324, "step": 1880, "valid_targets_mean": 4432.3, "valid_targets_min": 1740 }, { "epoch": 1.80928, "grad_norm": 0.049436031579658306, "learning_rate": 3.222433753689724e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002810401492752135, "step": 1885, "valid_targets_mean": 3545.3, "valid_targets_min": 2084 }, { "epoch": 1.8140800000000001, "grad_norm": 0.03577910696174026, "learning_rate": 3.2171241642791443e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002864730195142329, "step": 1890, "valid_targets_mean": 4110.9, "valid_targets_min": 1914 }, { "epoch": 1.81888, "grad_norm": 0.04253383606701866, "learning_rate": 3.211800916030152e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00027189357206225395, "step": 1895, "valid_targets_mean": 4199.0, "valid_targets_min": 1908 }, { "epoch": 1.82368, "grad_norm": 0.03981515952280382, "learning_rate": 3.206464068681424e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003700641100294888, "step": 1900, "valid_targets_mean": 4726.0, "valid_targets_min": 1919 }, { "epoch": 1.8284799999999999, "grad_norm": 0.04678756520562075, "learning_rate": 3.20111368212425e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0006207724800333381, "step": 1905, "valid_targets_mean": 4013.5, "valid_targets_min": 1839 }, { "epoch": 1.83328, "grad_norm": 0.042430851523702566, "learning_rate": 3.19574981640186e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00034162524389103055, "step": 1910, "valid_targets_mean": 3786.6, "valid_targets_min": 1908 }, { "epoch": 1.8380800000000002, "grad_norm": 0.05215277248239781, "learning_rate": 3.1903725317087495e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004819263413082808, "step": 1915, "valid_targets_mean": 3923.4, "valid_targets_min": 1719 }, { "epoch": 1.84288, "grad_norm": 0.044629333978700496, "learning_rate": 3.184981888390003e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003267807769589126, "step": 1920, "valid_targets_mean": 3651.1, "valid_targets_min": 2039 }, { "epoch": 1.84768, "grad_norm": 0.04480507387362986, "learning_rate": 3.1795779469406226e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00035782408667728305, "step": 1925, "valid_targets_mean": 3725.5, "valid_targets_min": 1786 }, { "epoch": 1.85248, "grad_norm": 0.041128453478606976, "learning_rate": 3.174160768004842e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022609728330280632, "step": 1930, "valid_targets_mean": 5245.9, "valid_targets_min": 1680 }, { "epoch": 1.85728, "grad_norm": 0.05143151866954522, "learning_rate": 3.168730412375449e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00044801694457419217, "step": 1935, "valid_targets_mean": 3150.0, "valid_targets_min": 1680 }, { "epoch": 1.86208, "grad_norm": 0.04692971584297232, "learning_rate": 3.1632869409931036e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.000266010407358408, "step": 1940, "valid_targets_mean": 3319.3, "valid_targets_min": 1775 }, { "epoch": 1.86688, "grad_norm": 0.03787908414763803, "learning_rate": 3.1578304149456544e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00027268845587968826, "step": 1945, "valid_targets_mean": 4960.8, "valid_targets_min": 1829 }, { "epoch": 1.87168, "grad_norm": 0.05436027849322881, "learning_rate": 3.1523608954674524e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.00037563478690572083, "step": 1950, "valid_targets_mean": 3414.5, "valid_targets_min": 1958 }, { "epoch": 1.87648, "grad_norm": 0.042774282013460875, "learning_rate": 3.1468784439386614e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003659092471934855, "step": 1955, "valid_targets_mean": 3620.4, "valid_targets_min": 1904 }, { "epoch": 1.8812799999999998, "grad_norm": 0.04122380272897595, "learning_rate": 3.141383121884576e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00034778908593580127, "step": 1960, "valid_targets_mean": 4347.6, "valid_targets_min": 2039 }, { "epoch": 1.88608, "grad_norm": 0.05330947792411219, "learning_rate": 3.1358749909749214e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00034708459861576557, "step": 1965, "valid_targets_mean": 4252.3, "valid_targets_min": 1959 }, { "epoch": 1.8908800000000001, "grad_norm": 0.049483338699360224, "learning_rate": 3.1303541130231703e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004025818780064583, "step": 1970, "valid_targets_mean": 4020.6, "valid_targets_min": 2012 }, { "epoch": 1.89568, "grad_norm": 0.049351126866147295, "learning_rate": 3.1248205499858446e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003342171257827431, "step": 1975, "valid_targets_mean": 3042.1, "valid_targets_min": 1943 }, { "epoch": 1.90048, "grad_norm": 0.042954433111331666, "learning_rate": 3.119274363961821e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00021361312246881425, "step": 1980, "valid_targets_mean": 3799.3, "valid_targets_min": 1942 }, { "epoch": 1.9052799999999999, "grad_norm": 0.03550201618878598, "learning_rate": 3.113715617191634e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002286080562043935, "step": 1985, "valid_targets_mean": 4318.5, "valid_targets_min": 2010 }, { "epoch": 1.91008, "grad_norm": 0.0512979708140217, "learning_rate": 3.1081443720567785e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00040846579940989614, "step": 1990, "valid_targets_mean": 4275.7, "valid_targets_min": 1870 }, { "epoch": 1.9148800000000001, "grad_norm": 0.04322505692818679, "learning_rate": 3.102560691079007e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003856475232169032, "step": 1995, "valid_targets_mean": 3959.7, "valid_targets_min": 1517 }, { "epoch": 1.91968, "grad_norm": 0.037866804711089004, "learning_rate": 3.0969646369196307e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020155790844000876, "step": 2000, "valid_targets_mean": 3651.0, "valid_targets_min": 1906 }, { "epoch": 1.92448, "grad_norm": 0.03520402744171799, "learning_rate": 3.0913562723788174e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017841681255958974, "step": 2005, "valid_targets_mean": 3097.2, "valid_targets_min": 1900 }, { "epoch": 1.9292799999999999, "grad_norm": 0.04576720772413004, "learning_rate": 3.085735660394881e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002288795803906396, "step": 2010, "valid_targets_mean": 3696.0, "valid_targets_min": 1987 }, { "epoch": 1.93408, "grad_norm": 0.04933298500996939, "learning_rate": 3.080102864043581e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004367926740087569, "step": 2015, "valid_targets_mean": 3204.1, "valid_targets_min": 2026 }, { "epoch": 1.9388800000000002, "grad_norm": 0.05260798047248693, "learning_rate": 3.074457946537413e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003071989049203694, "step": 2020, "valid_targets_mean": 3134.8, "valid_targets_min": 1525 }, { "epoch": 1.94368, "grad_norm": 0.04380153388399339, "learning_rate": 3.068800971224898e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.00030949185020290315, "step": 2025, "valid_targets_mean": 3797.7, "valid_targets_min": 1900 }, { "epoch": 1.94848, "grad_norm": 0.046800305647988746, "learning_rate": 3.0631320015898735e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003367983445059508, "step": 2030, "valid_targets_mean": 4517.7, "valid_targets_min": 1940 }, { "epoch": 1.95328, "grad_norm": 0.040178378749060155, "learning_rate": 3.057451101250778e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002442404511384666, "step": 2035, "valid_targets_mean": 4852.8, "valid_targets_min": 1740 }, { "epoch": 1.95808, "grad_norm": 0.04509788359517867, "learning_rate": 3.051758333959941e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002550902427174151, "step": 2040, "valid_targets_mean": 3564.3, "valid_targets_min": 1991 }, { "epoch": 1.96288, "grad_norm": 0.03594320942598652, "learning_rate": 3.046053763602865e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004347126523498446, "step": 2045, "valid_targets_mean": 4681.1, "valid_targets_min": 1802 }, { "epoch": 1.96768, "grad_norm": 0.04263972629270992, "learning_rate": 3.0403374541975078e-05, "loss": 0.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003159629413858056, "step": 2050, "valid_targets_mean": 3935.8, "valid_targets_min": 1981 }, { "epoch": 1.97248, "grad_norm": 0.04122883968158281, "learning_rate": 3.034609469893567e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003064102493226528, "step": 2055, "valid_targets_mean": 3883.6, "valid_targets_min": 1802 }, { "epoch": 1.97728, "grad_norm": 0.04338278061662454, "learning_rate": 3.028869874971758e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002915991353802383, "step": 2060, "valid_targets_mean": 3029.1, "valid_targets_min": 1847 }, { "epoch": 1.9820799999999998, "grad_norm": 0.036355028310916124, "learning_rate": 3.0231187338430944e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00035102188121527433, "step": 2065, "valid_targets_mean": 4931.2, "valid_targets_min": 1939 }, { "epoch": 1.98688, "grad_norm": 0.048383914402931466, "learning_rate": 3.0173561110481606e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023929959570523351, "step": 2070, "valid_targets_mean": 5375.9, "valid_targets_min": 1940 }, { "epoch": 1.9916800000000001, "grad_norm": 0.044115711212949424, "learning_rate": 3.011582071256394e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00032735677086748183, "step": 2075, "valid_targets_mean": 3306.5, "valid_targets_min": 1727 }, { "epoch": 1.99648, "grad_norm": 0.04118373461485346, "learning_rate": 3.0057966792653547e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00026323198108002543, "step": 2080, "valid_targets_mean": 4257.6, "valid_targets_min": 1829 }, { "epoch": 2.00096, "grad_norm": 0.033605720871692286, "learning_rate": 3.0000000000000004e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023035166668705642, "step": 2085, "valid_targets_mean": 3021.3, "valid_targets_min": 1820 }, { "epoch": 2.00576, "grad_norm": 0.03941509733719802, "learning_rate": 2.9941920985119562e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002633282565511763, "step": 2090, "valid_targets_mean": 3287.6, "valid_targets_min": 1906 }, { "epoch": 2.01056, "grad_norm": 0.04225606591711965, "learning_rate": 2.988373039978786e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00025588853168301284, "step": 2095, "valid_targets_mean": 2852.6, "valid_targets_min": 1857 }, { "epoch": 2.01536, "grad_norm": 0.03849636401283634, "learning_rate": 2.98254288970326e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003536568838171661, "step": 2100, "valid_targets_mean": 4180.8, "valid_targets_min": 1802 }, { "epoch": 2.02016, "grad_norm": 0.04407578409722852, "learning_rate": 2.9767017131126245e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014297438610810786, "step": 2105, "valid_targets_mean": 3781.4, "valid_targets_min": 1919 }, { "epoch": 2.02496, "grad_norm": 0.045494787360105746, "learning_rate": 2.9708495757578633e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022338703274726868, "step": 2110, "valid_targets_mean": 4300.6, "valid_targets_min": 1942 }, { "epoch": 2.02976, "grad_norm": 0.03789723665227751, "learning_rate": 2.964986543312964e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002846395072992891, "step": 2115, "valid_targets_mean": 4121.6, "valid_targets_min": 1771 }, { "epoch": 2.03456, "grad_norm": 0.04835105817239923, "learning_rate": 2.9591126815741832e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004806315992027521, "step": 2120, "valid_targets_mean": 4034.5, "valid_targets_min": 1858 }, { "epoch": 2.03936, "grad_norm": 0.03915872767648746, "learning_rate": 2.953228056459305e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00025110685965046287, "step": 2125, "valid_targets_mean": 4672.4, "valid_targets_min": 1863 }, { "epoch": 2.04416, "grad_norm": 0.04912331091299425, "learning_rate": 2.947332734006903e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0004711863584816456, "step": 2130, "valid_targets_mean": 3152.0, "valid_targets_min": 1652 }, { "epoch": 2.04896, "grad_norm": 0.03562616275436536, "learning_rate": 2.9414267803755988e-05, "loss": 0.001, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003120258334092796, "step": 2135, "valid_targets_mean": 4770.2, "valid_targets_min": 1680 }, { "epoch": 2.05376, "grad_norm": 0.03446236345598084, "learning_rate": 2.9355102618433197e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023818084446247667, "step": 2140, "valid_targets_mean": 3193.0, "valid_targets_min": 1906 }, { "epoch": 2.05856, "grad_norm": 0.03753730116508484, "learning_rate": 2.929583244806553e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002192890678998083, "step": 2145, "valid_targets_mean": 4480.2, "valid_targets_min": 1960 }, { "epoch": 2.06336, "grad_norm": 0.049491292395218045, "learning_rate": 2.9236457957796047e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003270478919148445, "step": 2150, "valid_targets_mean": 3365.0, "valid_targets_min": 1877 }, { "epoch": 2.0681599999999998, "grad_norm": 0.04715131351475584, "learning_rate": 2.9176979813938494e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003005887265317142, "step": 2155, "valid_targets_mean": 3592.0, "valid_targets_min": 1562 }, { "epoch": 2.07296, "grad_norm": 0.045132727411257935, "learning_rate": 2.9117398683969857e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002569695352576673, "step": 2160, "valid_targets_mean": 4224.3, "valid_targets_min": 1928 }, { "epoch": 2.07776, "grad_norm": 0.045645196767944124, "learning_rate": 2.9057715236522833e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002819838700816035, "step": 2165, "valid_targets_mean": 3357.2, "valid_targets_min": 1786 }, { "epoch": 2.08256, "grad_norm": 0.047911519242527144, "learning_rate": 2.899793014137836e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00036411883775144815, "step": 2170, "valid_targets_mean": 3320.3, "valid_targets_min": 1909 }, { "epoch": 2.08736, "grad_norm": 0.05180769284537206, "learning_rate": 2.8938044069458094e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00034832872916013, "step": 2175, "valid_targets_mean": 3780.2, "valid_targets_min": 1958 }, { "epoch": 2.09216, "grad_norm": 0.046025193146755725, "learning_rate": 2.8878057692816877e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.0005058305687271059, "step": 2180, "valid_targets_mean": 3388.2, "valid_targets_min": 1907 }, { "epoch": 2.09696, "grad_norm": 0.03775721962047528, "learning_rate": 2.8817971684635178e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001705609611235559, "step": 2185, "valid_targets_mean": 3603.0, "valid_targets_min": 1863 }, { "epoch": 2.10176, "grad_norm": 0.04585119871874699, "learning_rate": 2.8757786719211555e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020783724903594702, "step": 2190, "valid_targets_mean": 3269.0, "valid_targets_min": 1908 }, { "epoch": 2.10656, "grad_norm": 0.03891090599039738, "learning_rate": 2.8697503471955106e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001934785395860672, "step": 2195, "valid_targets_mean": 4751.0, "valid_targets_min": 1614 }, { "epoch": 2.11136, "grad_norm": 0.038984861137829015, "learning_rate": 2.8637122619377848e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.000268601841526106, "step": 2200, "valid_targets_mean": 3949.3, "valid_targets_min": 1992 }, { "epoch": 2.11616, "grad_norm": 0.04030795470548875, "learning_rate": 2.8576644839087152e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00018950544472318143, "step": 2205, "valid_targets_mean": 3396.4, "valid_targets_min": 1921 }, { "epoch": 2.12096, "grad_norm": 0.04272732693807203, "learning_rate": 2.8516070809778145e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001538700598757714, "step": 2210, "valid_targets_mean": 3320.9, "valid_targets_min": 1740 }, { "epoch": 2.12576, "grad_norm": 0.03964188235224993, "learning_rate": 2.845540121122607e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002259221364511177, "step": 2215, "valid_targets_mean": 4208.6, "valid_targets_min": 1887 }, { "epoch": 2.13056, "grad_norm": 0.04272357544341015, "learning_rate": 2.839463672427867e-05, "loss": 0.0009, "loss_nan_ranks": 0, "loss_rank_avg": 0.00033014221116900444, "step": 2220, "valid_targets_mean": 4028.6, "valid_targets_min": 1904 }, { "epoch": 2.13536, "grad_norm": 0.02931611152693843, "learning_rate": 2.833377803084855e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011045490828109905, "step": 2225, "valid_targets_mean": 3965.6, "valid_targets_min": 1863 }, { "epoch": 2.14016, "grad_norm": 0.03415035693128969, "learning_rate": 2.8272825813905522e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001376604486722499, "step": 2230, "valid_targets_mean": 3235.6, "valid_targets_min": 1857 }, { "epoch": 2.14496, "grad_norm": 0.03382136920768197, "learning_rate": 2.8211780757468942e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015516190615016967, "step": 2235, "valid_targets_mean": 3887.8, "valid_targets_min": 1919 }, { "epoch": 2.14976, "grad_norm": 0.044993094399656555, "learning_rate": 2.8150643546600012e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003087717341259122, "step": 2240, "valid_targets_mean": 3293.2, "valid_targets_min": 1928 }, { "epoch": 2.15456, "grad_norm": 0.03908152875549286, "learning_rate": 2.808941486739414e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002885219582822174, "step": 2245, "valid_targets_mean": 4638.7, "valid_targets_min": 1900 }, { "epoch": 2.15936, "grad_norm": 0.030928059487089134, "learning_rate": 2.80280954069732e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023226509802043438, "step": 2250, "valid_targets_mean": 3890.1, "valid_targets_min": 1951 }, { "epoch": 2.16416, "grad_norm": 0.03729014178961917, "learning_rate": 2.7966685853477828e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003418756532482803, "step": 2255, "valid_targets_mean": 3247.4, "valid_targets_min": 2231 }, { "epoch": 2.16896, "grad_norm": 0.0323102484575263, "learning_rate": 2.790518689605971e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00019071548013016582, "step": 2260, "valid_targets_mean": 3516.8, "valid_targets_min": 1889 }, { "epoch": 2.17376, "grad_norm": 0.04856897361198709, "learning_rate": 2.7843599224873833e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017041576211340725, "step": 2265, "valid_targets_mean": 4206.8, "valid_targets_min": 1924 }, { "epoch": 2.17856, "grad_norm": 0.03576939276419744, "learning_rate": 2.7781923531070775e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00038324674824252725, "step": 2270, "valid_targets_mean": 2961.4, "valid_targets_min": 1680 }, { "epoch": 2.18336, "grad_norm": 0.030493288750038344, "learning_rate": 2.7720160506788896e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001243678416358307, "step": 2275, "valid_targets_mean": 3825.0, "valid_targets_min": 1870 }, { "epoch": 2.18816, "grad_norm": 0.0400949924638015, "learning_rate": 2.7658310845146598e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00018578841991256922, "step": 2280, "valid_targets_mean": 4495.0, "valid_targets_min": 2009 }, { "epoch": 2.19296, "grad_norm": 0.037333026714177465, "learning_rate": 2.7596375240234574e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020659196889027953, "step": 2285, "valid_targets_mean": 3360.5, "valid_targets_min": 1719 }, { "epoch": 2.19776, "grad_norm": 0.045283233017465424, "learning_rate": 2.7534354387107975e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00029020351939834654, "step": 2290, "valid_targets_mean": 4335.8, "valid_targets_min": 1525 }, { "epoch": 2.20256, "grad_norm": 0.0321961691598059, "learning_rate": 2.747224898177862e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001831486588343978, "step": 2295, "valid_targets_mean": 5505.2, "valid_targets_min": 2074 }, { "epoch": 2.20736, "grad_norm": 0.04479222868751039, "learning_rate": 2.7410059721207187e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00031453612609766424, "step": 2300, "valid_targets_mean": 3296.8, "valid_targets_min": 2041 }, { "epoch": 2.21216, "grad_norm": 0.03396162372941247, "learning_rate": 2.734778730329543e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00024497491540387273, "step": 2305, "valid_targets_mean": 3662.8, "valid_targets_min": 1891 }, { "epoch": 2.21696, "grad_norm": 0.039392580173791665, "learning_rate": 2.7285432426878275e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002551403595134616, "step": 2310, "valid_targets_mean": 4311.8, "valid_targets_min": 2032 }, { "epoch": 2.22176, "grad_norm": 0.03754119255041813, "learning_rate": 2.7222995791716034e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00019644678104668856, "step": 2315, "valid_targets_mean": 3148.0, "valid_targets_min": 1763 }, { "epoch": 2.22656, "grad_norm": 0.030334413668914074, "learning_rate": 2.716047809848653e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00018585645011626184, "step": 2320, "valid_targets_mean": 3651.1, "valid_targets_min": 1938 }, { "epoch": 2.23136, "grad_norm": 0.04045784912723658, "learning_rate": 2.7097880048777238e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001915416942210868, "step": 2325, "valid_targets_mean": 3014.8, "valid_targets_min": 1863 }, { "epoch": 2.23616, "grad_norm": 0.04333177506122303, "learning_rate": 2.703520234507742e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00045665091602131724, "step": 2330, "valid_targets_mean": 4318.9, "valid_targets_min": 2056 }, { "epoch": 2.24096, "grad_norm": 0.03739441324826848, "learning_rate": 2.697244569077021e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020790009875781834, "step": 2335, "valid_targets_mean": 3993.2, "valid_targets_min": 1991 }, { "epoch": 2.24576, "grad_norm": 0.035305305784520465, "learning_rate": 2.6909610790124772e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003060979361180216, "step": 2340, "valid_targets_mean": 4405.0, "valid_targets_min": 1939 }, { "epoch": 2.25056, "grad_norm": 0.02959348243450873, "learning_rate": 2.684669834828835e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002234200801467523, "step": 2345, "valid_targets_mean": 4487.1, "valid_targets_min": 1680 }, { "epoch": 2.25536, "grad_norm": 0.04631364254708182, "learning_rate": 2.6783709071278372e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003990861587226391, "step": 2350, "valid_targets_mean": 3409.9, "valid_targets_min": 2011 }, { "epoch": 2.26016, "grad_norm": 0.036652540579393704, "learning_rate": 2.6720643665974522e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017286359798163176, "step": 2355, "valid_targets_mean": 4595.0, "valid_targets_min": 2171 }, { "epoch": 2.26496, "grad_norm": 0.031267941336866396, "learning_rate": 2.665750284011085e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016654253704473376, "step": 2360, "valid_targets_mean": 4046.1, "valid_targets_min": 1920 }, { "epoch": 2.2697599999999998, "grad_norm": 0.036409463244741175, "learning_rate": 2.6594287302267744e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00025828357320278883, "step": 2365, "valid_targets_mean": 5251.3, "valid_targets_min": 1705 }, { "epoch": 2.27456, "grad_norm": 0.03756310563624762, "learning_rate": 2.653099776186405e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001461548963561654, "step": 2370, "valid_targets_mean": 3591.6, "valid_targets_min": 1662 }, { "epoch": 2.27936, "grad_norm": 0.03467708796327428, "learning_rate": 2.646763492914908e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00026901293313130736, "step": 2375, "valid_targets_mean": 3220.3, "valid_targets_min": 1863 }, { "epoch": 2.28416, "grad_norm": 0.029874949666269978, "learning_rate": 2.640419951519467e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002025901630986482, "step": 2380, "valid_targets_mean": 3226.0, "valid_targets_min": 1998 }, { "epoch": 2.28896, "grad_norm": 0.03381433751089229, "learning_rate": 2.634069223188715e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00021201377967372537, "step": 2385, "valid_targets_mean": 4461.9, "valid_targets_min": 1917 }, { "epoch": 2.29376, "grad_norm": 0.037794410016097665, "learning_rate": 2.627711379191939e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022039566829334944, "step": 2390, "valid_targets_mean": 4068.2, "valid_targets_min": 1760 }, { "epoch": 2.29856, "grad_norm": 0.03876776181109457, "learning_rate": 2.621346490878281e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002503449213691056, "step": 2395, "valid_targets_mean": 3787.4, "valid_targets_min": 1884 }, { "epoch": 2.30336, "grad_norm": 0.04425219517126325, "learning_rate": 2.614974629675935e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002225804200861603, "step": 2400, "valid_targets_mean": 3016.7, "valid_targets_min": 1877 }, { "epoch": 2.30816, "grad_norm": 0.0332418527626137, "learning_rate": 2.608595867091346e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001066123804775998, "step": 2405, "valid_targets_mean": 3969.6, "valid_targets_min": 1839 }, { "epoch": 2.31296, "grad_norm": 0.03275117269790793, "learning_rate": 2.6022102747084084e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014958773681428283, "step": 2410, "valid_targets_mean": 3277.8, "valid_targets_min": 1868 }, { "epoch": 2.31776, "grad_norm": 0.03663969443965277, "learning_rate": 2.595817924187663e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023177076946012676, "step": 2415, "valid_targets_mean": 4114.9, "valid_targets_min": 1727 }, { "epoch": 2.32256, "grad_norm": 0.03151762456815796, "learning_rate": 2.589418887265489e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002696237061172724, "step": 2420, "valid_targets_mean": 4500.8, "valid_targets_min": 1942 }, { "epoch": 2.32736, "grad_norm": 0.032831572609185296, "learning_rate": 2.5830132357533044e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001549628796055913, "step": 2425, "valid_targets_mean": 4774.0, "valid_targets_min": 1925 }, { "epoch": 2.33216, "grad_norm": 0.04240344680707184, "learning_rate": 2.5766010415367567e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020264976774342358, "step": 2430, "valid_targets_mean": 3075.3, "valid_targets_min": 1908 }, { "epoch": 2.33696, "grad_norm": 0.041500799096206215, "learning_rate": 2.5701823765749187e-05, "loss": 0.0008, "loss_nan_ranks": 0, "loss_rank_avg": 0.00030124446493573487, "step": 2435, "valid_targets_mean": 3322.5, "valid_targets_min": 1614 }, { "epoch": 2.34176, "grad_norm": 0.024132575735248074, "learning_rate": 2.563757312899477e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001617611851543188, "step": 2440, "valid_targets_mean": 4256.2, "valid_targets_min": 1908 }, { "epoch": 2.34656, "grad_norm": 0.03622168996073483, "learning_rate": 2.557325922613926e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010978215868817642, "step": 2445, "valid_targets_mean": 4010.4, "valid_targets_min": 1751 }, { "epoch": 2.35136, "grad_norm": 0.035687387011170656, "learning_rate": 2.5508882778927615e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020305518410168588, "step": 2450, "valid_targets_mean": 5104.2, "valid_targets_min": 2008 }, { "epoch": 2.35616, "grad_norm": 0.03498720529081233, "learning_rate": 2.5444444509806654e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002204036427428946, "step": 2455, "valid_targets_mean": 3017.6, "valid_targets_min": 1868 }, { "epoch": 2.36096, "grad_norm": 0.033412627570212454, "learning_rate": 2.5379945141916976e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022408628137782216, "step": 2460, "valid_targets_mean": 3959.5, "valid_targets_min": 1662 }, { "epoch": 2.36576, "grad_norm": 0.03359882263771964, "learning_rate": 2.531538539908486e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001831240369938314, "step": 2465, "valid_targets_mean": 3663.9, "valid_targets_min": 1889 }, { "epoch": 2.3705600000000002, "grad_norm": 0.03526372615108675, "learning_rate": 2.5250766005814108e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002579090651124716, "step": 2470, "valid_targets_mean": 3923.1, "valid_targets_min": 1970 }, { "epoch": 2.37536, "grad_norm": 0.033811299894664026, "learning_rate": 2.5186087687277956e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016862923803273588, "step": 2475, "valid_targets_mean": 3491.5, "valid_targets_min": 1763 }, { "epoch": 2.38016, "grad_norm": 0.035525310974040464, "learning_rate": 2.5121351169310887e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00029478981741704047, "step": 2480, "valid_targets_mean": 3264.8, "valid_targets_min": 1917 }, { "epoch": 2.38496, "grad_norm": 0.027684694690569174, "learning_rate": 2.505655717840052e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00021103810286149383, "step": 2485, "valid_targets_mean": 5089.8, "valid_targets_min": 1820 }, { "epoch": 2.38976, "grad_norm": 0.03143907720270563, "learning_rate": 2.499170644167946e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002478085516486317, "step": 2490, "valid_targets_mean": 2749.9, "valid_targets_min": 1918 }, { "epoch": 2.3945600000000002, "grad_norm": 0.027614380837816813, "learning_rate": 2.49267996869171e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014130433555692434, "step": 2495, "valid_targets_mean": 4555.9, "valid_targets_min": 2073 }, { "epoch": 2.39936, "grad_norm": 0.03903812401787511, "learning_rate": 2.486183764251151e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00024015213421080261, "step": 2500, "valid_targets_mean": 3791.2, "valid_targets_min": 1948 }, { "epoch": 2.40416, "grad_norm": 0.028971229010347883, "learning_rate": 2.4796821037481215e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014903757255524397, "step": 2505, "valid_targets_mean": 3217.3, "valid_targets_min": 1914 }, { "epoch": 2.40896, "grad_norm": 0.035086625043318054, "learning_rate": 2.473175060145703e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001503221137681976, "step": 2510, "valid_targets_mean": 3694.5, "valid_targets_min": 1951 }, { "epoch": 2.41376, "grad_norm": 0.03784890895425839, "learning_rate": 2.4666627064673892e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002561969740781933, "step": 2515, "valid_targets_mean": 2764.7, "valid_targets_min": 1930 }, { "epoch": 2.41856, "grad_norm": 0.03502209953746837, "learning_rate": 2.4601451157962616e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014939287211745977, "step": 2520, "valid_targets_mean": 3019.3, "valid_targets_min": 1763 }, { "epoch": 2.42336, "grad_norm": 0.038579498889326165, "learning_rate": 2.4536223612741754e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00029830800485797226, "step": 2525, "valid_targets_mean": 4642.4, "valid_targets_min": 1361 }, { "epoch": 2.42816, "grad_norm": 0.02719304613035395, "learning_rate": 2.447094516100934e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001690950448391959, "step": 2530, "valid_targets_mean": 4152.7, "valid_targets_min": 1727 }, { "epoch": 2.43296, "grad_norm": 0.03258199868600974, "learning_rate": 2.4405616535334695e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020575785310938954, "step": 2535, "valid_targets_mean": 4316.7, "valid_targets_min": 1918 }, { "epoch": 2.43776, "grad_norm": 0.03801298563758932, "learning_rate": 2.43402384688502e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.000360257166903466, "step": 2540, "valid_targets_mean": 3739.1, "valid_targets_min": 1998 }, { "epoch": 2.44256, "grad_norm": 0.03621817881967739, "learning_rate": 2.4274811695243085e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023448243155144155, "step": 2545, "valid_targets_mean": 3347.4, "valid_targets_min": 2119 }, { "epoch": 2.4473599999999998, "grad_norm": 0.02805407299186264, "learning_rate": 2.4209336948747168e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00025352189550176263, "step": 2550, "valid_targets_mean": 3837.3, "valid_targets_min": 1517 }, { "epoch": 2.45216, "grad_norm": 0.03732310069016806, "learning_rate": 2.414381496413464e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00024747985298745334, "step": 2555, "valid_targets_mean": 4331.4, "valid_targets_min": 2008 }, { "epoch": 2.45696, "grad_norm": 0.03456714787592951, "learning_rate": 2.4078246476707793e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.000141127486131154, "step": 2560, "valid_targets_mean": 3667.2, "valid_targets_min": 1525 }, { "epoch": 2.46176, "grad_norm": 0.035425591366662346, "learning_rate": 2.4012632222290802e-05, "loss": 0.0007, "loss_nan_ranks": 0, "loss_rank_avg": 0.00029167812317609787, "step": 2565, "valid_targets_mean": 4083.5, "valid_targets_min": 1868 }, { "epoch": 2.46656, "grad_norm": 0.02874013643641384, "learning_rate": 2.3946972937221444e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001653900253586471, "step": 2570, "valid_targets_mean": 4142.4, "valid_targets_min": 1760 }, { "epoch": 2.47136, "grad_norm": 0.02862784285161512, "learning_rate": 2.3881269358342828e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00020821639918722212, "step": 2575, "valid_targets_mean": 4223.2, "valid_targets_min": 1361 }, { "epoch": 2.47616, "grad_norm": 0.029604293591339006, "learning_rate": 2.3815522222995158e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001307126512983814, "step": 2580, "valid_targets_mean": 3124.3, "valid_targets_min": 1958 }, { "epoch": 2.48096, "grad_norm": 0.033893385830383684, "learning_rate": 2.3749732269007427e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016485755622852594, "step": 2585, "valid_targets_mean": 4209.0, "valid_targets_min": 1775 }, { "epoch": 2.48576, "grad_norm": 0.03419392450169646, "learning_rate": 2.3683900234689142e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002415791677776724, "step": 2590, "valid_targets_mean": 4240.3, "valid_targets_min": 1906 }, { "epoch": 2.49056, "grad_norm": 0.029006117232870755, "learning_rate": 2.3618026858822054e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023742017219774425, "step": 2595, "valid_targets_mean": 3191.8, "valid_targets_min": 1858 }, { "epoch": 2.49536, "grad_norm": 0.04012111729972718, "learning_rate": 2.355211288065187e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015978682495187968, "step": 2600, "valid_targets_mean": 3348.3, "valid_targets_min": 2004 }, { "epoch": 2.50016, "grad_norm": 0.04056449581614587, "learning_rate": 2.348615903987991e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022866785002406687, "step": 2605, "valid_targets_mean": 3626.4, "valid_targets_min": 1995 }, { "epoch": 2.50496, "grad_norm": 0.030585259676019654, "learning_rate": 2.3420166076654873e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00021799776004627347, "step": 2610, "valid_targets_mean": 3237.5, "valid_targets_min": 1763 }, { "epoch": 2.50976, "grad_norm": 0.023930444972562206, "learning_rate": 2.335413473156449e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022054321016184986, "step": 2615, "valid_targets_mean": 3443.3, "valid_targets_min": 1884 }, { "epoch": 2.51456, "grad_norm": 0.024457278834734187, "learning_rate": 2.328806574562722e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011868066212628037, "step": 2620, "valid_targets_mean": 4358.3, "valid_targets_min": 1786 }, { "epoch": 2.51936, "grad_norm": 0.031028426914594242, "learning_rate": 2.322195986028393e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00027652987046167254, "step": 2625, "valid_targets_mean": 4464.6, "valid_targets_min": 1601 }, { "epoch": 2.52416, "grad_norm": 0.030577977296404303, "learning_rate": 2.315581781738959e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001450799172744155, "step": 2630, "valid_targets_mean": 4065.1, "valid_targets_min": 1764 }, { "epoch": 2.52896, "grad_norm": 0.028055994141291358, "learning_rate": 2.3089640359204937e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00018580812320578843, "step": 2635, "valid_targets_mean": 3585.7, "valid_targets_min": 1727 }, { "epoch": 2.53376, "grad_norm": 0.020316911634189153, "learning_rate": 2.3023428228388144e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015279500803444535, "step": 2640, "valid_targets_mean": 4268.4, "valid_targets_min": 1361 }, { "epoch": 2.53856, "grad_norm": 0.029192677167564848, "learning_rate": 2.2957182167986486e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016782352759037167, "step": 2645, "valid_targets_mean": 3354.9, "valid_targets_min": 1652 }, { "epoch": 2.54336, "grad_norm": 0.02674573810278128, "learning_rate": 2.2890902921428004e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011722477211151272, "step": 2650, "valid_targets_mean": 3411.8, "valid_targets_min": 1799 }, { "epoch": 2.54816, "grad_norm": 0.03491667544098721, "learning_rate": 2.2824591232513153e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017565107555128634, "step": 2655, "valid_targets_mean": 3712.1, "valid_targets_min": 1887 }, { "epoch": 2.55296, "grad_norm": 0.033105604731353114, "learning_rate": 2.2758247845406495e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00023516351939179003, "step": 2660, "valid_targets_mean": 3988.2, "valid_targets_min": 1931 }, { "epoch": 2.55776, "grad_norm": 0.024677789248399855, "learning_rate": 2.2691873504628282e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00013441765622701496, "step": 2665, "valid_targets_mean": 3287.0, "valid_targets_min": 1716 }, { "epoch": 2.56256, "grad_norm": 0.03347135910296354, "learning_rate": 2.2625468955046143e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016958295600488782, "step": 2670, "valid_targets_mean": 3179.7, "valid_targets_min": 1908 }, { "epoch": 2.56736, "grad_norm": 0.025305271492915622, "learning_rate": 2.2559034941866727e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017021692474372685, "step": 2675, "valid_targets_mean": 3838.3, "valid_targets_min": 1992 }, { "epoch": 2.5721600000000002, "grad_norm": 0.03054664142249039, "learning_rate": 2.2492572210627325e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002199383161496371, "step": 2680, "valid_targets_mean": 3718.6, "valid_targets_min": 1771 }, { "epoch": 2.57696, "grad_norm": 0.0295739820670092, "learning_rate": 2.24260815071875e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002091970236506313, "step": 2685, "valid_targets_mean": 4135.2, "valid_targets_min": 2033 }, { "epoch": 2.58176, "grad_norm": 0.027407367741136335, "learning_rate": 2.2359563577720743e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015643186634406447, "step": 2690, "valid_targets_mean": 3748.6, "valid_targets_min": 1863 }, { "epoch": 2.58656, "grad_norm": 0.023931228842467126, "learning_rate": 2.229301916870606e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001017052709357813, "step": 2695, "valid_targets_mean": 4408.4, "valid_targets_min": 1858 }, { "epoch": 2.59136, "grad_norm": 0.016879904184060966, "learning_rate": 2.2226449026919637e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014124697190709412, "step": 2700, "valid_targets_mean": 4628.8, "valid_targets_min": 1993 }, { "epoch": 2.5961600000000002, "grad_norm": 0.03350887881820371, "learning_rate": 2.2159853899426427e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00019711660570465028, "step": 2705, "valid_targets_mean": 3775.4, "valid_targets_min": 1924 }, { "epoch": 2.60096, "grad_norm": 0.024997563571365917, "learning_rate": 2.209323453357178e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001128168951254338, "step": 2710, "valid_targets_mean": 2900.3, "valid_targets_min": 1912 }, { "epoch": 2.60576, "grad_norm": 0.02473483219663956, "learning_rate": 2.202659167697306e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014166333130560815, "step": 2715, "valid_targets_mean": 5047.2, "valid_targets_min": 1858 }, { "epoch": 2.61056, "grad_norm": 0.02695375949945734, "learning_rate": 2.1959926077511234e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015097047435119748, "step": 2720, "valid_targets_mean": 4527.6, "valid_targets_min": 1925 }, { "epoch": 2.61536, "grad_norm": 0.029313431173201666, "learning_rate": 2.1893238483322512e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00027219983167015016, "step": 2725, "valid_targets_mean": 3846.9, "valid_targets_min": 1764 }, { "epoch": 2.6201600000000003, "grad_norm": 0.0246117813376776, "learning_rate": 2.1826529642789923e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011438388901297003, "step": 2730, "valid_targets_mean": 4127.7, "valid_targets_min": 1983 }, { "epoch": 2.6249599999999997, "grad_norm": 0.03166261718253728, "learning_rate": 2.1759800304534936e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00030604726634919643, "step": 2735, "valid_targets_mean": 3822.6, "valid_targets_min": 1917 }, { "epoch": 2.62976, "grad_norm": 0.02399486169062025, "learning_rate": 2.1693051217409048e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017993926303461194, "step": 2740, "valid_targets_mean": 2943.0, "valid_targets_min": 2022 }, { "epoch": 2.63456, "grad_norm": 0.022031983161228993, "learning_rate": 2.1626283130485365e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015471190272364765, "step": 2745, "valid_targets_mean": 4091.2, "valid_targets_min": 1839 }, { "epoch": 2.63936, "grad_norm": 0.029777655573390297, "learning_rate": 2.1559496793050235e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00022734438243787736, "step": 2750, "valid_targets_mean": 3356.0, "valid_targets_min": 1977 }, { "epoch": 2.64416, "grad_norm": 0.032339263263978055, "learning_rate": 2.1492692954594815e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016537672490812838, "step": 2755, "valid_targets_mean": 3285.5, "valid_targets_min": 1525 }, { "epoch": 2.6489599999999998, "grad_norm": 0.02041903769719548, "learning_rate": 2.1425872364806642e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 7.491001451853663e-05, "step": 2760, "valid_targets_mean": 3870.9, "valid_targets_min": 1928 }, { "epoch": 2.65376, "grad_norm": 0.02724645730303635, "learning_rate": 2.1359035773561275e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 8.727981185074896e-05, "step": 2765, "valid_targets_mean": 3569.4, "valid_targets_min": 1662 }, { "epoch": 2.65856, "grad_norm": 0.027173048710820033, "learning_rate": 2.1292183930913803e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002180126029998064, "step": 2770, "valid_targets_mean": 3932.3, "valid_targets_min": 1986 }, { "epoch": 2.66336, "grad_norm": 0.037202649199021574, "learning_rate": 2.1225317587090507e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015464637544937432, "step": 2775, "valid_targets_mean": 4374.6, "valid_targets_min": 1948 }, { "epoch": 2.66816, "grad_norm": 0.023946900535808578, "learning_rate": 2.1158437492480384e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 8.866835560183972e-05, "step": 2780, "valid_targets_mean": 3508.4, "valid_targets_min": 1972 }, { "epoch": 2.67296, "grad_norm": 0.023323639929458045, "learning_rate": 2.1091544397626752e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 9.227942791767418e-05, "step": 2785, "valid_targets_mean": 3581.1, "valid_targets_min": 1799 }, { "epoch": 2.67776, "grad_norm": 0.0172998031924568, "learning_rate": 2.102463905321881e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00019019619503524154, "step": 2790, "valid_targets_mean": 5262.3, "valid_targets_min": 1993 }, { "epoch": 2.68256, "grad_norm": 0.026339994207665886, "learning_rate": 2.095772221008323e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015134026762098074, "step": 2795, "valid_targets_mean": 3594.5, "valid_targets_min": 1877 }, { "epoch": 2.68736, "grad_norm": 0.03256359763209226, "learning_rate": 2.0890794619175745e-05, "loss": 0.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.00018617985188029706, "step": 2800, "valid_targets_mean": 4447.6, "valid_targets_min": 1943 }, { "epoch": 2.69216, "grad_norm": 0.023898664989193522, "learning_rate": 2.0823857031572663e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 7.358520815614611e-05, "step": 2805, "valid_targets_mean": 2726.3, "valid_targets_min": 1771 }, { "epoch": 2.69696, "grad_norm": 0.029494228295745283, "learning_rate": 2.0756910198462515e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001169008610304445, "step": 2810, "valid_targets_mean": 4072.3, "valid_targets_min": 1942 }, { "epoch": 2.70176, "grad_norm": 0.028854863277279583, "learning_rate": 2.0689954871137558e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011759097105823457, "step": 2815, "valid_targets_mean": 2916.8, "valid_targets_min": 1877 }, { "epoch": 2.70656, "grad_norm": 0.02416453071586182, "learning_rate": 2.0622991800985398e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001018679904518649, "step": 2820, "valid_targets_mean": 2619.8, "valid_targets_min": 1833 }, { "epoch": 2.71136, "grad_norm": 0.023490376662988942, "learning_rate": 2.055602173948051e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00013606276479549706, "step": 2825, "valid_targets_mean": 4143.3, "valid_targets_min": 1838 }, { "epoch": 2.71616, "grad_norm": 0.016960972248032263, "learning_rate": 2.0489045438175842e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001110613375203684, "step": 2830, "valid_targets_mean": 3656.4, "valid_targets_min": 1943 }, { "epoch": 2.72096, "grad_norm": 0.022589070972111297, "learning_rate": 2.042206364869436e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016260298434644938, "step": 2835, "valid_targets_mean": 3551.5, "valid_targets_min": 1763 }, { "epoch": 2.72576, "grad_norm": 0.02856209557457077, "learning_rate": 2.0355077122720625e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00018720896332524717, "step": 2840, "valid_targets_mean": 3209.6, "valid_targets_min": 1924 }, { "epoch": 2.73056, "grad_norm": 0.021731288713113188, "learning_rate": 2.0288086611992344e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 7.025498052826151e-05, "step": 2845, "valid_targets_mean": 3721.6, "valid_targets_min": 1992 }, { "epoch": 2.73536, "grad_norm": 0.028612983173565747, "learning_rate": 2.0221092868291953e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 8.612230158178136e-05, "step": 2850, "valid_targets_mean": 2944.8, "valid_targets_min": 1836 }, { "epoch": 2.74016, "grad_norm": 0.023600216503969575, "learning_rate": 2.0154096643438153e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 9.917169518303126e-05, "step": 2855, "valid_targets_mean": 4533.1, "valid_targets_min": 1719 }, { "epoch": 2.74496, "grad_norm": 0.025094469370057243, "learning_rate": 2.008709868927751e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 6.150246917968616e-05, "step": 2860, "valid_targets_mean": 3046.2, "valid_targets_min": 2086 }, { "epoch": 2.74976, "grad_norm": 0.019746676801553512, "learning_rate": 2.0020099757675978e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 4.597777297021821e-05, "step": 2865, "valid_targets_mean": 4366.8, "valid_targets_min": 1716 }, { "epoch": 2.75456, "grad_norm": 0.030709152512287757, "learning_rate": 1.9953100600510487e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 9.887020860332996e-05, "step": 2870, "valid_targets_mean": 3165.4, "valid_targets_min": 1970 }, { "epoch": 2.75936, "grad_norm": 0.019782474480980868, "learning_rate": 1.9886101969660504e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 6.534643762279302e-05, "step": 2875, "valid_targets_mean": 3346.6, "valid_targets_min": 1775 }, { "epoch": 2.76416, "grad_norm": 0.023247966487372883, "learning_rate": 1.9819104616999584e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00012664488167501986, "step": 2880, "valid_targets_mean": 3562.3, "valid_targets_min": 1863 }, { "epoch": 2.76896, "grad_norm": 0.026697504425241023, "learning_rate": 1.975210929438693e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011335482122376561, "step": 2885, "valid_targets_mean": 3805.9, "valid_targets_min": 1877 }, { "epoch": 2.7737600000000002, "grad_norm": 0.024236369610147433, "learning_rate": 1.9685116753658982e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015188367979135364, "step": 2890, "valid_targets_mean": 4950.4, "valid_targets_min": 1863 }, { "epoch": 2.77856, "grad_norm": 0.024006115720744844, "learning_rate": 1.9618127746620944e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 5.3211351769277826e-05, "step": 2895, "valid_targets_mean": 4628.9, "valid_targets_min": 1839 }, { "epoch": 2.78336, "grad_norm": 0.01828708573325881, "learning_rate": 1.9551143025038363e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015513661492150277, "step": 2900, "valid_targets_mean": 3301.9, "valid_targets_min": 1361 }, { "epoch": 2.78816, "grad_norm": 0.02452513702064594, "learning_rate": 1.9484163340628724e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001470555434934795, "step": 2905, "valid_targets_mean": 3966.4, "valid_targets_min": 1802 }, { "epoch": 2.79296, "grad_norm": 0.02162253904665591, "learning_rate": 1.941718944505294e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 6.633297016378492e-05, "step": 2910, "valid_targets_mean": 4646.6, "valid_targets_min": 1929 }, { "epoch": 2.7977600000000002, "grad_norm": 0.02653344462508564, "learning_rate": 1.9350222089906994e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011425589036662132, "step": 2915, "valid_targets_mean": 3358.9, "valid_targets_min": 1799 }, { "epoch": 2.80256, "grad_norm": 0.020408240597344585, "learning_rate": 1.9283262026713456e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014473756891675293, "step": 2920, "valid_targets_mean": 3279.9, "valid_targets_min": 2031 }, { "epoch": 2.80736, "grad_norm": 0.021028753731547636, "learning_rate": 1.9216310006913058e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001147160364780575, "step": 2925, "valid_targets_mean": 4004.2, "valid_targets_min": 1975 }, { "epoch": 2.81216, "grad_norm": 0.02594239060438439, "learning_rate": 1.914936678185629e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011305462248856202, "step": 2930, "valid_targets_mean": 3485.4, "valid_targets_min": 1614 }, { "epoch": 2.81696, "grad_norm": 0.02964528000434778, "learning_rate": 1.9082433102794918e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001548744912724942, "step": 2935, "valid_targets_mean": 3928.7, "valid_targets_min": 1933 }, { "epoch": 2.8217600000000003, "grad_norm": 0.017134150188487504, "learning_rate": 1.9015509720873603e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 8.740826888242736e-05, "step": 2940, "valid_targets_mean": 3706.7, "valid_targets_min": 1917 }, { "epoch": 2.8265599999999997, "grad_norm": 0.02180933059470857, "learning_rate": 1.894859738712143e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 9.822335414355621e-05, "step": 2945, "valid_targets_mean": 4252.4, "valid_targets_min": 1562 }, { "epoch": 2.83136, "grad_norm": 0.016218254788160618, "learning_rate": 1.888169685244352e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016421267355326563, "step": 2950, "valid_targets_mean": 3571.9, "valid_targets_min": 1986 }, { "epoch": 2.83616, "grad_norm": 0.02354906480901788, "learning_rate": 1.8814808867612568e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 6.99763695592992e-05, "step": 2955, "valid_targets_mean": 4399.5, "valid_targets_min": 2088 }, { "epoch": 2.84096, "grad_norm": 0.01971511867464185, "learning_rate": 1.8747934183260427e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 9.124760254053399e-05, "step": 2960, "valid_targets_mean": 3971.2, "valid_targets_min": 1921 }, { "epoch": 2.84576, "grad_norm": 0.0278188576069757, "learning_rate": 1.868107354986971e-05, "loss": 0.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.0003219933423679322, "step": 2965, "valid_targets_mean": 3617.8, "valid_targets_min": 1982 }, { "epoch": 2.8505599999999998, "grad_norm": 0.026739769872547982, "learning_rate": 1.8614227717765327e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00017199182184413075, "step": 2970, "valid_targets_mean": 3237.1, "valid_targets_min": 1939 }, { "epoch": 2.85536, "grad_norm": 0.03461644008980415, "learning_rate": 1.8547397437106084e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00012064729526173323, "step": 2975, "valid_targets_mean": 3380.6, "valid_targets_min": 1838 }, { "epoch": 2.86016, "grad_norm": 0.02209288532182616, "learning_rate": 1.848058345787629e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002483898715581745, "step": 2980, "valid_targets_mean": 3540.8, "valid_targets_min": 1709 }, { "epoch": 2.86496, "grad_norm": 0.02714572952475498, "learning_rate": 1.8413786529877288e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001591041509527713, "step": 2985, "valid_targets_mean": 3801.8, "valid_targets_min": 1833 }, { "epoch": 2.86976, "grad_norm": 0.022040485361692213, "learning_rate": 1.8347007402719082e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 9.611293353373185e-05, "step": 2990, "valid_targets_mean": 2953.5, "valid_targets_min": 2022 }, { "epoch": 2.87456, "grad_norm": 0.022123709290083143, "learning_rate": 1.828024682581191e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00019887229427695274, "step": 2995, "valid_targets_mean": 4369.2, "valid_targets_min": 1959 }, { "epoch": 2.87936, "grad_norm": 0.018819840014296388, "learning_rate": 1.8213505548357822e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 7.32165208319202e-05, "step": 3000, "valid_targets_mean": 3614.1, "valid_targets_min": 1939 }, { "epoch": 2.88416, "grad_norm": 0.017994001101041452, "learning_rate": 1.814678431934231e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00013698008842766285, "step": 3005, "valid_targets_mean": 4487.9, "valid_targets_min": 1972 }, { "epoch": 2.88896, "grad_norm": 0.021592474043977235, "learning_rate": 1.8080083887525862e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 6.77060306770727e-05, "step": 3010, "valid_targets_mean": 3691.1, "valid_targets_min": 1562 }, { "epoch": 2.89376, "grad_norm": 0.018912366380670783, "learning_rate": 1.801340500143557e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.287562766578048e-05, "step": 3015, "valid_targets_mean": 3996.4, "valid_targets_min": 2003 }, { "epoch": 2.89856, "grad_norm": 0.018013021378604936, "learning_rate": 1.7946748409356746e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.651852502021939e-05, "step": 3020, "valid_targets_mean": 5406.3, "valid_targets_min": 1829 }, { "epoch": 2.90336, "grad_norm": 0.02196142205330078, "learning_rate": 1.788011485932451e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 6.057618884369731e-05, "step": 3025, "valid_targets_mean": 3251.1, "valid_targets_min": 1614 }, { "epoch": 2.90816, "grad_norm": 0.021939180840453026, "learning_rate": 1.78135050991154e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015023195010144264, "step": 3030, "valid_targets_mean": 3716.9, "valid_targets_min": 1983 }, { "epoch": 2.91296, "grad_norm": 0.023266947785077412, "learning_rate": 1.774691987623898e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011902107507921755, "step": 3035, "valid_targets_mean": 3432.4, "valid_targets_min": 1877 }, { "epoch": 2.91776, "grad_norm": 0.023820830898385627, "learning_rate": 1.768035993792944e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002066703309537843, "step": 3040, "valid_targets_mean": 4092.0, "valid_targets_min": 1933 }, { "epoch": 2.92256, "grad_norm": 0.020333880634877222, "learning_rate": 1.7613826031137245e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0002175498811993748, "step": 3045, "valid_targets_mean": 2837.6, "valid_targets_min": 2020 }, { "epoch": 2.92736, "grad_norm": 0.026465596046422065, "learning_rate": 1.7547318902520693e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 8.79285071277991e-05, "step": 3050, "valid_targets_mean": 3790.3, "valid_targets_min": 1986 }, { "epoch": 2.93216, "grad_norm": 0.018649197132876022, "learning_rate": 1.7480839298437612e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 8.114524825941771e-05, "step": 3055, "valid_targets_mean": 3331.4, "valid_targets_min": 1760 }, { "epoch": 2.93696, "grad_norm": 0.020148453199511775, "learning_rate": 1.7414387964936913e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 6.896800186950713e-05, "step": 3060, "valid_targets_mean": 4374.5, "valid_targets_min": 1949 }, { "epoch": 2.94176, "grad_norm": 0.021423561052568516, "learning_rate": 1.7347965647750264e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014279386959969997, "step": 3065, "valid_targets_mean": 4296.7, "valid_targets_min": 1998 }, { "epoch": 2.94656, "grad_norm": 0.02528519196710435, "learning_rate": 1.7281573092283698e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 8.968213660409674e-05, "step": 3070, "valid_targets_mean": 3194.3, "valid_targets_min": 1727 }, { "epoch": 2.95136, "grad_norm": 0.07048429228721245, "learning_rate": 1.721521104360925e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 9.62947669904679e-05, "step": 3075, "valid_targets_mean": 3045.7, "valid_targets_min": 1839 }, { "epoch": 2.95616, "grad_norm": 0.0222354184644874, "learning_rate": 1.714888024645662e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001516393676865846, "step": 3080, "valid_targets_mean": 2978.5, "valid_targets_min": 1887 }, { "epoch": 2.96096, "grad_norm": 0.01555733846454575, "learning_rate": 1.708258144520478e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.9606034483294934e-05, "step": 3085, "valid_targets_mean": 4811.8, "valid_targets_min": 2343 }, { "epoch": 2.96576, "grad_norm": 0.02232143567928934, "learning_rate": 1.7016315383873637e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.000159605493536219, "step": 3090, "valid_targets_mean": 4230.9, "valid_targets_min": 1786 }, { "epoch": 2.97056, "grad_norm": 0.026488500145509335, "learning_rate": 1.6950082806115692e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 7.544553227489814e-05, "step": 3095, "valid_targets_mean": 3597.1, "valid_targets_min": 1958 }, { "epoch": 2.9753600000000002, "grad_norm": 0.018457072570227887, "learning_rate": 1.6883884455207685e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.865214916411787e-05, "step": 3100, "valid_targets_mean": 2762.7, "valid_targets_min": 1727 }, { "epoch": 2.98016, "grad_norm": 0.023355245345469806, "learning_rate": 1.6817721074042254e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001550887682242319, "step": 3105, "valid_targets_mean": 2952.7, "valid_targets_min": 2094 }, { "epoch": 2.98496, "grad_norm": 0.026488279295259706, "learning_rate": 1.675159340511958e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00013377467985264957, "step": 3110, "valid_targets_mean": 5067.9, "valid_targets_min": 1919 }, { "epoch": 2.98976, "grad_norm": 0.020655150651040233, "learning_rate": 1.6685502190539106e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 8.466073632007465e-05, "step": 3115, "valid_targets_mean": 3763.2, "valid_targets_min": 2112 }, { "epoch": 2.99456, "grad_norm": 0.019096184065461538, "learning_rate": 1.6619448171991155e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 8.77012571436353e-05, "step": 3120, "valid_targets_mean": 5052.1, "valid_targets_min": 1884 }, { "epoch": 2.9993600000000002, "grad_norm": 0.021052484889835625, "learning_rate": 1.6553432090748624e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.409695535898209e-05, "step": 3125, "valid_targets_mean": 3870.3, "valid_targets_min": 1970 }, { "epoch": 3.00384, "grad_norm": 0.018453110841428155, "learning_rate": 1.648745468765869e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.791754615027457e-05, "step": 3130, "valid_targets_mean": 4342.5, "valid_targets_min": 1775 }, { "epoch": 3.00864, "grad_norm": 0.02047687885648728, "learning_rate": 1.6421516703134463e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 4.985905979992822e-05, "step": 3135, "valid_targets_mean": 3566.9, "valid_targets_min": 1934 }, { "epoch": 3.01344, "grad_norm": 0.024891596375059534, "learning_rate": 1.6355618877146685e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00016949682321865112, "step": 3140, "valid_targets_mean": 3200.6, "valid_targets_min": 1786 }, { "epoch": 3.01824, "grad_norm": 0.017850108146377348, "learning_rate": 1.6289761949215435e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014728600217495114, "step": 3145, "valid_targets_mean": 3193.5, "valid_targets_min": 1930 }, { "epoch": 3.02304, "grad_norm": 0.018909473518080613, "learning_rate": 1.6223946658401818e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00021030849893577397, "step": 3150, "valid_targets_mean": 4067.7, "valid_targets_min": 1829 }, { "epoch": 3.02784, "grad_norm": 0.020871319993280343, "learning_rate": 1.6158173743299692e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 9.983018389903009e-05, "step": 3155, "valid_targets_mean": 4353.8, "valid_targets_min": 1763 }, { "epoch": 3.03264, "grad_norm": 0.021660620992697086, "learning_rate": 1.6092443942027356e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011195616389159113, "step": 3160, "valid_targets_mean": 2911.7, "valid_targets_min": 1839 }, { "epoch": 3.03744, "grad_norm": 0.020135937308117555, "learning_rate": 1.602675799221927e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.299851545714773e-05, "step": 3165, "valid_targets_mean": 3422.8, "valid_targets_min": 1839 }, { "epoch": 3.04224, "grad_norm": 0.018431276886312412, "learning_rate": 1.59611166310178e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.2702886023325846e-05, "step": 3170, "valid_targets_mean": 4471.5, "valid_targets_min": 2132 }, { "epoch": 3.04704, "grad_norm": 0.015155951409860745, "learning_rate": 1.5895520595064913e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 8.149896893883124e-05, "step": 3175, "valid_targets_mean": 3422.6, "valid_targets_min": 1909 }, { "epoch": 3.05184, "grad_norm": 0.019233986447757676, "learning_rate": 1.5829970620493932e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 8.23982700239867e-05, "step": 3180, "valid_targets_mean": 3077.1, "valid_targets_min": 1858 }, { "epoch": 3.05664, "grad_norm": 0.014451754392294036, "learning_rate": 1.5764467442921274e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.17826042091474e-05, "step": 3185, "valid_targets_mean": 3522.6, "valid_targets_min": 1614 }, { "epoch": 3.06144, "grad_norm": 0.018898138961676178, "learning_rate": 1.569901179743818e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011060632095905021, "step": 3190, "valid_targets_mean": 3454.0, "valid_targets_min": 1517 }, { "epoch": 3.06624, "grad_norm": 0.027683453283868373, "learning_rate": 1.5633604418602483e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011033978807972744, "step": 3195, "valid_targets_mean": 4021.5, "valid_targets_min": 1680 }, { "epoch": 3.07104, "grad_norm": 0.018878947618359634, "learning_rate": 1.5568246040430343e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010039303742814809, "step": 3200, "valid_targets_mean": 4480.4, "valid_targets_min": 1933 }, { "epoch": 3.07584, "grad_norm": 0.02031318192479438, "learning_rate": 1.5502937396388046e-05, "loss": 0.0004, "loss_nan_ranks": 0, "loss_rank_avg": 9.601862984709442e-05, "step": 3205, "valid_targets_mean": 3242.5, "valid_targets_min": 1740 }, { "epoch": 3.08064, "grad_norm": 0.02253989554735354, "learning_rate": 1.543767921938374e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014390042633749545, "step": 3210, "valid_targets_mean": 3770.4, "valid_targets_min": 1836 }, { "epoch": 3.08544, "grad_norm": 0.013587452354707022, "learning_rate": 1.537247224175922e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.746569463051856e-05, "step": 3215, "valid_targets_mean": 3409.2, "valid_targets_min": 2039 }, { "epoch": 3.09024, "grad_norm": 0.028111652441311752, "learning_rate": 1.53073171952817e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.700549031142145e-05, "step": 3220, "valid_targets_mean": 3577.5, "valid_targets_min": 1929 }, { "epoch": 3.09504, "grad_norm": 0.01708144063100646, "learning_rate": 1.5242214811135631e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.06500029284507e-05, "step": 3225, "valid_targets_mean": 4140.8, "valid_targets_min": 1912 }, { "epoch": 3.09984, "grad_norm": 0.0226372066028227, "learning_rate": 1.5177165819914461e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00012216181494295597, "step": 3230, "valid_targets_mean": 4149.2, "valid_targets_min": 1709 }, { "epoch": 3.10464, "grad_norm": 0.024965359579690115, "learning_rate": 1.5112170951612455e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.1957376854261383e-05, "step": 3235, "valid_targets_mean": 3129.3, "valid_targets_min": 1863 }, { "epoch": 3.10944, "grad_norm": 0.013437951112882224, "learning_rate": 1.5047230935616497e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.271107799373567e-05, "step": 3240, "valid_targets_mean": 3610.1, "valid_targets_min": 1786 }, { "epoch": 3.11424, "grad_norm": 0.014237700182485939, "learning_rate": 1.4982346500697916e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 4.194388020550832e-05, "step": 3245, "valid_targets_mean": 3825.3, "valid_targets_min": 1775 }, { "epoch": 3.11904, "grad_norm": 0.014111540907084268, "learning_rate": 1.4917518375004281e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.379166734404862e-05, "step": 3250, "valid_targets_mean": 3649.8, "valid_targets_min": 1914 }, { "epoch": 3.12384, "grad_norm": 0.018824156129808443, "learning_rate": 1.4852747286051254e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 6.309389573289081e-05, "step": 3255, "valid_targets_mean": 4722.3, "valid_targets_min": 1680 }, { "epoch": 3.12864, "grad_norm": 0.018101010313748535, "learning_rate": 1.478803396071443e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.809472299413756e-05, "step": 3260, "valid_targets_mean": 3089.8, "valid_targets_min": 1838 }, { "epoch": 3.1334400000000002, "grad_norm": 0.016178134459373116, "learning_rate": 1.472337912522115e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.876890595071018e-05, "step": 3265, "valid_targets_mean": 2934.6, "valid_targets_min": 1361 }, { "epoch": 3.13824, "grad_norm": 0.017702747159018806, "learning_rate": 1.4658783505142368e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010421761544421315, "step": 3270, "valid_targets_mean": 3497.0, "valid_targets_min": 1949 }, { "epoch": 3.14304, "grad_norm": 0.015629467170666565, "learning_rate": 1.4594247825384529e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.373621413833462e-05, "step": 3275, "valid_targets_mean": 4290.9, "valid_targets_min": 1993 }, { "epoch": 3.14784, "grad_norm": 0.018221576270069557, "learning_rate": 1.4529772810181398e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.873098416486755e-05, "step": 3280, "valid_targets_mean": 3406.2, "valid_targets_min": 1870 }, { "epoch": 3.15264, "grad_norm": 0.018884144359542467, "learning_rate": 1.4465359183085958e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010781181481434032, "step": 3285, "valid_targets_mean": 4543.2, "valid_targets_min": 1786 }, { "epoch": 3.15744, "grad_norm": 0.024798991362972755, "learning_rate": 1.4401007666962276e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 8.871503814589232e-05, "step": 3290, "valid_targets_mean": 3411.8, "valid_targets_min": 1906 }, { "epoch": 3.16224, "grad_norm": 0.026289618162018507, "learning_rate": 1.4336718983977389e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00014063461276236922, "step": 3295, "valid_targets_mean": 2952.9, "valid_targets_min": 2059 }, { "epoch": 3.16704, "grad_norm": 0.02087911055323807, "learning_rate": 1.4272493855593222e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011406857811380178, "step": 3300, "valid_targets_mean": 3903.2, "valid_targets_min": 1933 }, { "epoch": 3.17184, "grad_norm": 0.025864926194416736, "learning_rate": 1.4208333002558462e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.00012150718248449266, "step": 3305, "valid_targets_mean": 4186.3, "valid_targets_min": 1863 }, { "epoch": 3.17664, "grad_norm": 0.005925121943421106, "learning_rate": 1.4144237144900497e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 4.7987763537094e-05, "step": 3310, "valid_targets_mean": 3257.3, "valid_targets_min": 1877 }, { "epoch": 3.18144, "grad_norm": 0.0203610177094657, "learning_rate": 1.4080207001917302e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 9.982845222111791e-05, "step": 3315, "valid_targets_mean": 2632.5, "valid_targets_min": 1863 }, { "epoch": 3.18624, "grad_norm": 0.02013249654553658, "learning_rate": 1.4016243292169413e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001017134272842668, "step": 3320, "valid_targets_mean": 3098.9, "valid_targets_min": 1562 }, { "epoch": 3.19104, "grad_norm": 0.014150560479732852, "learning_rate": 1.3952346733471822e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.7287460145307705e-05, "step": 3325, "valid_targets_mean": 3468.7, "valid_targets_min": 1361 }, { "epoch": 3.19584, "grad_norm": 0.01247748935676924, "learning_rate": 1.3888518042885934e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.918737199157476e-05, "step": 3330, "valid_targets_mean": 3426.5, "valid_targets_min": 1992 }, { "epoch": 3.20064, "grad_norm": 0.009828455444539298, "learning_rate": 1.3824757936711537e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.947080404032022e-05, "step": 3335, "valid_targets_mean": 3553.8, "valid_targets_min": 1933 }, { "epoch": 3.20544, "grad_norm": 0.012686422174234565, "learning_rate": 1.3761067130478738e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.460604031919502e-05, "step": 3340, "valid_targets_mean": 3819.8, "valid_targets_min": 1942 }, { "epoch": 3.21024, "grad_norm": 0.01654103079369527, "learning_rate": 1.3697446338939942e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 6.0112899518571794e-05, "step": 3345, "valid_targets_mean": 3277.4, "valid_targets_min": 1562 }, { "epoch": 3.21504, "grad_norm": 0.0194091521016171, "learning_rate": 1.3633896276061847e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011460959649411961, "step": 3350, "valid_targets_mean": 3927.5, "valid_targets_min": 1833 }, { "epoch": 3.21984, "grad_norm": 0.016517976307009564, "learning_rate": 1.3570417655017405e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.381390267051756e-05, "step": 3355, "valid_targets_mean": 4070.7, "valid_targets_min": 1614 }, { "epoch": 3.22464, "grad_norm": 0.010600916211686231, "learning_rate": 1.3507011188177846e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 9.461009904043749e-05, "step": 3360, "valid_targets_mean": 3980.2, "valid_targets_min": 1928 }, { "epoch": 3.22944, "grad_norm": 0.016976292352953615, "learning_rate": 1.3443677587104655e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 8.451566827716306e-05, "step": 3365, "valid_targets_mean": 3608.3, "valid_targets_min": 1928 }, { "epoch": 3.23424, "grad_norm": 0.012813626401298798, "learning_rate": 1.3380417562541604e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.145267641637474e-05, "step": 3370, "valid_targets_mean": 4600.5, "valid_targets_min": 1909 }, { "epoch": 3.23904, "grad_norm": 0.010829071491700365, "learning_rate": 1.3317231824406783e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.345774505054578e-05, "step": 3375, "valid_targets_mean": 4325.6, "valid_targets_min": 1868 }, { "epoch": 3.24384, "grad_norm": 0.01041182604349842, "learning_rate": 1.325412108178461e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.307223131647334e-05, "step": 3380, "valid_targets_mean": 3372.8, "valid_targets_min": 1361 }, { "epoch": 3.24864, "grad_norm": 0.01526890053285902, "learning_rate": 1.3191086042917895e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.071500320103951e-05, "step": 3385, "valid_targets_mean": 5381.7, "valid_targets_min": 1863 }, { "epoch": 3.25344, "grad_norm": 0.015370550532819507, "learning_rate": 1.3128127415199883e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.260534766828641e-05, "step": 3390, "valid_targets_mean": 3824.7, "valid_targets_min": 2121 }, { "epoch": 3.25824, "grad_norm": 0.01190987235181321, "learning_rate": 1.3065245905166316e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.562914157053456e-05, "step": 3395, "valid_targets_mean": 4362.4, "valid_targets_min": 1998 }, { "epoch": 3.26304, "grad_norm": 0.0050532178122862466, "learning_rate": 1.30024422184875e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.3684292652178556e-05, "step": 3400, "valid_targets_mean": 3969.5, "valid_targets_min": 1914 }, { "epoch": 3.26784, "grad_norm": 0.011786071851466207, "learning_rate": 1.2939717059960384e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.181220330996439e-05, "step": 3405, "valid_targets_mean": 3020.6, "valid_targets_min": 1361 }, { "epoch": 3.27264, "grad_norm": 0.01729739851008109, "learning_rate": 1.287707113350068e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.659601058345288e-05, "step": 3410, "valid_targets_mean": 5125.4, "valid_targets_min": 2072 }, { "epoch": 3.27744, "grad_norm": 0.01670211062110001, "learning_rate": 1.2814505142134921e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 6.324228161247447e-05, "step": 3415, "valid_targets_mean": 3899.4, "valid_targets_min": 2013 }, { "epoch": 3.28224, "grad_norm": 0.01914716601442075, "learning_rate": 1.2752019787992587e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.421004556817934e-05, "step": 3420, "valid_targets_mean": 3452.8, "valid_targets_min": 1847 }, { "epoch": 3.28704, "grad_norm": 0.015196263944313884, "learning_rate": 1.268961577229824e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.754793867003173e-05, "step": 3425, "valid_targets_mean": 4664.8, "valid_targets_min": 1933 }, { "epoch": 3.29184, "grad_norm": 0.009801501966872886, "learning_rate": 1.262729379536365e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.6651009041816e-05, "step": 3430, "valid_targets_mean": 3303.6, "valid_targets_min": 1931 }, { "epoch": 3.29664, "grad_norm": 0.018792435761741236, "learning_rate": 1.2565054556579917e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.3184681746643037e-05, "step": 3435, "valid_targets_mean": 3715.3, "valid_targets_min": 1716 }, { "epoch": 3.30144, "grad_norm": 0.02123827971481195, "learning_rate": 1.2502898754409637e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 7.16395370545797e-05, "step": 3440, "valid_targets_mean": 4315.2, "valid_targets_min": 1829 }, { "epoch": 3.30624, "grad_norm": 0.016955050967706747, "learning_rate": 1.2440827086379055e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.558079232694581e-05, "step": 3445, "valid_targets_mean": 3924.2, "valid_targets_min": 1680 }, { "epoch": 3.31104, "grad_norm": 0.011393580150245596, "learning_rate": 1.2378840249070265e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.816037006909028e-05, "step": 3450, "valid_targets_mean": 4042.6, "valid_targets_min": 1993 }, { "epoch": 3.31584, "grad_norm": 0.014021469513832098, "learning_rate": 1.2316938938113356e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.988252451061271e-05, "step": 3455, "valid_targets_mean": 3272.9, "valid_targets_min": 1919 }, { "epoch": 3.32064, "grad_norm": 0.021608841881745316, "learning_rate": 1.2255123848178619e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.891654968261719e-05, "step": 3460, "valid_targets_mean": 2683.6, "valid_targets_min": 1839 }, { "epoch": 3.32544, "grad_norm": 0.01594098999699228, "learning_rate": 1.2193395672968765e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.743696237914264e-05, "step": 3465, "valid_targets_mean": 4081.6, "valid_targets_min": 1839 }, { "epoch": 3.33024, "grad_norm": 0.017982113832719027, "learning_rate": 1.2131755105211118e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 6.675477197859436e-05, "step": 3470, "valid_targets_mean": 3484.5, "valid_targets_min": 1763 }, { "epoch": 3.3350400000000002, "grad_norm": 0.012091989839522792, "learning_rate": 1.2070202836649855e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 6.264718831516802e-05, "step": 3475, "valid_targets_mean": 3723.5, "valid_targets_min": 2106 }, { "epoch": 3.33984, "grad_norm": 0.016693800580166875, "learning_rate": 1.2008739558038247e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.9205801486969e-05, "step": 3480, "valid_targets_mean": 4107.0, "valid_targets_min": 1887 }, { "epoch": 3.34464, "grad_norm": 0.020245961840814296, "learning_rate": 1.1947365959130895e-05, "loss": 0.0003, "loss_nan_ranks": 0, "loss_rank_avg": 5.409671939560212e-05, "step": 3485, "valid_targets_mean": 3815.5, "valid_targets_min": 1942 }, { "epoch": 3.34944, "grad_norm": 0.009696441130015688, "learning_rate": 1.1886082728675984e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.198530172696337e-05, "step": 3490, "valid_targets_mean": 3173.8, "valid_targets_min": 1662 }, { "epoch": 3.35424, "grad_norm": 0.008070751492922062, "learning_rate": 1.1824890554407574e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.529598663793877e-05, "step": 3495, "valid_targets_mean": 3571.8, "valid_targets_min": 1601 }, { "epoch": 3.3590400000000002, "grad_norm": 0.016893770420853417, "learning_rate": 1.1763790123037873e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.078791142906994e-05, "step": 3500, "valid_targets_mean": 3549.1, "valid_targets_min": 1930 }, { "epoch": 3.36384, "grad_norm": 0.010611619676596679, "learning_rate": 1.1702782120249539e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.067165693617426e-05, "step": 3505, "valid_targets_mean": 2994.8, "valid_targets_min": 1921 }, { "epoch": 3.36864, "grad_norm": 0.012227824476474919, "learning_rate": 1.164186723068795e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010194306378252804, "step": 3510, "valid_targets_mean": 3324.2, "valid_targets_min": 1952 }, { "epoch": 3.37344, "grad_norm": 0.018233151037207677, "learning_rate": 1.1581046137953575e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.322602323256433e-05, "step": 3515, "valid_targets_mean": 3473.9, "valid_targets_min": 1525 }, { "epoch": 3.37824, "grad_norm": 0.008027450910334806, "learning_rate": 1.1520319524594256e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.367275662138127e-05, "step": 3520, "valid_targets_mean": 3441.0, "valid_targets_min": 1820 }, { "epoch": 3.38304, "grad_norm": 0.016385156735597293, "learning_rate": 1.1459688072097568e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011734359577530995, "step": 3525, "valid_targets_mean": 4226.1, "valid_targets_min": 1525 }, { "epoch": 3.38784, "grad_norm": 0.0067915094576856535, "learning_rate": 1.1399152460883176e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.4733271352015436e-05, "step": 3530, "valid_targets_mean": 3731.2, "valid_targets_min": 1829 }, { "epoch": 3.39264, "grad_norm": 0.00892211548509811, "learning_rate": 1.1338713370295189e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.814416024601087e-05, "step": 3535, "valid_targets_mean": 3858.1, "valid_targets_min": 1983 }, { "epoch": 3.39744, "grad_norm": 0.008159206891878339, "learning_rate": 1.1278371478594538e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.263151640770957e-05, "step": 3540, "valid_targets_mean": 3644.7, "valid_targets_min": 1972 }, { "epoch": 3.40224, "grad_norm": 0.0067195504898440485, "learning_rate": 1.1218127462951367e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.700961678987369e-05, "step": 3545, "valid_targets_mean": 3890.9, "valid_targets_min": 1525 }, { "epoch": 3.40704, "grad_norm": 0.007884157725395604, "learning_rate": 1.1157981999437444e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.053674638271332e-05, "step": 3550, "valid_targets_mean": 4305.6, "valid_targets_min": 1836 }, { "epoch": 3.4118399999999998, "grad_norm": 0.015000201204561208, "learning_rate": 1.109793576301855e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.019015250378288e-05, "step": 3555, "valid_targets_mean": 4950.6, "valid_targets_min": 1680 }, { "epoch": 3.41664, "grad_norm": 0.016970726415525852, "learning_rate": 1.1037989427546924e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00012615707237273455, "step": 3560, "valid_targets_mean": 3820.9, "valid_targets_min": 1662 }, { "epoch": 3.42144, "grad_norm": 0.008553481869326631, "learning_rate": 1.0978143665753692e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.730415821541101e-05, "step": 3565, "valid_targets_mean": 4176.1, "valid_targets_min": 1991 }, { "epoch": 3.42624, "grad_norm": 0.020611764051659598, "learning_rate": 1.0918399149241314e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.6515218602726236e-05, "step": 3570, "valid_targets_mean": 3387.0, "valid_targets_min": 1908 }, { "epoch": 3.43104, "grad_norm": 0.03254530583537241, "learning_rate": 1.0858756548476058e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001125583949033171, "step": 3575, "valid_targets_mean": 2906.8, "valid_targets_min": 1934 }, { "epoch": 3.43584, "grad_norm": 0.014829373122733618, "learning_rate": 1.0799216532780478e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.488798003876582e-05, "step": 3580, "valid_targets_mean": 3507.2, "valid_targets_min": 1716 }, { "epoch": 3.44064, "grad_norm": 0.025957320437693793, "learning_rate": 1.0739779770325885e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00013226433657109737, "step": 3585, "valid_targets_mean": 3937.9, "valid_targets_min": 2115 }, { "epoch": 3.44544, "grad_norm": 0.011198146121762398, "learning_rate": 1.0680446928124872e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.750825221184641e-05, "step": 3590, "valid_targets_mean": 5197.8, "valid_targets_min": 1900 }, { "epoch": 3.45024, "grad_norm": 0.013783909187565497, "learning_rate": 1.06212186720238e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.546361404005438e-05, "step": 3595, "valid_targets_mean": 3067.2, "valid_targets_min": 2012 }, { "epoch": 3.45504, "grad_norm": 0.008523171197014895, "learning_rate": 1.0562095666695352e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.496578185353428e-05, "step": 3600, "valid_targets_mean": 4060.1, "valid_targets_min": 1906 }, { "epoch": 3.45984, "grad_norm": 0.013801175341468335, "learning_rate": 1.0503078575631052e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.477723945863545e-05, "step": 3605, "valid_targets_mean": 3305.2, "valid_targets_min": 2000 }, { "epoch": 3.46464, "grad_norm": 0.014959764009151036, "learning_rate": 1.0444168061133846e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00012726544809993356, "step": 3610, "valid_targets_mean": 4484.9, "valid_targets_min": 1763 }, { "epoch": 3.46944, "grad_norm": 0.01139425598770555, "learning_rate": 1.0385364784310636e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.298814383218996e-05, "step": 3615, "valid_targets_mean": 3759.6, "valid_targets_min": 1361 }, { "epoch": 3.47424, "grad_norm": 0.015011712005345224, "learning_rate": 1.0326669405064904e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.0001424011425115168, "step": 3620, "valid_targets_mean": 3863.2, "valid_targets_min": 1727 }, { "epoch": 3.47904, "grad_norm": 0.006988112883670556, "learning_rate": 1.0268082582089263e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.663314419100061e-05, "step": 3625, "valid_targets_mean": 5181.8, "valid_targets_min": 1972 }, { "epoch": 3.48384, "grad_norm": 0.016204945933502923, "learning_rate": 1.0209604972858081e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.9584206610452384e-05, "step": 3630, "valid_targets_mean": 4587.8, "valid_targets_min": 1799 }, { "epoch": 3.48864, "grad_norm": 0.006836549926723057, "learning_rate": 1.0151237233620115e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.5423868868965656e-05, "step": 3635, "valid_targets_mean": 4556.9, "valid_targets_min": 2020 }, { "epoch": 3.49344, "grad_norm": 0.01047918810880494, "learning_rate": 1.0092980019391132e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00011410897423047572, "step": 3640, "valid_targets_mean": 3896.4, "valid_targets_min": 1939 }, { "epoch": 3.49824, "grad_norm": 0.014652018259616206, "learning_rate": 1.0034833983946561e-05, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010652582568582147, "step": 3645, "valid_targets_mean": 2887.8, "valid_targets_min": 1829 }, { "epoch": 3.50304, "grad_norm": 0.010669898087313332, "learning_rate": 9.976799779814157e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.363785698544234e-05, "step": 3650, "valid_targets_mean": 3741.1, "valid_targets_min": 1763 }, { "epoch": 3.50784, "grad_norm": 0.01150859791625705, "learning_rate": 9.918878058266687e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.623920151265338e-05, "step": 3655, "valid_targets_mean": 3809.2, "valid_targets_min": 1939 }, { "epoch": 3.51264, "grad_norm": 0.003478644304975548, "learning_rate": 9.86106946931462e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.717148138093762e-05, "step": 3660, "valid_targets_mean": 4336.8, "valid_targets_min": 1974 }, { "epoch": 3.51744, "grad_norm": 0.01237512729854138, "learning_rate": 9.803374661698802e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.4668777011102065e-05, "step": 3665, "valid_targets_mean": 3139.4, "valid_targets_min": 1938 }, { "epoch": 3.52224, "grad_norm": 0.009173018328596294, "learning_rate": 9.745794282883215e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.844043749268167e-05, "step": 3670, "valid_targets_mean": 4644.7, "valid_targets_min": 2029 }, { "epoch": 3.52704, "grad_norm": 0.012126353551714644, "learning_rate": 9.688328979047689e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.3574360713828355e-05, "step": 3675, "valid_targets_mean": 4152.6, "valid_targets_min": 1983 }, { "epoch": 3.53184, "grad_norm": 0.00974942484547369, "learning_rate": 9.630979395080667e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.9589365769643337e-05, "step": 3680, "valid_targets_mean": 4399.3, "valid_targets_min": 1933 }, { "epoch": 3.5366400000000002, "grad_norm": 0.007448900727798668, "learning_rate": 9.573746174571947e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 7.012276182649657e-05, "step": 3685, "valid_targets_mean": 3892.2, "valid_targets_min": 1771 }, { "epoch": 3.54144, "grad_norm": 0.009998416704858777, "learning_rate": 9.516629959805468e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.176214472157881e-05, "step": 3690, "valid_targets_mean": 3584.5, "valid_targets_min": 1525 }, { "epoch": 3.54624, "grad_norm": 0.013292503205467973, "learning_rate": 9.459631391752126e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.5208176743471995e-05, "step": 3695, "valid_targets_mean": 5094.4, "valid_targets_min": 2136 }, { "epoch": 3.55104, "grad_norm": 0.008334331712158317, "learning_rate": 9.40275111006254e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.263483035378158e-05, "step": 3700, "valid_targets_mean": 4102.0, "valid_targets_min": 1887 }, { "epoch": 3.55584, "grad_norm": 0.007827281873180344, "learning_rate": 9.345989753059895e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 6.234985630726442e-05, "step": 3705, "valid_targets_mean": 4199.7, "valid_targets_min": 2105 }, { "epoch": 3.5606400000000002, "grad_norm": 0.010974477469488148, "learning_rate": 9.289347957732779e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.0864338593091816e-05, "step": 3710, "valid_targets_mean": 3562.9, "valid_targets_min": 2091 }, { "epoch": 3.56544, "grad_norm": 0.007061621309209828, "learning_rate": 9.232826359728034e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.380605630809441e-05, "step": 3715, "valid_targets_mean": 4573.4, "valid_targets_min": 1820 }, { "epoch": 3.57024, "grad_norm": 0.006768925158879715, "learning_rate": 9.17642559334362e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.614176577888429e-05, "step": 3720, "valid_targets_mean": 3561.2, "valid_targets_min": 1716 }, { "epoch": 3.57504, "grad_norm": 0.005606648088124625, "learning_rate": 9.120146291521488e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00015613154391758144, "step": 3725, "valid_targets_mean": 3199.8, "valid_targets_min": 1977 }, { "epoch": 3.57984, "grad_norm": 0.009401345215855002, "learning_rate": 9.063989085840506e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.945084169274196e-05, "step": 3730, "valid_targets_mean": 3199.3, "valid_targets_min": 1970 }, { "epoch": 3.5846400000000003, "grad_norm": 0.014559174559493274, "learning_rate": 9.007954606509346e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.059839845169336e-05, "step": 3735, "valid_targets_mean": 4898.0, "valid_targets_min": 1833 }, { "epoch": 3.5894399999999997, "grad_norm": 0.01712977436721481, "learning_rate": 8.952043482359408e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 9.897394193103537e-05, "step": 3740, "valid_targets_mean": 4177.9, "valid_targets_min": 1942 }, { "epoch": 3.59424, "grad_norm": 0.01897818953911394, "learning_rate": 8.896256340837779e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.639182225218974e-05, "step": 3745, "valid_targets_mean": 3746.3, "valid_targets_min": 2007 }, { "epoch": 3.59904, "grad_norm": 0.008696730760610802, "learning_rate": 8.840593808000182e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.316093251574785e-05, "step": 3750, "valid_targets_mean": 3307.4, "valid_targets_min": 1884 }, { "epoch": 3.60384, "grad_norm": 0.00752523752718718, "learning_rate": 8.785056508503956e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.271009963005781e-05, "step": 3755, "valid_targets_mean": 4282.9, "valid_targets_min": 1943 }, { "epoch": 3.60864, "grad_norm": 0.017446379775524528, "learning_rate": 8.729645065601045e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.897156759398058e-05, "step": 3760, "valid_targets_mean": 3718.6, "valid_targets_min": 1870 }, { "epoch": 3.6134399999999998, "grad_norm": 0.008082161778407785, "learning_rate": 8.674360101130994e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.3372128857299685e-05, "step": 3765, "valid_targets_mean": 3104.3, "valid_targets_min": 1601 }, { "epoch": 3.61824, "grad_norm": 0.007773752201751082, "learning_rate": 8.619202235514e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.664046016638167e-05, "step": 3770, "valid_targets_mean": 4204.1, "valid_targets_min": 1877 }, { "epoch": 3.62304, "grad_norm": 0.011724108974262567, "learning_rate": 8.564172087743903e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 8.043753041420132e-05, "step": 3775, "valid_targets_mean": 4841.0, "valid_targets_min": 1919 }, { "epoch": 3.62784, "grad_norm": 0.014603234371469162, "learning_rate": 8.50927027538128e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.7259538657963276e-05, "step": 3780, "valid_targets_mean": 4642.8, "valid_targets_min": 1960 }, { "epoch": 3.63264, "grad_norm": 0.00800559357448803, "learning_rate": 8.454497414546497e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.628532406059094e-05, "step": 3785, "valid_targets_mean": 3900.8, "valid_targets_min": 1906 }, { "epoch": 3.63744, "grad_norm": 0.009760845212688286, "learning_rate": 8.39985411991279e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.497586633078754e-05, "step": 3790, "valid_targets_mean": 3523.5, "valid_targets_min": 1614 }, { "epoch": 3.64224, "grad_norm": 0.009892739360240588, "learning_rate": 8.345341004699386e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.6855250073131174e-05, "step": 3795, "valid_targets_mean": 4958.9, "valid_targets_min": 1740 }, { "epoch": 3.64704, "grad_norm": 0.022126997467983734, "learning_rate": 8.290958680664591e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.7001504097133875e-05, "step": 3800, "valid_targets_mean": 5003.7, "valid_targets_min": 1601 }, { "epoch": 3.65184, "grad_norm": 0.006207067260963997, "learning_rate": 8.236707758098965e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.68956306274049e-05, "step": 3805, "valid_targets_mean": 4634.0, "valid_targets_min": 1829 }, { "epoch": 3.65664, "grad_norm": 0.009933222541426298, "learning_rate": 8.182588845818452e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.3912557632429525e-05, "step": 3810, "valid_targets_mean": 3370.8, "valid_targets_min": 1931 }, { "epoch": 3.66144, "grad_norm": 0.005083907207555841, "learning_rate": 8.128602551157523e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.829049819614738e-05, "step": 3815, "valid_targets_mean": 3926.0, "valid_targets_min": 1998 }, { "epoch": 3.66624, "grad_norm": 0.003423366499798073, "learning_rate": 8.074749479962407e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.400216857902706e-05, "step": 3820, "valid_targets_mean": 3917.4, "valid_targets_min": 1904 }, { "epoch": 3.67104, "grad_norm": 0.00822734919109149, "learning_rate": 8.021030236584254e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.029735984862782e-05, "step": 3825, "valid_targets_mean": 4000.3, "valid_targets_min": 1361 }, { "epoch": 3.67584, "grad_norm": 0.00811845623327458, "learning_rate": 7.967445423872384e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.5101038014981896e-05, "step": 3830, "valid_targets_mean": 3887.2, "valid_targets_min": 1858 }, { "epoch": 3.68064, "grad_norm": 0.008909582138274898, "learning_rate": 7.913995643167494e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.464569742092863e-05, "step": 3835, "valid_targets_mean": 4139.8, "valid_targets_min": 1799 }, { "epoch": 3.68544, "grad_norm": 0.005082007045025474, "learning_rate": 7.860681494294917e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.289662683731876e-05, "step": 3840, "valid_targets_mean": 5383.5, "valid_targets_min": 1877 }, { "epoch": 3.69024, "grad_norm": 0.028567503324743313, "learning_rate": 7.80750357555792e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 6.482819298980758e-05, "step": 3845, "valid_targets_mean": 4351.8, "valid_targets_min": 2010 }, { "epoch": 3.69504, "grad_norm": 0.008312164085289285, "learning_rate": 7.75446248373094e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.698741420521401e-05, "step": 3850, "valid_targets_mean": 4194.5, "valid_targets_min": 1925 }, { "epoch": 3.69984, "grad_norm": 0.013534579590798691, "learning_rate": 7.701558814052928e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.3835676226299256e-05, "step": 3855, "valid_targets_mean": 3634.8, "valid_targets_min": 1786 }, { "epoch": 3.70464, "grad_norm": 0.00720602048189928, "learning_rate": 7.648793160220637e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 2.953006151074078e-05, "step": 3860, "valid_targets_mean": 4952.3, "valid_targets_min": 1919 }, { "epoch": 3.70944, "grad_norm": 0.008449956594170478, "learning_rate": 7.596166114381991e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.4673154004849494e-05, "step": 3865, "valid_targets_mean": 3438.7, "valid_targets_min": 1939 }, { "epoch": 3.71424, "grad_norm": 0.005375083760714377, "learning_rate": 7.543678267129408e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.617395123001188e-05, "step": 3870, "valid_targets_mean": 4350.7, "valid_targets_min": 1847 }, { "epoch": 3.71904, "grad_norm": 0.009037269182640846, "learning_rate": 7.491330207493215e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.979194272891618e-05, "step": 3875, "valid_targets_mean": 3996.6, "valid_targets_min": 1909 }, { "epoch": 3.72384, "grad_norm": 0.008946248984604825, "learning_rate": 7.4391225229349785e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.837323311017826e-05, "step": 3880, "valid_targets_mean": 3842.8, "valid_targets_min": 2083 }, { "epoch": 3.72864, "grad_norm": 0.006741545487650149, "learning_rate": 7.387055799340977e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.537091106409207e-05, "step": 3885, "valid_targets_mean": 3515.7, "valid_targets_min": 2084 }, { "epoch": 3.73344, "grad_norm": 0.009958719900647239, "learning_rate": 7.3351306210155645e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.938116323202848e-05, "step": 3890, "valid_targets_mean": 4039.8, "valid_targets_min": 1727 }, { "epoch": 3.7382400000000002, "grad_norm": 0.004166899002692281, "learning_rate": 7.283347570674664e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.300503835314885e-05, "step": 3895, "valid_targets_mean": 4780.2, "valid_targets_min": 1914 }, { "epoch": 3.74304, "grad_norm": 0.0055545578726656705, "learning_rate": 7.231707229439191e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.4573745981324464e-05, "step": 3900, "valid_targets_mean": 2902.8, "valid_targets_min": 1838 }, { "epoch": 3.74784, "grad_norm": 0.011400834486338789, "learning_rate": 7.180210176828557e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.124083691043779e-05, "step": 3905, "valid_targets_mean": 4634.8, "valid_targets_min": 1838 }, { "epoch": 3.75264, "grad_norm": 0.00841332841155176, "learning_rate": 7.1288569907541495e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010382626351201907, "step": 3910, "valid_targets_mean": 3998.2, "valid_targets_min": 1836 }, { "epoch": 3.75744, "grad_norm": 0.008771579099235028, "learning_rate": 7.0776482475128674e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.999216642114334e-05, "step": 3915, "valid_targets_mean": 3358.6, "valid_targets_min": 1930 }, { "epoch": 3.7622400000000003, "grad_norm": 0.01653968115841514, "learning_rate": 7.026584521780628e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.055902485968545e-05, "step": 3920, "valid_targets_mean": 3337.5, "valid_targets_min": 1940 }, { "epoch": 3.76704, "grad_norm": 0.0020106714719736176, "learning_rate": 6.9756663866059324e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.6483760999981314e-05, "step": 3925, "valid_targets_mean": 3525.4, "valid_targets_min": 1921 }, { "epoch": 3.77184, "grad_norm": 0.009353143146674505, "learning_rate": 6.924894413403434e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.59437542303931e-05, "step": 3930, "valid_targets_mean": 3793.8, "valid_targets_min": 1986 }, { "epoch": 3.77664, "grad_norm": 0.0016988195482671596, "learning_rate": 6.874269171947516e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.4710130421444774e-05, "step": 3935, "valid_targets_mean": 4158.0, "valid_targets_min": 1991 }, { "epoch": 3.78144, "grad_norm": 0.011525809325227182, "learning_rate": 6.8237912303659195e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.272616959293373e-05, "step": 3940, "valid_targets_mean": 4315.2, "valid_targets_min": 2040 }, { "epoch": 3.7862400000000003, "grad_norm": 0.01327437986216609, "learning_rate": 6.773461155133334e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.483360316953622e-05, "step": 3945, "valid_targets_mean": 4166.3, "valid_targets_min": 2041 }, { "epoch": 3.7910399999999997, "grad_norm": 0.01155061809019346, "learning_rate": 6.723279511065088e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 0.00010878659668378532, "step": 3950, "valid_targets_mean": 3971.8, "valid_targets_min": 1751 }, { "epoch": 3.79584, "grad_norm": 0.008489470823871952, "learning_rate": 6.673246861310751e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.032125070807524e-05, "step": 3955, "valid_targets_mean": 3081.6, "valid_targets_min": 1993 }, { "epoch": 3.80064, "grad_norm": 0.004944406539400989, "learning_rate": 6.623363767347874e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.2762374758021906e-05, "step": 3960, "valid_targets_mean": 3511.7, "valid_targets_min": 2034 }, { "epoch": 3.80544, "grad_norm": 0.0015531554707660037, "learning_rate": 6.5736307889756425e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.0193985367077403e-05, "step": 3965, "valid_targets_mean": 4271.0, "valid_targets_min": 1771 }, { "epoch": 3.81024, "grad_norm": 0.002938449796497635, "learning_rate": 6.5240484843086095e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.3413271012250334e-05, "step": 3970, "valid_targets_mean": 3733.8, "valid_targets_min": 1740 }, { "epoch": 3.8150399999999998, "grad_norm": 0.0051302286350760245, "learning_rate": 6.474617409770441e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.9273050788324326e-05, "step": 3975, "valid_targets_mean": 4800.5, "valid_targets_min": 1833 }, { "epoch": 3.81984, "grad_norm": 0.00431880865043546, "learning_rate": 6.425338120087665e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.9392667026259005e-05, "step": 3980, "valid_targets_mean": 3564.1, "valid_targets_min": 1933 }, { "epoch": 3.82464, "grad_norm": 0.0135204569747035, "learning_rate": 6.3762111682834374e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.671135684475303e-05, "step": 3985, "valid_targets_mean": 3377.8, "valid_targets_min": 1966 }, { "epoch": 3.82944, "grad_norm": 0.012904633473275234, "learning_rate": 6.327237105671362e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.7124419981846586e-05, "step": 3990, "valid_targets_mean": 3646.4, "valid_targets_min": 1931 }, { "epoch": 3.83424, "grad_norm": 0.012677339947563877, "learning_rate": 6.278416481849274e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.282880738377571e-05, "step": 3995, "valid_targets_mean": 3834.4, "valid_targets_min": 1517 }, { "epoch": 3.83904, "grad_norm": 0.0027541770656437647, "learning_rate": 6.22974984469308e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.0949358663056046e-05, "step": 4000, "valid_targets_mean": 4092.8, "valid_targets_min": 1870 }, { "epoch": 3.84384, "grad_norm": 0.0025121154244893383, "learning_rate": 6.181237740350625e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.9284408558160067e-05, "step": 4005, "valid_targets_mean": 3402.4, "valid_targets_min": 2072 }, { "epoch": 3.84864, "grad_norm": 0.007040691563797863, "learning_rate": 6.132880713235543e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.226173768984154e-05, "step": 4010, "valid_targets_mean": 3744.0, "valid_targets_min": 1662 }, { "epoch": 3.85344, "grad_norm": 0.0017011433295406567, "learning_rate": 6.084679306021162e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.698827276821248e-05, "step": 4015, "valid_targets_mean": 4849.4, "valid_targets_min": 1909 }, { "epoch": 3.85824, "grad_norm": 0.010975701606423343, "learning_rate": 6.036634059634403e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.6234490582719445e-05, "step": 4020, "valid_targets_mean": 3950.8, "valid_targets_min": 1802 }, { "epoch": 3.86304, "grad_norm": 0.009004613849435001, "learning_rate": 5.988745513249723e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.65586020052433e-05, "step": 4025, "valid_targets_mean": 4084.7, "valid_targets_min": 1987 }, { "epoch": 3.86784, "grad_norm": 0.006895797007772438, "learning_rate": 5.941014204283065e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.828316352562979e-05, "step": 4030, "valid_targets_mean": 3135.8, "valid_targets_min": 1857 }, { "epoch": 3.87264, "grad_norm": 0.01178803809355006, "learning_rate": 5.893440668385797e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.943587216781452e-05, "step": 4035, "valid_targets_mean": 4593.9, "valid_targets_min": 1908 }, { "epoch": 3.87744, "grad_norm": 0.01132365691364727, "learning_rate": 5.8460254394387335e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 7.603708218084648e-05, "step": 4040, "valid_targets_mean": 2908.2, "valid_targets_min": 1763 }, { "epoch": 3.88224, "grad_norm": 0.0015247764789779767, "learning_rate": 5.798769049546136e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.867723353323527e-05, "step": 4045, "valid_targets_mean": 4326.9, "valid_targets_min": 2052 }, { "epoch": 3.88704, "grad_norm": 0.007712351251859507, "learning_rate": 5.751672029029734e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 6.214739551069215e-05, "step": 4050, "valid_targets_mean": 3336.8, "valid_targets_min": 1918 }, { "epoch": 3.89184, "grad_norm": 0.005302270584137382, "learning_rate": 5.704734906422775e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.486428952077404e-05, "step": 4055, "valid_targets_mean": 3890.5, "valid_targets_min": 1614 }, { "epoch": 3.89664, "grad_norm": 0.008602600193917502, "learning_rate": 5.657958208464103e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.3105505533749238e-05, "step": 4060, "valid_targets_mean": 5310.7, "valid_targets_min": 1868 }, { "epoch": 3.90144, "grad_norm": 0.011762847617699367, "learning_rate": 5.611342460092244e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.642755837063305e-05, "step": 4065, "valid_targets_mean": 3324.7, "valid_targets_min": 1763 }, { "epoch": 3.90624, "grad_norm": 0.01025277386741305, "learning_rate": 5.564888184439505e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 8.32563528092578e-05, "step": 4070, "valid_targets_mean": 3358.8, "valid_targets_min": 1987 }, { "epoch": 3.91104, "grad_norm": 0.00826164879811961, "learning_rate": 5.5185959028261135e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 6.293428305070847e-05, "step": 4075, "valid_targets_mean": 3793.2, "valid_targets_min": 1913 }, { "epoch": 3.91584, "grad_norm": 0.0017179245030004447, "learning_rate": 5.47246613475436e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.292598921689205e-05, "step": 4080, "valid_targets_mean": 5032.8, "valid_targets_min": 1764 }, { "epoch": 3.92064, "grad_norm": 0.006387347577353118, "learning_rate": 5.4264993979027735e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.276900265016593e-05, "step": 4085, "valid_targets_mean": 4469.8, "valid_targets_min": 1662 }, { "epoch": 3.92544, "grad_norm": 0.0017208693189951672, "learning_rate": 5.380696208120315e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.718512016348541e-05, "step": 4090, "valid_targets_mean": 3913.8, "valid_targets_min": 1942 }, { "epoch": 3.93024, "grad_norm": 0.009615232784227547, "learning_rate": 5.335057079420571e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 4.271994475857355e-05, "step": 4095, "valid_targets_mean": 4633.0, "valid_targets_min": 1906 }, { "epoch": 3.93504, "grad_norm": 0.00315117505190966, "learning_rate": 5.289582523976015e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.916188092669472e-05, "step": 4100, "valid_targets_mean": 3094.9, "valid_targets_min": 1839 }, { "epoch": 3.9398400000000002, "grad_norm": 0.002341135347296883, "learning_rate": 5.244273052112241e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.824275674764067e-05, "step": 4105, "valid_targets_mean": 3952.0, "valid_targets_min": 1820 }, { "epoch": 3.94464, "grad_norm": 0.006120762233210705, "learning_rate": 5.199129172302224e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.396788477199152e-05, "step": 4110, "valid_targets_mean": 4057.8, "valid_targets_min": 1652 }, { "epoch": 3.94944, "grad_norm": 0.01147219264594495, "learning_rate": 5.154151391160638e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 5.357105692382902e-05, "step": 4115, "valid_targets_mean": 3406.0, "valid_targets_min": 2061 }, { "epoch": 3.95424, "grad_norm": 0.0043650589223010496, "learning_rate": 5.109340213438156e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.6478053263854235e-05, "step": 4120, "valid_targets_mean": 3741.1, "valid_targets_min": 1952 }, { "epoch": 3.95904, "grad_norm": 0.0030919506576588917, "learning_rate": 5.0646961420157995e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.029893741768319e-05, "step": 4125, "valid_targets_mean": 4083.2, "valid_targets_min": 1877 }, { "epoch": 3.9638400000000003, "grad_norm": 0.0030273483345704686, "learning_rate": 5.020219677899276e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.4400916774757206e-05, "step": 4130, "valid_targets_mean": 3293.4, "valid_targets_min": 1760 }, { "epoch": 3.9686399999999997, "grad_norm": 0.0017464199544329963, "learning_rate": 4.975911320213365e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.5975579268997535e-05, "step": 4135, "valid_targets_mean": 3433.2, "valid_targets_min": 1705 }, { "epoch": 3.97344, "grad_norm": 0.002077433108478966, "learning_rate": 4.931771566196332e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.3588610424194485e-05, "step": 4140, "valid_targets_mean": 3861.1, "valid_targets_min": 1942 }, { "epoch": 3.97824, "grad_norm": 0.002321329052569725, "learning_rate": 4.887800911194327e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.014351336285472e-05, "step": 4145, "valid_targets_mean": 3757.0, "valid_targets_min": 1917 }, { "epoch": 3.98304, "grad_norm": 0.0033831803043769893, "learning_rate": 4.8439998486558246e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.0929337551933713e-05, "step": 4150, "valid_targets_mean": 4829.0, "valid_targets_min": 1933 }, { "epoch": 3.9878400000000003, "grad_norm": 0.0065384692462405886, "learning_rate": 4.800368870126111e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.445397644303739e-05, "step": 4155, "valid_targets_mean": 4013.5, "valid_targets_min": 2008 }, { "epoch": 3.9926399999999997, "grad_norm": 0.007960408672666047, "learning_rate": 4.756908465241736e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 6.532538100145757e-05, "step": 4160, "valid_targets_mean": 2909.1, "valid_targets_min": 1933 }, { "epoch": 3.99744, "grad_norm": 0.002761429608947698, "learning_rate": 4.713619121725039e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.965345917502418e-05, "step": 4165, "valid_targets_mean": 3661.7, "valid_targets_min": 1361 }, { "epoch": 4.00192, "grad_norm": 0.00564879768287149, "learning_rate": 4.670501325378682e-06, "loss": 0.0002, "loss_nan_ranks": 0, "loss_rank_avg": 3.989029937656596e-05, "step": 4170, "valid_targets_mean": 4154.5, "valid_targets_min": 1562 }, { "epoch": 4.00672, "grad_norm": 0.0017008982835388347, "learning_rate": 4.627555560080173e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.260703281033784e-05, "step": 4175, "valid_targets_mean": 3558.2, "valid_targets_min": 2030 }, { "epoch": 4.01152, "grad_norm": 0.0013598220119315672, "learning_rate": 4.5847823077764565e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.567889507394284e-05, "step": 4180, "valid_targets_mean": 4792.2, "valid_targets_min": 1716 }, { "epoch": 4.01632, "grad_norm": 0.0017277913774604524, "learning_rate": 4.5421820484784936e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.8666614273097366e-05, "step": 4185, "valid_targets_mean": 3129.0, "valid_targets_min": 1680 }, { "epoch": 4.02112, "grad_norm": 0.010995756807561355, "learning_rate": 4.499755260255881e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.598851955961436e-05, "step": 4190, "valid_targets_mean": 3880.6, "valid_targets_min": 1887 }, { "epoch": 4.02592, "grad_norm": 0.007874013108371752, "learning_rate": 4.457502419231483e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 6.0256828874116763e-05, "step": 4195, "valid_targets_mean": 3937.4, "valid_targets_min": 1919 }, { "epoch": 4.03072, "grad_norm": 0.005097701158583684, "learning_rate": 4.415423999576091e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.7677243856014684e-05, "step": 4200, "valid_targets_mean": 4715.7, "valid_targets_min": 1930 }, { "epoch": 4.03552, "grad_norm": 0.00832156517250208, "learning_rate": 4.373520473503097e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.421106521273032e-05, "step": 4205, "valid_targets_mean": 4367.5, "valid_targets_min": 2220 }, { "epoch": 4.04032, "grad_norm": 0.0013368495812476166, "learning_rate": 4.33179231126321e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.380177804501727e-05, "step": 4210, "valid_targets_mean": 3230.2, "valid_targets_min": 1958 }, { "epoch": 4.04512, "grad_norm": 0.00208369487802161, "learning_rate": 4.2902399811391575e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.897564238286577e-05, "step": 4215, "valid_targets_mean": 3983.1, "valid_targets_min": 1662 }, { "epoch": 4.04992, "grad_norm": 0.001584687114330045, "learning_rate": 4.248863949440436e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.266106068622321e-05, "step": 4220, "valid_targets_mean": 3432.7, "valid_targets_min": 2007 }, { "epoch": 4.05472, "grad_norm": 0.00787766824013007, "learning_rate": 4.207664680498094e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.363234282005578e-05, "step": 4225, "valid_targets_mean": 4572.5, "valid_targets_min": 1839 }, { "epoch": 4.05952, "grad_norm": 0.00205025097170975, "learning_rate": 4.166642636659495e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.519926601962652e-05, "step": 4230, "valid_targets_mean": 5066.3, "valid_targets_min": 1786 }, { "epoch": 4.06432, "grad_norm": 0.0016026371988252155, "learning_rate": 4.125798278283155e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.269485750934109e-05, "step": 4235, "valid_targets_mean": 3498.3, "valid_targets_min": 2041 }, { "epoch": 4.06912, "grad_norm": 0.0017439816942912997, "learning_rate": 4.085132063733554e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.675786138046533e-05, "step": 4240, "valid_targets_mean": 3827.7, "valid_targets_min": 2024 }, { "epoch": 4.07392, "grad_norm": 0.0059827154830725034, "learning_rate": 4.0446444493760165e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.55681695509702e-05, "step": 4245, "valid_targets_mean": 4141.8, "valid_targets_min": 1889 }, { "epoch": 4.07872, "grad_norm": 0.0038426262164381678, "learning_rate": 4.004335889571556e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.607972030295059e-05, "step": 4250, "valid_targets_mean": 3393.1, "valid_targets_min": 1950 }, { "epoch": 4.08352, "grad_norm": 0.00491056822089905, "learning_rate": 3.96420683667182e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.275919829728082e-05, "step": 4255, "valid_targets_mean": 3971.6, "valid_targets_min": 2020 }, { "epoch": 4.08832, "grad_norm": 0.0028428055872032018, "learning_rate": 3.924257741013968e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.72756837552879e-05, "step": 4260, "valid_targets_mean": 3005.8, "valid_targets_min": 1727 }, { "epoch": 4.09312, "grad_norm": 0.002148760727185149, "learning_rate": 3.884489050915652e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.0193852328229696e-05, "step": 4265, "valid_targets_mean": 2827.3, "valid_targets_min": 1863 }, { "epoch": 4.09792, "grad_norm": 0.0023335386496191987, "learning_rate": 3.844901212669962e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.841453351720702e-05, "step": 4270, "valid_targets_mean": 3088.7, "valid_targets_min": 1930 }, { "epoch": 4.10272, "grad_norm": 0.001286310131837442, "learning_rate": 3.8054946705404415e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.464947803877294e-05, "step": 4275, "valid_targets_mean": 4350.3, "valid_targets_min": 1884 }, { "epoch": 4.10752, "grad_norm": 0.0015531321802579076, "learning_rate": 3.7662698667560714e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.5117111110594124e-05, "step": 4280, "valid_targets_mean": 3142.5, "valid_targets_min": 1942 }, { "epoch": 4.11232, "grad_norm": 0.0016055863187996663, "learning_rate": 3.7272272415063484e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.6740551877301186e-05, "step": 4285, "valid_targets_mean": 3298.3, "valid_targets_min": 2013 }, { "epoch": 4.11712, "grad_norm": 0.0029316369728722416, "learning_rate": 3.6883672329363007e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.9559832657687366e-05, "step": 4290, "valid_targets_mean": 3922.3, "valid_targets_min": 1727 }, { "epoch": 4.12192, "grad_norm": 0.0015623211280171884, "learning_rate": 3.649690277141598e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.7854842958040535e-05, "step": 4295, "valid_targets_mean": 3290.9, "valid_targets_min": 1525 }, { "epoch": 4.12672, "grad_norm": 0.0027055639776239634, "learning_rate": 3.6111968081636507e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.4809010938042775e-05, "step": 4300, "valid_targets_mean": 3566.5, "valid_targets_min": 2034 }, { "epoch": 4.13152, "grad_norm": 0.0013377359893271355, "learning_rate": 3.572887257984743e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.381590406410396e-05, "step": 4305, "valid_targets_mean": 3170.8, "valid_targets_min": 1987 }, { "epoch": 4.1363199999999996, "grad_norm": 0.003940540400894581, "learning_rate": 3.5347620565231733e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 7.146632560761645e-05, "step": 4310, "valid_targets_mean": 3132.8, "valid_targets_min": 1909 }, { "epoch": 4.14112, "grad_norm": 0.0019501200493331245, "learning_rate": 3.496821631628442e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.4340086131123826e-05, "step": 4315, "valid_targets_mean": 4166.7, "valid_targets_min": 1614 }, { "epoch": 4.14592, "grad_norm": 0.0011369610238447416, "learning_rate": 3.459066409076448e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.429923526709899e-05, "step": 4320, "valid_targets_mean": 4413.0, "valid_targets_min": 1361 }, { "epoch": 4.15072, "grad_norm": 0.0014505389624406707, "learning_rate": 3.421496812564713e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.4482301998650655e-05, "step": 4325, "valid_targets_mean": 5303.1, "valid_targets_min": 2088 }, { "epoch": 4.15552, "grad_norm": 0.004779096813522042, "learning_rate": 3.384113263707609e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.184087836416438e-05, "step": 4330, "valid_targets_mean": 4378.8, "valid_targets_min": 1870 }, { "epoch": 4.16032, "grad_norm": 0.0026258332815263757, "learning_rate": 3.34691618203165e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 6.489974475698546e-05, "step": 4335, "valid_targets_mean": 4047.0, "valid_targets_min": 1920 }, { "epoch": 4.16512, "grad_norm": 0.001816961044617779, "learning_rate": 3.309905984970765e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.8048809074098244e-05, "step": 4340, "valid_targets_mean": 2844.7, "valid_targets_min": 1914 }, { "epoch": 4.16992, "grad_norm": 0.0018025365511840077, "learning_rate": 3.2730830878616305e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.494471457088366e-05, "step": 4345, "valid_targets_mean": 4423.0, "valid_targets_min": 1977 }, { "epoch": 4.17472, "grad_norm": 0.0015254616003019617, "learning_rate": 3.2364479039389973e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.3799573429860175e-05, "step": 4350, "valid_targets_mean": 3975.1, "valid_targets_min": 1601 }, { "epoch": 4.17952, "grad_norm": 0.0013297521092237158, "learning_rate": 3.2000008443310505e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.5375484003452584e-05, "step": 4355, "valid_targets_mean": 3518.4, "valid_targets_min": 1764 }, { "epoch": 4.18432, "grad_norm": 0.0015651851486661397, "learning_rate": 3.1637423180548232e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.7060703359893523e-05, "step": 4360, "valid_targets_mean": 4383.7, "valid_targets_min": 2081 }, { "epoch": 4.18912, "grad_norm": 0.0013429520317032584, "learning_rate": 3.127672732011564e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.832937752828002e-05, "step": 4365, "valid_targets_mean": 3055.6, "valid_targets_min": 1931 }, { "epoch": 4.19392, "grad_norm": 0.001673435127439738, "learning_rate": 3.0917924909821993e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.698914199252613e-05, "step": 4370, "valid_targets_mean": 3913.2, "valid_targets_min": 1925 }, { "epoch": 4.19872, "grad_norm": 0.0017055197505207748, "learning_rate": 3.0561019976227867e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.7643716495949775e-05, "step": 4375, "valid_targets_mean": 4424.2, "valid_targets_min": 1942 }, { "epoch": 4.20352, "grad_norm": 0.001524053630224983, "learning_rate": 3.020601652459989e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.057669502799399e-05, "step": 4380, "valid_targets_mean": 3439.1, "valid_targets_min": 2033 }, { "epoch": 4.20832, "grad_norm": 0.0014977455442873465, "learning_rate": 2.9852918538865847e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.6328819987829775e-05, "step": 4385, "valid_targets_mean": 3529.1, "valid_targets_min": 1950 }, { "epoch": 4.21312, "grad_norm": 0.002089373327408226, "learning_rate": 2.950172998156995e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.692836955655366e-05, "step": 4390, "valid_targets_mean": 4298.4, "valid_targets_min": 2071 }, { "epoch": 4.21792, "grad_norm": 0.0018448814132004277, "learning_rate": 2.91524547938284e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.71622372767888e-05, "step": 4395, "valid_targets_mean": 4462.7, "valid_targets_min": 1847 }, { "epoch": 4.22272, "grad_norm": 0.0012318653842671413, "learning_rate": 2.880509689528519e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.8981317629804835e-05, "step": 4400, "valid_targets_mean": 4393.9, "valid_targets_min": 1919 }, { "epoch": 4.22752, "grad_norm": 0.0013800529639858145, "learning_rate": 2.845966018406796e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.7751670131692663e-05, "step": 4405, "valid_targets_mean": 4296.9, "valid_targets_min": 1914 }, { "epoch": 4.23232, "grad_norm": 0.0022095704660588518, "learning_rate": 2.8116148536744448e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.149065378238447e-05, "step": 4410, "valid_targets_mean": 3783.5, "valid_targets_min": 1951 }, { "epoch": 4.23712, "grad_norm": 0.001829538248299371, "learning_rate": 2.777456580827882e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.5836652386933565e-05, "step": 4415, "valid_targets_mean": 3286.2, "valid_targets_min": 1972 }, { "epoch": 4.24192, "grad_norm": 0.0013569162605098144, "learning_rate": 2.7434915831988517e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.01278848585207e-05, "step": 4420, "valid_targets_mean": 5327.2, "valid_targets_min": 1786 }, { "epoch": 4.24672, "grad_norm": 0.0015208666777376662, "learning_rate": 2.7097202419501246e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.3911415812326595e-05, "step": 4425, "valid_targets_mean": 4008.7, "valid_targets_min": 1917 }, { "epoch": 4.25152, "grad_norm": 0.0013156359603355792, "learning_rate": 2.6761429360712045e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.497844980098307e-05, "step": 4430, "valid_targets_mean": 4711.8, "valid_targets_min": 1614 }, { "epoch": 4.25632, "grad_norm": 0.0054384452715636345, "learning_rate": 2.642760042374106e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.011658165836707e-05, "step": 4435, "valid_targets_mean": 3496.8, "valid_targets_min": 1912 }, { "epoch": 4.26112, "grad_norm": 0.0013737950200195751, "learning_rate": 2.6095719354890903e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.339675458846614e-05, "step": 4440, "valid_targets_mean": 4009.8, "valid_targets_min": 1877 }, { "epoch": 4.26592, "grad_norm": 0.0011869857062110785, "learning_rate": 2.5765789878604852e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.306513801566325e-05, "step": 4445, "valid_targets_mean": 3195.0, "valid_targets_min": 1833 }, { "epoch": 4.27072, "grad_norm": 0.002369333683258055, "learning_rate": 2.543781569742496e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.995891504222527e-05, "step": 4450, "valid_targets_mean": 4051.5, "valid_targets_min": 1981 }, { "epoch": 4.27552, "grad_norm": 0.0015064551394305126, "learning_rate": 2.5111800491950523e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.0394799978239462e-05, "step": 4455, "valid_targets_mean": 3638.0, "valid_targets_min": 1662 }, { "epoch": 4.28032, "grad_norm": 0.001674277187515422, "learning_rate": 2.4787747920796723e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.41932536684908e-05, "step": 4460, "valid_targets_mean": 4709.2, "valid_targets_min": 1919 }, { "epoch": 4.28512, "grad_norm": 0.0016113360197275133, "learning_rate": 2.446566162055377e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.608020051615313e-05, "step": 4465, "valid_targets_mean": 3064.8, "valid_targets_min": 1906 }, { "epoch": 4.28992, "grad_norm": 0.0017275336703297865, "learning_rate": 2.414554520574579e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.0131959142163396e-05, "step": 4470, "valid_targets_mean": 3079.5, "valid_targets_min": 1562 }, { "epoch": 4.29472, "grad_norm": 0.0013714628082071834, "learning_rate": 2.382740226879052e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.390222627785988e-05, "step": 4475, "valid_targets_mean": 4828.3, "valid_targets_min": 1763 }, { "epoch": 4.29952, "grad_norm": 0.0012150699900979316, "learning_rate": 2.3511236379958824e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.9595783164259046e-05, "step": 4480, "valid_targets_mean": 3530.4, "valid_targets_min": 1662 }, { "epoch": 4.30432, "grad_norm": 0.001616671707384578, "learning_rate": 2.31970510873347e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.014815203845501e-05, "step": 4485, "valid_targets_mean": 4057.2, "valid_targets_min": 1836 }, { "epoch": 4.30912, "grad_norm": 0.0011221295175201655, "learning_rate": 2.2884849916775485e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.353855572640896e-05, "step": 4490, "valid_targets_mean": 4496.3, "valid_targets_min": 1786 }, { "epoch": 4.3139199999999995, "grad_norm": 0.0017016556243612912, "learning_rate": 2.257463637187225e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.1361305193277076e-05, "step": 4495, "valid_targets_mean": 3690.3, "valid_targets_min": 1906 }, { "epoch": 4.31872, "grad_norm": 0.0015121984545869538, "learning_rate": 2.2266413933910426e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.035143527085893e-05, "step": 4500, "valid_targets_mean": 3866.2, "valid_targets_min": 1966 }, { "epoch": 4.32352, "grad_norm": 0.0012856343972766713, "learning_rate": 2.196018606183088e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.976351424877066e-05, "step": 4505, "valid_targets_mean": 4928.6, "valid_targets_min": 2030 }, { "epoch": 4.32832, "grad_norm": 0.0014908309871930075, "learning_rate": 2.1655956192191007e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.7100074880290776e-05, "step": 4510, "valid_targets_mean": 4195.6, "valid_targets_min": 1884 }, { "epoch": 4.33312, "grad_norm": 0.0016059641687275934, "learning_rate": 2.135372773912614e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.639291000785306e-05, "step": 4515, "valid_targets_mean": 3228.2, "valid_targets_min": 1933 }, { "epoch": 4.33792, "grad_norm": 0.002000268968529377, "learning_rate": 2.1053504094311285e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.447868973831646e-05, "step": 4520, "valid_targets_mean": 5219.3, "valid_targets_min": 1928 }, { "epoch": 4.34272, "grad_norm": 0.0017280071789846, "learning_rate": 2.0755288626923022e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.983695544069633e-05, "step": 4525, "valid_targets_mean": 3567.2, "valid_targets_min": 1999 }, { "epoch": 4.34752, "grad_norm": 0.0015796876911165173, "learning_rate": 2.0459084683601736e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.003527257940732e-05, "step": 4530, "valid_targets_mean": 3082.1, "valid_targets_min": 2088 }, { "epoch": 4.35232, "grad_norm": 0.0016431065257554265, "learning_rate": 2.0164895588414037e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.4640182497678325e-05, "step": 4535, "valid_targets_mean": 4039.8, "valid_targets_min": 1863 }, { "epoch": 4.35712, "grad_norm": 0.0011173401923015307, "learning_rate": 1.987272464281551e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.7552010578801855e-05, "step": 4540, "valid_targets_mean": 3328.8, "valid_targets_min": 1909 }, { "epoch": 4.36192, "grad_norm": 0.0014470057490486652, "learning_rate": 1.95825751256135e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.667410055641085e-05, "step": 4545, "valid_targets_mean": 3116.9, "valid_targets_min": 1740 }, { "epoch": 4.36672, "grad_norm": 0.0011899865608208137, "learning_rate": 1.9294450292930576e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.059140362893231e-05, "step": 4550, "valid_targets_mean": 4447.5, "valid_targets_min": 2136 }, { "epoch": 4.37152, "grad_norm": 0.0014338406740680588, "learning_rate": 1.9008353378167755e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.4420336053008214e-05, "step": 4555, "valid_targets_mean": 4507.5, "valid_targets_min": 1949 }, { "epoch": 4.37632, "grad_norm": 0.0016033511510176346, "learning_rate": 1.8724287591968294e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.303139237686992e-05, "step": 4560, "valid_targets_mean": 4461.0, "valid_targets_min": 1958 }, { "epoch": 4.38112, "grad_norm": 0.0016662233139541564, "learning_rate": 1.8442256122181735e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.8418951589846984e-05, "step": 4565, "valid_targets_mean": 4491.6, "valid_targets_min": 2044 }, { "epoch": 4.38592, "grad_norm": 0.00227254489455862, "learning_rate": 1.8162262133828013e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.4018466976704076e-05, "step": 4570, "valid_targets_mean": 4248.5, "valid_targets_min": 1931 }, { "epoch": 4.39072, "grad_norm": 0.0012256581723182494, "learning_rate": 1.7884308769061974e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.6851910408586264e-05, "step": 4575, "valid_targets_mean": 3628.8, "valid_targets_min": 1991 }, { "epoch": 4.39552, "grad_norm": 0.0013118549809077072, "learning_rate": 1.7608399147138278e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.930739356088452e-05, "step": 4580, "valid_targets_mean": 4122.8, "valid_targets_min": 1908 }, { "epoch": 4.40032, "grad_norm": 0.0014985345497132527, "learning_rate": 1.7334536364376075e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.729587817564607e-05, "step": 4585, "valid_targets_mean": 3863.1, "valid_targets_min": 1751 }, { "epoch": 4.40512, "grad_norm": 0.0016352089801263863, "learning_rate": 1.7062723494124545e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.489490700303577e-05, "step": 4590, "valid_targets_mean": 2983.8, "valid_targets_min": 1900 }, { "epoch": 4.40992, "grad_norm": 0.0012257363638319958, "learning_rate": 1.6792963586728195e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.1652001780457795e-05, "step": 4595, "valid_targets_mean": 3711.4, "valid_targets_min": 2032 }, { "epoch": 4.41472, "grad_norm": 0.0013212030801314416, "learning_rate": 1.6525259669492832e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.7446647436590865e-05, "step": 4600, "valid_targets_mean": 4090.9, "valid_targets_min": 1907 }, { "epoch": 4.41952, "grad_norm": 0.0014011914669706318, "learning_rate": 1.6259614746651364e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.055836739600636e-05, "step": 4605, "valid_targets_mean": 3449.7, "valid_targets_min": 1764 }, { "epoch": 4.42432, "grad_norm": 0.0014717860429847214, "learning_rate": 1.5996031799330315e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.580058546504006e-05, "step": 4610, "valid_targets_mean": 3305.9, "valid_targets_min": 1802 }, { "epoch": 4.42912, "grad_norm": 0.0016473531059666415, "learning_rate": 1.5734513785516227e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.1261421099770814e-05, "step": 4615, "valid_targets_mean": 3253.5, "valid_targets_min": 1361 }, { "epoch": 4.43392, "grad_norm": 0.001331483103913834, "learning_rate": 1.5475063640022425e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.218392885173671e-05, "step": 4620, "valid_targets_mean": 4387.2, "valid_targets_min": 1943 }, { "epoch": 4.43872, "grad_norm": 0.0015678072884918073, "learning_rate": 1.5217684274456314e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.212444764561951e-05, "step": 4625, "valid_targets_mean": 4228.2, "valid_targets_min": 1914 }, { "epoch": 4.44352, "grad_norm": 0.0012720162054364376, "learning_rate": 1.496237857718641e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.2788058888399974e-05, "step": 4630, "valid_targets_mean": 3761.5, "valid_targets_min": 1908 }, { "epoch": 4.44832, "grad_norm": 0.0014693064780329035, "learning_rate": 1.4709149413310076e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.5739245251752436e-05, "step": 4635, "valid_targets_mean": 3045.1, "valid_targets_min": 1914 }, { "epoch": 4.45312, "grad_norm": 0.0012759797820861135, "learning_rate": 1.445799962462142e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.0074017306324095e-05, "step": 4640, "valid_targets_mean": 4218.8, "valid_targets_min": 1939 }, { "epoch": 4.45792, "grad_norm": 0.0014016504839545346, "learning_rate": 1.420893202957927e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.586061211535707e-05, "step": 4645, "valid_targets_mean": 5258.8, "valid_targets_min": 1763 }, { "epoch": 4.46272, "grad_norm": 0.0013382238846672736, "learning_rate": 1.3961949423275622e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.416348772589117e-05, "step": 4650, "valid_targets_mean": 3336.5, "valid_targets_min": 1917 }, { "epoch": 4.46752, "grad_norm": 0.0010650811370673263, "learning_rate": 1.3717054577404331e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.619651397457346e-05, "step": 4655, "valid_targets_mean": 4939.1, "valid_targets_min": 1942 }, { "epoch": 4.47232, "grad_norm": 0.0015467868997038122, "learning_rate": 1.347425024022988e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.186376099823974e-05, "step": 4660, "valid_targets_mean": 3193.4, "valid_targets_min": 1719 }, { "epoch": 4.47712, "grad_norm": 0.001079459379272364, "learning_rate": 1.3233539136556606e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.495600321912207e-05, "step": 4665, "valid_targets_mean": 4908.7, "valid_targets_min": 1525 }, { "epoch": 4.48192, "grad_norm": 0.0016107049369327223, "learning_rate": 1.2994923967698125e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.6766832888824865e-05, "step": 4670, "valid_targets_mean": 3231.1, "valid_targets_min": 1918 }, { "epoch": 4.48672, "grad_norm": 0.001295276413290572, "learning_rate": 1.2758407411446982e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.188467806263361e-05, "step": 4675, "valid_targets_mean": 3830.6, "valid_targets_min": 1863 }, { "epoch": 4.49152, "grad_norm": 0.0014125030915670483, "learning_rate": 1.252399212204467e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.064816312165931e-05, "step": 4680, "valid_targets_mean": 4017.2, "valid_targets_min": 1906 }, { "epoch": 4.49632, "grad_norm": 0.0013458030400534259, "learning_rate": 1.22916807301517e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.3533407733775675e-05, "step": 4685, "valid_targets_mean": 3477.4, "valid_targets_min": 1820 }, { "epoch": 4.50112, "grad_norm": 0.0016436112336502518, "learning_rate": 1.2061475842818337e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.694011997547932e-05, "step": 4690, "valid_targets_mean": 2803.8, "valid_targets_min": 1771 }, { "epoch": 4.50592, "grad_norm": 0.0014744987333515098, "learning_rate": 1.1833380043455e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.827699401881546e-05, "step": 4695, "valid_targets_mean": 3764.2, "valid_targets_min": 2059 }, { "epoch": 4.51072, "grad_norm": 0.0014523313139412053, "learning_rate": 1.1607395891803641e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.0521079932223074e-05, "step": 4700, "valid_targets_mean": 3435.2, "valid_targets_min": 1919 }, { "epoch": 4.51552, "grad_norm": 0.001377506897666381, "learning_rate": 1.1383525923908678e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.60075207229238e-05, "step": 4705, "valid_targets_mean": 3290.6, "valid_targets_min": 1966 }, { "epoch": 4.52032, "grad_norm": 0.001252005700755184, "learning_rate": 1.1161772652088775e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.753907003556378e-05, "step": 4710, "valid_targets_mean": 3920.6, "valid_targets_min": 1820 }, { "epoch": 4.52512, "grad_norm": 0.0025620915151801284, "learning_rate": 1.094213856490849e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.3474727135617286e-05, "step": 4715, "valid_targets_mean": 3555.8, "valid_targets_min": 1601 }, { "epoch": 4.52992, "grad_norm": 0.001519151744512467, "learning_rate": 1.0724626127150462e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.198120950604789e-05, "step": 4720, "valid_targets_mean": 2547.0, "valid_targets_min": 1981 }, { "epoch": 4.53472, "grad_norm": 0.001991121718963719, "learning_rate": 1.0509237779787717e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.0243176044896245e-05, "step": 4725, "valid_targets_mean": 3534.3, "valid_targets_min": 2086 }, { "epoch": 4.5395199999999996, "grad_norm": 0.0013389944210247407, "learning_rate": 1.029597593995626e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.0416300180368125e-05, "step": 4730, "valid_targets_mean": 3721.5, "valid_targets_min": 1929 }, { "epoch": 4.54432, "grad_norm": 0.0017033067169285275, "learning_rate": 1.008484300092798e-06, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.046371759613976e-05, "step": 4735, "valid_targets_mean": 3974.4, "valid_targets_min": 1562 }, { "epoch": 4.54912, "grad_norm": 0.0013382541310036622, "learning_rate": 9.87584133208368e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.098331919522025e-05, "step": 4740, "valid_targets_mean": 4250.1, "valid_targets_min": 1934 }, { "epoch": 4.55392, "grad_norm": 0.0014815237161349228, "learning_rate": 9.66897327888665e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.0904986488167197e-05, "step": 4745, "valid_targets_mean": 3927.1, "valid_targets_min": 2136 }, { "epoch": 4.55872, "grad_norm": 0.0012628924512069915, "learning_rate": 9.464241162856269e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.71253284154227e-05, "step": 4750, "valid_targets_mean": 3516.2, "valid_targets_min": 1820 }, { "epoch": 4.5635200000000005, "grad_norm": 0.0016096247714936995, "learning_rate": 9.261647281541908e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.163005360169336e-05, "step": 4755, "valid_targets_mean": 3711.3, "valid_targets_min": 1786 }, { "epoch": 4.56832, "grad_norm": 0.0011359447908436454, "learning_rate": 9.061193908497201e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.9243678000057116e-05, "step": 4760, "valid_targets_mean": 3960.3, "valid_targets_min": 1760 }, { "epoch": 4.57312, "grad_norm": 0.0012325208487944698, "learning_rate": 8.862883293254598e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.4878499971237034e-05, "step": 4765, "valid_targets_mean": 3877.7, "valid_targets_min": 1760 }, { "epoch": 4.57792, "grad_norm": 0.0017772163052283724, "learning_rate": 8.666717661299917e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.6678311769501306e-05, "step": 4770, "valid_targets_mean": 3336.5, "valid_targets_min": 1727 }, { "epoch": 4.58272, "grad_norm": 0.0012672879514388682, "learning_rate": 8.472699214047652e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.525630381773226e-05, "step": 4775, "valid_targets_mean": 3886.1, "valid_targets_min": 1986 }, { "epoch": 4.58752, "grad_norm": 0.0014442282222083972, "learning_rate": 8.280830128815953e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.140436794841662e-05, "step": 4780, "valid_targets_mean": 2852.9, "valid_targets_min": 1601 }, { "epoch": 4.59232, "grad_norm": 0.0013335062943690265, "learning_rate": 8.09111255880246e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.9172715585445985e-05, "step": 4785, "valid_targets_mean": 4712.3, "valid_targets_min": 1933 }, { "epoch": 4.59712, "grad_norm": 0.0016073643552779076, "learning_rate": 7.903548633059955e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.3097250959835947e-05, "step": 4790, "valid_targets_mean": 3657.0, "valid_targets_min": 2162 }, { "epoch": 4.60192, "grad_norm": 0.0014311250739149058, "learning_rate": 7.718140456472612e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.254737384850159e-05, "step": 4795, "valid_targets_mean": 3186.6, "valid_targets_min": 1857 }, { "epoch": 4.60672, "grad_norm": 0.0014720511963264634, "learning_rate": 7.534890109732229e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.767356975004077e-05, "step": 4800, "valid_targets_mean": 4191.3, "valid_targets_min": 1986 }, { "epoch": 4.61152, "grad_norm": 0.0011422497608168177, "learning_rate": 7.353799649315085e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.191369640058838e-05, "step": 4805, "valid_targets_mean": 5858.8, "valid_targets_min": 2177 }, { "epoch": 4.61632, "grad_norm": 0.0015142999837969848, "learning_rate": 7.174871107458603e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.843754166155122e-05, "step": 4810, "valid_targets_mean": 4474.0, "valid_targets_min": 1889 }, { "epoch": 4.62112, "grad_norm": 0.0012380465021728157, "learning_rate": 6.998106492138724e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.2066651328932494e-05, "step": 4815, "valid_targets_mean": 3932.0, "valid_targets_min": 2020 }, { "epoch": 4.62592, "grad_norm": 0.0013493062176373246, "learning_rate": 6.823507787047346e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.646211942192167e-05, "step": 4820, "valid_targets_mean": 3945.9, "valid_targets_min": 1525 }, { "epoch": 4.63072, "grad_norm": 0.0013500247168241138, "learning_rate": 6.65107695156999e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.864829341182485e-05, "step": 4825, "valid_targets_mean": 3249.5, "valid_targets_min": 2026 }, { "epoch": 4.63552, "grad_norm": 0.0016728963895163553, "learning_rate": 6.480815920763905e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.096078919246793e-05, "step": 4830, "valid_targets_mean": 2811.6, "valid_targets_min": 1680 }, { "epoch": 4.64032, "grad_norm": 0.0013007674582857596, "learning_rate": 6.312726605336306e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.305595939513296e-05, "step": 4835, "valid_targets_mean": 3727.9, "valid_targets_min": 1763 }, { "epoch": 4.64512, "grad_norm": 0.001246805819895664, "learning_rate": 6.146810891622923e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.767627276829444e-05, "step": 4840, "valid_targets_mean": 4590.0, "valid_targets_min": 1786 }, { "epoch": 4.64992, "grad_norm": 0.0015306984235042263, "learning_rate": 5.983070641566802e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.872297722613439e-05, "step": 4845, "valid_targets_mean": 3660.3, "valid_targets_min": 1909 }, { "epoch": 4.65472, "grad_norm": 0.0013636211473654518, "learning_rate": 5.821507692697537e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.59952864528168e-05, "step": 4850, "valid_targets_mean": 4783.3, "valid_targets_min": 1929 }, { "epoch": 4.65952, "grad_norm": 0.001214169634631268, "learning_rate": 5.662123858110513e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.457337152212858e-05, "step": 4855, "valid_targets_mean": 4948.0, "valid_targets_min": 1981 }, { "epoch": 4.66432, "grad_norm": 0.0013015007668589714, "learning_rate": 5.504920926446611e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 1.846073428168893e-05, "step": 4860, "valid_targets_mean": 4190.8, "valid_targets_min": 2241 }, { "epoch": 4.66912, "grad_norm": 0.0017585809273893223, "learning_rate": 5.349900661872132e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.999376349383965e-05, "step": 4865, "valid_targets_mean": 3302.1, "valid_targets_min": 1940 }, { "epoch": 4.67392, "grad_norm": 0.0014018105059137838, "learning_rate": 5.197064804058971e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.753218334168196e-05, "step": 4870, "valid_targets_mean": 3569.1, "valid_targets_min": 1868 }, { "epoch": 4.67872, "grad_norm": 0.001411049154838511, "learning_rate": 5.046415068165234e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.0762810385786e-05, "step": 4875, "valid_targets_mean": 4144.9, "valid_targets_min": 1838 }, { "epoch": 4.68352, "grad_norm": 0.0012325440682396773, "learning_rate": 4.897953144815759e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.6161636419128627e-05, "step": 4880, "valid_targets_mean": 4015.3, "valid_targets_min": 1884 }, { "epoch": 4.68832, "grad_norm": 0.001081422749527924, "learning_rate": 4.7516807000833165e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.977273652504664e-05, "step": 4885, "valid_targets_mean": 5051.3, "valid_targets_min": 2148 }, { "epoch": 4.69312, "grad_norm": 0.0013326312566954472, "learning_rate": 4.6075993754698623e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.299923992017284e-05, "step": 4890, "valid_targets_mean": 3795.8, "valid_targets_min": 1930 }, { "epoch": 4.69792, "grad_norm": 0.0010834549302240677, "learning_rate": 4.4657107878881113e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.9331695006694645e-05, "step": 4895, "valid_targets_mean": 4620.5, "valid_targets_min": 1940 }, { "epoch": 4.70272, "grad_norm": 0.0009505343422854887, "learning_rate": 4.326016529643351e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.737485192483291e-05, "step": 4900, "valid_targets_mean": 5942.9, "valid_targets_min": 1991 }, { "epoch": 4.70752, "grad_norm": 0.0012846898025216246, "learning_rate": 4.1885181684157005e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.654539614217356e-05, "step": 4905, "valid_targets_mean": 3363.9, "valid_targets_min": 1917 }, { "epoch": 4.71232, "grad_norm": 0.0015367895661445351, "learning_rate": 4.053217247242369e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.137801442993805e-05, "step": 4910, "valid_targets_mean": 3513.6, "valid_targets_min": 1727 }, { "epoch": 4.7171199999999995, "grad_norm": 0.0015445627771844294, "learning_rate": 3.9201152845004476e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.674181087058969e-05, "step": 4915, "valid_targets_mean": 3224.1, "valid_targets_min": 1924 }, { "epoch": 4.72192, "grad_norm": 0.0015343846128040427, "learning_rate": 3.789213773889744e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.526258660713211e-05, "step": 4920, "valid_targets_mean": 2999.2, "valid_targets_min": 1727 }, { "epoch": 4.72672, "grad_norm": 0.001325208866112591, "learning_rate": 3.6605141844162417e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.196104444214143e-05, "step": 4925, "valid_targets_mean": 4132.0, "valid_targets_min": 1912 }, { "epoch": 4.73152, "grad_norm": 0.0018118681699326824, "learning_rate": 3.5340179603753354e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.0053150112507865e-05, "step": 4930, "valid_targets_mean": 3962.4, "valid_targets_min": 1887 }, { "epoch": 4.73632, "grad_norm": 0.0008082094400929223, "learning_rate": 3.4097265213358435e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 1.9822517060674727e-05, "step": 4935, "valid_targets_mean": 4209.6, "valid_targets_min": 1951 }, { "epoch": 4.7411200000000004, "grad_norm": 0.0013943033363122907, "learning_rate": 3.287641262123975e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.594924055505544e-05, "step": 4940, "valid_targets_mean": 3413.5, "valid_targets_min": 1614 }, { "epoch": 4.74592, "grad_norm": 0.0012017603675163208, "learning_rate": 3.1677635528076566e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.850576493074186e-05, "step": 4945, "valid_targets_mean": 4258.0, "valid_targets_min": 1917 }, { "epoch": 4.75072, "grad_norm": 0.0014305722242892265, "learning_rate": 3.0500947386812973e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.7447800423251465e-05, "step": 4950, "valid_targets_mean": 4027.3, "valid_targets_min": 1925 }, { "epoch": 4.75552, "grad_norm": 0.0010461845264905828, "learning_rate": 2.934636140250513e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.5297613067086786e-05, "step": 4955, "valid_targets_mean": 4322.1, "valid_targets_min": 1836 }, { "epoch": 4.76032, "grad_norm": 0.001185201140045603, "learning_rate": 2.821389053217383e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.970770583488047e-05, "step": 4960, "valid_targets_mean": 4760.2, "valid_targets_min": 1917 }, { "epoch": 4.76512, "grad_norm": 0.0011274151535639705, "learning_rate": 2.710354748465949e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.792166924336925e-05, "step": 4965, "valid_targets_mean": 3010.6, "valid_targets_min": 1802 }, { "epoch": 4.76992, "grad_norm": 0.0015942705739524197, "learning_rate": 2.6015344720479395e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.446161619853228e-05, "step": 4970, "valid_targets_mean": 3951.6, "valid_targets_min": 1908 }, { "epoch": 4.77472, "grad_norm": 0.0011431533238156495, "learning_rate": 2.49492944516867e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.62203354598023e-05, "step": 4975, "valid_targets_mean": 4022.9, "valid_targets_min": 1991 }, { "epoch": 4.77952, "grad_norm": 0.0013344896167050537, "learning_rate": 2.3905408641735183e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.3846070184372365e-05, "step": 4980, "valid_targets_mean": 2981.7, "valid_targets_min": 1764 }, { "epoch": 4.78432, "grad_norm": 0.0011469415623424919, "learning_rate": 2.288369900534404e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.583916986826807e-05, "step": 4985, "valid_targets_mean": 4020.9, "valid_targets_min": 1614 }, { "epoch": 4.7891200000000005, "grad_norm": 0.0015332867881165636, "learning_rate": 2.1884177008366203e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.023212022730149e-05, "step": 4990, "valid_targets_mean": 3641.2, "valid_targets_min": 1992 }, { "epoch": 4.79392, "grad_norm": 0.0015958107058125627, "learning_rate": 2.0906853867660004e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.5333177695283666e-05, "step": 4995, "valid_targets_mean": 3073.5, "valid_targets_min": 1833 }, { "epoch": 4.79872, "grad_norm": 0.0014088920318571542, "learning_rate": 1.9951740550963493e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.387499236850999e-05, "step": 5000, "valid_targets_mean": 3618.2, "valid_targets_min": 1863 }, { "epoch": 4.80352, "grad_norm": 0.001382017022764611, "learning_rate": 1.9018847776770987e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.965832391055301e-05, "step": 5005, "valid_targets_mean": 3913.4, "valid_targets_min": 1680 }, { "epoch": 4.80832, "grad_norm": 0.0009667895381881995, "learning_rate": 1.8108186014212935e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.5687706258613616e-05, "step": 5010, "valid_targets_mean": 3918.7, "valid_targets_min": 1984 }, { "epoch": 4.81312, "grad_norm": 0.001125905574920971, "learning_rate": 1.7219765482938465e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.900204683304764e-05, "step": 5015, "valid_targets_mean": 3905.2, "valid_targets_min": 1614 }, { "epoch": 4.81792, "grad_norm": 0.001735614405714739, "learning_rate": 1.635359615300036e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.774373180931434e-05, "step": 5020, "valid_targets_mean": 3537.9, "valid_targets_min": 2020 }, { "epoch": 4.82272, "grad_norm": 0.00135684272286996, "learning_rate": 1.5509687744744262e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.51240742020309e-05, "step": 5025, "valid_targets_mean": 3842.5, "valid_targets_min": 2001 }, { "epoch": 4.82752, "grad_norm": 0.0014588129404354, "learning_rate": 1.468804972869786e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.749809548025951e-05, "step": 5030, "valid_targets_mean": 4380.7, "valid_targets_min": 1829 }, { "epoch": 4.83232, "grad_norm": 0.0011513349659320153, "learning_rate": 1.3888691325465886e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.5042725610546768e-05, "step": 5035, "valid_targets_mean": 4936.8, "valid_targets_min": 1838 }, { "epoch": 4.83712, "grad_norm": 0.0014964758267286004, "learning_rate": 1.3111621505626616e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.30040929839015e-05, "step": 5040, "valid_targets_mean": 3460.6, "valid_targets_min": 1836 }, { "epoch": 4.84192, "grad_norm": 0.0017164816439846106, "learning_rate": 1.235684898963041e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.070202703587711e-05, "step": 5045, "valid_targets_mean": 3200.8, "valid_targets_min": 1680 }, { "epoch": 4.84672, "grad_norm": 0.0015533880396124476, "learning_rate": 1.1624382247702681e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.0546980269718915e-05, "step": 5050, "valid_targets_mean": 3411.6, "valid_targets_min": 1719 }, { "epoch": 4.85152, "grad_norm": 0.0010019739894339837, "learning_rate": 1.0914229499748186e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.7109126676805317e-05, "step": 5055, "valid_targets_mean": 4662.9, "valid_targets_min": 1918 }, { "epoch": 4.85632, "grad_norm": 0.0012845399103813841, "learning_rate": 1.0226398715259322e-07, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.92291510454379e-05, "step": 5060, "valid_targets_mean": 3564.8, "valid_targets_min": 1829 }, { "epoch": 4.86112, "grad_norm": 0.0011385205570641132, "learning_rate": 9.560897613226205e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.4021744795609266e-05, "step": 5065, "valid_targets_mean": 4878.3, "valid_targets_min": 2041 }, { "epoch": 4.86592, "grad_norm": 0.0012616009743158724, "learning_rate": 8.917733662050287e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.472245953162201e-05, "step": 5070, "valid_targets_mean": 5015.9, "valid_targets_min": 1921 }, { "epoch": 4.87072, "grad_norm": 0.001155635403330904, "learning_rate": 8.296914079461094e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.9761726182186976e-05, "step": 5075, "valid_targets_mean": 5231.2, "valid_targets_min": 1839 }, { "epoch": 4.87552, "grad_norm": 0.0013659832914605808, "learning_rate": 7.698445832433843e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.441186709096655e-05, "step": 5080, "valid_targets_mean": 4165.3, "valid_targets_min": 1877 }, { "epoch": 4.88032, "grad_norm": 0.0012340347205992707, "learning_rate": 7.122335637112621e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.069916030857712e-05, "step": 5085, "valid_targets_mean": 4010.7, "valid_targets_min": 1751 }, { "epoch": 4.88512, "grad_norm": 0.001273691882930067, "learning_rate": 6.568589958734218e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.6386449210112914e-05, "step": 5090, "valid_targets_mean": 3385.9, "valid_targets_min": 1857 }, { "epoch": 4.88992, "grad_norm": 0.001393496913272501, "learning_rate": 6.037215011556185e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.061328218085691e-05, "step": 5095, "valid_targets_mean": 4302.8, "valid_targets_min": 1938 }, { "epoch": 4.8947199999999995, "grad_norm": 0.0013498594145078644, "learning_rate": 5.5282167587862314e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.7743702705483884e-05, "step": 5100, "valid_targets_mean": 4179.5, "valid_targets_min": 2008 }, { "epoch": 4.89952, "grad_norm": 0.0014143037065501012, "learning_rate": 5.041600912516264e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.063945380039513e-05, "step": 5105, "valid_targets_mean": 3860.1, "valid_targets_min": 1836 }, { "epoch": 4.90432, "grad_norm": 0.0014140500655952196, "learning_rate": 4.5773729336577865e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.08784656226635e-05, "step": 5110, "valid_targets_mean": 3286.4, "valid_targets_min": 2030 }, { "epoch": 4.90912, "grad_norm": 0.0017234645985855681, "learning_rate": 4.1355380318803816e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.182319753454067e-05, "step": 5115, "valid_targets_mean": 3396.9, "valid_targets_min": 1601 }, { "epoch": 4.91392, "grad_norm": 0.0011229129262111707, "learning_rate": 3.7161011655535425e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.045425000891555e-05, "step": 5120, "valid_targets_mean": 3276.5, "valid_targets_min": 1914 }, { "epoch": 4.91872, "grad_norm": 0.001192187863420458, "learning_rate": 3.319067041691604e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.9014812753302976e-05, "step": 5125, "valid_targets_mean": 3593.7, "valid_targets_min": 1763 }, { "epoch": 4.92352, "grad_norm": 0.0015182017551724832, "learning_rate": 2.9444401158995606e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.1434181437361985e-05, "step": 5130, "valid_targets_mean": 2530.2, "valid_targets_min": 1993 }, { "epoch": 4.92832, "grad_norm": 0.0011932741963916822, "learning_rate": 2.5922245923244436e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.078323399880901e-05, "step": 5135, "valid_targets_mean": 3796.1, "valid_targets_min": 1976 }, { "epoch": 4.93312, "grad_norm": 0.001550202425571585, "learning_rate": 2.2624244236071348e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.0727601774269715e-05, "step": 5140, "valid_targets_mean": 3348.7, "valid_targets_min": 1829 }, { "epoch": 4.93792, "grad_norm": 0.0013292556967572553, "learning_rate": 1.9550433108384005e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.335079236421734e-05, "step": 5145, "valid_targets_mean": 3704.0, "valid_targets_min": 1877 }, { "epoch": 4.94272, "grad_norm": 0.0014035126325946453, "learning_rate": 1.6700847035180378e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.1342160835047252e-05, "step": 5150, "valid_targets_mean": 4230.9, "valid_targets_min": 1786 }, { "epoch": 4.94752, "grad_norm": 0.0014310478819625216, "learning_rate": 1.4075517995146837e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.299306990811601e-05, "step": 5155, "valid_targets_mean": 4439.9, "valid_targets_min": 1949 }, { "epoch": 4.95232, "grad_norm": 0.0015978203559360326, "learning_rate": 1.167447545031175e-08, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.916247806046158e-05, "step": 5160, "valid_targets_mean": 3008.0, "valid_targets_min": 2091 }, { "epoch": 4.95712, "grad_norm": 0.0011164404550244923, "learning_rate": 9.497746345705772e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.2907188142417e-05, "step": 5165, "valid_targets_mean": 4431.3, "valid_targets_min": 1705 }, { "epoch": 4.96192, "grad_norm": 0.0012503279471786264, "learning_rate": 7.545355109073172e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.4081882656901143e-05, "step": 5170, "valid_targets_mean": 3681.2, "valid_targets_min": 1727 }, { "epoch": 4.9667200000000005, "grad_norm": 0.001375435267226282, "learning_rate": 5.817323650578743e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.076618643011898e-05, "step": 5175, "valid_targets_mean": 3616.1, "valid_targets_min": 2113 }, { "epoch": 4.97152, "grad_norm": 0.0016537587168405621, "learning_rate": 4.313671362576877e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.502938827499747e-05, "step": 5180, "valid_targets_mean": 2839.1, "valid_targets_min": 1705 }, { "epoch": 4.97632, "grad_norm": 0.0016762299883309327, "learning_rate": 3.0344151193917316e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.7856032324489206e-05, "step": 5185, "valid_targets_mean": 3107.3, "valid_targets_min": 1919 }, { "epoch": 4.98112, "grad_norm": 0.0021278546575005703, "learning_rate": 1.979569277117399e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.744456626009196e-05, "step": 5190, "valid_targets_mean": 3881.2, "valid_targets_min": 2103 }, { "epoch": 4.98592, "grad_norm": 0.00150027232141985, "learning_rate": 1.1491456734713524e-09, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 3.7057245208416134e-05, "step": 5195, "valid_targets_mean": 3717.0, "valid_targets_min": 1838 }, { "epoch": 4.99072, "grad_norm": 0.0010896481788440953, "learning_rate": 5.431536276523375e-10, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 2.905803376052063e-05, "step": 5200, "valid_targets_mean": 4881.5, "valid_targets_min": 1900 }, { "epoch": 4.99552, "grad_norm": 0.001501183108511998, "learning_rate": 1.6159994023601245e-10, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 4.9408565246267244e-05, "step": 5205, "valid_targets_mean": 3176.6, "valid_targets_min": 1952 }, { "epoch": 5.0, "grad_norm": 0.0016249555548919574, "learning_rate": 4.488893106113779e-12, "loss": 0.0001, "loss_nan_ranks": 0, "loss_rank_avg": 5.124273229739629e-05, "step": 5210, "valid_targets_mean": 3937.9, "valid_targets_min": 1868 }, { "epoch": 5.0, "step": 5210, "total_flos": 6.749812417674346e+18, "train_loss": 0.0, "train_runtime": 1.2275, "train_samples_per_second": 407324.551, "train_steps_per_second": 4244.322 } ], "logging_steps": 5, "max_steps": 5210, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 300, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 6.749812417674346e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }