Files
r2egym-100000-opt100k__Qwen…/trainer_state.json
ModelHub XC 7d865d342f 初始化项目,由ModelHub XC社区提供模型
Model: laion/r2egym-100000-opt100k__Qwen3-8B
Source: Original Platform
2026-04-18 20:49:39 +08:00

11506 lines
314 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 5210,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0048,
"grad_norm": 6.937965654420425,
"learning_rate": 3.071017274472169e-07,
"loss": 0.3626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11469614505767822,
"step": 5,
"valid_targets_mean": 3499.5,
"valid_targets_min": 1863
},
{
"epoch": 0.0096,
"grad_norm": 6.5863821052475515,
"learning_rate": 6.909788867562381e-07,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12012797594070435,
"step": 10,
"valid_targets_mean": 3721.8,
"valid_targets_min": 1764
},
{
"epoch": 0.0144,
"grad_norm": 5.343535940478726,
"learning_rate": 1.074856046065259e-06,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12584523856639862,
"step": 15,
"valid_targets_mean": 3173.9,
"valid_targets_min": 1727
},
{
"epoch": 0.0192,
"grad_norm": 2.3671652084368016,
"learning_rate": 1.4587332053742803e-06,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09593678265810013,
"step": 20,
"valid_targets_mean": 4235.9,
"valid_targets_min": 1930
},
{
"epoch": 0.024,
"grad_norm": 1.5821432353896931,
"learning_rate": 1.8426103646833015e-06,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0928233414888382,
"step": 25,
"valid_targets_mean": 3918.5,
"valid_targets_min": 2012
},
{
"epoch": 0.0288,
"grad_norm": 1.0466260829406362,
"learning_rate": 2.2264875239923228e-06,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09647513926029205,
"step": 30,
"valid_targets_mean": 3579.7,
"valid_targets_min": 1909
},
{
"epoch": 0.0336,
"grad_norm": 0.7301653193288717,
"learning_rate": 2.6103646833013433e-06,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09100286662578583,
"step": 35,
"valid_targets_mean": 3455.0,
"valid_targets_min": 2080
},
{
"epoch": 0.0384,
"grad_norm": 0.5634397105921576,
"learning_rate": 2.9942418426103648e-06,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06531375646591187,
"step": 40,
"valid_targets_mean": 2997.9,
"valid_targets_min": 1907
},
{
"epoch": 0.0432,
"grad_norm": 0.3771989155832216,
"learning_rate": 3.378119001919386e-06,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05960608273744583,
"step": 45,
"valid_targets_mean": 3948.8,
"valid_targets_min": 1863
},
{
"epoch": 0.048,
"grad_norm": 0.2913641430638286,
"learning_rate": 3.761996161228407e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05882091447710991,
"step": 50,
"valid_targets_mean": 4149.5,
"valid_targets_min": 2046
},
{
"epoch": 0.0528,
"grad_norm": 0.2153147490996494,
"learning_rate": 4.145873320537428e-06,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04906277358531952,
"step": 55,
"valid_targets_mean": 4259.8,
"valid_targets_min": 1940
},
{
"epoch": 0.0576,
"grad_norm": 0.20723734858542475,
"learning_rate": 4.52975047984645e-06,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050851885229349136,
"step": 60,
"valid_targets_mean": 3494.0,
"valid_targets_min": 2009
},
{
"epoch": 0.0624,
"grad_norm": 0.17986844485497974,
"learning_rate": 4.91362763915547e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048392847180366516,
"step": 65,
"valid_targets_mean": 4253.8,
"valid_targets_min": 1937
},
{
"epoch": 0.0672,
"grad_norm": 0.17301691819215223,
"learning_rate": 5.297504798464492e-06,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046146441251039505,
"step": 70,
"valid_targets_mean": 3649.2,
"valid_targets_min": 1939
},
{
"epoch": 0.072,
"grad_norm": 0.16766105949933824,
"learning_rate": 5.681381957773513e-06,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04667827486991882,
"step": 75,
"valid_targets_mean": 3832.0,
"valid_targets_min": 1995
},
{
"epoch": 0.0768,
"grad_norm": 0.19338450140560143,
"learning_rate": 6.065259117082534e-06,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045901913195848465,
"step": 80,
"valid_targets_mean": 3223.5,
"valid_targets_min": 1930
},
{
"epoch": 0.0816,
"grad_norm": 0.163903129334992,
"learning_rate": 6.449136276391556e-06,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03836950659751892,
"step": 85,
"valid_targets_mean": 4337.8,
"valid_targets_min": 1716
},
{
"epoch": 0.0864,
"grad_norm": 0.1732436888952196,
"learning_rate": 6.833013435700576e-06,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04401613771915436,
"step": 90,
"valid_targets_mean": 4111.6,
"valid_targets_min": 1857
},
{
"epoch": 0.0912,
"grad_norm": 0.19082139608668852,
"learning_rate": 7.216890595009598e-06,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03892116993665695,
"step": 95,
"valid_targets_mean": 2942.4,
"valid_targets_min": 1977
},
{
"epoch": 0.096,
"grad_norm": 0.17638352231994248,
"learning_rate": 7.600767754318619e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0390937514603138,
"step": 100,
"valid_targets_mean": 3591.5,
"valid_targets_min": 1680
},
{
"epoch": 0.1008,
"grad_norm": 0.1944525138076534,
"learning_rate": 7.98464491362764e-06,
"loss": 0.1245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048598822206258774,
"step": 105,
"valid_targets_mean": 3481.1,
"valid_targets_min": 1868
},
{
"epoch": 0.1056,
"grad_norm": 0.22035770940213192,
"learning_rate": 8.368522072936662e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039973922073841095,
"step": 110,
"valid_targets_mean": 3435.9,
"valid_targets_min": 2010
},
{
"epoch": 0.1104,
"grad_norm": 0.18001026275208665,
"learning_rate": 8.752399232245682e-06,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03717381879687309,
"step": 115,
"valid_targets_mean": 3578.4,
"valid_targets_min": 1929
},
{
"epoch": 0.1152,
"grad_norm": 0.20166628598885344,
"learning_rate": 9.136276391554704e-06,
"loss": 0.1142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034547075629234314,
"step": 120,
"valid_targets_mean": 3295.2,
"valid_targets_min": 1662
},
{
"epoch": 0.12,
"grad_norm": 0.19167865931651773,
"learning_rate": 9.520153550863724e-06,
"loss": 0.1086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03747241944074631,
"step": 125,
"valid_targets_mean": 4539.3,
"valid_targets_min": 1847
},
{
"epoch": 0.1248,
"grad_norm": 0.19148980089840842,
"learning_rate": 9.904030710172746e-06,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03533416986465454,
"step": 130,
"valid_targets_mean": 3445.7,
"valid_targets_min": 1709
},
{
"epoch": 0.1296,
"grad_norm": 0.21821353960131265,
"learning_rate": 1.0287907869481766e-05,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03997855633497238,
"step": 135,
"valid_targets_mean": 3530.8,
"valid_targets_min": 2027
},
{
"epoch": 0.1344,
"grad_norm": 0.23048953683917786,
"learning_rate": 1.067178502879079e-05,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03685012459754944,
"step": 140,
"valid_targets_mean": 3553.0,
"valid_targets_min": 1820
},
{
"epoch": 0.1392,
"grad_norm": 0.23561676819347502,
"learning_rate": 1.105566218809981e-05,
"loss": 0.1037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033116281032562256,
"step": 145,
"valid_targets_mean": 3572.2,
"valid_targets_min": 2180
},
{
"epoch": 0.144,
"grad_norm": 0.18410766236895754,
"learning_rate": 1.143953934740883e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02970690280199051,
"step": 150,
"valid_targets_mean": 4146.3,
"valid_targets_min": 1719
},
{
"epoch": 0.1488,
"grad_norm": 0.18049019085906956,
"learning_rate": 1.182341650671785e-05,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029041530564427376,
"step": 155,
"valid_targets_mean": 3589.8,
"valid_targets_min": 1863
},
{
"epoch": 0.1536,
"grad_norm": 0.23489464884439978,
"learning_rate": 1.2207293666026872e-05,
"loss": 0.0924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03265086188912392,
"step": 160,
"valid_targets_mean": 3268.7,
"valid_targets_min": 1847
},
{
"epoch": 0.1584,
"grad_norm": 0.19835583785764463,
"learning_rate": 1.2591170825335894e-05,
"loss": 0.0887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029566409066319466,
"step": 165,
"valid_targets_mean": 4323.8,
"valid_targets_min": 1974
},
{
"epoch": 0.1632,
"grad_norm": 0.24846365725039307,
"learning_rate": 1.2975047984644915e-05,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0281932782381773,
"step": 170,
"valid_targets_mean": 4207.3,
"valid_targets_min": 2087
},
{
"epoch": 0.168,
"grad_norm": 0.22919583334361535,
"learning_rate": 1.3358925143953936e-05,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02949838899075985,
"step": 175,
"valid_targets_mean": 3960.9,
"valid_targets_min": 1857
},
{
"epoch": 0.1728,
"grad_norm": 0.27434533496042574,
"learning_rate": 1.3742802303262956e-05,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02647317200899124,
"step": 180,
"valid_targets_mean": 3963.9,
"valid_targets_min": 2022
},
{
"epoch": 0.1776,
"grad_norm": 0.2554410371258365,
"learning_rate": 1.4126679462571978e-05,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028740808367729187,
"step": 185,
"valid_targets_mean": 3598.1,
"valid_targets_min": 1970
},
{
"epoch": 0.1824,
"grad_norm": 0.22965813069707355,
"learning_rate": 1.4510556621881e-05,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022127017378807068,
"step": 190,
"valid_targets_mean": 4289.5,
"valid_targets_min": 1764
},
{
"epoch": 0.1872,
"grad_norm": 0.2288532296930469,
"learning_rate": 1.4894433781190021e-05,
"loss": 0.0723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02306653931736946,
"step": 195,
"valid_targets_mean": 4330.4,
"valid_targets_min": 1993
},
{
"epoch": 0.192,
"grad_norm": 0.27240454535637443,
"learning_rate": 1.527831094049904e-05,
"loss": 0.0712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025289515033364296,
"step": 200,
"valid_targets_mean": 2736.6,
"valid_targets_min": 1614
},
{
"epoch": 0.1968,
"grad_norm": 0.242681238840325,
"learning_rate": 1.566218809980806e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024639660492539406,
"step": 205,
"valid_targets_mean": 4075.1,
"valid_targets_min": 2080
},
{
"epoch": 0.2016,
"grad_norm": 0.24849701794363202,
"learning_rate": 1.6046065259117082e-05,
"loss": 0.0645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01965644210577011,
"step": 210,
"valid_targets_mean": 3752.0,
"valid_targets_min": 1719
},
{
"epoch": 0.2064,
"grad_norm": 0.27241151966507293,
"learning_rate": 1.6429942418426105e-05,
"loss": 0.0602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01922878436744213,
"step": 215,
"valid_targets_mean": 3878.5,
"valid_targets_min": 1662
},
{
"epoch": 0.2112,
"grad_norm": 0.3082022682540152,
"learning_rate": 1.6813819577735126e-05,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019677884876728058,
"step": 220,
"valid_targets_mean": 3743.6,
"valid_targets_min": 2048
},
{
"epoch": 0.216,
"grad_norm": 0.3058526962109295,
"learning_rate": 1.7197696737044146e-05,
"loss": 0.0583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02079184725880623,
"step": 225,
"valid_targets_mean": 3293.6,
"valid_targets_min": 1662
},
{
"epoch": 0.2208,
"grad_norm": 0.27962167396369564,
"learning_rate": 1.758157389635317e-05,
"loss": 0.0544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01946953497827053,
"step": 230,
"valid_targets_mean": 4708.4,
"valid_targets_min": 2046
},
{
"epoch": 0.2256,
"grad_norm": 0.28869191640978553,
"learning_rate": 1.796545105566219e-05,
"loss": 0.0519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01823297329246998,
"step": 235,
"valid_targets_mean": 3593.3,
"valid_targets_min": 2081
},
{
"epoch": 0.2304,
"grad_norm": 0.2898824996991812,
"learning_rate": 1.8349328214971213e-05,
"loss": 0.0499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016215849667787552,
"step": 240,
"valid_targets_mean": 4142.3,
"valid_targets_min": 2089
},
{
"epoch": 0.2352,
"grad_norm": 0.30149704768269103,
"learning_rate": 1.8733205374280233e-05,
"loss": 0.0509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01709664985537529,
"step": 245,
"valid_targets_mean": 3813.4,
"valid_targets_min": 1928
},
{
"epoch": 0.24,
"grad_norm": 0.2979272115801746,
"learning_rate": 1.9117082533589253e-05,
"loss": 0.0452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.010545975528657436,
"step": 250,
"valid_targets_mean": 3071.1,
"valid_targets_min": 1877
},
{
"epoch": 0.2448,
"grad_norm": 0.3057707833669144,
"learning_rate": 1.9500959692898273e-05,
"loss": 0.0424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014655347913503647,
"step": 255,
"valid_targets_mean": 3741.1,
"valid_targets_min": 1763
},
{
"epoch": 0.2496,
"grad_norm": 0.2995200667585905,
"learning_rate": 1.9884836852207294e-05,
"loss": 0.0419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01323431171476841,
"step": 260,
"valid_targets_mean": 4534.5,
"valid_targets_min": 1889
},
{
"epoch": 0.2544,
"grad_norm": 0.3284439605360466,
"learning_rate": 2.0268714011516314e-05,
"loss": 0.038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013670418411493301,
"step": 265,
"valid_targets_mean": 3705.1,
"valid_targets_min": 1877
},
{
"epoch": 0.2592,
"grad_norm": 0.28351371383795076,
"learning_rate": 2.0652591170825337e-05,
"loss": 0.0364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.010727550834417343,
"step": 270,
"valid_targets_mean": 3922.1,
"valid_targets_min": 1889
},
{
"epoch": 0.264,
"grad_norm": 0.3150839446969937,
"learning_rate": 2.103646833013436e-05,
"loss": 0.0342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.011736005544662476,
"step": 275,
"valid_targets_mean": 3559.4,
"valid_targets_min": 1919
},
{
"epoch": 0.2688,
"grad_norm": 0.2806927089920171,
"learning_rate": 2.142034548944338e-05,
"loss": 0.0318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013169767335057259,
"step": 280,
"valid_targets_mean": 4125.0,
"valid_targets_min": 1952
},
{
"epoch": 0.2736,
"grad_norm": 0.2971395106031058,
"learning_rate": 2.18042226487524e-05,
"loss": 0.0338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.009649878367781639,
"step": 285,
"valid_targets_mean": 3847.2,
"valid_targets_min": 1839
},
{
"epoch": 0.2784,
"grad_norm": 0.30462593223391954,
"learning_rate": 2.218809980806142e-05,
"loss": 0.0309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.007476530969142914,
"step": 290,
"valid_targets_mean": 4701.7,
"valid_targets_min": 1802
},
{
"epoch": 0.2832,
"grad_norm": 0.30038151573422667,
"learning_rate": 2.2571976967370445e-05,
"loss": 0.0287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.007295252755284309,
"step": 295,
"valid_targets_mean": 3913.3,
"valid_targets_min": 1799
},
{
"epoch": 0.288,
"grad_norm": 0.29158760056491095,
"learning_rate": 2.2955854126679465e-05,
"loss": 0.028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.009111661463975906,
"step": 300,
"valid_targets_mean": 3851.0,
"valid_targets_min": 1952
},
{
"epoch": 0.2928,
"grad_norm": 0.29029858315528134,
"learning_rate": 2.3339731285988485e-05,
"loss": 0.0265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00890104379504919,
"step": 305,
"valid_targets_mean": 3463.2,
"valid_targets_min": 1751
},
{
"epoch": 0.2976,
"grad_norm": 0.3432214228291009,
"learning_rate": 2.372360844529751e-05,
"loss": 0.0243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.008902271278202534,
"step": 310,
"valid_targets_mean": 2587.8,
"valid_targets_min": 1917
},
{
"epoch": 0.3024,
"grad_norm": 0.2780773407000986,
"learning_rate": 2.4107485604606525e-05,
"loss": 0.0231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00839188788086176,
"step": 315,
"valid_targets_mean": 3983.3,
"valid_targets_min": 1601
},
{
"epoch": 0.3072,
"grad_norm": 0.32885066035163374,
"learning_rate": 2.449136276391555e-05,
"loss": 0.0233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.008772674016654491,
"step": 320,
"valid_targets_mean": 3652.5,
"valid_targets_min": 2008
},
{
"epoch": 0.312,
"grad_norm": 0.3055398782817974,
"learning_rate": 2.4875239923224573e-05,
"loss": 0.0233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.009282301180064678,
"step": 325,
"valid_targets_mean": 4054.7,
"valid_targets_min": 1716
},
{
"epoch": 0.3168,
"grad_norm": 0.36149353916895155,
"learning_rate": 2.525911708253359e-05,
"loss": 0.0224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.007749137934297323,
"step": 330,
"valid_targets_mean": 3019.2,
"valid_targets_min": 1939
},
{
"epoch": 0.3216,
"grad_norm": 0.3228633275486538,
"learning_rate": 2.5642994241842613e-05,
"loss": 0.0202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.007192028686404228,
"step": 335,
"valid_targets_mean": 3837.0,
"valid_targets_min": 1760
},
{
"epoch": 0.3264,
"grad_norm": 0.25093922169727056,
"learning_rate": 2.6026871401151633e-05,
"loss": 0.0175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00533191068097949,
"step": 340,
"valid_targets_mean": 3737.1,
"valid_targets_min": 1517
},
{
"epoch": 0.3312,
"grad_norm": 0.35279337813115486,
"learning_rate": 2.6410748560460657e-05,
"loss": 0.0175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.007894867099821568,
"step": 345,
"valid_targets_mean": 3601.5,
"valid_targets_min": 1907
},
{
"epoch": 0.336,
"grad_norm": 0.26818158089815164,
"learning_rate": 2.6794625719769677e-05,
"loss": 0.0173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.005505319684743881,
"step": 350,
"valid_targets_mean": 4927.9,
"valid_targets_min": 2030
},
{
"epoch": 0.3408,
"grad_norm": 0.2897950061058035,
"learning_rate": 2.7178502879078697e-05,
"loss": 0.0178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.005148059222847223,
"step": 355,
"valid_targets_mean": 3249.0,
"valid_targets_min": 2031
},
{
"epoch": 0.3456,
"grad_norm": 0.29798905792631397,
"learning_rate": 2.756238003838772e-05,
"loss": 0.0175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.005866318475455046,
"step": 360,
"valid_targets_mean": 3637.2,
"valid_targets_min": 2012
},
{
"epoch": 0.3504,
"grad_norm": 0.23388716919207966,
"learning_rate": 2.7946257197696737e-05,
"loss": 0.0157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0034332945942878723,
"step": 365,
"valid_targets_mean": 3665.2,
"valid_targets_min": 1562
},
{
"epoch": 0.3552,
"grad_norm": 0.3144219799825524,
"learning_rate": 2.833013435700576e-05,
"loss": 0.0165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.005330200307071209,
"step": 370,
"valid_targets_mean": 3714.6,
"valid_targets_min": 1918
},
{
"epoch": 0.36,
"grad_norm": 0.2347921761514834,
"learning_rate": 2.8714011516314784e-05,
"loss": 0.015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0039110006764531136,
"step": 375,
"valid_targets_mean": 3327.7,
"valid_targets_min": 1764
},
{
"epoch": 0.3648,
"grad_norm": 0.2904804056955613,
"learning_rate": 2.90978886756238e-05,
"loss": 0.0151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.005027526989579201,
"step": 380,
"valid_targets_mean": 3128.4,
"valid_targets_min": 1868
},
{
"epoch": 0.3696,
"grad_norm": 0.28700226054014716,
"learning_rate": 2.9481765834932825e-05,
"loss": 0.016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.004024747759103775,
"step": 385,
"valid_targets_mean": 3588.8,
"valid_targets_min": 1601
},
{
"epoch": 0.3744,
"grad_norm": 0.26884448060402233,
"learning_rate": 2.9865642994241845e-05,
"loss": 0.0141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.004564404953271151,
"step": 390,
"valid_targets_mean": 3236.8,
"valid_targets_min": 1900
},
{
"epoch": 0.3792,
"grad_norm": 0.24611041897462416,
"learning_rate": 3.0249520153550865e-05,
"loss": 0.0141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.004304606467485428,
"step": 395,
"valid_targets_mean": 4403.7,
"valid_targets_min": 1709
},
{
"epoch": 0.384,
"grad_norm": 0.48825494706248906,
"learning_rate": 3.063339731285989e-05,
"loss": 0.012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.004420734476298094,
"step": 400,
"valid_targets_mean": 3538.8,
"valid_targets_min": 1614
},
{
"epoch": 0.3888,
"grad_norm": 0.2792081008190513,
"learning_rate": 3.101727447216891e-05,
"loss": 0.0144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.005862731486558914,
"step": 405,
"valid_targets_mean": 4681.7,
"valid_targets_min": 2091
},
{
"epoch": 0.3936,
"grad_norm": 0.30743113561108026,
"learning_rate": 3.140115163147793e-05,
"loss": 0.0142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.006006536073982716,
"step": 410,
"valid_targets_mean": 4158.8,
"valid_targets_min": 1906
},
{
"epoch": 0.3984,
"grad_norm": 0.23617729705125162,
"learning_rate": 3.178502879078695e-05,
"loss": 0.0112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0039299000054597855,
"step": 415,
"valid_targets_mean": 5437.2,
"valid_targets_min": 2126
},
{
"epoch": 0.4032,
"grad_norm": 0.24273874285561925,
"learning_rate": 3.216890595009597e-05,
"loss": 0.0121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002637755125761032,
"step": 420,
"valid_targets_mean": 4218.1,
"valid_targets_min": 1836
},
{
"epoch": 0.408,
"grad_norm": 0.2571274327476414,
"learning_rate": 3.2552783109404996e-05,
"loss": 0.0126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.004715914838016033,
"step": 425,
"valid_targets_mean": 3939.8,
"valid_targets_min": 2195
},
{
"epoch": 0.4128,
"grad_norm": 0.2500933896104518,
"learning_rate": 3.2936660268714016e-05,
"loss": 0.0118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0031941996421664953,
"step": 430,
"valid_targets_mean": 3576.3,
"valid_targets_min": 1705
},
{
"epoch": 0.4176,
"grad_norm": 0.22701352422866455,
"learning_rate": 3.3320537428023036e-05,
"loss": 0.0106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003280221950262785,
"step": 435,
"valid_targets_mean": 3586.2,
"valid_targets_min": 1942
},
{
"epoch": 0.4224,
"grad_norm": 0.2524861159968299,
"learning_rate": 3.3704414587332056e-05,
"loss": 0.0114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.004017299972474575,
"step": 440,
"valid_targets_mean": 3009.8,
"valid_targets_min": 1952
},
{
"epoch": 0.4272,
"grad_norm": 0.22783228209467407,
"learning_rate": 3.4088291746641077e-05,
"loss": 0.0109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003924804739654064,
"step": 445,
"valid_targets_mean": 4031.3,
"valid_targets_min": 1906
},
{
"epoch": 0.432,
"grad_norm": 0.2675229581899117,
"learning_rate": 3.4472168905950104e-05,
"loss": 0.012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0031715864315629005,
"step": 450,
"valid_targets_mean": 3449.6,
"valid_targets_min": 1942
},
{
"epoch": 0.4368,
"grad_norm": 0.22212296709946297,
"learning_rate": 3.485604606525912e-05,
"loss": 0.0109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0034985882230103016,
"step": 455,
"valid_targets_mean": 4985.9,
"valid_targets_min": 1802
},
{
"epoch": 0.4416,
"grad_norm": 0.22671994440103954,
"learning_rate": 3.5239923224568144e-05,
"loss": 0.0101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003531843423843384,
"step": 460,
"valid_targets_mean": 4070.9,
"valid_targets_min": 2019
},
{
"epoch": 0.4464,
"grad_norm": 0.21948437480345728,
"learning_rate": 3.5623800383877164e-05,
"loss": 0.0101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0022159013897180557,
"step": 465,
"valid_targets_mean": 4492.9,
"valid_targets_min": 1775
},
{
"epoch": 0.4512,
"grad_norm": 0.25220894753487705,
"learning_rate": 3.6007677543186184e-05,
"loss": 0.0107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003613119013607502,
"step": 470,
"valid_targets_mean": 3354.7,
"valid_targets_min": 1786
},
{
"epoch": 0.456,
"grad_norm": 0.2409715853264873,
"learning_rate": 3.6391554702495204e-05,
"loss": 0.0111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00343118398450315,
"step": 475,
"valid_targets_mean": 3894.3,
"valid_targets_min": 1917
},
{
"epoch": 0.4608,
"grad_norm": 0.2170729540621222,
"learning_rate": 3.6775431861804224e-05,
"loss": 0.0092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0030733980238437653,
"step": 480,
"valid_targets_mean": 4114.4,
"valid_targets_min": 1995
},
{
"epoch": 0.4656,
"grad_norm": 0.21068892921988389,
"learning_rate": 3.7159309021113245e-05,
"loss": 0.0096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003135197563096881,
"step": 485,
"valid_targets_mean": 3322.5,
"valid_targets_min": 1763
},
{
"epoch": 0.4704,
"grad_norm": 0.21972566727493456,
"learning_rate": 3.7543186180422265e-05,
"loss": 0.0094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0030888905748724937,
"step": 490,
"valid_targets_mean": 3647.6,
"valid_targets_min": 1912
},
{
"epoch": 0.4752,
"grad_norm": 0.2442380917642565,
"learning_rate": 3.792706333973129e-05,
"loss": 0.0088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0034611904993653297,
"step": 495,
"valid_targets_mean": 2969.6,
"valid_targets_min": 1933
},
{
"epoch": 0.48,
"grad_norm": 0.19420220971217322,
"learning_rate": 3.831094049904031e-05,
"loss": 0.0081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003016189206391573,
"step": 500,
"valid_targets_mean": 4435.8,
"valid_targets_min": 1900
},
{
"epoch": 0.4848,
"grad_norm": 0.22164558812400362,
"learning_rate": 3.869481765834933e-05,
"loss": 0.0092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0032875773031264544,
"step": 505,
"valid_targets_mean": 4127.6,
"valid_targets_min": 1719
},
{
"epoch": 0.4896,
"grad_norm": 0.22374906160761918,
"learning_rate": 3.907869481765835e-05,
"loss": 0.0094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003515136195346713,
"step": 510,
"valid_targets_mean": 3748.6,
"valid_targets_min": 1991
},
{
"epoch": 0.4944,
"grad_norm": 0.23454630233428864,
"learning_rate": 3.946257197696737e-05,
"loss": 0.0089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00364376581273973,
"step": 515,
"valid_targets_mean": 3213.7,
"valid_targets_min": 1870
},
{
"epoch": 0.4992,
"grad_norm": 0.21562525432252683,
"learning_rate": 3.984644913627639e-05,
"loss": 0.0099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0031704031862318516,
"step": 520,
"valid_targets_mean": 4295.1,
"valid_targets_min": 1719
},
{
"epoch": 0.504,
"grad_norm": 0.19124689835472855,
"learning_rate": 3.999995959997414e-05,
"loss": 0.0086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0025279440451413393,
"step": 525,
"valid_targets_mean": 4059.2,
"valid_targets_min": 1949
},
{
"epoch": 0.5088,
"grad_norm": 0.23017443414998648,
"learning_rate": 3.999971271151827e-05,
"loss": 0.0094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00394061952829361,
"step": 530,
"valid_targets_mean": 3380.1,
"valid_targets_min": 1716
},
{
"epoch": 0.5136,
"grad_norm": 0.23319549902718553,
"learning_rate": 3.9999241381832614e-05,
"loss": 0.0083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0036682155914604664,
"step": 535,
"valid_targets_mean": 4276.3,
"valid_targets_min": 1662
},
{
"epoch": 0.5184,
"grad_norm": 0.21660253159440473,
"learning_rate": 3.999854561620655e-05,
"loss": 0.0077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0027715754695236683,
"step": 540,
"valid_targets_mean": 4977.5,
"valid_targets_min": 2008
},
{
"epoch": 0.5232,
"grad_norm": 0.19912853298801866,
"learning_rate": 3.9997625422448114e-05,
"loss": 0.0085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0031935221049934626,
"step": 545,
"valid_targets_mean": 3682.2,
"valid_targets_min": 1887
},
{
"epoch": 0.528,
"grad_norm": 0.23896432906358125,
"learning_rate": 3.999648081088391e-05,
"loss": 0.0084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0029742794577032328,
"step": 550,
"valid_targets_mean": 2679.8,
"valid_targets_min": 1361
},
{
"epoch": 0.5328,
"grad_norm": 0.1861883799280027,
"learning_rate": 3.999511179435905e-05,
"loss": 0.0081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.003043075557798147,
"step": 555,
"valid_targets_mean": 4540.3,
"valid_targets_min": 1925
},
{
"epoch": 0.5376,
"grad_norm": 0.199027392427487,
"learning_rate": 3.999351838823691e-05,
"loss": 0.0073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0025762999430298805,
"step": 560,
"valid_targets_mean": 3683.8,
"valid_targets_min": 1924
},
{
"epoch": 0.5424,
"grad_norm": 0.17389819697427045,
"learning_rate": 3.999170061039908e-05,
"loss": 0.0081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0023557578679174185,
"step": 565,
"valid_targets_mean": 3989.9,
"valid_targets_min": 2056
},
{
"epoch": 0.5472,
"grad_norm": 0.2334228789161362,
"learning_rate": 3.998965848124505e-05,
"loss": 0.0078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00438684830442071,
"step": 570,
"valid_targets_mean": 3362.2,
"valid_targets_min": 2027
},
{
"epoch": 0.552,
"grad_norm": 0.17945821748347074,
"learning_rate": 3.998739202369205e-05,
"loss": 0.0076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002859172411262989,
"step": 575,
"valid_targets_mean": 3952.9,
"valid_targets_min": 1924
},
{
"epoch": 0.5568,
"grad_norm": 0.18678690741356818,
"learning_rate": 3.998490126317477e-05,
"loss": 0.0071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002055731136351824,
"step": 580,
"valid_targets_mean": 3083.8,
"valid_targets_min": 1950
},
{
"epoch": 0.5616,
"grad_norm": 0.18250900877509713,
"learning_rate": 3.9982186227645085e-05,
"loss": 0.0065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00249089440330863,
"step": 585,
"valid_targets_mean": 3829.1,
"valid_targets_min": 1829
},
{
"epoch": 0.5664,
"grad_norm": 0.25762748462961554,
"learning_rate": 3.9979246947571724e-05,
"loss": 0.0075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00278734159655869,
"step": 590,
"valid_targets_mean": 3546.0,
"valid_targets_min": 1847
},
{
"epoch": 0.5712,
"grad_norm": 0.16262986702540477,
"learning_rate": 3.9976083455939945e-05,
"loss": 0.007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0021733571775257587,
"step": 595,
"valid_targets_mean": 3765.6,
"valid_targets_min": 1820
},
{
"epoch": 0.576,
"grad_norm": 0.15646991186627635,
"learning_rate": 3.9972695788251155e-05,
"loss": 0.007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0019335944671183825,
"step": 600,
"valid_targets_mean": 2733.1,
"valid_targets_min": 1948
},
{
"epoch": 0.5808,
"grad_norm": 0.1866634582185585,
"learning_rate": 3.996908398252251e-05,
"loss": 0.0067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002379871904850006,
"step": 605,
"valid_targets_mean": 3607.9,
"valid_targets_min": 1361
},
{
"epoch": 0.5856,
"grad_norm": 0.17961524657660505,
"learning_rate": 3.9965248079286505e-05,
"loss": 0.0065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0021986260544508696,
"step": 610,
"valid_targets_mean": 3557.2,
"valid_targets_min": 1716
},
{
"epoch": 0.5904,
"grad_norm": 0.17270751315569516,
"learning_rate": 3.99611881215905e-05,
"loss": 0.0063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001944814925082028,
"step": 615,
"valid_targets_mean": 3441.6,
"valid_targets_min": 1652
},
{
"epoch": 0.5952,
"grad_norm": 0.16463245499969842,
"learning_rate": 3.995690415499624e-05,
"loss": 0.0061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002012577373534441,
"step": 620,
"valid_targets_mean": 4407.1,
"valid_targets_min": 1972
},
{
"epoch": 0.6,
"grad_norm": 0.1498606450916074,
"learning_rate": 3.995239622757936e-05,
"loss": 0.0059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0020940229296684265,
"step": 625,
"valid_targets_mean": 3533.7,
"valid_targets_min": 1760
},
{
"epoch": 0.6048,
"grad_norm": 0.16182624313567134,
"learning_rate": 3.994766438992882e-05,
"loss": 0.0063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002139991382136941,
"step": 630,
"valid_targets_mean": 3479.1,
"valid_targets_min": 1727
},
{
"epoch": 0.6096,
"grad_norm": 0.16492253100569335,
"learning_rate": 3.994270869514635e-05,
"loss": 0.0061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0020363912917673588,
"step": 635,
"valid_targets_mean": 3303.8,
"valid_targets_min": 1361
},
{
"epoch": 0.6144,
"grad_norm": 0.19146820633459416,
"learning_rate": 3.9937529198845864e-05,
"loss": 0.0057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0017477039946243167,
"step": 640,
"valid_targets_mean": 4908.4,
"valid_targets_min": 1833
},
{
"epoch": 0.6192,
"grad_norm": 0.16755843461256645,
"learning_rate": 3.9932125959152833e-05,
"loss": 0.0051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001417946070432663,
"step": 645,
"valid_targets_mean": 3218.1,
"valid_targets_min": 1763
},
{
"epoch": 0.624,
"grad_norm": 0.1491212416818786,
"learning_rate": 3.9926499036703607e-05,
"loss": 0.0064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0022455165162682533,
"step": 650,
"valid_targets_mean": 4048.8,
"valid_targets_min": 1930
},
{
"epoch": 0.6288,
"grad_norm": 0.17871275289420183,
"learning_rate": 3.992064849464476e-05,
"loss": 0.0056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0021069804206490517,
"step": 655,
"valid_targets_mean": 3222.5,
"valid_targets_min": 1939
},
{
"epoch": 0.6336,
"grad_norm": 0.15026244145657655,
"learning_rate": 3.991457439863238e-05,
"loss": 0.0052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0020846365951001644,
"step": 660,
"valid_targets_mean": 4101.5,
"valid_targets_min": 1802
},
{
"epoch": 0.6384,
"grad_norm": 0.15132033151846047,
"learning_rate": 3.990827681683133e-05,
"loss": 0.0054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0013402425684034824,
"step": 665,
"valid_targets_mean": 4053.0,
"valid_targets_min": 2089
},
{
"epoch": 0.6432,
"grad_norm": 0.14291482930175778,
"learning_rate": 3.990175581991448e-05,
"loss": 0.0052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001968193333595991,
"step": 670,
"valid_targets_mean": 4646.0,
"valid_targets_min": 1716
},
{
"epoch": 0.648,
"grad_norm": 0.13205771498876573,
"learning_rate": 3.989501148106189e-05,
"loss": 0.005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0014164431486278772,
"step": 675,
"valid_targets_mean": 4138.6,
"valid_targets_min": 1517
},
{
"epoch": 0.6528,
"grad_norm": 0.1454241022903471,
"learning_rate": 3.988804387596005e-05,
"loss": 0.0052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0017517493106424809,
"step": 680,
"valid_targets_mean": 4377.7,
"valid_targets_min": 1925
},
{
"epoch": 0.6576,
"grad_norm": 0.15080631968356206,
"learning_rate": 3.9880853082800965e-05,
"loss": 0.0051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.002116061747074127,
"step": 685,
"valid_targets_mean": 3755.3,
"valid_targets_min": 1909
},
{
"epoch": 0.6624,
"grad_norm": 0.1377601399723467,
"learning_rate": 3.987343918228133e-05,
"loss": 0.0049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0015512771205976605,
"step": 690,
"valid_targets_mean": 3227.3,
"valid_targets_min": 1970
},
{
"epoch": 0.6672,
"grad_norm": 0.16894800757253736,
"learning_rate": 3.9865802257601584e-05,
"loss": 0.0051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0015093731926754117,
"step": 695,
"valid_targets_mean": 3398.4,
"valid_targets_min": 2031
},
{
"epoch": 0.672,
"grad_norm": 0.13885441728364661,
"learning_rate": 3.9857942394464976e-05,
"loss": 0.005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0017606966430321336,
"step": 700,
"valid_targets_mean": 3476.6,
"valid_targets_min": 1930
},
{
"epoch": 0.6768,
"grad_norm": 0.1338580199682233,
"learning_rate": 3.984985968107667e-05,
"loss": 0.0051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001561261946335435,
"step": 705,
"valid_targets_mean": 4040.5,
"valid_targets_min": 1913
},
{
"epoch": 0.6816,
"grad_norm": 0.1432672149680153,
"learning_rate": 3.984155420814266e-05,
"loss": 0.0047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0013145990669727325,
"step": 710,
"valid_targets_mean": 4966.2,
"valid_targets_min": 1988
},
{
"epoch": 0.6864,
"grad_norm": 0.13283116074357573,
"learning_rate": 3.9833026068868814e-05,
"loss": 0.0048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001742208143696189,
"step": 715,
"valid_targets_mean": 4114.5,
"valid_targets_min": 1914
},
{
"epoch": 0.6912,
"grad_norm": 0.12495828177583537,
"learning_rate": 3.982427535895982e-05,
"loss": 0.0043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001497375313192606,
"step": 720,
"valid_targets_mean": 3872.3,
"valid_targets_min": 1942
},
{
"epoch": 0.696,
"grad_norm": 0.26157930715172134,
"learning_rate": 3.9815302176618076e-05,
"loss": 0.0045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012776684015989304,
"step": 725,
"valid_targets_mean": 3521.8,
"valid_targets_min": 1751
},
{
"epoch": 0.7008,
"grad_norm": 0.1247067429593807,
"learning_rate": 3.980610662254264e-05,
"loss": 0.0047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0015188871184363961,
"step": 730,
"valid_targets_mean": 3731.8,
"valid_targets_min": 1942
},
{
"epoch": 0.7056,
"grad_norm": 0.10721609529299062,
"learning_rate": 3.9796688799928075e-05,
"loss": 0.0044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0013464395888149738,
"step": 735,
"valid_targets_mean": 4545.2,
"valid_targets_min": 2003
},
{
"epoch": 0.7104,
"grad_norm": 0.14094264977785242,
"learning_rate": 3.978704881446327e-05,
"loss": 0.0044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0014088444877415895,
"step": 740,
"valid_targets_mean": 3220.6,
"valid_targets_min": 1906
},
{
"epoch": 0.7152,
"grad_norm": 0.10781543110136461,
"learning_rate": 3.9777186774330304e-05,
"loss": 0.0044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012600058689713478,
"step": 745,
"valid_targets_mean": 4427.3,
"valid_targets_min": 2263
},
{
"epoch": 0.72,
"grad_norm": 0.12029787392855426,
"learning_rate": 3.976710279020318e-05,
"loss": 0.0043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010703550651669502,
"step": 750,
"valid_targets_mean": 4369.5,
"valid_targets_min": 2020
},
{
"epoch": 0.7248,
"grad_norm": 0.15068996687496647,
"learning_rate": 3.975679697524661e-05,
"loss": 0.0046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0014090463519096375,
"step": 755,
"valid_targets_mean": 4053.9,
"valid_targets_min": 1917
},
{
"epoch": 0.7296,
"grad_norm": 0.12000665726518672,
"learning_rate": 3.974626944511475e-05,
"loss": 0.0041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011800779029726982,
"step": 760,
"valid_targets_mean": 3526.3,
"valid_targets_min": 2033
},
{
"epoch": 0.7344,
"grad_norm": 0.10875222012783078,
"learning_rate": 3.973552031794988e-05,
"loss": 0.0042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012633678270503879,
"step": 765,
"valid_targets_mean": 5437.8,
"valid_targets_min": 1943
},
{
"epoch": 0.7392,
"grad_norm": 0.11241217686368878,
"learning_rate": 3.9724549714381106e-05,
"loss": 0.0041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012497665593400598,
"step": 770,
"valid_targets_mean": 4326.5,
"valid_targets_min": 2002
},
{
"epoch": 0.744,
"grad_norm": 0.11897759021143543,
"learning_rate": 3.971335775752298e-05,
"loss": 0.0045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001275674207136035,
"step": 775,
"valid_targets_mean": 2989.6,
"valid_targets_min": 1960
},
{
"epoch": 0.7488,
"grad_norm": 0.11558986969740365,
"learning_rate": 3.970194457297414e-05,
"loss": 0.0042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0014982791617512703,
"step": 780,
"valid_targets_mean": 3710.9,
"valid_targets_min": 1908
},
{
"epoch": 0.7536,
"grad_norm": 0.10741653865582416,
"learning_rate": 3.9690310288815876e-05,
"loss": 0.004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00115393684245646,
"step": 785,
"valid_targets_mean": 4165.2,
"valid_targets_min": 1775
},
{
"epoch": 0.7584,
"grad_norm": 0.11516842126720446,
"learning_rate": 3.967845503561073e-05,
"loss": 0.0043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0013473081635311246,
"step": 790,
"valid_targets_mean": 4067.3,
"valid_targets_min": 1942
},
{
"epoch": 0.7632,
"grad_norm": 0.11351545091236749,
"learning_rate": 3.9666378946400974e-05,
"loss": 0.0036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001365464529953897,
"step": 795,
"valid_targets_mean": 3699.9,
"valid_targets_min": 1833
},
{
"epoch": 0.768,
"grad_norm": 0.12309069150799558,
"learning_rate": 3.965408215670719e-05,
"loss": 0.004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0013098465278744698,
"step": 800,
"valid_targets_mean": 3937.4,
"valid_targets_min": 1964
},
{
"epoch": 0.7728,
"grad_norm": 0.12432078035897463,
"learning_rate": 3.964156480452667e-05,
"loss": 0.0042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0015537126455456018,
"step": 805,
"valid_targets_mean": 4146.9,
"valid_targets_min": 1764
},
{
"epoch": 0.7776,
"grad_norm": 0.11795652999166656,
"learning_rate": 3.962882703033195e-05,
"loss": 0.0043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011664225021377206,
"step": 810,
"valid_targets_mean": 4204.5,
"valid_targets_min": 1939
},
{
"epoch": 0.7824,
"grad_norm": 0.11091476599630226,
"learning_rate": 3.961586897706915e-05,
"loss": 0.0036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0015496142441406846,
"step": 815,
"valid_targets_mean": 4644.7,
"valid_targets_min": 1939
},
{
"epoch": 0.7872,
"grad_norm": 0.10688116342811396,
"learning_rate": 3.960269079015643e-05,
"loss": 0.0039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001176126068457961,
"step": 820,
"valid_targets_mean": 4056.7,
"valid_targets_min": 1980
},
{
"epoch": 0.792,
"grad_norm": 0.11642692391730794,
"learning_rate": 3.958929261748236e-05,
"loss": 0.0036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001297774026170373,
"step": 825,
"valid_targets_mean": 3668.7,
"valid_targets_min": 1614
},
{
"epoch": 0.7968,
"grad_norm": 0.098807867074682,
"learning_rate": 3.957567460940419e-05,
"loss": 0.0038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012444111052900553,
"step": 830,
"valid_targets_mean": 4412.2,
"valid_targets_min": 1763
},
{
"epoch": 0.8016,
"grad_norm": 0.11412160343259568,
"learning_rate": 3.9561836918746256e-05,
"loss": 0.0035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010612367186695337,
"step": 835,
"valid_targets_mean": 4943.7,
"valid_targets_min": 1877
},
{
"epoch": 0.8064,
"grad_norm": 0.11666792034799639,
"learning_rate": 3.95477797007982e-05,
"loss": 0.0036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011054251808673143,
"step": 840,
"valid_targets_mean": 4050.5,
"valid_targets_min": 1937
},
{
"epoch": 0.8112,
"grad_norm": 0.11538500128726843,
"learning_rate": 3.953350311331325e-05,
"loss": 0.0037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011343640508130193,
"step": 845,
"valid_targets_mean": 4588.8,
"valid_targets_min": 1775
},
{
"epoch": 0.816,
"grad_norm": 0.09364586828014224,
"learning_rate": 3.951900731650645e-05,
"loss": 0.0034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010743942111730576,
"step": 850,
"valid_targets_mean": 4492.2,
"valid_targets_min": 1906
},
{
"epoch": 0.8208,
"grad_norm": 0.11750177774881453,
"learning_rate": 3.950429247305286e-05,
"loss": 0.0036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011643307516351342,
"step": 855,
"valid_targets_mean": 2967.8,
"valid_targets_min": 1680
},
{
"epoch": 0.8256,
"grad_norm": 0.11124286170862023,
"learning_rate": 3.9489358748085737e-05,
"loss": 0.0034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001344716758467257,
"step": 860,
"valid_targets_mean": 3575.3,
"valid_targets_min": 1771
},
{
"epoch": 0.8304,
"grad_norm": 0.1084575920874673,
"learning_rate": 3.947420630919466e-05,
"loss": 0.0034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001134268008172512,
"step": 865,
"valid_targets_mean": 4376.6,
"valid_targets_min": 1891
},
{
"epoch": 0.8352,
"grad_norm": 0.10852534059779477,
"learning_rate": 3.9458835326423674e-05,
"loss": 0.0035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001093921484425664,
"step": 870,
"valid_targets_mean": 3641.3,
"valid_targets_min": 1838
},
{
"epoch": 0.84,
"grad_norm": 0.1079926557884953,
"learning_rate": 3.9443245972269376e-05,
"loss": 0.0038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012400320265442133,
"step": 875,
"valid_targets_mean": 3411.1,
"valid_targets_min": 1992
},
{
"epoch": 0.8448,
"grad_norm": 0.11238022059807141,
"learning_rate": 3.942743842167896e-05,
"loss": 0.0036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012292286846786737,
"step": 880,
"valid_targets_mean": 2977.5,
"valid_targets_min": 1877
},
{
"epoch": 0.8496,
"grad_norm": 0.09672286411873122,
"learning_rate": 3.941141285204829e-05,
"loss": 0.0032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007136667263694108,
"step": 885,
"valid_targets_mean": 3401.6,
"valid_targets_min": 1727
},
{
"epoch": 0.8544,
"grad_norm": 0.108672832404322,
"learning_rate": 3.939516944321986e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0014265866484493017,
"step": 890,
"valid_targets_mean": 5317.2,
"valid_targets_min": 2096
},
{
"epoch": 0.8592,
"grad_norm": 0.08500035385803482,
"learning_rate": 3.937870837748085e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007657730020582676,
"step": 895,
"valid_targets_mean": 4747.8,
"valid_targets_min": 1652
},
{
"epoch": 0.864,
"grad_norm": 0.12054172577524297,
"learning_rate": 3.936202983956098e-05,
"loss": 0.0032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010280468268319964,
"step": 900,
"valid_targets_mean": 4090.7,
"valid_targets_min": 1921
},
{
"epoch": 0.8688,
"grad_norm": 0.10234250480193231,
"learning_rate": 3.934513401663052e-05,
"loss": 0.0032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010562061797827482,
"step": 905,
"valid_targets_mean": 3031.4,
"valid_targets_min": 1991
},
{
"epoch": 0.8736,
"grad_norm": 0.12774724999406212,
"learning_rate": 3.9328021098298164e-05,
"loss": 0.0035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001268667634576559,
"step": 910,
"valid_targets_mean": 3329.1,
"valid_targets_min": 2014
},
{
"epoch": 0.8784,
"grad_norm": 0.10641838411361687,
"learning_rate": 3.9310691276608894e-05,
"loss": 0.0032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000988850835710764,
"step": 915,
"valid_targets_mean": 3899.7,
"valid_targets_min": 1716
},
{
"epoch": 0.8832,
"grad_norm": 0.10827132525574004,
"learning_rate": 3.9293144746041824e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011344174854457378,
"step": 920,
"valid_targets_mean": 3272.9,
"valid_targets_min": 1760
},
{
"epoch": 0.888,
"grad_norm": 0.09513704022755502,
"learning_rate": 3.9275381703508034e-05,
"loss": 0.0032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011016558855772018,
"step": 925,
"valid_targets_mean": 3681.6,
"valid_targets_min": 1836
},
{
"epoch": 0.8928,
"grad_norm": 0.07861451847755797,
"learning_rate": 3.925740234834833e-05,
"loss": 0.0028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006670982111245394,
"step": 930,
"valid_targets_mean": 4255.3,
"valid_targets_min": 1361
},
{
"epoch": 0.8976,
"grad_norm": 0.09716097453724373,
"learning_rate": 3.9239206882331045e-05,
"loss": 0.0028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010126556735485792,
"step": 935,
"valid_targets_mean": 4101.5,
"valid_targets_min": 1933
},
{
"epoch": 0.9024,
"grad_norm": 0.09329297657208854,
"learning_rate": 3.922079550964976e-05,
"loss": 0.0034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001035340828821063,
"step": 940,
"valid_targets_mean": 3683.1,
"valid_targets_min": 1912
},
{
"epoch": 0.9072,
"grad_norm": 0.10634525538037214,
"learning_rate": 3.920216843692099e-05,
"loss": 0.003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008592663798481226,
"step": 945,
"valid_targets_mean": 3470.2,
"valid_targets_min": 1942
},
{
"epoch": 0.912,
"grad_norm": 0.09331321143620223,
"learning_rate": 3.918332587318189e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009684814722277224,
"step": 950,
"valid_targets_mean": 3834.3,
"valid_targets_min": 1921
},
{
"epoch": 0.9168,
"grad_norm": 0.0933007582514206,
"learning_rate": 3.916426802988791e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009699763031676412,
"step": 955,
"valid_targets_mean": 4792.5,
"valid_targets_min": 1802
},
{
"epoch": 0.9216,
"grad_norm": 0.08822587812104978,
"learning_rate": 3.9144995120910414e-05,
"loss": 0.0029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.001074823783710599,
"step": 960,
"valid_targets_mean": 4560.1,
"valid_targets_min": 2210
},
{
"epoch": 0.9264,
"grad_norm": 0.10596108991960777,
"learning_rate": 3.912550736253428e-05,
"loss": 0.0029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008593408274464309,
"step": 965,
"valid_targets_mean": 3210.6,
"valid_targets_min": 1833
},
{
"epoch": 0.9312,
"grad_norm": 0.08707190113521034,
"learning_rate": 3.9105804973455466e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010110901203006506,
"step": 970,
"valid_targets_mean": 4952.5,
"valid_targets_min": 1987
},
{
"epoch": 0.936,
"grad_norm": 0.09171050448973861,
"learning_rate": 3.908588817477858e-05,
"loss": 0.0028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010078486520797014,
"step": 975,
"valid_targets_mean": 5238.2,
"valid_targets_min": 1863
},
{
"epoch": 0.9408,
"grad_norm": 0.09164652188624466,
"learning_rate": 3.9065757190014356e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008506424492225051,
"step": 980,
"valid_targets_mean": 4875.0,
"valid_targets_min": 1925
},
{
"epoch": 0.9456,
"grad_norm": 0.10980723053180172,
"learning_rate": 3.90454122450772e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008993170922622085,
"step": 985,
"valid_targets_mean": 3326.2,
"valid_targets_min": 1920
},
{
"epoch": 0.9504,
"grad_norm": 0.08983452553358251,
"learning_rate": 3.9024853568282615e-05,
"loss": 0.0031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009225120302289724,
"step": 990,
"valid_targets_mean": 4108.7,
"valid_targets_min": 1975
},
{
"epoch": 0.9552,
"grad_norm": 0.09169525441917338,
"learning_rate": 3.900408139034464e-05,
"loss": 0.0028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007527648704126477,
"step": 995,
"valid_targets_mean": 3358.1,
"valid_targets_min": 1908
},
{
"epoch": 0.96,
"grad_norm": 0.08231724789721716,
"learning_rate": 3.89830959443733e-05,
"loss": 0.0028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007301989244297147,
"step": 1000,
"valid_targets_mean": 3902.4,
"valid_targets_min": 1719
},
{
"epoch": 0.9648,
"grad_norm": 0.09136251476965629,
"learning_rate": 3.896189746587192e-05,
"loss": 0.0026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006765191210433841,
"step": 1005,
"valid_targets_mean": 3040.7,
"valid_targets_min": 1992
},
{
"epoch": 0.9696,
"grad_norm": 0.0973881927043345,
"learning_rate": 3.894048619273457e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008304090006276965,
"step": 1010,
"valid_targets_mean": 3484.0,
"valid_targets_min": 2008
},
{
"epoch": 0.9744,
"grad_norm": 0.10329326340033367,
"learning_rate": 3.89188623652433e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010426387889310718,
"step": 1015,
"valid_targets_mean": 3487.8,
"valid_targets_min": 1933
},
{
"epoch": 0.9792,
"grad_norm": 0.08556444578908518,
"learning_rate": 3.889702622606553e-05,
"loss": 0.0028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0011887401342391968,
"step": 1020,
"valid_targets_mean": 4090.1,
"valid_targets_min": 1951
},
{
"epoch": 0.984,
"grad_norm": 0.08515059162016657,
"learning_rate": 3.887497802025129e-05,
"loss": 0.0024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007636288064531982,
"step": 1025,
"valid_targets_mean": 4201.1,
"valid_targets_min": 1920
},
{
"epoch": 0.9888,
"grad_norm": 0.09535626849370749,
"learning_rate": 3.885271799523043e-05,
"loss": 0.0026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009697978966869414,
"step": 1030,
"valid_targets_mean": 3636.8,
"valid_targets_min": 1614
},
{
"epoch": 0.9936,
"grad_norm": 0.0980669848781187,
"learning_rate": 3.8830246400809925e-05,
"loss": 0.0029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009542859625071287,
"step": 1035,
"valid_targets_mean": 3659.2,
"valid_targets_min": 1870
},
{
"epoch": 0.9984,
"grad_norm": 0.08778230952309017,
"learning_rate": 3.880756348917101e-05,
"loss": 0.003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0012875967659056187,
"step": 1040,
"valid_targets_mean": 4062.1,
"valid_targets_min": 2081
},
{
"epoch": 1.00288,
"grad_norm": 0.086197700086096,
"learning_rate": 3.8784669514866365e-05,
"loss": 0.0025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009929087245836854,
"step": 1045,
"valid_targets_mean": 3231.5,
"valid_targets_min": 1719
},
{
"epoch": 1.00768,
"grad_norm": 0.08547866320552522,
"learning_rate": 3.876156473481727e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000846736365929246,
"step": 1050,
"valid_targets_mean": 4431.3,
"valid_targets_min": 1993
},
{
"epoch": 1.01248,
"grad_norm": 0.08391253769447353,
"learning_rate": 3.8738249408310716e-05,
"loss": 0.0024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007149117300286889,
"step": 1055,
"valid_targets_mean": 3551.1,
"valid_targets_min": 1771
},
{
"epoch": 1.01728,
"grad_norm": 0.07389756284878693,
"learning_rate": 3.871472379699648e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007226199377328157,
"step": 1060,
"valid_targets_mean": 3603.4,
"valid_targets_min": 2074
},
{
"epoch": 1.02208,
"grad_norm": 0.08190003923821697,
"learning_rate": 3.869098816488422e-05,
"loss": 0.0025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008007280994206667,
"step": 1065,
"valid_targets_mean": 3631.3,
"valid_targets_min": 1970
},
{
"epoch": 1.02688,
"grad_norm": 0.0953727091278497,
"learning_rate": 3.866704277834049e-05,
"loss": 0.0025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009208035771735013,
"step": 1070,
"valid_targets_mean": 3726.2,
"valid_targets_min": 1906
},
{
"epoch": 1.03168,
"grad_norm": 0.0782930286061942,
"learning_rate": 3.864288790608573e-05,
"loss": 0.0029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010479418560862541,
"step": 1075,
"valid_targets_mean": 4111.3,
"valid_targets_min": 2026
},
{
"epoch": 1.03648,
"grad_norm": 0.08763252794635999,
"learning_rate": 3.861852381919132e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008621154120191932,
"step": 1080,
"valid_targets_mean": 3631.4,
"valid_targets_min": 2011
},
{
"epoch": 1.04128,
"grad_norm": 0.07975207664420085,
"learning_rate": 3.8593950791076446e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007578890072181821,
"step": 1085,
"valid_targets_mean": 4506.1,
"valid_targets_min": 1838
},
{
"epoch": 1.04608,
"grad_norm": 0.08519082868687813,
"learning_rate": 3.856916909750512e-05,
"loss": 0.0024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008825008408166468,
"step": 1090,
"valid_targets_mean": 3900.7,
"valid_targets_min": 1889
},
{
"epoch": 1.05088,
"grad_norm": 0.08661350730724589,
"learning_rate": 3.854417901658301e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010637170635163784,
"step": 1095,
"valid_targets_mean": 3464.5,
"valid_targets_min": 1839
},
{
"epoch": 1.05568,
"grad_norm": 0.0779672388921201,
"learning_rate": 3.851898082875438e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006217740592546761,
"step": 1100,
"valid_targets_mean": 3628.1,
"valid_targets_min": 1802
},
{
"epoch": 1.06048,
"grad_norm": 0.07394866276608925,
"learning_rate": 3.849357481679891e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000598479644395411,
"step": 1105,
"valid_targets_mean": 3672.1,
"valid_targets_min": 1562
},
{
"epoch": 1.06528,
"grad_norm": 0.08662140030567693,
"learning_rate": 3.846796126582851e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008953436627052724,
"step": 1110,
"valid_targets_mean": 4051.2,
"valid_targets_min": 1740
},
{
"epoch": 1.07008,
"grad_norm": 0.0823370220101719,
"learning_rate": 3.844214046328416e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006970255635678768,
"step": 1115,
"valid_targets_mean": 3599.7,
"valid_targets_min": 1928
},
{
"epoch": 1.07488,
"grad_norm": 0.0901193916034131,
"learning_rate": 3.841611269893266e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006074707489460707,
"step": 1120,
"valid_targets_mean": 3385.9,
"valid_targets_min": 1980
},
{
"epoch": 1.07968,
"grad_norm": 0.0761744661497128,
"learning_rate": 3.8389878264863364e-05,
"loss": 0.0026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008789674611762166,
"step": 1125,
"valid_targets_mean": 3657.1,
"valid_targets_min": 1934
},
{
"epoch": 1.08448,
"grad_norm": 0.08437359007221527,
"learning_rate": 3.836343745548495e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008096237434074283,
"step": 1130,
"valid_targets_mean": 3535.8,
"valid_targets_min": 1906
},
{
"epoch": 1.08928,
"grad_norm": 0.0919856624688295,
"learning_rate": 3.833679056752205e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010354400146752596,
"step": 1135,
"valid_targets_mean": 4240.6,
"valid_targets_min": 1662
},
{
"epoch": 1.09408,
"grad_norm": 0.0672698854888288,
"learning_rate": 3.8309937900012e-05,
"loss": 0.0024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006182040087878704,
"step": 1140,
"valid_targets_mean": 5282.5,
"valid_targets_min": 1847
},
{
"epoch": 1.09888,
"grad_norm": 0.09154431881180543,
"learning_rate": 3.8282879754301395e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008248881786130369,
"step": 1145,
"valid_targets_mean": 3183.1,
"valid_targets_min": 1868
},
{
"epoch": 1.10368,
"grad_norm": 0.08087150149583128,
"learning_rate": 3.825561643404277e-05,
"loss": 0.0024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006553860730491579,
"step": 1150,
"valid_targets_mean": 4181.3,
"valid_targets_min": 1838
},
{
"epoch": 1.10848,
"grad_norm": 0.07350347984015675,
"learning_rate": 3.8228148245191195e-05,
"loss": 0.0024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006827219622209668,
"step": 1155,
"valid_targets_mean": 4734.0,
"valid_targets_min": 2008
},
{
"epoch": 1.11328,
"grad_norm": 0.07091572829462224,
"learning_rate": 3.820047549600078e-05,
"loss": 0.0027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006135037983767688,
"step": 1160,
"valid_targets_mean": 3254.9,
"valid_targets_min": 1525
},
{
"epoch": 1.11808,
"grad_norm": 0.0777569727802482,
"learning_rate": 3.8172598497021304e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0010421124752610922,
"step": 1165,
"valid_targets_mean": 4660.4,
"valid_targets_min": 1705
},
{
"epoch": 1.12288,
"grad_norm": 0.08688863620334608,
"learning_rate": 3.8144517561094635e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008928946917876601,
"step": 1170,
"valid_targets_mean": 3918.8,
"valid_targets_min": 1907
},
{
"epoch": 1.12768,
"grad_norm": 0.07873600105581716,
"learning_rate": 3.811623300335129e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007803626358509064,
"step": 1175,
"valid_targets_mean": 3826.0,
"valid_targets_min": 1933
},
{
"epoch": 1.13248,
"grad_norm": 0.07726798965675107,
"learning_rate": 3.808774514120689e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007038116455078125,
"step": 1180,
"valid_targets_mean": 2743.8,
"valid_targets_min": 2007
},
{
"epoch": 1.13728,
"grad_norm": 0.07403528700578575,
"learning_rate": 3.805905429435856e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009153485298156738,
"step": 1185,
"valid_targets_mean": 4641.1,
"valid_targets_min": 1904
},
{
"epoch": 1.14208,
"grad_norm": 0.0872290553941291,
"learning_rate": 3.803016078478137e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007584341801702976,
"step": 1190,
"valid_targets_mean": 3616.6,
"valid_targets_min": 1925
},
{
"epoch": 1.14688,
"grad_norm": 0.0709258238934523,
"learning_rate": 3.800106493672472e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006345144938677549,
"step": 1195,
"valid_targets_mean": 3609.2,
"valid_targets_min": 1786
},
{
"epoch": 1.15168,
"grad_norm": 0.07801772343781505,
"learning_rate": 3.7971767076708704e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009863885352388024,
"step": 1200,
"valid_targets_mean": 3440.6,
"valid_targets_min": 1614
},
{
"epoch": 1.15648,
"grad_norm": 0.07389611823346304,
"learning_rate": 3.794226753352042e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007948827114887536,
"step": 1205,
"valid_targets_mean": 3287.3,
"valid_targets_min": 1361
},
{
"epoch": 1.16128,
"grad_norm": 0.06497642766755227,
"learning_rate": 3.791256663821032e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005222467589192092,
"step": 1210,
"valid_targets_mean": 4036.9,
"valid_targets_min": 2034
},
{
"epoch": 1.16608,
"grad_norm": 0.06299482388250971,
"learning_rate": 3.788266472408846e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005134165403433144,
"step": 1215,
"valid_targets_mean": 3814.6,
"valid_targets_min": 1914
},
{
"epoch": 1.17088,
"grad_norm": 0.08171326113301111,
"learning_rate": 3.785256212672077e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009849846828728914,
"step": 1220,
"valid_targets_mean": 3237.6,
"valid_targets_min": 2013
},
{
"epoch": 1.17568,
"grad_norm": 0.0804150430123658,
"learning_rate": 3.7822259183925324e-05,
"loss": 0.0022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006895281840115786,
"step": 1225,
"valid_targets_mean": 3147.6,
"valid_targets_min": 2073
},
{
"epoch": 1.18048,
"grad_norm": 0.07953442754835148,
"learning_rate": 3.7791756235768476e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005019694799557328,
"step": 1230,
"valid_targets_mean": 4059.0,
"valid_targets_min": 1986
},
{
"epoch": 1.1852800000000001,
"grad_norm": 0.06855513232526653,
"learning_rate": 3.7761053624561104e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006399221601895988,
"step": 1235,
"valid_targets_mean": 4481.3,
"valid_targets_min": 1652
},
{
"epoch": 1.19008,
"grad_norm": 0.07266331471123853,
"learning_rate": 3.7730151694854757e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006030212971381843,
"step": 1240,
"valid_targets_mean": 3147.8,
"valid_targets_min": 2112
},
{
"epoch": 1.19488,
"grad_norm": 0.07341874027666305,
"learning_rate": 3.769905079343777e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005216033896431327,
"step": 1245,
"valid_targets_mean": 3752.4,
"valid_targets_min": 2000
},
{
"epoch": 1.19968,
"grad_norm": 0.0772295236927303,
"learning_rate": 3.766775126933138e-05,
"loss": 0.0023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007670236518606544,
"step": 1250,
"valid_targets_mean": 3803.3,
"valid_targets_min": 1887
},
{
"epoch": 1.20448,
"grad_norm": 0.06534912913900263,
"learning_rate": 3.7636253473785815e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006711517926305532,
"step": 1255,
"valid_targets_mean": 3514.3,
"valid_targets_min": 1719
},
{
"epoch": 1.20928,
"grad_norm": 0.06650634860098974,
"learning_rate": 3.760455776027636e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000556517974473536,
"step": 1260,
"valid_targets_mean": 4241.4,
"valid_targets_min": 1949
},
{
"epoch": 1.21408,
"grad_norm": 0.08877250893671114,
"learning_rate": 3.7572664484499365e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0009134068968705833,
"step": 1265,
"valid_targets_mean": 2475.9,
"valid_targets_min": 1900
},
{
"epoch": 1.21888,
"grad_norm": 0.07123738698666394,
"learning_rate": 3.7540574004368264e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004884611698798835,
"step": 1270,
"valid_targets_mean": 4605.3,
"valid_targets_min": 1833
},
{
"epoch": 1.2236799999999999,
"grad_norm": 0.06505623796756807,
"learning_rate": 3.750828668000959e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005974129308015108,
"step": 1275,
"valid_targets_mean": 3525.4,
"valid_targets_min": 2047
},
{
"epoch": 1.22848,
"grad_norm": 0.061783395627733356,
"learning_rate": 3.747580287375887e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005115181556902826,
"step": 1280,
"valid_targets_mean": 4752.2,
"valid_targets_min": 2102
},
{
"epoch": 1.23328,
"grad_norm": 0.06631151827050302,
"learning_rate": 3.744312295015662e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005237223813310266,
"step": 1285,
"valid_targets_mean": 4775.7,
"valid_targets_min": 1933
},
{
"epoch": 1.23808,
"grad_norm": 0.08273205851761135,
"learning_rate": 3.7410247275944223e-05,
"loss": 0.0021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007862814818508923,
"step": 1290,
"valid_targets_mean": 3475.9,
"valid_targets_min": 1771
},
{
"epoch": 1.24288,
"grad_norm": 0.05896227722198991,
"learning_rate": 3.737717622005981e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005240546306595206,
"step": 1295,
"valid_targets_mean": 4562.6,
"valid_targets_min": 2026
},
{
"epoch": 1.24768,
"grad_norm": 0.0693995618369498,
"learning_rate": 3.734391015363413e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005423809634521604,
"step": 1300,
"valid_targets_mean": 4364.8,
"valid_targets_min": 1863
},
{
"epoch": 1.25248,
"grad_norm": 0.07369923985839384,
"learning_rate": 3.7310449449986404e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005977890104986727,
"step": 1305,
"valid_targets_mean": 3853.8,
"valid_targets_min": 1863
},
{
"epoch": 1.25728,
"grad_norm": 0.07551774484051925,
"learning_rate": 3.727679448462009e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006663898238912225,
"step": 1310,
"valid_targets_mean": 3010.4,
"valid_targets_min": 1912
},
{
"epoch": 1.26208,
"grad_norm": 0.064694527946226,
"learning_rate": 3.7242945635218696e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006106563378125429,
"step": 1315,
"valid_targets_mean": 4648.5,
"valid_targets_min": 1614
},
{
"epoch": 1.26688,
"grad_norm": 0.07397659737573328,
"learning_rate": 3.720890328164156e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007054214365780354,
"step": 1320,
"valid_targets_mean": 3650.5,
"valid_targets_min": 1525
},
{
"epoch": 1.27168,
"grad_norm": 0.06335161480174571,
"learning_rate": 3.717466780591956e-05,
"loss": 0.002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006929860101081431,
"step": 1325,
"valid_targets_mean": 5325.5,
"valid_targets_min": 2040
},
{
"epoch": 1.27648,
"grad_norm": 0.06804994355224919,
"learning_rate": 3.7140239592250804e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000726754660718143,
"step": 1330,
"valid_targets_mean": 4236.4,
"valid_targets_min": 1877
},
{
"epoch": 1.28128,
"grad_norm": 0.06480070102782637,
"learning_rate": 3.71056190269964e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006756271468475461,
"step": 1335,
"valid_targets_mean": 4148.4,
"valid_targets_min": 1562
},
{
"epoch": 1.2860800000000001,
"grad_norm": 0.07074354812550124,
"learning_rate": 3.7070806498676025e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006020993459969759,
"step": 1340,
"valid_targets_mean": 3465.2,
"valid_targets_min": 2013
},
{
"epoch": 1.29088,
"grad_norm": 0.06503461305315013,
"learning_rate": 3.7035802397963625e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006871588411740959,
"step": 1345,
"valid_targets_mean": 3813.0,
"valid_targets_min": 1614
},
{
"epoch": 1.29568,
"grad_norm": 0.07401450353104723,
"learning_rate": 3.700060711768302e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006600288324989378,
"step": 1350,
"valid_targets_mean": 3878.8,
"valid_targets_min": 1839
},
{
"epoch": 1.30048,
"grad_norm": 0.07680667987027859,
"learning_rate": 3.696522105280348e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007312206435017288,
"step": 1355,
"valid_targets_mean": 4043.9,
"valid_targets_min": 1764
},
{
"epoch": 1.30528,
"grad_norm": 0.06469896222704227,
"learning_rate": 3.6929644600435303e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006350899348035455,
"step": 1360,
"valid_targets_mean": 4086.7,
"valid_targets_min": 1652
},
{
"epoch": 1.3100800000000001,
"grad_norm": 0.06477008506037779,
"learning_rate": 3.689387815982536e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005677276058122516,
"step": 1365,
"valid_targets_mean": 4331.5,
"valid_targets_min": 2088
},
{
"epoch": 1.31488,
"grad_norm": 0.06258396354088679,
"learning_rate": 3.6857922132352617e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006163810612633824,
"step": 1370,
"valid_targets_mean": 4495.3,
"valid_targets_min": 1705
},
{
"epoch": 1.31968,
"grad_norm": 0.07028510535202044,
"learning_rate": 3.6821776921523615e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007107181008905172,
"step": 1375,
"valid_targets_mean": 3949.4,
"valid_targets_min": 2014
},
{
"epoch": 1.3244799999999999,
"grad_norm": 0.05077976162402836,
"learning_rate": 3.678544293296797e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004410394176375121,
"step": 1380,
"valid_targets_mean": 4144.0,
"valid_targets_min": 1921
},
{
"epoch": 1.32928,
"grad_norm": 0.07438935849118425,
"learning_rate": 3.674892057443378e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0008442823309451342,
"step": 1385,
"valid_targets_mean": 4133.5,
"valid_targets_min": 2143
},
{
"epoch": 1.33408,
"grad_norm": 0.0682757279109907,
"learning_rate": 3.671221025578309e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007162219844758511,
"step": 1390,
"valid_targets_mean": 4855.8,
"valid_targets_min": 1913
},
{
"epoch": 1.33888,
"grad_norm": 0.07341922338949,
"learning_rate": 3.6675312388987274e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006667692796327174,
"step": 1395,
"valid_targets_mean": 3465.5,
"valid_targets_min": 2030
},
{
"epoch": 1.34368,
"grad_norm": 0.07020332214835699,
"learning_rate": 3.663822738812241e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006832577055320144,
"step": 1400,
"valid_targets_mean": 4072.4,
"valid_targets_min": 2007
},
{
"epoch": 1.34848,
"grad_norm": 0.06099353552564727,
"learning_rate": 3.660095566936462e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00047730878577567637,
"step": 1405,
"valid_targets_mean": 5152.2,
"valid_targets_min": 1977
},
{
"epoch": 1.35328,
"grad_norm": 0.05528893930640278,
"learning_rate": 3.656349765098546e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005526028689928353,
"step": 1410,
"valid_targets_mean": 4026.0,
"valid_targets_min": 2112
},
{
"epoch": 1.35808,
"grad_norm": 0.06445302958586464,
"learning_rate": 3.652585375334714e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005105407908558846,
"step": 1415,
"valid_targets_mean": 4236.2,
"valid_targets_min": 1662
},
{
"epoch": 1.36288,
"grad_norm": 0.06802186778046675,
"learning_rate": 3.648802439889785e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005574011011049151,
"step": 1420,
"valid_targets_mean": 3783.2,
"valid_targets_min": 1839
},
{
"epoch": 1.36768,
"grad_norm": 0.06528073484942466,
"learning_rate": 3.645001001216705e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005780609208159149,
"step": 1425,
"valid_targets_mean": 2935.5,
"valid_targets_min": 1838
},
{
"epoch": 1.37248,
"grad_norm": 0.05639907531689663,
"learning_rate": 3.641181101976065e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004771294188685715,
"step": 1430,
"valid_targets_mean": 3967.0,
"valid_targets_min": 1904
},
{
"epoch": 1.37728,
"grad_norm": 0.06966113126336215,
"learning_rate": 3.637342785035624e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004934966564178467,
"step": 1435,
"valid_targets_mean": 4545.3,
"valid_targets_min": 1680
},
{
"epoch": 1.38208,
"grad_norm": 0.06651395252299827,
"learning_rate": 3.633486093469829e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000541509420145303,
"step": 1440,
"valid_targets_mean": 3806.9,
"valid_targets_min": 1907
},
{
"epoch": 1.3868800000000001,
"grad_norm": 0.06692400353511045,
"learning_rate": 3.629611070559333e-05,
"loss": 0.0018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000700898002833128,
"step": 1445,
"valid_targets_mean": 2970.4,
"valid_targets_min": 1727
},
{
"epoch": 1.39168,
"grad_norm": 0.0556009908675102,
"learning_rate": 3.625717759790506e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005732535501010716,
"step": 1450,
"valid_targets_mean": 3820.5,
"valid_targets_min": 1965
},
{
"epoch": 1.39648,
"grad_norm": 0.06579603095770614,
"learning_rate": 3.621806204854947e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006776693044230342,
"step": 1455,
"valid_targets_mean": 3576.1,
"valid_targets_min": 1719
},
{
"epoch": 1.40128,
"grad_norm": 0.057150898506148747,
"learning_rate": 3.617876449648998e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006130424444563687,
"step": 1460,
"valid_targets_mean": 4522.8,
"valid_targets_min": 1870
},
{
"epoch": 1.40608,
"grad_norm": 0.06670784102144113,
"learning_rate": 3.613928538273247e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00048188146320171654,
"step": 1465,
"valid_targets_mean": 3102.2,
"valid_targets_min": 1972
},
{
"epoch": 1.4108800000000001,
"grad_norm": 0.06763203016388951,
"learning_rate": 3.609962515032034e-05,
"loss": 0.0017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006231270963326097,
"step": 1470,
"valid_targets_mean": 2779.9,
"valid_targets_min": 1914
},
{
"epoch": 1.41568,
"grad_norm": 0.06280482861569853,
"learning_rate": 3.605978424432954e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004219388938508928,
"step": 1475,
"valid_targets_mean": 3924.9,
"valid_targets_min": 1984
},
{
"epoch": 1.42048,
"grad_norm": 0.07020653984883694,
"learning_rate": 3.601976311186361e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00041140051325783134,
"step": 1480,
"valid_targets_mean": 2816.9,
"valid_targets_min": 1820
},
{
"epoch": 1.4252799999999999,
"grad_norm": 0.05898237565692731,
"learning_rate": 3.597956220204861e-05,
"loss": 0.0019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005558461998589337,
"step": 1485,
"valid_targets_mean": 4578.8,
"valid_targets_min": 1763
},
{
"epoch": 1.43008,
"grad_norm": 0.057373824481315346,
"learning_rate": 3.5939181966028084e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000512075494043529,
"step": 1490,
"valid_targets_mean": 3754.1,
"valid_targets_min": 1900
},
{
"epoch": 1.43488,
"grad_norm": 0.07125513076235777,
"learning_rate": 3.589862285695804e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0007729599601589143,
"step": 1495,
"valid_targets_mean": 3450.2,
"valid_targets_min": 1705
},
{
"epoch": 1.43968,
"grad_norm": 0.060930732371940854,
"learning_rate": 3.585788533000184e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006291154422797263,
"step": 1500,
"valid_targets_mean": 4446.1,
"valid_targets_min": 1662
},
{
"epoch": 1.44448,
"grad_norm": 0.055811659510320806,
"learning_rate": 3.581696984232508e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00038417422911152244,
"step": 1505,
"valid_targets_mean": 3627.4,
"valid_targets_min": 1705
},
{
"epoch": 1.44928,
"grad_norm": 0.061531493977022365,
"learning_rate": 3.5775876853090465e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006389599875546992,
"step": 1510,
"valid_targets_mean": 3979.2,
"valid_targets_min": 2031
},
{
"epoch": 1.45408,
"grad_norm": 0.0628987310198828,
"learning_rate": 3.5734606823452686e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006298416992649436,
"step": 1515,
"valid_targets_mean": 3707.5,
"valid_targets_min": 1839
},
{
"epoch": 1.45888,
"grad_norm": 0.06317191831321439,
"learning_rate": 3.569316021655319e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004600128741003573,
"step": 1520,
"valid_targets_mean": 4283.7,
"valid_targets_min": 1833
},
{
"epoch": 1.46368,
"grad_norm": 0.0568786391414204,
"learning_rate": 3.565153749751505e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005623505567200482,
"step": 1525,
"valid_targets_mean": 4382.9,
"valid_targets_min": 1727
},
{
"epoch": 1.46848,
"grad_norm": 0.06022997207628912,
"learning_rate": 3.5609739133437666e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004593412159010768,
"step": 1530,
"valid_targets_mean": 4219.6,
"valid_targets_min": 1877
},
{
"epoch": 1.47328,
"grad_norm": 0.062444717675455196,
"learning_rate": 3.55677655933916e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005715553415939212,
"step": 1535,
"valid_targets_mean": 3537.5,
"valid_targets_min": 1662
},
{
"epoch": 1.47808,
"grad_norm": 0.0625345202594014,
"learning_rate": 3.5525617348413265e-05,
"loss": 0.0016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006118146702647209,
"step": 1540,
"valid_targets_mean": 3959.2,
"valid_targets_min": 1833
},
{
"epoch": 1.48288,
"grad_norm": 0.0676310496671364,
"learning_rate": 3.5483294871499646e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005530751659534872,
"step": 1545,
"valid_targets_mean": 3372.5,
"valid_targets_min": 1877
},
{
"epoch": 1.4876800000000001,
"grad_norm": 0.060396214971341365,
"learning_rate": 3.544079863760302e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00045702309580519795,
"step": 1550,
"valid_targets_mean": 4131.5,
"valid_targets_min": 1838
},
{
"epoch": 1.49248,
"grad_norm": 0.054164127702003184,
"learning_rate": 3.5398129123625565e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00044832000276073813,
"step": 1555,
"valid_targets_mean": 3460.3,
"valid_targets_min": 1938
},
{
"epoch": 1.49728,
"grad_norm": 0.04613403287715913,
"learning_rate": 3.535528680841408e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003852218796964735,
"step": 1560,
"valid_targets_mean": 4295.8,
"valid_targets_min": 1662
},
{
"epoch": 1.5020799999999999,
"grad_norm": 0.0500127512382979,
"learning_rate": 3.5312272172754566e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002881671243812889,
"step": 1565,
"valid_targets_mean": 4434.7,
"valid_targets_min": 2013
},
{
"epoch": 1.50688,
"grad_norm": 0.04570223243728663,
"learning_rate": 3.5269085699366844e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00036125804763287306,
"step": 1570,
"valid_targets_mean": 3563.8,
"valid_targets_min": 1662
},
{
"epoch": 1.5116800000000001,
"grad_norm": 0.050115443527604414,
"learning_rate": 3.5225727872899136e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00035666252369992435,
"step": 1575,
"valid_targets_mean": 4493.9,
"valid_targets_min": 1958
},
{
"epoch": 1.51648,
"grad_norm": 0.05814250073314437,
"learning_rate": 3.518219917992262e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004859221226070076,
"step": 1580,
"valid_targets_mean": 3551.9,
"valid_targets_min": 1918
},
{
"epoch": 1.52128,
"grad_norm": 0.06290377895194338,
"learning_rate": 3.5138500108926e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005594316171482205,
"step": 1585,
"valid_targets_mean": 3467.0,
"valid_targets_min": 1907
},
{
"epoch": 1.5260799999999999,
"grad_norm": 0.05486405846197014,
"learning_rate": 3.509463115030995e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005741740460507572,
"step": 1590,
"valid_targets_mean": 3229.7,
"valid_targets_min": 1908
},
{
"epoch": 1.53088,
"grad_norm": 0.05481084601712841,
"learning_rate": 3.505059279638172e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004915180034004152,
"step": 1595,
"valid_targets_mean": 4382.2,
"valid_targets_min": 1829
},
{
"epoch": 1.5356800000000002,
"grad_norm": 0.05643903234898962,
"learning_rate": 3.500638554134952e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005215753335505724,
"step": 1600,
"valid_targets_mean": 4035.5,
"valid_targets_min": 1934
},
{
"epoch": 1.54048,
"grad_norm": 0.05254977998780307,
"learning_rate": 3.4962009881317005e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003885997866746038,
"step": 1605,
"valid_targets_mean": 4436.7,
"valid_targets_min": 1839
},
{
"epoch": 1.54528,
"grad_norm": 0.04901711420583684,
"learning_rate": 3.491746631427772e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00030224508373066783,
"step": 1610,
"valid_targets_mean": 4003.0,
"valid_targets_min": 1836
},
{
"epoch": 1.55008,
"grad_norm": 0.06623036966544768,
"learning_rate": 3.487275534010948e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00043395202374085784,
"step": 1615,
"valid_targets_mean": 3309.2,
"valid_targets_min": 1964
},
{
"epoch": 1.55488,
"grad_norm": 0.048836873073373185,
"learning_rate": 3.482787746056881e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002878532977774739,
"step": 1620,
"valid_targets_mean": 3198.2,
"valid_targets_min": 1920
},
{
"epoch": 1.55968,
"grad_norm": 0.056913745823748994,
"learning_rate": 3.4782833179285256e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003762117703445256,
"step": 1625,
"valid_targets_mean": 4056.7,
"valid_targets_min": 2048
},
{
"epoch": 1.56448,
"grad_norm": 0.0639777721623604,
"learning_rate": 3.473762300175578e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006554973078891635,
"step": 1630,
"valid_targets_mean": 4729.8,
"valid_targets_min": 1913
},
{
"epoch": 1.56928,
"grad_norm": 0.051373274326048456,
"learning_rate": 3.469224743533906e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003751883050426841,
"step": 1635,
"valid_targets_mean": 3390.2,
"valid_targets_min": 1719
},
{
"epoch": 1.57408,
"grad_norm": 0.05691966457897771,
"learning_rate": 3.464670698924981e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004305654438212514,
"step": 1640,
"valid_targets_mean": 3745.8,
"valid_targets_min": 2113
},
{
"epoch": 1.5788799999999998,
"grad_norm": 0.05813617644285067,
"learning_rate": 3.4601002174553055e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003666894044727087,
"step": 1645,
"valid_targets_mean": 2813.3,
"valid_targets_min": 1716
},
{
"epoch": 1.58368,
"grad_norm": 0.05612945598126955,
"learning_rate": 3.45551335041584e-05,
"loss": 0.0014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006458326242864132,
"step": 1650,
"valid_targets_mean": 3816.4,
"valid_targets_min": 1614
},
{
"epoch": 1.5884800000000001,
"grad_norm": 0.06049444178287035,
"learning_rate": 3.4509101492814286e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003922865726053715,
"step": 1655,
"valid_targets_mean": 3021.3,
"valid_targets_min": 1517
},
{
"epoch": 1.59328,
"grad_norm": 0.06005838628831204,
"learning_rate": 3.446290665710219e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000557239050976932,
"step": 1660,
"valid_targets_mean": 3385.1,
"valid_targets_min": 1908
},
{
"epoch": 1.59808,
"grad_norm": 0.057545476191578786,
"learning_rate": 3.441654951543085e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004963584360666573,
"step": 1665,
"valid_targets_mean": 3562.9,
"valid_targets_min": 1937
},
{
"epoch": 1.6028799999999999,
"grad_norm": 0.0441759887433332,
"learning_rate": 3.4370030588030425e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003990795521531254,
"step": 1670,
"valid_targets_mean": 4340.4,
"valid_targets_min": 2031
},
{
"epoch": 1.60768,
"grad_norm": 0.06127534174000278,
"learning_rate": 3.432335039694669e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003658411733340472,
"step": 1675,
"valid_targets_mean": 4327.9,
"valid_targets_min": 1917
},
{
"epoch": 1.6124800000000001,
"grad_norm": 0.058767126137987784,
"learning_rate": 3.427650946603513e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005258081946521997,
"step": 1680,
"valid_targets_mean": 3368.2,
"valid_targets_min": 1966
},
{
"epoch": 1.61728,
"grad_norm": 0.0449556804757125,
"learning_rate": 3.422950832095511e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003695829655043781,
"step": 1685,
"valid_targets_mean": 4248.2,
"valid_targets_min": 1940
},
{
"epoch": 1.62208,
"grad_norm": 0.039865055155997225,
"learning_rate": 3.418234748916395e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00027950757066719234,
"step": 1690,
"valid_targets_mean": 4464.6,
"valid_targets_min": 1838
},
{
"epoch": 1.6268799999999999,
"grad_norm": 0.052016803985212814,
"learning_rate": 3.4135027499911003e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003943184856325388,
"step": 1695,
"valid_targets_mean": 3936.7,
"valid_targets_min": 1829
},
{
"epoch": 1.63168,
"grad_norm": 0.050299889174442704,
"learning_rate": 3.408754888423173e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003132482524961233,
"step": 1700,
"valid_targets_mean": 4339.2,
"valid_targets_min": 1705
},
{
"epoch": 1.6364800000000002,
"grad_norm": 0.047308777354368184,
"learning_rate": 3.403991217494172e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002561693836469203,
"step": 1705,
"valid_targets_mean": 3008.0,
"valid_targets_min": 1836
},
{
"epoch": 1.64128,
"grad_norm": 0.05413378126480606,
"learning_rate": 3.3992117906630744e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004959758371114731,
"step": 1710,
"valid_targets_mean": 4311.6,
"valid_targets_min": 2001
},
{
"epoch": 1.64608,
"grad_norm": 0.04883708091963607,
"learning_rate": 3.394416661565671e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003378509427420795,
"step": 1715,
"valid_targets_mean": 3893.9,
"valid_targets_min": 1517
},
{
"epoch": 1.65088,
"grad_norm": 0.04414000339277738,
"learning_rate": 3.389605884013969e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003347942838445306,
"step": 1720,
"valid_targets_mean": 3723.3,
"valid_targets_min": 1933
},
{
"epoch": 1.65568,
"grad_norm": 0.055219278511505654,
"learning_rate": 3.384779511995587e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002406383428024128,
"step": 1725,
"valid_targets_mean": 3163.8,
"valid_targets_min": 1981
},
{
"epoch": 1.66048,
"grad_norm": 0.05296936286452832,
"learning_rate": 3.379937599673144e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00038539827801287174,
"step": 1730,
"valid_targets_mean": 2922.3,
"valid_targets_min": 1525
},
{
"epoch": 1.66528,
"grad_norm": 0.06301281456735988,
"learning_rate": 3.3750802013836596e-05,
"loss": 0.0015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006307390285655856,
"step": 1735,
"valid_targets_mean": 3184.9,
"valid_targets_min": 2030
},
{
"epoch": 1.67008,
"grad_norm": 0.040991134654555485,
"learning_rate": 3.370207371637939e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00027934444369748235,
"step": 1740,
"valid_targets_mean": 4248.1,
"valid_targets_min": 1917
},
{
"epoch": 1.67488,
"grad_norm": 0.05525964959165724,
"learning_rate": 3.3653191651199635e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00043741060653701425,
"step": 1745,
"valid_targets_mean": 3096.0,
"valid_targets_min": 1942
},
{
"epoch": 1.6796799999999998,
"grad_norm": 0.04948169779465362,
"learning_rate": 3.360415636686274e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00034553324803709984,
"step": 1750,
"valid_targets_mean": 3762.4,
"valid_targets_min": 1839
},
{
"epoch": 1.68448,
"grad_norm": 0.057814928993456416,
"learning_rate": 3.355496841365359e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00034999416675418615,
"step": 1755,
"valid_targets_mean": 3363.3,
"valid_targets_min": 1614
},
{
"epoch": 1.6892800000000001,
"grad_norm": 0.04656009081003181,
"learning_rate": 3.350562834357034e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003240430378355086,
"step": 1760,
"valid_targets_mean": 4379.7,
"valid_targets_min": 1928
},
{
"epoch": 1.69408,
"grad_norm": 0.04634663217611643,
"learning_rate": 3.345613671031827e-05,
"loss": 0.0013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003630942082963884,
"step": 1765,
"valid_targets_mean": 2665.6,
"valid_targets_min": 1829
},
{
"epoch": 1.69888,
"grad_norm": 0.05389450610622448,
"learning_rate": 3.340649406930349e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00042325188405811787,
"step": 1770,
"valid_targets_mean": 3036.8,
"valid_targets_min": 1908
},
{
"epoch": 1.7036799999999999,
"grad_norm": 0.04054004078806552,
"learning_rate": 3.335670097762677e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003856320690829307,
"step": 1775,
"valid_targets_mean": 4150.5,
"valid_targets_min": 1921
},
{
"epoch": 1.70848,
"grad_norm": 0.04319122595484807,
"learning_rate": 3.330675799407728e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002972689107991755,
"step": 1780,
"valid_targets_mean": 4059.9,
"valid_targets_min": 2010
},
{
"epoch": 1.7132800000000001,
"grad_norm": 0.0614953115360606,
"learning_rate": 3.32566656791263e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00041061831871047616,
"step": 1785,
"valid_targets_mean": 3852.8,
"valid_targets_min": 1820
},
{
"epoch": 1.71808,
"grad_norm": 0.05093908281170732,
"learning_rate": 3.320642459492095e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00046082702465355396,
"step": 1790,
"valid_targets_mean": 4709.6,
"valid_targets_min": 1914
},
{
"epoch": 1.72288,
"grad_norm": 0.0405281692299427,
"learning_rate": 3.315603530527785e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002832312893588096,
"step": 1795,
"valid_targets_mean": 4104.4,
"valid_targets_min": 1829
},
{
"epoch": 1.7276799999999999,
"grad_norm": 0.04855015633898981,
"learning_rate": 3.310549837567685e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00033870741026476026,
"step": 1800,
"valid_targets_mean": 2691.3,
"valid_targets_min": 2029
},
{
"epoch": 1.73248,
"grad_norm": 0.047363617105796715,
"learning_rate": 3.3054814373254615e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002556862309575081,
"step": 1805,
"valid_targets_mean": 3560.0,
"valid_targets_min": 1974
},
{
"epoch": 1.7372800000000002,
"grad_norm": 0.06870257527043447,
"learning_rate": 3.300398386679831e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005319949705153704,
"step": 1810,
"valid_targets_mean": 3655.3,
"valid_targets_min": 1928
},
{
"epoch": 1.74208,
"grad_norm": 0.04543379139820006,
"learning_rate": 3.2953007426739204e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006080212187953293,
"step": 1815,
"valid_targets_mean": 3771.9,
"valid_targets_min": 1950
},
{
"epoch": 1.74688,
"grad_norm": 0.059110598595154995,
"learning_rate": 3.290188562514624e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004835808358620852,
"step": 1820,
"valid_targets_mean": 3807.7,
"valid_targets_min": 1929
},
{
"epoch": 1.75168,
"grad_norm": 0.053563524383162094,
"learning_rate": 3.285061903571968e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00036704057129099965,
"step": 1825,
"valid_targets_mean": 3920.9,
"valid_targets_min": 1525
},
{
"epoch": 1.75648,
"grad_norm": 0.04025291938966945,
"learning_rate": 3.27992082337846e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003524449421092868,
"step": 1830,
"valid_targets_mean": 3674.2,
"valid_targets_min": 1775
},
{
"epoch": 1.76128,
"grad_norm": 0.04632488808634008,
"learning_rate": 3.274765379628447e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003716344363056123,
"step": 1835,
"valid_targets_mean": 4068.3,
"valid_targets_min": 1562
},
{
"epoch": 1.76608,
"grad_norm": 0.04633480317494468,
"learning_rate": 3.2695956301774664e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003534138377290219,
"step": 1840,
"valid_targets_mean": 4502.1,
"valid_targets_min": 1820
},
{
"epoch": 1.77088,
"grad_norm": 0.05850594818743109,
"learning_rate": 3.264411633041598e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00048642410547472537,
"step": 1845,
"valid_targets_mean": 3579.4,
"valid_targets_min": 1836
},
{
"epoch": 1.77568,
"grad_norm": 0.05387262915143158,
"learning_rate": 3.259213446396812e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004213897336740047,
"step": 1850,
"valid_targets_mean": 4249.3,
"valid_targets_min": 1912
},
{
"epoch": 1.7804799999999998,
"grad_norm": 0.04971774541588144,
"learning_rate": 3.254001128578317e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003937389701604843,
"step": 1855,
"valid_targets_mean": 4642.7,
"valid_targets_min": 2057
},
{
"epoch": 1.78528,
"grad_norm": 0.05572299073574149,
"learning_rate": 3.2487747380799036e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000320199120324105,
"step": 1860,
"valid_targets_mean": 3592.1,
"valid_targets_min": 1361
},
{
"epoch": 1.7900800000000001,
"grad_norm": 0.04950662800517279,
"learning_rate": 3.243534333553291e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004355285782366991,
"step": 1865,
"valid_targets_mean": 3426.8,
"valid_targets_min": 2025
},
{
"epoch": 1.79488,
"grad_norm": 0.045827956197243926,
"learning_rate": 3.2382799738074635e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002996047551278025,
"step": 1870,
"valid_targets_mean": 4818.6,
"valid_targets_min": 1836
},
{
"epoch": 1.79968,
"grad_norm": 0.043499031883452915,
"learning_rate": 3.2330117178080184e-05,
"loss": 0.0012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00030622404301539063,
"step": 1875,
"valid_targets_mean": 4497.5,
"valid_targets_min": 1942
},
{
"epoch": 1.8044799999999999,
"grad_norm": 0.04161937474381663,
"learning_rate": 3.227729624676497e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002968889311887324,
"step": 1880,
"valid_targets_mean": 4432.3,
"valid_targets_min": 1740
},
{
"epoch": 1.80928,
"grad_norm": 0.049436031579658306,
"learning_rate": 3.222433753689724e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002810401492752135,
"step": 1885,
"valid_targets_mean": 3545.3,
"valid_targets_min": 2084
},
{
"epoch": 1.8140800000000001,
"grad_norm": 0.03577910696174026,
"learning_rate": 3.2171241642791443e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002864730195142329,
"step": 1890,
"valid_targets_mean": 4110.9,
"valid_targets_min": 1914
},
{
"epoch": 1.81888,
"grad_norm": 0.04253383606701866,
"learning_rate": 3.211800916030152e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00027189357206225395,
"step": 1895,
"valid_targets_mean": 4199.0,
"valid_targets_min": 1908
},
{
"epoch": 1.82368,
"grad_norm": 0.03981515952280382,
"learning_rate": 3.206464068681424e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003700641100294888,
"step": 1900,
"valid_targets_mean": 4726.0,
"valid_targets_min": 1919
},
{
"epoch": 1.8284799999999999,
"grad_norm": 0.04678756520562075,
"learning_rate": 3.20111368212425e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0006207724800333381,
"step": 1905,
"valid_targets_mean": 4013.5,
"valid_targets_min": 1839
},
{
"epoch": 1.83328,
"grad_norm": 0.042430851523702566,
"learning_rate": 3.19574981640186e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00034162524389103055,
"step": 1910,
"valid_targets_mean": 3786.6,
"valid_targets_min": 1908
},
{
"epoch": 1.8380800000000002,
"grad_norm": 0.05215277248239781,
"learning_rate": 3.1903725317087495e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004819263413082808,
"step": 1915,
"valid_targets_mean": 3923.4,
"valid_targets_min": 1719
},
{
"epoch": 1.84288,
"grad_norm": 0.044629333978700496,
"learning_rate": 3.184981888390003e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003267807769589126,
"step": 1920,
"valid_targets_mean": 3651.1,
"valid_targets_min": 2039
},
{
"epoch": 1.84768,
"grad_norm": 0.04480507387362986,
"learning_rate": 3.1795779469406226e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00035782408667728305,
"step": 1925,
"valid_targets_mean": 3725.5,
"valid_targets_min": 1786
},
{
"epoch": 1.85248,
"grad_norm": 0.041128453478606976,
"learning_rate": 3.174160768004842e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022609728330280632,
"step": 1930,
"valid_targets_mean": 5245.9,
"valid_targets_min": 1680
},
{
"epoch": 1.85728,
"grad_norm": 0.05143151866954522,
"learning_rate": 3.168730412375449e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00044801694457419217,
"step": 1935,
"valid_targets_mean": 3150.0,
"valid_targets_min": 1680
},
{
"epoch": 1.86208,
"grad_norm": 0.04692971584297232,
"learning_rate": 3.1632869409931036e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000266010407358408,
"step": 1940,
"valid_targets_mean": 3319.3,
"valid_targets_min": 1775
},
{
"epoch": 1.86688,
"grad_norm": 0.03787908414763803,
"learning_rate": 3.1578304149456544e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00027268845587968826,
"step": 1945,
"valid_targets_mean": 4960.8,
"valid_targets_min": 1829
},
{
"epoch": 1.87168,
"grad_norm": 0.05436027849322881,
"learning_rate": 3.1523608954674524e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00037563478690572083,
"step": 1950,
"valid_targets_mean": 3414.5,
"valid_targets_min": 1958
},
{
"epoch": 1.87648,
"grad_norm": 0.042774282013460875,
"learning_rate": 3.1468784439386614e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003659092471934855,
"step": 1955,
"valid_targets_mean": 3620.4,
"valid_targets_min": 1904
},
{
"epoch": 1.8812799999999998,
"grad_norm": 0.04122380272897595,
"learning_rate": 3.141383121884576e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00034778908593580127,
"step": 1960,
"valid_targets_mean": 4347.6,
"valid_targets_min": 2039
},
{
"epoch": 1.88608,
"grad_norm": 0.05330947792411219,
"learning_rate": 3.1358749909749214e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00034708459861576557,
"step": 1965,
"valid_targets_mean": 4252.3,
"valid_targets_min": 1959
},
{
"epoch": 1.8908800000000001,
"grad_norm": 0.049483338699360224,
"learning_rate": 3.1303541130231703e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004025818780064583,
"step": 1970,
"valid_targets_mean": 4020.6,
"valid_targets_min": 2012
},
{
"epoch": 1.89568,
"grad_norm": 0.049351126866147295,
"learning_rate": 3.1248205499858446e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003342171257827431,
"step": 1975,
"valid_targets_mean": 3042.1,
"valid_targets_min": 1943
},
{
"epoch": 1.90048,
"grad_norm": 0.042954433111331666,
"learning_rate": 3.119274363961821e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00021361312246881425,
"step": 1980,
"valid_targets_mean": 3799.3,
"valid_targets_min": 1942
},
{
"epoch": 1.9052799999999999,
"grad_norm": 0.03550201618878598,
"learning_rate": 3.113715617191634e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002286080562043935,
"step": 1985,
"valid_targets_mean": 4318.5,
"valid_targets_min": 2010
},
{
"epoch": 1.91008,
"grad_norm": 0.0512979708140217,
"learning_rate": 3.1081443720567785e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00040846579940989614,
"step": 1990,
"valid_targets_mean": 4275.7,
"valid_targets_min": 1870
},
{
"epoch": 1.9148800000000001,
"grad_norm": 0.04322505692818679,
"learning_rate": 3.102560691079007e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003856475232169032,
"step": 1995,
"valid_targets_mean": 3959.7,
"valid_targets_min": 1517
},
{
"epoch": 1.91968,
"grad_norm": 0.037866804711089004,
"learning_rate": 3.0969646369196307e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020155790844000876,
"step": 2000,
"valid_targets_mean": 3651.0,
"valid_targets_min": 1906
},
{
"epoch": 1.92448,
"grad_norm": 0.03520402744171799,
"learning_rate": 3.0913562723788174e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017841681255958974,
"step": 2005,
"valid_targets_mean": 3097.2,
"valid_targets_min": 1900
},
{
"epoch": 1.9292799999999999,
"grad_norm": 0.04576720772413004,
"learning_rate": 3.085735660394881e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002288795803906396,
"step": 2010,
"valid_targets_mean": 3696.0,
"valid_targets_min": 1987
},
{
"epoch": 1.93408,
"grad_norm": 0.04933298500996939,
"learning_rate": 3.080102864043581e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004367926740087569,
"step": 2015,
"valid_targets_mean": 3204.1,
"valid_targets_min": 2026
},
{
"epoch": 1.9388800000000002,
"grad_norm": 0.05260798047248693,
"learning_rate": 3.074457946537413e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003071989049203694,
"step": 2020,
"valid_targets_mean": 3134.8,
"valid_targets_min": 1525
},
{
"epoch": 1.94368,
"grad_norm": 0.04380153388399339,
"learning_rate": 3.068800971224898e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00030949185020290315,
"step": 2025,
"valid_targets_mean": 3797.7,
"valid_targets_min": 1900
},
{
"epoch": 1.94848,
"grad_norm": 0.046800305647988746,
"learning_rate": 3.0631320015898735e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003367983445059508,
"step": 2030,
"valid_targets_mean": 4517.7,
"valid_targets_min": 1940
},
{
"epoch": 1.95328,
"grad_norm": 0.040178378749060155,
"learning_rate": 3.057451101250778e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002442404511384666,
"step": 2035,
"valid_targets_mean": 4852.8,
"valid_targets_min": 1740
},
{
"epoch": 1.95808,
"grad_norm": 0.04509788359517867,
"learning_rate": 3.051758333959941e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002550902427174151,
"step": 2040,
"valid_targets_mean": 3564.3,
"valid_targets_min": 1991
},
{
"epoch": 1.96288,
"grad_norm": 0.03594320942598652,
"learning_rate": 3.046053763602865e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004347126523498446,
"step": 2045,
"valid_targets_mean": 4681.1,
"valid_targets_min": 1802
},
{
"epoch": 1.96768,
"grad_norm": 0.04263972629270992,
"learning_rate": 3.0403374541975078e-05,
"loss": 0.0011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003159629413858056,
"step": 2050,
"valid_targets_mean": 3935.8,
"valid_targets_min": 1981
},
{
"epoch": 1.97248,
"grad_norm": 0.04122883968158281,
"learning_rate": 3.034609469893567e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003064102493226528,
"step": 2055,
"valid_targets_mean": 3883.6,
"valid_targets_min": 1802
},
{
"epoch": 1.97728,
"grad_norm": 0.04338278061662454,
"learning_rate": 3.028869874971758e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002915991353802383,
"step": 2060,
"valid_targets_mean": 3029.1,
"valid_targets_min": 1847
},
{
"epoch": 1.9820799999999998,
"grad_norm": 0.036355028310916124,
"learning_rate": 3.0231187338430944e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00035102188121527433,
"step": 2065,
"valid_targets_mean": 4931.2,
"valid_targets_min": 1939
},
{
"epoch": 1.98688,
"grad_norm": 0.048383914402931466,
"learning_rate": 3.0173561110481606e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023929959570523351,
"step": 2070,
"valid_targets_mean": 5375.9,
"valid_targets_min": 1940
},
{
"epoch": 1.9916800000000001,
"grad_norm": 0.044115711212949424,
"learning_rate": 3.011582071256394e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00032735677086748183,
"step": 2075,
"valid_targets_mean": 3306.5,
"valid_targets_min": 1727
},
{
"epoch": 1.99648,
"grad_norm": 0.04118373461485346,
"learning_rate": 3.0057966792653547e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00026323198108002543,
"step": 2080,
"valid_targets_mean": 4257.6,
"valid_targets_min": 1829
},
{
"epoch": 2.00096,
"grad_norm": 0.033605720871692286,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023035166668705642,
"step": 2085,
"valid_targets_mean": 3021.3,
"valid_targets_min": 1820
},
{
"epoch": 2.00576,
"grad_norm": 0.03941509733719802,
"learning_rate": 2.9941920985119562e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002633282565511763,
"step": 2090,
"valid_targets_mean": 3287.6,
"valid_targets_min": 1906
},
{
"epoch": 2.01056,
"grad_norm": 0.04225606591711965,
"learning_rate": 2.988373039978786e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00025588853168301284,
"step": 2095,
"valid_targets_mean": 2852.6,
"valid_targets_min": 1857
},
{
"epoch": 2.01536,
"grad_norm": 0.03849636401283634,
"learning_rate": 2.98254288970326e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003536568838171661,
"step": 2100,
"valid_targets_mean": 4180.8,
"valid_targets_min": 1802
},
{
"epoch": 2.02016,
"grad_norm": 0.04407578409722852,
"learning_rate": 2.9767017131126245e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014297438610810786,
"step": 2105,
"valid_targets_mean": 3781.4,
"valid_targets_min": 1919
},
{
"epoch": 2.02496,
"grad_norm": 0.045494787360105746,
"learning_rate": 2.9708495757578633e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022338703274726868,
"step": 2110,
"valid_targets_mean": 4300.6,
"valid_targets_min": 1942
},
{
"epoch": 2.02976,
"grad_norm": 0.03789723665227751,
"learning_rate": 2.964986543312964e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002846395072992891,
"step": 2115,
"valid_targets_mean": 4121.6,
"valid_targets_min": 1771
},
{
"epoch": 2.03456,
"grad_norm": 0.04835105817239923,
"learning_rate": 2.9591126815741832e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004806315992027521,
"step": 2120,
"valid_targets_mean": 4034.5,
"valid_targets_min": 1858
},
{
"epoch": 2.03936,
"grad_norm": 0.03915872767648746,
"learning_rate": 2.953228056459305e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00025110685965046287,
"step": 2125,
"valid_targets_mean": 4672.4,
"valid_targets_min": 1863
},
{
"epoch": 2.04416,
"grad_norm": 0.04912331091299425,
"learning_rate": 2.947332734006903e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0004711863584816456,
"step": 2130,
"valid_targets_mean": 3152.0,
"valid_targets_min": 1652
},
{
"epoch": 2.04896,
"grad_norm": 0.03562616275436536,
"learning_rate": 2.9414267803755988e-05,
"loss": 0.001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003120258334092796,
"step": 2135,
"valid_targets_mean": 4770.2,
"valid_targets_min": 1680
},
{
"epoch": 2.05376,
"grad_norm": 0.03446236345598084,
"learning_rate": 2.9355102618433197e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023818084446247667,
"step": 2140,
"valid_targets_mean": 3193.0,
"valid_targets_min": 1906
},
{
"epoch": 2.05856,
"grad_norm": 0.03753730116508484,
"learning_rate": 2.929583244806553e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002192890678998083,
"step": 2145,
"valid_targets_mean": 4480.2,
"valid_targets_min": 1960
},
{
"epoch": 2.06336,
"grad_norm": 0.049491292395218045,
"learning_rate": 2.9236457957796047e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003270478919148445,
"step": 2150,
"valid_targets_mean": 3365.0,
"valid_targets_min": 1877
},
{
"epoch": 2.0681599999999998,
"grad_norm": 0.04715131351475584,
"learning_rate": 2.9176979813938494e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003005887265317142,
"step": 2155,
"valid_targets_mean": 3592.0,
"valid_targets_min": 1562
},
{
"epoch": 2.07296,
"grad_norm": 0.045132727411257935,
"learning_rate": 2.9117398683969857e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002569695352576673,
"step": 2160,
"valid_targets_mean": 4224.3,
"valid_targets_min": 1928
},
{
"epoch": 2.07776,
"grad_norm": 0.045645196767944124,
"learning_rate": 2.9057715236522833e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002819838700816035,
"step": 2165,
"valid_targets_mean": 3357.2,
"valid_targets_min": 1786
},
{
"epoch": 2.08256,
"grad_norm": 0.047911519242527144,
"learning_rate": 2.899793014137836e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00036411883775144815,
"step": 2170,
"valid_targets_mean": 3320.3,
"valid_targets_min": 1909
},
{
"epoch": 2.08736,
"grad_norm": 0.05180769284537206,
"learning_rate": 2.8938044069458094e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00034832872916013,
"step": 2175,
"valid_targets_mean": 3780.2,
"valid_targets_min": 1958
},
{
"epoch": 2.09216,
"grad_norm": 0.046025193146755725,
"learning_rate": 2.8878057692816877e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0005058305687271059,
"step": 2180,
"valid_targets_mean": 3388.2,
"valid_targets_min": 1907
},
{
"epoch": 2.09696,
"grad_norm": 0.03775721962047528,
"learning_rate": 2.8817971684635178e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001705609611235559,
"step": 2185,
"valid_targets_mean": 3603.0,
"valid_targets_min": 1863
},
{
"epoch": 2.10176,
"grad_norm": 0.04585119871874699,
"learning_rate": 2.8757786719211555e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020783724903594702,
"step": 2190,
"valid_targets_mean": 3269.0,
"valid_targets_min": 1908
},
{
"epoch": 2.10656,
"grad_norm": 0.03891090599039738,
"learning_rate": 2.8697503471955106e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001934785395860672,
"step": 2195,
"valid_targets_mean": 4751.0,
"valid_targets_min": 1614
},
{
"epoch": 2.11136,
"grad_norm": 0.038984861137829015,
"learning_rate": 2.8637122619377848e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000268601841526106,
"step": 2200,
"valid_targets_mean": 3949.3,
"valid_targets_min": 1992
},
{
"epoch": 2.11616,
"grad_norm": 0.04030795470548875,
"learning_rate": 2.8576644839087152e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00018950544472318143,
"step": 2205,
"valid_targets_mean": 3396.4,
"valid_targets_min": 1921
},
{
"epoch": 2.12096,
"grad_norm": 0.04272732693807203,
"learning_rate": 2.8516070809778145e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001538700598757714,
"step": 2210,
"valid_targets_mean": 3320.9,
"valid_targets_min": 1740
},
{
"epoch": 2.12576,
"grad_norm": 0.03964188235224993,
"learning_rate": 2.845540121122607e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002259221364511177,
"step": 2215,
"valid_targets_mean": 4208.6,
"valid_targets_min": 1887
},
{
"epoch": 2.13056,
"grad_norm": 0.04272357544341015,
"learning_rate": 2.839463672427867e-05,
"loss": 0.0009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00033014221116900444,
"step": 2220,
"valid_targets_mean": 4028.6,
"valid_targets_min": 1904
},
{
"epoch": 2.13536,
"grad_norm": 0.02931611152693843,
"learning_rate": 2.833377803084855e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011045490828109905,
"step": 2225,
"valid_targets_mean": 3965.6,
"valid_targets_min": 1863
},
{
"epoch": 2.14016,
"grad_norm": 0.03415035693128969,
"learning_rate": 2.8272825813905522e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001376604486722499,
"step": 2230,
"valid_targets_mean": 3235.6,
"valid_targets_min": 1857
},
{
"epoch": 2.14496,
"grad_norm": 0.03382136920768197,
"learning_rate": 2.8211780757468942e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015516190615016967,
"step": 2235,
"valid_targets_mean": 3887.8,
"valid_targets_min": 1919
},
{
"epoch": 2.14976,
"grad_norm": 0.044993094399656555,
"learning_rate": 2.8150643546600012e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003087717341259122,
"step": 2240,
"valid_targets_mean": 3293.2,
"valid_targets_min": 1928
},
{
"epoch": 2.15456,
"grad_norm": 0.03908152875549286,
"learning_rate": 2.808941486739414e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002885219582822174,
"step": 2245,
"valid_targets_mean": 4638.7,
"valid_targets_min": 1900
},
{
"epoch": 2.15936,
"grad_norm": 0.030928059487089134,
"learning_rate": 2.80280954069732e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023226509802043438,
"step": 2250,
"valid_targets_mean": 3890.1,
"valid_targets_min": 1951
},
{
"epoch": 2.16416,
"grad_norm": 0.03729014178961917,
"learning_rate": 2.7966685853477828e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003418756532482803,
"step": 2255,
"valid_targets_mean": 3247.4,
"valid_targets_min": 2231
},
{
"epoch": 2.16896,
"grad_norm": 0.0323102484575263,
"learning_rate": 2.790518689605971e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00019071548013016582,
"step": 2260,
"valid_targets_mean": 3516.8,
"valid_targets_min": 1889
},
{
"epoch": 2.17376,
"grad_norm": 0.04856897361198709,
"learning_rate": 2.7843599224873833e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017041576211340725,
"step": 2265,
"valid_targets_mean": 4206.8,
"valid_targets_min": 1924
},
{
"epoch": 2.17856,
"grad_norm": 0.03576939276419744,
"learning_rate": 2.7781923531070775e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00038324674824252725,
"step": 2270,
"valid_targets_mean": 2961.4,
"valid_targets_min": 1680
},
{
"epoch": 2.18336,
"grad_norm": 0.030493288750038344,
"learning_rate": 2.7720160506788896e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001243678416358307,
"step": 2275,
"valid_targets_mean": 3825.0,
"valid_targets_min": 1870
},
{
"epoch": 2.18816,
"grad_norm": 0.0400949924638015,
"learning_rate": 2.7658310845146598e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00018578841991256922,
"step": 2280,
"valid_targets_mean": 4495.0,
"valid_targets_min": 2009
},
{
"epoch": 2.19296,
"grad_norm": 0.037333026714177465,
"learning_rate": 2.7596375240234574e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020659196889027953,
"step": 2285,
"valid_targets_mean": 3360.5,
"valid_targets_min": 1719
},
{
"epoch": 2.19776,
"grad_norm": 0.045283233017465424,
"learning_rate": 2.7534354387107975e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00029020351939834654,
"step": 2290,
"valid_targets_mean": 4335.8,
"valid_targets_min": 1525
},
{
"epoch": 2.20256,
"grad_norm": 0.0321961691598059,
"learning_rate": 2.747224898177862e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001831486588343978,
"step": 2295,
"valid_targets_mean": 5505.2,
"valid_targets_min": 2074
},
{
"epoch": 2.20736,
"grad_norm": 0.04479222868751039,
"learning_rate": 2.7410059721207187e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00031453612609766424,
"step": 2300,
"valid_targets_mean": 3296.8,
"valid_targets_min": 2041
},
{
"epoch": 2.21216,
"grad_norm": 0.03396162372941247,
"learning_rate": 2.734778730329543e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00024497491540387273,
"step": 2305,
"valid_targets_mean": 3662.8,
"valid_targets_min": 1891
},
{
"epoch": 2.21696,
"grad_norm": 0.039392580173791665,
"learning_rate": 2.7285432426878275e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002551403595134616,
"step": 2310,
"valid_targets_mean": 4311.8,
"valid_targets_min": 2032
},
{
"epoch": 2.22176,
"grad_norm": 0.03754119255041813,
"learning_rate": 2.7222995791716034e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00019644678104668856,
"step": 2315,
"valid_targets_mean": 3148.0,
"valid_targets_min": 1763
},
{
"epoch": 2.22656,
"grad_norm": 0.030334413668914074,
"learning_rate": 2.716047809848653e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00018585645011626184,
"step": 2320,
"valid_targets_mean": 3651.1,
"valid_targets_min": 1938
},
{
"epoch": 2.23136,
"grad_norm": 0.04045784912723658,
"learning_rate": 2.7097880048777238e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001915416942210868,
"step": 2325,
"valid_targets_mean": 3014.8,
"valid_targets_min": 1863
},
{
"epoch": 2.23616,
"grad_norm": 0.04333177506122303,
"learning_rate": 2.703520234507742e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00045665091602131724,
"step": 2330,
"valid_targets_mean": 4318.9,
"valid_targets_min": 2056
},
{
"epoch": 2.24096,
"grad_norm": 0.03739441324826848,
"learning_rate": 2.697244569077021e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020790009875781834,
"step": 2335,
"valid_targets_mean": 3993.2,
"valid_targets_min": 1991
},
{
"epoch": 2.24576,
"grad_norm": 0.035305305784520465,
"learning_rate": 2.6909610790124772e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003060979361180216,
"step": 2340,
"valid_targets_mean": 4405.0,
"valid_targets_min": 1939
},
{
"epoch": 2.25056,
"grad_norm": 0.02959348243450873,
"learning_rate": 2.684669834828835e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002234200801467523,
"step": 2345,
"valid_targets_mean": 4487.1,
"valid_targets_min": 1680
},
{
"epoch": 2.25536,
"grad_norm": 0.04631364254708182,
"learning_rate": 2.6783709071278372e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003990861587226391,
"step": 2350,
"valid_targets_mean": 3409.9,
"valid_targets_min": 2011
},
{
"epoch": 2.26016,
"grad_norm": 0.036652540579393704,
"learning_rate": 2.6720643665974522e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017286359798163176,
"step": 2355,
"valid_targets_mean": 4595.0,
"valid_targets_min": 2171
},
{
"epoch": 2.26496,
"grad_norm": 0.031267941336866396,
"learning_rate": 2.665750284011085e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016654253704473376,
"step": 2360,
"valid_targets_mean": 4046.1,
"valid_targets_min": 1920
},
{
"epoch": 2.2697599999999998,
"grad_norm": 0.036409463244741175,
"learning_rate": 2.6594287302267744e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00025828357320278883,
"step": 2365,
"valid_targets_mean": 5251.3,
"valid_targets_min": 1705
},
{
"epoch": 2.27456,
"grad_norm": 0.03756310563624762,
"learning_rate": 2.653099776186405e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001461548963561654,
"step": 2370,
"valid_targets_mean": 3591.6,
"valid_targets_min": 1662
},
{
"epoch": 2.27936,
"grad_norm": 0.03467708796327428,
"learning_rate": 2.646763492914908e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00026901293313130736,
"step": 2375,
"valid_targets_mean": 3220.3,
"valid_targets_min": 1863
},
{
"epoch": 2.28416,
"grad_norm": 0.029874949666269978,
"learning_rate": 2.640419951519467e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002025901630986482,
"step": 2380,
"valid_targets_mean": 3226.0,
"valid_targets_min": 1998
},
{
"epoch": 2.28896,
"grad_norm": 0.03381433751089229,
"learning_rate": 2.634069223188715e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00021201377967372537,
"step": 2385,
"valid_targets_mean": 4461.9,
"valid_targets_min": 1917
},
{
"epoch": 2.29376,
"grad_norm": 0.037794410016097665,
"learning_rate": 2.627711379191939e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022039566829334944,
"step": 2390,
"valid_targets_mean": 4068.2,
"valid_targets_min": 1760
},
{
"epoch": 2.29856,
"grad_norm": 0.03876776181109457,
"learning_rate": 2.621346490878281e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002503449213691056,
"step": 2395,
"valid_targets_mean": 3787.4,
"valid_targets_min": 1884
},
{
"epoch": 2.30336,
"grad_norm": 0.04425219517126325,
"learning_rate": 2.614974629675935e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002225804200861603,
"step": 2400,
"valid_targets_mean": 3016.7,
"valid_targets_min": 1877
},
{
"epoch": 2.30816,
"grad_norm": 0.0332418527626137,
"learning_rate": 2.608595867091346e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001066123804775998,
"step": 2405,
"valid_targets_mean": 3969.6,
"valid_targets_min": 1839
},
{
"epoch": 2.31296,
"grad_norm": 0.03275117269790793,
"learning_rate": 2.6022102747084084e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014958773681428283,
"step": 2410,
"valid_targets_mean": 3277.8,
"valid_targets_min": 1868
},
{
"epoch": 2.31776,
"grad_norm": 0.03663969443965277,
"learning_rate": 2.595817924187663e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023177076946012676,
"step": 2415,
"valid_targets_mean": 4114.9,
"valid_targets_min": 1727
},
{
"epoch": 2.32256,
"grad_norm": 0.03151762456815796,
"learning_rate": 2.589418887265489e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002696237061172724,
"step": 2420,
"valid_targets_mean": 4500.8,
"valid_targets_min": 1942
},
{
"epoch": 2.32736,
"grad_norm": 0.032831572609185296,
"learning_rate": 2.5830132357533044e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001549628796055913,
"step": 2425,
"valid_targets_mean": 4774.0,
"valid_targets_min": 1925
},
{
"epoch": 2.33216,
"grad_norm": 0.04240344680707184,
"learning_rate": 2.5766010415367567e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020264976774342358,
"step": 2430,
"valid_targets_mean": 3075.3,
"valid_targets_min": 1908
},
{
"epoch": 2.33696,
"grad_norm": 0.041500799096206215,
"learning_rate": 2.5701823765749187e-05,
"loss": 0.0008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00030124446493573487,
"step": 2435,
"valid_targets_mean": 3322.5,
"valid_targets_min": 1614
},
{
"epoch": 2.34176,
"grad_norm": 0.024132575735248074,
"learning_rate": 2.563757312899477e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001617611851543188,
"step": 2440,
"valid_targets_mean": 4256.2,
"valid_targets_min": 1908
},
{
"epoch": 2.34656,
"grad_norm": 0.03622168996073483,
"learning_rate": 2.557325922613926e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010978215868817642,
"step": 2445,
"valid_targets_mean": 4010.4,
"valid_targets_min": 1751
},
{
"epoch": 2.35136,
"grad_norm": 0.035687387011170656,
"learning_rate": 2.5508882778927615e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020305518410168588,
"step": 2450,
"valid_targets_mean": 5104.2,
"valid_targets_min": 2008
},
{
"epoch": 2.35616,
"grad_norm": 0.03498720529081233,
"learning_rate": 2.5444444509806654e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002204036427428946,
"step": 2455,
"valid_targets_mean": 3017.6,
"valid_targets_min": 1868
},
{
"epoch": 2.36096,
"grad_norm": 0.033412627570212454,
"learning_rate": 2.5379945141916976e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022408628137782216,
"step": 2460,
"valid_targets_mean": 3959.5,
"valid_targets_min": 1662
},
{
"epoch": 2.36576,
"grad_norm": 0.03359882263771964,
"learning_rate": 2.531538539908486e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001831240369938314,
"step": 2465,
"valid_targets_mean": 3663.9,
"valid_targets_min": 1889
},
{
"epoch": 2.3705600000000002,
"grad_norm": 0.03526372615108675,
"learning_rate": 2.5250766005814108e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002579090651124716,
"step": 2470,
"valid_targets_mean": 3923.1,
"valid_targets_min": 1970
},
{
"epoch": 2.37536,
"grad_norm": 0.033811299894664026,
"learning_rate": 2.5186087687277956e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016862923803273588,
"step": 2475,
"valid_targets_mean": 3491.5,
"valid_targets_min": 1763
},
{
"epoch": 2.38016,
"grad_norm": 0.035525310974040464,
"learning_rate": 2.5121351169310887e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00029478981741704047,
"step": 2480,
"valid_targets_mean": 3264.8,
"valid_targets_min": 1917
},
{
"epoch": 2.38496,
"grad_norm": 0.027684694690569174,
"learning_rate": 2.505655717840052e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00021103810286149383,
"step": 2485,
"valid_targets_mean": 5089.8,
"valid_targets_min": 1820
},
{
"epoch": 2.38976,
"grad_norm": 0.03143907720270563,
"learning_rate": 2.499170644167946e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002478085516486317,
"step": 2490,
"valid_targets_mean": 2749.9,
"valid_targets_min": 1918
},
{
"epoch": 2.3945600000000002,
"grad_norm": 0.027614380837816813,
"learning_rate": 2.49267996869171e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014130433555692434,
"step": 2495,
"valid_targets_mean": 4555.9,
"valid_targets_min": 2073
},
{
"epoch": 2.39936,
"grad_norm": 0.03903812401787511,
"learning_rate": 2.486183764251151e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00024015213421080261,
"step": 2500,
"valid_targets_mean": 3791.2,
"valid_targets_min": 1948
},
{
"epoch": 2.40416,
"grad_norm": 0.028971229010347883,
"learning_rate": 2.4796821037481215e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014903757255524397,
"step": 2505,
"valid_targets_mean": 3217.3,
"valid_targets_min": 1914
},
{
"epoch": 2.40896,
"grad_norm": 0.035086625043318054,
"learning_rate": 2.473175060145703e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001503221137681976,
"step": 2510,
"valid_targets_mean": 3694.5,
"valid_targets_min": 1951
},
{
"epoch": 2.41376,
"grad_norm": 0.03784890895425839,
"learning_rate": 2.4666627064673892e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002561969740781933,
"step": 2515,
"valid_targets_mean": 2764.7,
"valid_targets_min": 1930
},
{
"epoch": 2.41856,
"grad_norm": 0.03502209953746837,
"learning_rate": 2.4601451157962616e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014939287211745977,
"step": 2520,
"valid_targets_mean": 3019.3,
"valid_targets_min": 1763
},
{
"epoch": 2.42336,
"grad_norm": 0.038579498889326165,
"learning_rate": 2.4536223612741754e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00029830800485797226,
"step": 2525,
"valid_targets_mean": 4642.4,
"valid_targets_min": 1361
},
{
"epoch": 2.42816,
"grad_norm": 0.02719304613035395,
"learning_rate": 2.447094516100934e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001690950448391959,
"step": 2530,
"valid_targets_mean": 4152.7,
"valid_targets_min": 1727
},
{
"epoch": 2.43296,
"grad_norm": 0.03258199868600974,
"learning_rate": 2.4405616535334695e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020575785310938954,
"step": 2535,
"valid_targets_mean": 4316.7,
"valid_targets_min": 1918
},
{
"epoch": 2.43776,
"grad_norm": 0.03801298563758932,
"learning_rate": 2.43402384688502e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000360257166903466,
"step": 2540,
"valid_targets_mean": 3739.1,
"valid_targets_min": 1998
},
{
"epoch": 2.44256,
"grad_norm": 0.03621817881967739,
"learning_rate": 2.4274811695243085e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023448243155144155,
"step": 2545,
"valid_targets_mean": 3347.4,
"valid_targets_min": 2119
},
{
"epoch": 2.4473599999999998,
"grad_norm": 0.02805407299186264,
"learning_rate": 2.4209336948747168e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00025352189550176263,
"step": 2550,
"valid_targets_mean": 3837.3,
"valid_targets_min": 1517
},
{
"epoch": 2.45216,
"grad_norm": 0.03732310069016806,
"learning_rate": 2.414381496413464e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00024747985298745334,
"step": 2555,
"valid_targets_mean": 4331.4,
"valid_targets_min": 2008
},
{
"epoch": 2.45696,
"grad_norm": 0.03456714787592951,
"learning_rate": 2.4078246476707793e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000141127486131154,
"step": 2560,
"valid_targets_mean": 3667.2,
"valid_targets_min": 1525
},
{
"epoch": 2.46176,
"grad_norm": 0.035425591366662346,
"learning_rate": 2.4012632222290802e-05,
"loss": 0.0007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00029167812317609787,
"step": 2565,
"valid_targets_mean": 4083.5,
"valid_targets_min": 1868
},
{
"epoch": 2.46656,
"grad_norm": 0.02874013643641384,
"learning_rate": 2.3946972937221444e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001653900253586471,
"step": 2570,
"valid_targets_mean": 4142.4,
"valid_targets_min": 1760
},
{
"epoch": 2.47136,
"grad_norm": 0.02862784285161512,
"learning_rate": 2.3881269358342828e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00020821639918722212,
"step": 2575,
"valid_targets_mean": 4223.2,
"valid_targets_min": 1361
},
{
"epoch": 2.47616,
"grad_norm": 0.029604293591339006,
"learning_rate": 2.3815522222995158e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001307126512983814,
"step": 2580,
"valid_targets_mean": 3124.3,
"valid_targets_min": 1958
},
{
"epoch": 2.48096,
"grad_norm": 0.033893385830383684,
"learning_rate": 2.3749732269007427e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016485755622852594,
"step": 2585,
"valid_targets_mean": 4209.0,
"valid_targets_min": 1775
},
{
"epoch": 2.48576,
"grad_norm": 0.03419392450169646,
"learning_rate": 2.3683900234689142e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002415791677776724,
"step": 2590,
"valid_targets_mean": 4240.3,
"valid_targets_min": 1906
},
{
"epoch": 2.49056,
"grad_norm": 0.029006117232870755,
"learning_rate": 2.3618026858822054e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023742017219774425,
"step": 2595,
"valid_targets_mean": 3191.8,
"valid_targets_min": 1858
},
{
"epoch": 2.49536,
"grad_norm": 0.04012111729972718,
"learning_rate": 2.355211288065187e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015978682495187968,
"step": 2600,
"valid_targets_mean": 3348.3,
"valid_targets_min": 2004
},
{
"epoch": 2.50016,
"grad_norm": 0.04056449581614587,
"learning_rate": 2.348615903987991e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022866785002406687,
"step": 2605,
"valid_targets_mean": 3626.4,
"valid_targets_min": 1995
},
{
"epoch": 2.50496,
"grad_norm": 0.030585259676019654,
"learning_rate": 2.3420166076654873e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00021799776004627347,
"step": 2610,
"valid_targets_mean": 3237.5,
"valid_targets_min": 1763
},
{
"epoch": 2.50976,
"grad_norm": 0.023930444972562206,
"learning_rate": 2.335413473156449e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022054321016184986,
"step": 2615,
"valid_targets_mean": 3443.3,
"valid_targets_min": 1884
},
{
"epoch": 2.51456,
"grad_norm": 0.024457278834734187,
"learning_rate": 2.328806574562722e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011868066212628037,
"step": 2620,
"valid_targets_mean": 4358.3,
"valid_targets_min": 1786
},
{
"epoch": 2.51936,
"grad_norm": 0.031028426914594242,
"learning_rate": 2.322195986028393e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00027652987046167254,
"step": 2625,
"valid_targets_mean": 4464.6,
"valid_targets_min": 1601
},
{
"epoch": 2.52416,
"grad_norm": 0.030577977296404303,
"learning_rate": 2.315581781738959e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001450799172744155,
"step": 2630,
"valid_targets_mean": 4065.1,
"valid_targets_min": 1764
},
{
"epoch": 2.52896,
"grad_norm": 0.028055994141291358,
"learning_rate": 2.3089640359204937e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00018580812320578843,
"step": 2635,
"valid_targets_mean": 3585.7,
"valid_targets_min": 1727
},
{
"epoch": 2.53376,
"grad_norm": 0.020316911634189153,
"learning_rate": 2.3023428228388144e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015279500803444535,
"step": 2640,
"valid_targets_mean": 4268.4,
"valid_targets_min": 1361
},
{
"epoch": 2.53856,
"grad_norm": 0.029192677167564848,
"learning_rate": 2.2957182167986486e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016782352759037167,
"step": 2645,
"valid_targets_mean": 3354.9,
"valid_targets_min": 1652
},
{
"epoch": 2.54336,
"grad_norm": 0.02674573810278128,
"learning_rate": 2.2890902921428004e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011722477211151272,
"step": 2650,
"valid_targets_mean": 3411.8,
"valid_targets_min": 1799
},
{
"epoch": 2.54816,
"grad_norm": 0.03491667544098721,
"learning_rate": 2.2824591232513153e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017565107555128634,
"step": 2655,
"valid_targets_mean": 3712.1,
"valid_targets_min": 1887
},
{
"epoch": 2.55296,
"grad_norm": 0.033105604731353114,
"learning_rate": 2.2758247845406495e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00023516351939179003,
"step": 2660,
"valid_targets_mean": 3988.2,
"valid_targets_min": 1931
},
{
"epoch": 2.55776,
"grad_norm": 0.024677789248399855,
"learning_rate": 2.2691873504628282e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00013441765622701496,
"step": 2665,
"valid_targets_mean": 3287.0,
"valid_targets_min": 1716
},
{
"epoch": 2.56256,
"grad_norm": 0.03347135910296354,
"learning_rate": 2.2625468955046143e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016958295600488782,
"step": 2670,
"valid_targets_mean": 3179.7,
"valid_targets_min": 1908
},
{
"epoch": 2.56736,
"grad_norm": 0.025305271492915622,
"learning_rate": 2.2559034941866727e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017021692474372685,
"step": 2675,
"valid_targets_mean": 3838.3,
"valid_targets_min": 1992
},
{
"epoch": 2.5721600000000002,
"grad_norm": 0.03054664142249039,
"learning_rate": 2.2492572210627325e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002199383161496371,
"step": 2680,
"valid_targets_mean": 3718.6,
"valid_targets_min": 1771
},
{
"epoch": 2.57696,
"grad_norm": 0.0295739820670092,
"learning_rate": 2.24260815071875e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002091970236506313,
"step": 2685,
"valid_targets_mean": 4135.2,
"valid_targets_min": 2033
},
{
"epoch": 2.58176,
"grad_norm": 0.027407367741136335,
"learning_rate": 2.2359563577720743e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015643186634406447,
"step": 2690,
"valid_targets_mean": 3748.6,
"valid_targets_min": 1863
},
{
"epoch": 2.58656,
"grad_norm": 0.023931228842467126,
"learning_rate": 2.229301916870606e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001017052709357813,
"step": 2695,
"valid_targets_mean": 4408.4,
"valid_targets_min": 1858
},
{
"epoch": 2.59136,
"grad_norm": 0.016879904184060966,
"learning_rate": 2.2226449026919637e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014124697190709412,
"step": 2700,
"valid_targets_mean": 4628.8,
"valid_targets_min": 1993
},
{
"epoch": 2.5961600000000002,
"grad_norm": 0.03350887881820371,
"learning_rate": 2.2159853899426427e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00019711660570465028,
"step": 2705,
"valid_targets_mean": 3775.4,
"valid_targets_min": 1924
},
{
"epoch": 2.60096,
"grad_norm": 0.024997563571365917,
"learning_rate": 2.209323453357178e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001128168951254338,
"step": 2710,
"valid_targets_mean": 2900.3,
"valid_targets_min": 1912
},
{
"epoch": 2.60576,
"grad_norm": 0.02473483219663956,
"learning_rate": 2.202659167697306e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014166333130560815,
"step": 2715,
"valid_targets_mean": 5047.2,
"valid_targets_min": 1858
},
{
"epoch": 2.61056,
"grad_norm": 0.02695375949945734,
"learning_rate": 2.1959926077511234e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015097047435119748,
"step": 2720,
"valid_targets_mean": 4527.6,
"valid_targets_min": 1925
},
{
"epoch": 2.61536,
"grad_norm": 0.029313431173201666,
"learning_rate": 2.1893238483322512e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00027219983167015016,
"step": 2725,
"valid_targets_mean": 3846.9,
"valid_targets_min": 1764
},
{
"epoch": 2.6201600000000003,
"grad_norm": 0.0246117813376776,
"learning_rate": 2.1826529642789923e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011438388901297003,
"step": 2730,
"valid_targets_mean": 4127.7,
"valid_targets_min": 1983
},
{
"epoch": 2.6249599999999997,
"grad_norm": 0.03166261718253728,
"learning_rate": 2.1759800304534936e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00030604726634919643,
"step": 2735,
"valid_targets_mean": 3822.6,
"valid_targets_min": 1917
},
{
"epoch": 2.62976,
"grad_norm": 0.02399486169062025,
"learning_rate": 2.1693051217409048e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017993926303461194,
"step": 2740,
"valid_targets_mean": 2943.0,
"valid_targets_min": 2022
},
{
"epoch": 2.63456,
"grad_norm": 0.022031983161228993,
"learning_rate": 2.1626283130485365e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015471190272364765,
"step": 2745,
"valid_targets_mean": 4091.2,
"valid_targets_min": 1839
},
{
"epoch": 2.63936,
"grad_norm": 0.029777655573390297,
"learning_rate": 2.1559496793050235e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00022734438243787736,
"step": 2750,
"valid_targets_mean": 3356.0,
"valid_targets_min": 1977
},
{
"epoch": 2.64416,
"grad_norm": 0.032339263263978055,
"learning_rate": 2.1492692954594815e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016537672490812838,
"step": 2755,
"valid_targets_mean": 3285.5,
"valid_targets_min": 1525
},
{
"epoch": 2.6489599999999998,
"grad_norm": 0.02041903769719548,
"learning_rate": 2.1425872364806642e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.491001451853663e-05,
"step": 2760,
"valid_targets_mean": 3870.9,
"valid_targets_min": 1928
},
{
"epoch": 2.65376,
"grad_norm": 0.02724645730303635,
"learning_rate": 2.1359035773561275e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.727981185074896e-05,
"step": 2765,
"valid_targets_mean": 3569.4,
"valid_targets_min": 1662
},
{
"epoch": 2.65856,
"grad_norm": 0.027173048710820033,
"learning_rate": 2.1292183930913803e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002180126029998064,
"step": 2770,
"valid_targets_mean": 3932.3,
"valid_targets_min": 1986
},
{
"epoch": 2.66336,
"grad_norm": 0.037202649199021574,
"learning_rate": 2.1225317587090507e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015464637544937432,
"step": 2775,
"valid_targets_mean": 4374.6,
"valid_targets_min": 1948
},
{
"epoch": 2.66816,
"grad_norm": 0.023946900535808578,
"learning_rate": 2.1158437492480384e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.866835560183972e-05,
"step": 2780,
"valid_targets_mean": 3508.4,
"valid_targets_min": 1972
},
{
"epoch": 2.67296,
"grad_norm": 0.023323639929458045,
"learning_rate": 2.1091544397626752e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.227942791767418e-05,
"step": 2785,
"valid_targets_mean": 3581.1,
"valid_targets_min": 1799
},
{
"epoch": 2.67776,
"grad_norm": 0.0172998031924568,
"learning_rate": 2.102463905321881e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00019019619503524154,
"step": 2790,
"valid_targets_mean": 5262.3,
"valid_targets_min": 1993
},
{
"epoch": 2.68256,
"grad_norm": 0.026339994207665886,
"learning_rate": 2.095772221008323e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015134026762098074,
"step": 2795,
"valid_targets_mean": 3594.5,
"valid_targets_min": 1877
},
{
"epoch": 2.68736,
"grad_norm": 0.03256359763209226,
"learning_rate": 2.0890794619175745e-05,
"loss": 0.0006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00018617985188029706,
"step": 2800,
"valid_targets_mean": 4447.6,
"valid_targets_min": 1943
},
{
"epoch": 2.69216,
"grad_norm": 0.023898664989193522,
"learning_rate": 2.0823857031572663e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.358520815614611e-05,
"step": 2805,
"valid_targets_mean": 2726.3,
"valid_targets_min": 1771
},
{
"epoch": 2.69696,
"grad_norm": 0.029494228295745283,
"learning_rate": 2.0756910198462515e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001169008610304445,
"step": 2810,
"valid_targets_mean": 4072.3,
"valid_targets_min": 1942
},
{
"epoch": 2.70176,
"grad_norm": 0.028854863277279583,
"learning_rate": 2.0689954871137558e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011759097105823457,
"step": 2815,
"valid_targets_mean": 2916.8,
"valid_targets_min": 1877
},
{
"epoch": 2.70656,
"grad_norm": 0.02416453071586182,
"learning_rate": 2.0622991800985398e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001018679904518649,
"step": 2820,
"valid_targets_mean": 2619.8,
"valid_targets_min": 1833
},
{
"epoch": 2.71136,
"grad_norm": 0.023490376662988942,
"learning_rate": 2.055602173948051e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00013606276479549706,
"step": 2825,
"valid_targets_mean": 4143.3,
"valid_targets_min": 1838
},
{
"epoch": 2.71616,
"grad_norm": 0.016960972248032263,
"learning_rate": 2.0489045438175842e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001110613375203684,
"step": 2830,
"valid_targets_mean": 3656.4,
"valid_targets_min": 1943
},
{
"epoch": 2.72096,
"grad_norm": 0.022589070972111297,
"learning_rate": 2.042206364869436e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016260298434644938,
"step": 2835,
"valid_targets_mean": 3551.5,
"valid_targets_min": 1763
},
{
"epoch": 2.72576,
"grad_norm": 0.02856209557457077,
"learning_rate": 2.0355077122720625e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00018720896332524717,
"step": 2840,
"valid_targets_mean": 3209.6,
"valid_targets_min": 1924
},
{
"epoch": 2.73056,
"grad_norm": 0.021731288713113188,
"learning_rate": 2.0288086611992344e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.025498052826151e-05,
"step": 2845,
"valid_targets_mean": 3721.6,
"valid_targets_min": 1992
},
{
"epoch": 2.73536,
"grad_norm": 0.028612983173565747,
"learning_rate": 2.0221092868291953e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.612230158178136e-05,
"step": 2850,
"valid_targets_mean": 2944.8,
"valid_targets_min": 1836
},
{
"epoch": 2.74016,
"grad_norm": 0.023600216503969575,
"learning_rate": 2.0154096643438153e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.917169518303126e-05,
"step": 2855,
"valid_targets_mean": 4533.1,
"valid_targets_min": 1719
},
{
"epoch": 2.74496,
"grad_norm": 0.025094469370057243,
"learning_rate": 2.008709868927751e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.150246917968616e-05,
"step": 2860,
"valid_targets_mean": 3046.2,
"valid_targets_min": 2086
},
{
"epoch": 2.74976,
"grad_norm": 0.019746676801553512,
"learning_rate": 2.0020099757675978e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.597777297021821e-05,
"step": 2865,
"valid_targets_mean": 4366.8,
"valid_targets_min": 1716
},
{
"epoch": 2.75456,
"grad_norm": 0.030709152512287757,
"learning_rate": 1.9953100600510487e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.887020860332996e-05,
"step": 2870,
"valid_targets_mean": 3165.4,
"valid_targets_min": 1970
},
{
"epoch": 2.75936,
"grad_norm": 0.019782474480980868,
"learning_rate": 1.9886101969660504e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.534643762279302e-05,
"step": 2875,
"valid_targets_mean": 3346.6,
"valid_targets_min": 1775
},
{
"epoch": 2.76416,
"grad_norm": 0.023247966487372883,
"learning_rate": 1.9819104616999584e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00012664488167501986,
"step": 2880,
"valid_targets_mean": 3562.3,
"valid_targets_min": 1863
},
{
"epoch": 2.76896,
"grad_norm": 0.026697504425241023,
"learning_rate": 1.975210929438693e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011335482122376561,
"step": 2885,
"valid_targets_mean": 3805.9,
"valid_targets_min": 1877
},
{
"epoch": 2.7737600000000002,
"grad_norm": 0.024236369610147433,
"learning_rate": 1.9685116753658982e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015188367979135364,
"step": 2890,
"valid_targets_mean": 4950.4,
"valid_targets_min": 1863
},
{
"epoch": 2.77856,
"grad_norm": 0.024006115720744844,
"learning_rate": 1.9618127746620944e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.3211351769277826e-05,
"step": 2895,
"valid_targets_mean": 4628.9,
"valid_targets_min": 1839
},
{
"epoch": 2.78336,
"grad_norm": 0.01828708573325881,
"learning_rate": 1.9551143025038363e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015513661492150277,
"step": 2900,
"valid_targets_mean": 3301.9,
"valid_targets_min": 1361
},
{
"epoch": 2.78816,
"grad_norm": 0.02452513702064594,
"learning_rate": 1.9484163340628724e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001470555434934795,
"step": 2905,
"valid_targets_mean": 3966.4,
"valid_targets_min": 1802
},
{
"epoch": 2.79296,
"grad_norm": 0.02162253904665591,
"learning_rate": 1.941718944505294e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.633297016378492e-05,
"step": 2910,
"valid_targets_mean": 4646.6,
"valid_targets_min": 1929
},
{
"epoch": 2.7977600000000002,
"grad_norm": 0.02653344462508564,
"learning_rate": 1.9350222089906994e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011425589036662132,
"step": 2915,
"valid_targets_mean": 3358.9,
"valid_targets_min": 1799
},
{
"epoch": 2.80256,
"grad_norm": 0.020408240597344585,
"learning_rate": 1.9283262026713456e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014473756891675293,
"step": 2920,
"valid_targets_mean": 3279.9,
"valid_targets_min": 2031
},
{
"epoch": 2.80736,
"grad_norm": 0.021028753731547636,
"learning_rate": 1.9216310006913058e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001147160364780575,
"step": 2925,
"valid_targets_mean": 4004.2,
"valid_targets_min": 1975
},
{
"epoch": 2.81216,
"grad_norm": 0.02594239060438439,
"learning_rate": 1.914936678185629e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011305462248856202,
"step": 2930,
"valid_targets_mean": 3485.4,
"valid_targets_min": 1614
},
{
"epoch": 2.81696,
"grad_norm": 0.02964528000434778,
"learning_rate": 1.9082433102794918e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001548744912724942,
"step": 2935,
"valid_targets_mean": 3928.7,
"valid_targets_min": 1933
},
{
"epoch": 2.8217600000000003,
"grad_norm": 0.017134150188487504,
"learning_rate": 1.9015509720873603e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.740826888242736e-05,
"step": 2940,
"valid_targets_mean": 3706.7,
"valid_targets_min": 1917
},
{
"epoch": 2.8265599999999997,
"grad_norm": 0.02180933059470857,
"learning_rate": 1.894859738712143e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.822335414355621e-05,
"step": 2945,
"valid_targets_mean": 4252.4,
"valid_targets_min": 1562
},
{
"epoch": 2.83136,
"grad_norm": 0.016218254788160618,
"learning_rate": 1.888169685244352e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016421267355326563,
"step": 2950,
"valid_targets_mean": 3571.9,
"valid_targets_min": 1986
},
{
"epoch": 2.83616,
"grad_norm": 0.02354906480901788,
"learning_rate": 1.8814808867612568e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.99763695592992e-05,
"step": 2955,
"valid_targets_mean": 4399.5,
"valid_targets_min": 2088
},
{
"epoch": 2.84096,
"grad_norm": 0.01971511867464185,
"learning_rate": 1.8747934183260427e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.124760254053399e-05,
"step": 2960,
"valid_targets_mean": 3971.2,
"valid_targets_min": 1921
},
{
"epoch": 2.84576,
"grad_norm": 0.0278188576069757,
"learning_rate": 1.868107354986971e-05,
"loss": 0.0005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0003219933423679322,
"step": 2965,
"valid_targets_mean": 3617.8,
"valid_targets_min": 1982
},
{
"epoch": 2.8505599999999998,
"grad_norm": 0.026739769872547982,
"learning_rate": 1.8614227717765327e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00017199182184413075,
"step": 2970,
"valid_targets_mean": 3237.1,
"valid_targets_min": 1939
},
{
"epoch": 2.85536,
"grad_norm": 0.03461644008980415,
"learning_rate": 1.8547397437106084e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00012064729526173323,
"step": 2975,
"valid_targets_mean": 3380.6,
"valid_targets_min": 1838
},
{
"epoch": 2.86016,
"grad_norm": 0.02209288532182616,
"learning_rate": 1.848058345787629e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002483898715581745,
"step": 2980,
"valid_targets_mean": 3540.8,
"valid_targets_min": 1709
},
{
"epoch": 2.86496,
"grad_norm": 0.02714572952475498,
"learning_rate": 1.8413786529877288e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001591041509527713,
"step": 2985,
"valid_targets_mean": 3801.8,
"valid_targets_min": 1833
},
{
"epoch": 2.86976,
"grad_norm": 0.022040485361692213,
"learning_rate": 1.8347007402719082e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.611293353373185e-05,
"step": 2990,
"valid_targets_mean": 2953.5,
"valid_targets_min": 2022
},
{
"epoch": 2.87456,
"grad_norm": 0.022123709290083143,
"learning_rate": 1.828024682581191e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00019887229427695274,
"step": 2995,
"valid_targets_mean": 4369.2,
"valid_targets_min": 1959
},
{
"epoch": 2.87936,
"grad_norm": 0.018819840014296388,
"learning_rate": 1.8213505548357822e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.32165208319202e-05,
"step": 3000,
"valid_targets_mean": 3614.1,
"valid_targets_min": 1939
},
{
"epoch": 2.88416,
"grad_norm": 0.017994001101041452,
"learning_rate": 1.814678431934231e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00013698008842766285,
"step": 3005,
"valid_targets_mean": 4487.9,
"valid_targets_min": 1972
},
{
"epoch": 2.88896,
"grad_norm": 0.021592474043977235,
"learning_rate": 1.8080083887525862e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.77060306770727e-05,
"step": 3010,
"valid_targets_mean": 3691.1,
"valid_targets_min": 1562
},
{
"epoch": 2.89376,
"grad_norm": 0.018912366380670783,
"learning_rate": 1.801340500143557e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.287562766578048e-05,
"step": 3015,
"valid_targets_mean": 3996.4,
"valid_targets_min": 2003
},
{
"epoch": 2.89856,
"grad_norm": 0.018013021378604936,
"learning_rate": 1.7946748409356746e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.651852502021939e-05,
"step": 3020,
"valid_targets_mean": 5406.3,
"valid_targets_min": 1829
},
{
"epoch": 2.90336,
"grad_norm": 0.02196142205330078,
"learning_rate": 1.788011485932451e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.057618884369731e-05,
"step": 3025,
"valid_targets_mean": 3251.1,
"valid_targets_min": 1614
},
{
"epoch": 2.90816,
"grad_norm": 0.021939180840453026,
"learning_rate": 1.78135050991154e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015023195010144264,
"step": 3030,
"valid_targets_mean": 3716.9,
"valid_targets_min": 1983
},
{
"epoch": 2.91296,
"grad_norm": 0.023266947785077412,
"learning_rate": 1.774691987623898e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011902107507921755,
"step": 3035,
"valid_targets_mean": 3432.4,
"valid_targets_min": 1877
},
{
"epoch": 2.91776,
"grad_norm": 0.023820830898385627,
"learning_rate": 1.768035993792944e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002066703309537843,
"step": 3040,
"valid_targets_mean": 4092.0,
"valid_targets_min": 1933
},
{
"epoch": 2.92256,
"grad_norm": 0.020333880634877222,
"learning_rate": 1.7613826031137245e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0002175498811993748,
"step": 3045,
"valid_targets_mean": 2837.6,
"valid_targets_min": 2020
},
{
"epoch": 2.92736,
"grad_norm": 0.026465596046422065,
"learning_rate": 1.7547318902520693e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.79285071277991e-05,
"step": 3050,
"valid_targets_mean": 3790.3,
"valid_targets_min": 1986
},
{
"epoch": 2.93216,
"grad_norm": 0.018649197132876022,
"learning_rate": 1.7480839298437612e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.114524825941771e-05,
"step": 3055,
"valid_targets_mean": 3331.4,
"valid_targets_min": 1760
},
{
"epoch": 2.93696,
"grad_norm": 0.020148453199511775,
"learning_rate": 1.7414387964936913e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.896800186950713e-05,
"step": 3060,
"valid_targets_mean": 4374.5,
"valid_targets_min": 1949
},
{
"epoch": 2.94176,
"grad_norm": 0.021423561052568516,
"learning_rate": 1.7347965647750264e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014279386959969997,
"step": 3065,
"valid_targets_mean": 4296.7,
"valid_targets_min": 1998
},
{
"epoch": 2.94656,
"grad_norm": 0.02528519196710435,
"learning_rate": 1.7281573092283698e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.968213660409674e-05,
"step": 3070,
"valid_targets_mean": 3194.3,
"valid_targets_min": 1727
},
{
"epoch": 2.95136,
"grad_norm": 0.07048429228721245,
"learning_rate": 1.721521104360925e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.62947669904679e-05,
"step": 3075,
"valid_targets_mean": 3045.7,
"valid_targets_min": 1839
},
{
"epoch": 2.95616,
"grad_norm": 0.0222354184644874,
"learning_rate": 1.714888024645662e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001516393676865846,
"step": 3080,
"valid_targets_mean": 2978.5,
"valid_targets_min": 1887
},
{
"epoch": 2.96096,
"grad_norm": 0.01555733846454575,
"learning_rate": 1.708258144520478e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.9606034483294934e-05,
"step": 3085,
"valid_targets_mean": 4811.8,
"valid_targets_min": 2343
},
{
"epoch": 2.96576,
"grad_norm": 0.02232143567928934,
"learning_rate": 1.7016315383873637e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.000159605493536219,
"step": 3090,
"valid_targets_mean": 4230.9,
"valid_targets_min": 1786
},
{
"epoch": 2.97056,
"grad_norm": 0.026488500145509335,
"learning_rate": 1.6950082806115692e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.544553227489814e-05,
"step": 3095,
"valid_targets_mean": 3597.1,
"valid_targets_min": 1958
},
{
"epoch": 2.9753600000000002,
"grad_norm": 0.018457072570227887,
"learning_rate": 1.6883884455207685e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.865214916411787e-05,
"step": 3100,
"valid_targets_mean": 2762.7,
"valid_targets_min": 1727
},
{
"epoch": 2.98016,
"grad_norm": 0.023355245345469806,
"learning_rate": 1.6817721074042254e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001550887682242319,
"step": 3105,
"valid_targets_mean": 2952.7,
"valid_targets_min": 2094
},
{
"epoch": 2.98496,
"grad_norm": 0.026488279295259706,
"learning_rate": 1.675159340511958e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00013377467985264957,
"step": 3110,
"valid_targets_mean": 5067.9,
"valid_targets_min": 1919
},
{
"epoch": 2.98976,
"grad_norm": 0.020655150651040233,
"learning_rate": 1.6685502190539106e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.466073632007465e-05,
"step": 3115,
"valid_targets_mean": 3763.2,
"valid_targets_min": 2112
},
{
"epoch": 2.99456,
"grad_norm": 0.019096184065461538,
"learning_rate": 1.6619448171991155e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.77012571436353e-05,
"step": 3120,
"valid_targets_mean": 5052.1,
"valid_targets_min": 1884
},
{
"epoch": 2.9993600000000002,
"grad_norm": 0.021052484889835625,
"learning_rate": 1.6553432090748624e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.409695535898209e-05,
"step": 3125,
"valid_targets_mean": 3870.3,
"valid_targets_min": 1970
},
{
"epoch": 3.00384,
"grad_norm": 0.018453110841428155,
"learning_rate": 1.648745468765869e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.791754615027457e-05,
"step": 3130,
"valid_targets_mean": 4342.5,
"valid_targets_min": 1775
},
{
"epoch": 3.00864,
"grad_norm": 0.02047687885648728,
"learning_rate": 1.6421516703134463e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.985905979992822e-05,
"step": 3135,
"valid_targets_mean": 3566.9,
"valid_targets_min": 1934
},
{
"epoch": 3.01344,
"grad_norm": 0.024891596375059534,
"learning_rate": 1.6355618877146685e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00016949682321865112,
"step": 3140,
"valid_targets_mean": 3200.6,
"valid_targets_min": 1786
},
{
"epoch": 3.01824,
"grad_norm": 0.017850108146377348,
"learning_rate": 1.6289761949215435e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014728600217495114,
"step": 3145,
"valid_targets_mean": 3193.5,
"valid_targets_min": 1930
},
{
"epoch": 3.02304,
"grad_norm": 0.018909473518080613,
"learning_rate": 1.6223946658401818e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00021030849893577397,
"step": 3150,
"valid_targets_mean": 4067.7,
"valid_targets_min": 1829
},
{
"epoch": 3.02784,
"grad_norm": 0.020871319993280343,
"learning_rate": 1.6158173743299692e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.983018389903009e-05,
"step": 3155,
"valid_targets_mean": 4353.8,
"valid_targets_min": 1763
},
{
"epoch": 3.03264,
"grad_norm": 0.021660620992697086,
"learning_rate": 1.6092443942027356e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011195616389159113,
"step": 3160,
"valid_targets_mean": 2911.7,
"valid_targets_min": 1839
},
{
"epoch": 3.03744,
"grad_norm": 0.020135937308117555,
"learning_rate": 1.602675799221927e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.299851545714773e-05,
"step": 3165,
"valid_targets_mean": 3422.8,
"valid_targets_min": 1839
},
{
"epoch": 3.04224,
"grad_norm": 0.018431276886312412,
"learning_rate": 1.59611166310178e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.2702886023325846e-05,
"step": 3170,
"valid_targets_mean": 4471.5,
"valid_targets_min": 2132
},
{
"epoch": 3.04704,
"grad_norm": 0.015155951409860745,
"learning_rate": 1.5895520595064913e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.149896893883124e-05,
"step": 3175,
"valid_targets_mean": 3422.6,
"valid_targets_min": 1909
},
{
"epoch": 3.05184,
"grad_norm": 0.019233986447757676,
"learning_rate": 1.5829970620493932e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.23982700239867e-05,
"step": 3180,
"valid_targets_mean": 3077.1,
"valid_targets_min": 1858
},
{
"epoch": 3.05664,
"grad_norm": 0.014451754392294036,
"learning_rate": 1.5764467442921274e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.17826042091474e-05,
"step": 3185,
"valid_targets_mean": 3522.6,
"valid_targets_min": 1614
},
{
"epoch": 3.06144,
"grad_norm": 0.018898138961676178,
"learning_rate": 1.569901179743818e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011060632095905021,
"step": 3190,
"valid_targets_mean": 3454.0,
"valid_targets_min": 1517
},
{
"epoch": 3.06624,
"grad_norm": 0.027683453283868373,
"learning_rate": 1.5633604418602483e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011033978807972744,
"step": 3195,
"valid_targets_mean": 4021.5,
"valid_targets_min": 1680
},
{
"epoch": 3.07104,
"grad_norm": 0.018878947618359634,
"learning_rate": 1.5568246040430343e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010039303742814809,
"step": 3200,
"valid_targets_mean": 4480.4,
"valid_targets_min": 1933
},
{
"epoch": 3.07584,
"grad_norm": 0.02031318192479438,
"learning_rate": 1.5502937396388046e-05,
"loss": 0.0004,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.601862984709442e-05,
"step": 3205,
"valid_targets_mean": 3242.5,
"valid_targets_min": 1740
},
{
"epoch": 3.08064,
"grad_norm": 0.02253989554735354,
"learning_rate": 1.543767921938374e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014390042633749545,
"step": 3210,
"valid_targets_mean": 3770.4,
"valid_targets_min": 1836
},
{
"epoch": 3.08544,
"grad_norm": 0.013587452354707022,
"learning_rate": 1.537247224175922e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.746569463051856e-05,
"step": 3215,
"valid_targets_mean": 3409.2,
"valid_targets_min": 2039
},
{
"epoch": 3.09024,
"grad_norm": 0.028111652441311752,
"learning_rate": 1.53073171952817e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.700549031142145e-05,
"step": 3220,
"valid_targets_mean": 3577.5,
"valid_targets_min": 1929
},
{
"epoch": 3.09504,
"grad_norm": 0.01708144063100646,
"learning_rate": 1.5242214811135631e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.06500029284507e-05,
"step": 3225,
"valid_targets_mean": 4140.8,
"valid_targets_min": 1912
},
{
"epoch": 3.09984,
"grad_norm": 0.0226372066028227,
"learning_rate": 1.5177165819914461e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00012216181494295597,
"step": 3230,
"valid_targets_mean": 4149.2,
"valid_targets_min": 1709
},
{
"epoch": 3.10464,
"grad_norm": 0.024965359579690115,
"learning_rate": 1.5112170951612455e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.1957376854261383e-05,
"step": 3235,
"valid_targets_mean": 3129.3,
"valid_targets_min": 1863
},
{
"epoch": 3.10944,
"grad_norm": 0.013437951112882224,
"learning_rate": 1.5047230935616497e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.271107799373567e-05,
"step": 3240,
"valid_targets_mean": 3610.1,
"valid_targets_min": 1786
},
{
"epoch": 3.11424,
"grad_norm": 0.014237700182485939,
"learning_rate": 1.4982346500697916e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.194388020550832e-05,
"step": 3245,
"valid_targets_mean": 3825.3,
"valid_targets_min": 1775
},
{
"epoch": 3.11904,
"grad_norm": 0.014111540907084268,
"learning_rate": 1.4917518375004281e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.379166734404862e-05,
"step": 3250,
"valid_targets_mean": 3649.8,
"valid_targets_min": 1914
},
{
"epoch": 3.12384,
"grad_norm": 0.018824156129808443,
"learning_rate": 1.4852747286051254e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.309389573289081e-05,
"step": 3255,
"valid_targets_mean": 4722.3,
"valid_targets_min": 1680
},
{
"epoch": 3.12864,
"grad_norm": 0.018101010313748535,
"learning_rate": 1.478803396071443e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.809472299413756e-05,
"step": 3260,
"valid_targets_mean": 3089.8,
"valid_targets_min": 1838
},
{
"epoch": 3.1334400000000002,
"grad_norm": 0.016178134459373116,
"learning_rate": 1.472337912522115e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.876890595071018e-05,
"step": 3265,
"valid_targets_mean": 2934.6,
"valid_targets_min": 1361
},
{
"epoch": 3.13824,
"grad_norm": 0.017702747159018806,
"learning_rate": 1.4658783505142368e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010421761544421315,
"step": 3270,
"valid_targets_mean": 3497.0,
"valid_targets_min": 1949
},
{
"epoch": 3.14304,
"grad_norm": 0.015629467170666565,
"learning_rate": 1.4594247825384529e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.373621413833462e-05,
"step": 3275,
"valid_targets_mean": 4290.9,
"valid_targets_min": 1993
},
{
"epoch": 3.14784,
"grad_norm": 0.018221576270069557,
"learning_rate": 1.4529772810181398e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.873098416486755e-05,
"step": 3280,
"valid_targets_mean": 3406.2,
"valid_targets_min": 1870
},
{
"epoch": 3.15264,
"grad_norm": 0.018884144359542467,
"learning_rate": 1.4465359183085958e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010781181481434032,
"step": 3285,
"valid_targets_mean": 4543.2,
"valid_targets_min": 1786
},
{
"epoch": 3.15744,
"grad_norm": 0.024798991362972755,
"learning_rate": 1.4401007666962276e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.871503814589232e-05,
"step": 3290,
"valid_targets_mean": 3411.8,
"valid_targets_min": 1906
},
{
"epoch": 3.16224,
"grad_norm": 0.026289618162018507,
"learning_rate": 1.4336718983977389e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00014063461276236922,
"step": 3295,
"valid_targets_mean": 2952.9,
"valid_targets_min": 2059
},
{
"epoch": 3.16704,
"grad_norm": 0.02087911055323807,
"learning_rate": 1.4272493855593222e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011406857811380178,
"step": 3300,
"valid_targets_mean": 3903.2,
"valid_targets_min": 1933
},
{
"epoch": 3.17184,
"grad_norm": 0.025864926194416736,
"learning_rate": 1.4208333002558462e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00012150718248449266,
"step": 3305,
"valid_targets_mean": 4186.3,
"valid_targets_min": 1863
},
{
"epoch": 3.17664,
"grad_norm": 0.005925121943421106,
"learning_rate": 1.4144237144900497e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.7987763537094e-05,
"step": 3310,
"valid_targets_mean": 3257.3,
"valid_targets_min": 1877
},
{
"epoch": 3.18144,
"grad_norm": 0.0203610177094657,
"learning_rate": 1.4080207001917302e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.982845222111791e-05,
"step": 3315,
"valid_targets_mean": 2632.5,
"valid_targets_min": 1863
},
{
"epoch": 3.18624,
"grad_norm": 0.02013249654553658,
"learning_rate": 1.4016243292169413e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001017134272842668,
"step": 3320,
"valid_targets_mean": 3098.9,
"valid_targets_min": 1562
},
{
"epoch": 3.19104,
"grad_norm": 0.014150560479732852,
"learning_rate": 1.3952346733471822e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7287460145307705e-05,
"step": 3325,
"valid_targets_mean": 3468.7,
"valid_targets_min": 1361
},
{
"epoch": 3.19584,
"grad_norm": 0.01247748935676924,
"learning_rate": 1.3888518042885934e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.918737199157476e-05,
"step": 3330,
"valid_targets_mean": 3426.5,
"valid_targets_min": 1992
},
{
"epoch": 3.20064,
"grad_norm": 0.009828455444539298,
"learning_rate": 1.3824757936711537e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.947080404032022e-05,
"step": 3335,
"valid_targets_mean": 3553.8,
"valid_targets_min": 1933
},
{
"epoch": 3.20544,
"grad_norm": 0.012686422174234565,
"learning_rate": 1.3761067130478738e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.460604031919502e-05,
"step": 3340,
"valid_targets_mean": 3819.8,
"valid_targets_min": 1942
},
{
"epoch": 3.21024,
"grad_norm": 0.01654103079369527,
"learning_rate": 1.3697446338939942e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.0112899518571794e-05,
"step": 3345,
"valid_targets_mean": 3277.4,
"valid_targets_min": 1562
},
{
"epoch": 3.21504,
"grad_norm": 0.0194091521016171,
"learning_rate": 1.3633896276061847e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011460959649411961,
"step": 3350,
"valid_targets_mean": 3927.5,
"valid_targets_min": 1833
},
{
"epoch": 3.21984,
"grad_norm": 0.016517976307009564,
"learning_rate": 1.3570417655017405e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.381390267051756e-05,
"step": 3355,
"valid_targets_mean": 4070.7,
"valid_targets_min": 1614
},
{
"epoch": 3.22464,
"grad_norm": 0.010600916211686231,
"learning_rate": 1.3507011188177846e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.461009904043749e-05,
"step": 3360,
"valid_targets_mean": 3980.2,
"valid_targets_min": 1928
},
{
"epoch": 3.22944,
"grad_norm": 0.016976292352953615,
"learning_rate": 1.3443677587104655e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.451566827716306e-05,
"step": 3365,
"valid_targets_mean": 3608.3,
"valid_targets_min": 1928
},
{
"epoch": 3.23424,
"grad_norm": 0.012813626401298798,
"learning_rate": 1.3380417562541604e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.145267641637474e-05,
"step": 3370,
"valid_targets_mean": 4600.5,
"valid_targets_min": 1909
},
{
"epoch": 3.23904,
"grad_norm": 0.010829071491700365,
"learning_rate": 1.3317231824406783e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.345774505054578e-05,
"step": 3375,
"valid_targets_mean": 4325.6,
"valid_targets_min": 1868
},
{
"epoch": 3.24384,
"grad_norm": 0.01041182604349842,
"learning_rate": 1.325412108178461e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.307223131647334e-05,
"step": 3380,
"valid_targets_mean": 3372.8,
"valid_targets_min": 1361
},
{
"epoch": 3.24864,
"grad_norm": 0.01526890053285902,
"learning_rate": 1.3191086042917895e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.071500320103951e-05,
"step": 3385,
"valid_targets_mean": 5381.7,
"valid_targets_min": 1863
},
{
"epoch": 3.25344,
"grad_norm": 0.015370550532819507,
"learning_rate": 1.3128127415199883e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.260534766828641e-05,
"step": 3390,
"valid_targets_mean": 3824.7,
"valid_targets_min": 2121
},
{
"epoch": 3.25824,
"grad_norm": 0.01190987235181321,
"learning_rate": 1.3065245905166316e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.562914157053456e-05,
"step": 3395,
"valid_targets_mean": 4362.4,
"valid_targets_min": 1998
},
{
"epoch": 3.26304,
"grad_norm": 0.0050532178122862466,
"learning_rate": 1.30024422184875e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.3684292652178556e-05,
"step": 3400,
"valid_targets_mean": 3969.5,
"valid_targets_min": 1914
},
{
"epoch": 3.26784,
"grad_norm": 0.011786071851466207,
"learning_rate": 1.2939717059960384e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.181220330996439e-05,
"step": 3405,
"valid_targets_mean": 3020.6,
"valid_targets_min": 1361
},
{
"epoch": 3.27264,
"grad_norm": 0.01729739851008109,
"learning_rate": 1.287707113350068e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.659601058345288e-05,
"step": 3410,
"valid_targets_mean": 5125.4,
"valid_targets_min": 2072
},
{
"epoch": 3.27744,
"grad_norm": 0.01670211062110001,
"learning_rate": 1.2814505142134921e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.324228161247447e-05,
"step": 3415,
"valid_targets_mean": 3899.4,
"valid_targets_min": 2013
},
{
"epoch": 3.28224,
"grad_norm": 0.01914716601442075,
"learning_rate": 1.2752019787992587e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.421004556817934e-05,
"step": 3420,
"valid_targets_mean": 3452.8,
"valid_targets_min": 1847
},
{
"epoch": 3.28704,
"grad_norm": 0.015196263944313884,
"learning_rate": 1.268961577229824e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.754793867003173e-05,
"step": 3425,
"valid_targets_mean": 4664.8,
"valid_targets_min": 1933
},
{
"epoch": 3.29184,
"grad_norm": 0.009801501966872886,
"learning_rate": 1.262729379536365e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.6651009041816e-05,
"step": 3430,
"valid_targets_mean": 3303.6,
"valid_targets_min": 1931
},
{
"epoch": 3.29664,
"grad_norm": 0.018792435761741236,
"learning_rate": 1.2565054556579917e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.3184681746643037e-05,
"step": 3435,
"valid_targets_mean": 3715.3,
"valid_targets_min": 1716
},
{
"epoch": 3.30144,
"grad_norm": 0.02123827971481195,
"learning_rate": 1.2502898754409637e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.16395370545797e-05,
"step": 3440,
"valid_targets_mean": 4315.2,
"valid_targets_min": 1829
},
{
"epoch": 3.30624,
"grad_norm": 0.016955050967706747,
"learning_rate": 1.2440827086379055e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.558079232694581e-05,
"step": 3445,
"valid_targets_mean": 3924.2,
"valid_targets_min": 1680
},
{
"epoch": 3.31104,
"grad_norm": 0.011393580150245596,
"learning_rate": 1.2378840249070265e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.816037006909028e-05,
"step": 3450,
"valid_targets_mean": 4042.6,
"valid_targets_min": 1993
},
{
"epoch": 3.31584,
"grad_norm": 0.014021469513832098,
"learning_rate": 1.2316938938113356e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.988252451061271e-05,
"step": 3455,
"valid_targets_mean": 3272.9,
"valid_targets_min": 1919
},
{
"epoch": 3.32064,
"grad_norm": 0.021608841881745316,
"learning_rate": 1.2255123848178619e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.891654968261719e-05,
"step": 3460,
"valid_targets_mean": 2683.6,
"valid_targets_min": 1839
},
{
"epoch": 3.32544,
"grad_norm": 0.01594098999699228,
"learning_rate": 1.2193395672968765e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.743696237914264e-05,
"step": 3465,
"valid_targets_mean": 4081.6,
"valid_targets_min": 1839
},
{
"epoch": 3.33024,
"grad_norm": 0.017982113832719027,
"learning_rate": 1.2131755105211118e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.675477197859436e-05,
"step": 3470,
"valid_targets_mean": 3484.5,
"valid_targets_min": 1763
},
{
"epoch": 3.3350400000000002,
"grad_norm": 0.012091989839522792,
"learning_rate": 1.2070202836649855e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.264718831516802e-05,
"step": 3475,
"valid_targets_mean": 3723.5,
"valid_targets_min": 2106
},
{
"epoch": 3.33984,
"grad_norm": 0.016693800580166875,
"learning_rate": 1.2008739558038247e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.9205801486969e-05,
"step": 3480,
"valid_targets_mean": 4107.0,
"valid_targets_min": 1887
},
{
"epoch": 3.34464,
"grad_norm": 0.020245961840814296,
"learning_rate": 1.1947365959130895e-05,
"loss": 0.0003,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.409671939560212e-05,
"step": 3485,
"valid_targets_mean": 3815.5,
"valid_targets_min": 1942
},
{
"epoch": 3.34944,
"grad_norm": 0.009696441130015688,
"learning_rate": 1.1886082728675984e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.198530172696337e-05,
"step": 3490,
"valid_targets_mean": 3173.8,
"valid_targets_min": 1662
},
{
"epoch": 3.35424,
"grad_norm": 0.008070751492922062,
"learning_rate": 1.1824890554407574e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.529598663793877e-05,
"step": 3495,
"valid_targets_mean": 3571.8,
"valid_targets_min": 1601
},
{
"epoch": 3.3590400000000002,
"grad_norm": 0.016893770420853417,
"learning_rate": 1.1763790123037873e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.078791142906994e-05,
"step": 3500,
"valid_targets_mean": 3549.1,
"valid_targets_min": 1930
},
{
"epoch": 3.36384,
"grad_norm": 0.010611619676596679,
"learning_rate": 1.1702782120249539e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.067165693617426e-05,
"step": 3505,
"valid_targets_mean": 2994.8,
"valid_targets_min": 1921
},
{
"epoch": 3.36864,
"grad_norm": 0.012227824476474919,
"learning_rate": 1.164186723068795e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010194306378252804,
"step": 3510,
"valid_targets_mean": 3324.2,
"valid_targets_min": 1952
},
{
"epoch": 3.37344,
"grad_norm": 0.018233151037207677,
"learning_rate": 1.1581046137953575e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.322602323256433e-05,
"step": 3515,
"valid_targets_mean": 3473.9,
"valid_targets_min": 1525
},
{
"epoch": 3.37824,
"grad_norm": 0.008027450910334806,
"learning_rate": 1.1520319524594256e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.367275662138127e-05,
"step": 3520,
"valid_targets_mean": 3441.0,
"valid_targets_min": 1820
},
{
"epoch": 3.38304,
"grad_norm": 0.016385156735597293,
"learning_rate": 1.1459688072097568e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011734359577530995,
"step": 3525,
"valid_targets_mean": 4226.1,
"valid_targets_min": 1525
},
{
"epoch": 3.38784,
"grad_norm": 0.0067915094576856535,
"learning_rate": 1.1399152460883176e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.4733271352015436e-05,
"step": 3530,
"valid_targets_mean": 3731.2,
"valid_targets_min": 1829
},
{
"epoch": 3.39264,
"grad_norm": 0.00892211548509811,
"learning_rate": 1.1338713370295189e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.814416024601087e-05,
"step": 3535,
"valid_targets_mean": 3858.1,
"valid_targets_min": 1983
},
{
"epoch": 3.39744,
"grad_norm": 0.008159206891878339,
"learning_rate": 1.1278371478594538e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.263151640770957e-05,
"step": 3540,
"valid_targets_mean": 3644.7,
"valid_targets_min": 1972
},
{
"epoch": 3.40224,
"grad_norm": 0.0067195504898440485,
"learning_rate": 1.1218127462951367e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.700961678987369e-05,
"step": 3545,
"valid_targets_mean": 3890.9,
"valid_targets_min": 1525
},
{
"epoch": 3.40704,
"grad_norm": 0.007884157725395604,
"learning_rate": 1.1157981999437444e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.053674638271332e-05,
"step": 3550,
"valid_targets_mean": 4305.6,
"valid_targets_min": 1836
},
{
"epoch": 3.4118399999999998,
"grad_norm": 0.015000201204561208,
"learning_rate": 1.109793576301855e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.019015250378288e-05,
"step": 3555,
"valid_targets_mean": 4950.6,
"valid_targets_min": 1680
},
{
"epoch": 3.41664,
"grad_norm": 0.016970726415525852,
"learning_rate": 1.1037989427546924e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00012615707237273455,
"step": 3560,
"valid_targets_mean": 3820.9,
"valid_targets_min": 1662
},
{
"epoch": 3.42144,
"grad_norm": 0.008553481869326631,
"learning_rate": 1.0978143665753692e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.730415821541101e-05,
"step": 3565,
"valid_targets_mean": 4176.1,
"valid_targets_min": 1991
},
{
"epoch": 3.42624,
"grad_norm": 0.020611764051659598,
"learning_rate": 1.0918399149241314e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.6515218602726236e-05,
"step": 3570,
"valid_targets_mean": 3387.0,
"valid_targets_min": 1908
},
{
"epoch": 3.43104,
"grad_norm": 0.03254530583537241,
"learning_rate": 1.0858756548476058e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001125583949033171,
"step": 3575,
"valid_targets_mean": 2906.8,
"valid_targets_min": 1934
},
{
"epoch": 3.43584,
"grad_norm": 0.014829373122733618,
"learning_rate": 1.0799216532780478e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.488798003876582e-05,
"step": 3580,
"valid_targets_mean": 3507.2,
"valid_targets_min": 1716
},
{
"epoch": 3.44064,
"grad_norm": 0.025957320437693793,
"learning_rate": 1.0739779770325885e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00013226433657109737,
"step": 3585,
"valid_targets_mean": 3937.9,
"valid_targets_min": 2115
},
{
"epoch": 3.44544,
"grad_norm": 0.011198146121762398,
"learning_rate": 1.0680446928124872e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.750825221184641e-05,
"step": 3590,
"valid_targets_mean": 5197.8,
"valid_targets_min": 1900
},
{
"epoch": 3.45024,
"grad_norm": 0.013783909187565497,
"learning_rate": 1.06212186720238e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.546361404005438e-05,
"step": 3595,
"valid_targets_mean": 3067.2,
"valid_targets_min": 2012
},
{
"epoch": 3.45504,
"grad_norm": 0.008523171197014895,
"learning_rate": 1.0562095666695352e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.496578185353428e-05,
"step": 3600,
"valid_targets_mean": 4060.1,
"valid_targets_min": 1906
},
{
"epoch": 3.45984,
"grad_norm": 0.013801175341468335,
"learning_rate": 1.0503078575631052e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.477723945863545e-05,
"step": 3605,
"valid_targets_mean": 3305.2,
"valid_targets_min": 2000
},
{
"epoch": 3.46464,
"grad_norm": 0.014959764009151036,
"learning_rate": 1.0444168061133846e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00012726544809993356,
"step": 3610,
"valid_targets_mean": 4484.9,
"valid_targets_min": 1763
},
{
"epoch": 3.46944,
"grad_norm": 0.01139425598770555,
"learning_rate": 1.0385364784310636e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.298814383218996e-05,
"step": 3615,
"valid_targets_mean": 3759.6,
"valid_targets_min": 1361
},
{
"epoch": 3.47424,
"grad_norm": 0.015011712005345224,
"learning_rate": 1.0326669405064904e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0001424011425115168,
"step": 3620,
"valid_targets_mean": 3863.2,
"valid_targets_min": 1727
},
{
"epoch": 3.47904,
"grad_norm": 0.006988112883670556,
"learning_rate": 1.0268082582089263e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.663314419100061e-05,
"step": 3625,
"valid_targets_mean": 5181.8,
"valid_targets_min": 1972
},
{
"epoch": 3.48384,
"grad_norm": 0.016204945933502923,
"learning_rate": 1.0209604972858081e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.9584206610452384e-05,
"step": 3630,
"valid_targets_mean": 4587.8,
"valid_targets_min": 1799
},
{
"epoch": 3.48864,
"grad_norm": 0.006836549926723057,
"learning_rate": 1.0151237233620115e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.5423868868965656e-05,
"step": 3635,
"valid_targets_mean": 4556.9,
"valid_targets_min": 2020
},
{
"epoch": 3.49344,
"grad_norm": 0.01047918810880494,
"learning_rate": 1.0092980019391132e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00011410897423047572,
"step": 3640,
"valid_targets_mean": 3896.4,
"valid_targets_min": 1939
},
{
"epoch": 3.49824,
"grad_norm": 0.014652018259616206,
"learning_rate": 1.0034833983946561e-05,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010652582568582147,
"step": 3645,
"valid_targets_mean": 2887.8,
"valid_targets_min": 1829
},
{
"epoch": 3.50304,
"grad_norm": 0.010669898087313332,
"learning_rate": 9.976799779814157e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.363785698544234e-05,
"step": 3650,
"valid_targets_mean": 3741.1,
"valid_targets_min": 1763
},
{
"epoch": 3.50784,
"grad_norm": 0.01150859791625705,
"learning_rate": 9.918878058266687e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.623920151265338e-05,
"step": 3655,
"valid_targets_mean": 3809.2,
"valid_targets_min": 1939
},
{
"epoch": 3.51264,
"grad_norm": 0.003478644304975548,
"learning_rate": 9.86106946931462e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.717148138093762e-05,
"step": 3660,
"valid_targets_mean": 4336.8,
"valid_targets_min": 1974
},
{
"epoch": 3.51744,
"grad_norm": 0.01237512729854138,
"learning_rate": 9.803374661698802e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.4668777011102065e-05,
"step": 3665,
"valid_targets_mean": 3139.4,
"valid_targets_min": 1938
},
{
"epoch": 3.52224,
"grad_norm": 0.009173018328596294,
"learning_rate": 9.745794282883215e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.844043749268167e-05,
"step": 3670,
"valid_targets_mean": 4644.7,
"valid_targets_min": 2029
},
{
"epoch": 3.52704,
"grad_norm": 0.012126353551714644,
"learning_rate": 9.688328979047689e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.3574360713828355e-05,
"step": 3675,
"valid_targets_mean": 4152.6,
"valid_targets_min": 1983
},
{
"epoch": 3.53184,
"grad_norm": 0.00974942484547369,
"learning_rate": 9.630979395080667e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.9589365769643337e-05,
"step": 3680,
"valid_targets_mean": 4399.3,
"valid_targets_min": 1933
},
{
"epoch": 3.5366400000000002,
"grad_norm": 0.007448900727798668,
"learning_rate": 9.573746174571947e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.012276182649657e-05,
"step": 3685,
"valid_targets_mean": 3892.2,
"valid_targets_min": 1771
},
{
"epoch": 3.54144,
"grad_norm": 0.009998416704858777,
"learning_rate": 9.516629959805468e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.176214472157881e-05,
"step": 3690,
"valid_targets_mean": 3584.5,
"valid_targets_min": 1525
},
{
"epoch": 3.54624,
"grad_norm": 0.013292503205467973,
"learning_rate": 9.459631391752126e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.5208176743471995e-05,
"step": 3695,
"valid_targets_mean": 5094.4,
"valid_targets_min": 2136
},
{
"epoch": 3.55104,
"grad_norm": 0.008334331712158317,
"learning_rate": 9.40275111006254e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.263483035378158e-05,
"step": 3700,
"valid_targets_mean": 4102.0,
"valid_targets_min": 1887
},
{
"epoch": 3.55584,
"grad_norm": 0.007827281873180344,
"learning_rate": 9.345989753059895e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.234985630726442e-05,
"step": 3705,
"valid_targets_mean": 4199.7,
"valid_targets_min": 2105
},
{
"epoch": 3.5606400000000002,
"grad_norm": 0.010974477469488148,
"learning_rate": 9.289347957732779e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.0864338593091816e-05,
"step": 3710,
"valid_targets_mean": 3562.9,
"valid_targets_min": 2091
},
{
"epoch": 3.56544,
"grad_norm": 0.007061621309209828,
"learning_rate": 9.232826359728034e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.380605630809441e-05,
"step": 3715,
"valid_targets_mean": 4573.4,
"valid_targets_min": 1820
},
{
"epoch": 3.57024,
"grad_norm": 0.006768925158879715,
"learning_rate": 9.17642559334362e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.614176577888429e-05,
"step": 3720,
"valid_targets_mean": 3561.2,
"valid_targets_min": 1716
},
{
"epoch": 3.57504,
"grad_norm": 0.005606648088124625,
"learning_rate": 9.120146291521488e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00015613154391758144,
"step": 3725,
"valid_targets_mean": 3199.8,
"valid_targets_min": 1977
},
{
"epoch": 3.57984,
"grad_norm": 0.009401345215855002,
"learning_rate": 9.063989085840506e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.945084169274196e-05,
"step": 3730,
"valid_targets_mean": 3199.3,
"valid_targets_min": 1970
},
{
"epoch": 3.5846400000000003,
"grad_norm": 0.014559174559493274,
"learning_rate": 9.007954606509346e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.059839845169336e-05,
"step": 3735,
"valid_targets_mean": 4898.0,
"valid_targets_min": 1833
},
{
"epoch": 3.5894399999999997,
"grad_norm": 0.01712977436721481,
"learning_rate": 8.952043482359408e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 9.897394193103537e-05,
"step": 3740,
"valid_targets_mean": 4177.9,
"valid_targets_min": 1942
},
{
"epoch": 3.59424,
"grad_norm": 0.01897818953911394,
"learning_rate": 8.896256340837779e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.639182225218974e-05,
"step": 3745,
"valid_targets_mean": 3746.3,
"valid_targets_min": 2007
},
{
"epoch": 3.59904,
"grad_norm": 0.008696730760610802,
"learning_rate": 8.840593808000182e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.316093251574785e-05,
"step": 3750,
"valid_targets_mean": 3307.4,
"valid_targets_min": 1884
},
{
"epoch": 3.60384,
"grad_norm": 0.00752523752718718,
"learning_rate": 8.785056508503956e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.271009963005781e-05,
"step": 3755,
"valid_targets_mean": 4282.9,
"valid_targets_min": 1943
},
{
"epoch": 3.60864,
"grad_norm": 0.017446379775524528,
"learning_rate": 8.729645065601045e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.897156759398058e-05,
"step": 3760,
"valid_targets_mean": 3718.6,
"valid_targets_min": 1870
},
{
"epoch": 3.6134399999999998,
"grad_norm": 0.008082161778407785,
"learning_rate": 8.674360101130994e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.3372128857299685e-05,
"step": 3765,
"valid_targets_mean": 3104.3,
"valid_targets_min": 1601
},
{
"epoch": 3.61824,
"grad_norm": 0.007773752201751082,
"learning_rate": 8.619202235514e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.664046016638167e-05,
"step": 3770,
"valid_targets_mean": 4204.1,
"valid_targets_min": 1877
},
{
"epoch": 3.62304,
"grad_norm": 0.011724108974262567,
"learning_rate": 8.564172087743903e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.043753041420132e-05,
"step": 3775,
"valid_targets_mean": 4841.0,
"valid_targets_min": 1919
},
{
"epoch": 3.62784,
"grad_norm": 0.014603234371469162,
"learning_rate": 8.50927027538128e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7259538657963276e-05,
"step": 3780,
"valid_targets_mean": 4642.8,
"valid_targets_min": 1960
},
{
"epoch": 3.63264,
"grad_norm": 0.00800559357448803,
"learning_rate": 8.454497414546497e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.628532406059094e-05,
"step": 3785,
"valid_targets_mean": 3900.8,
"valid_targets_min": 1906
},
{
"epoch": 3.63744,
"grad_norm": 0.009760845212688286,
"learning_rate": 8.39985411991279e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.497586633078754e-05,
"step": 3790,
"valid_targets_mean": 3523.5,
"valid_targets_min": 1614
},
{
"epoch": 3.64224,
"grad_norm": 0.009892739360240588,
"learning_rate": 8.345341004699386e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.6855250073131174e-05,
"step": 3795,
"valid_targets_mean": 4958.9,
"valid_targets_min": 1740
},
{
"epoch": 3.64704,
"grad_norm": 0.022126997467983734,
"learning_rate": 8.290958680664591e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7001504097133875e-05,
"step": 3800,
"valid_targets_mean": 5003.7,
"valid_targets_min": 1601
},
{
"epoch": 3.65184,
"grad_norm": 0.006207067260963997,
"learning_rate": 8.236707758098965e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.68956306274049e-05,
"step": 3805,
"valid_targets_mean": 4634.0,
"valid_targets_min": 1829
},
{
"epoch": 3.65664,
"grad_norm": 0.009933222541426298,
"learning_rate": 8.182588845818452e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.3912557632429525e-05,
"step": 3810,
"valid_targets_mean": 3370.8,
"valid_targets_min": 1931
},
{
"epoch": 3.66144,
"grad_norm": 0.005083907207555841,
"learning_rate": 8.128602551157523e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.829049819614738e-05,
"step": 3815,
"valid_targets_mean": 3926.0,
"valid_targets_min": 1998
},
{
"epoch": 3.66624,
"grad_norm": 0.003423366499798073,
"learning_rate": 8.074749479962407e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.400216857902706e-05,
"step": 3820,
"valid_targets_mean": 3917.4,
"valid_targets_min": 1904
},
{
"epoch": 3.67104,
"grad_norm": 0.00822734919109149,
"learning_rate": 8.021030236584254e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.029735984862782e-05,
"step": 3825,
"valid_targets_mean": 4000.3,
"valid_targets_min": 1361
},
{
"epoch": 3.67584,
"grad_norm": 0.00811845623327458,
"learning_rate": 7.967445423872384e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.5101038014981896e-05,
"step": 3830,
"valid_targets_mean": 3887.2,
"valid_targets_min": 1858
},
{
"epoch": 3.68064,
"grad_norm": 0.008909582138274898,
"learning_rate": 7.913995643167494e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.464569742092863e-05,
"step": 3835,
"valid_targets_mean": 4139.8,
"valid_targets_min": 1799
},
{
"epoch": 3.68544,
"grad_norm": 0.005082007045025474,
"learning_rate": 7.860681494294917e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.289662683731876e-05,
"step": 3840,
"valid_targets_mean": 5383.5,
"valid_targets_min": 1877
},
{
"epoch": 3.69024,
"grad_norm": 0.028567503324743313,
"learning_rate": 7.80750357555792e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.482819298980758e-05,
"step": 3845,
"valid_targets_mean": 4351.8,
"valid_targets_min": 2010
},
{
"epoch": 3.69504,
"grad_norm": 0.008312164085289285,
"learning_rate": 7.75446248373094e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.698741420521401e-05,
"step": 3850,
"valid_targets_mean": 4194.5,
"valid_targets_min": 1925
},
{
"epoch": 3.69984,
"grad_norm": 0.013534579590798691,
"learning_rate": 7.701558814052928e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.3835676226299256e-05,
"step": 3855,
"valid_targets_mean": 3634.8,
"valid_targets_min": 1786
},
{
"epoch": 3.70464,
"grad_norm": 0.00720602048189928,
"learning_rate": 7.648793160220637e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.953006151074078e-05,
"step": 3860,
"valid_targets_mean": 4952.3,
"valid_targets_min": 1919
},
{
"epoch": 3.70944,
"grad_norm": 0.008449956594170478,
"learning_rate": 7.596166114381991e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4673154004849494e-05,
"step": 3865,
"valid_targets_mean": 3438.7,
"valid_targets_min": 1939
},
{
"epoch": 3.71424,
"grad_norm": 0.005375083760714377,
"learning_rate": 7.543678267129408e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.617395123001188e-05,
"step": 3870,
"valid_targets_mean": 4350.7,
"valid_targets_min": 1847
},
{
"epoch": 3.71904,
"grad_norm": 0.009037269182640846,
"learning_rate": 7.491330207493215e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.979194272891618e-05,
"step": 3875,
"valid_targets_mean": 3996.6,
"valid_targets_min": 1909
},
{
"epoch": 3.72384,
"grad_norm": 0.008946248984604825,
"learning_rate": 7.4391225229349785e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.837323311017826e-05,
"step": 3880,
"valid_targets_mean": 3842.8,
"valid_targets_min": 2083
},
{
"epoch": 3.72864,
"grad_norm": 0.006741545487650149,
"learning_rate": 7.387055799340977e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.537091106409207e-05,
"step": 3885,
"valid_targets_mean": 3515.7,
"valid_targets_min": 2084
},
{
"epoch": 3.73344,
"grad_norm": 0.009958719900647239,
"learning_rate": 7.3351306210155645e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.938116323202848e-05,
"step": 3890,
"valid_targets_mean": 4039.8,
"valid_targets_min": 1727
},
{
"epoch": 3.7382400000000002,
"grad_norm": 0.004166899002692281,
"learning_rate": 7.283347570674664e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.300503835314885e-05,
"step": 3895,
"valid_targets_mean": 4780.2,
"valid_targets_min": 1914
},
{
"epoch": 3.74304,
"grad_norm": 0.0055545578726656705,
"learning_rate": 7.231707229439191e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.4573745981324464e-05,
"step": 3900,
"valid_targets_mean": 2902.8,
"valid_targets_min": 1838
},
{
"epoch": 3.74784,
"grad_norm": 0.011400834486338789,
"learning_rate": 7.180210176828557e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.124083691043779e-05,
"step": 3905,
"valid_targets_mean": 4634.8,
"valid_targets_min": 1838
},
{
"epoch": 3.75264,
"grad_norm": 0.00841332841155176,
"learning_rate": 7.1288569907541495e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010382626351201907,
"step": 3910,
"valid_targets_mean": 3998.2,
"valid_targets_min": 1836
},
{
"epoch": 3.75744,
"grad_norm": 0.008771579099235028,
"learning_rate": 7.0776482475128674e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.999216642114334e-05,
"step": 3915,
"valid_targets_mean": 3358.6,
"valid_targets_min": 1930
},
{
"epoch": 3.7622400000000003,
"grad_norm": 0.01653968115841514,
"learning_rate": 7.026584521780628e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.055902485968545e-05,
"step": 3920,
"valid_targets_mean": 3337.5,
"valid_targets_min": 1940
},
{
"epoch": 3.76704,
"grad_norm": 0.0020106714719736176,
"learning_rate": 6.9756663866059324e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.6483760999981314e-05,
"step": 3925,
"valid_targets_mean": 3525.4,
"valid_targets_min": 1921
},
{
"epoch": 3.77184,
"grad_norm": 0.009353143146674505,
"learning_rate": 6.924894413403434e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.59437542303931e-05,
"step": 3930,
"valid_targets_mean": 3793.8,
"valid_targets_min": 1986
},
{
"epoch": 3.77664,
"grad_norm": 0.0016988195482671596,
"learning_rate": 6.874269171947516e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4710130421444774e-05,
"step": 3935,
"valid_targets_mean": 4158.0,
"valid_targets_min": 1991
},
{
"epoch": 3.78144,
"grad_norm": 0.011525809325227182,
"learning_rate": 6.8237912303659195e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.272616959293373e-05,
"step": 3940,
"valid_targets_mean": 4315.2,
"valid_targets_min": 2040
},
{
"epoch": 3.7862400000000003,
"grad_norm": 0.01327437986216609,
"learning_rate": 6.773461155133334e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.483360316953622e-05,
"step": 3945,
"valid_targets_mean": 4166.3,
"valid_targets_min": 2041
},
{
"epoch": 3.7910399999999997,
"grad_norm": 0.01155061809019346,
"learning_rate": 6.723279511065088e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.00010878659668378532,
"step": 3950,
"valid_targets_mean": 3971.8,
"valid_targets_min": 1751
},
{
"epoch": 3.79584,
"grad_norm": 0.008489470823871952,
"learning_rate": 6.673246861310751e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.032125070807524e-05,
"step": 3955,
"valid_targets_mean": 3081.6,
"valid_targets_min": 1993
},
{
"epoch": 3.80064,
"grad_norm": 0.004944406539400989,
"learning_rate": 6.623363767347874e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.2762374758021906e-05,
"step": 3960,
"valid_targets_mean": 3511.7,
"valid_targets_min": 2034
},
{
"epoch": 3.80544,
"grad_norm": 0.0015531554707660037,
"learning_rate": 6.5736307889756425e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.0193985367077403e-05,
"step": 3965,
"valid_targets_mean": 4271.0,
"valid_targets_min": 1771
},
{
"epoch": 3.81024,
"grad_norm": 0.002938449796497635,
"learning_rate": 6.5240484843086095e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.3413271012250334e-05,
"step": 3970,
"valid_targets_mean": 3733.8,
"valid_targets_min": 1740
},
{
"epoch": 3.8150399999999998,
"grad_norm": 0.0051302286350760245,
"learning_rate": 6.474617409770441e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.9273050788324326e-05,
"step": 3975,
"valid_targets_mean": 4800.5,
"valid_targets_min": 1833
},
{
"epoch": 3.81984,
"grad_norm": 0.00431880865043546,
"learning_rate": 6.425338120087665e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.9392667026259005e-05,
"step": 3980,
"valid_targets_mean": 3564.1,
"valid_targets_min": 1933
},
{
"epoch": 3.82464,
"grad_norm": 0.0135204569747035,
"learning_rate": 6.3762111682834374e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.671135684475303e-05,
"step": 3985,
"valid_targets_mean": 3377.8,
"valid_targets_min": 1966
},
{
"epoch": 3.82944,
"grad_norm": 0.012904633473275234,
"learning_rate": 6.327237105671362e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.7124419981846586e-05,
"step": 3990,
"valid_targets_mean": 3646.4,
"valid_targets_min": 1931
},
{
"epoch": 3.83424,
"grad_norm": 0.012677339947563877,
"learning_rate": 6.278416481849274e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.282880738377571e-05,
"step": 3995,
"valid_targets_mean": 3834.4,
"valid_targets_min": 1517
},
{
"epoch": 3.83904,
"grad_norm": 0.0027541770656437647,
"learning_rate": 6.22974984469308e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.0949358663056046e-05,
"step": 4000,
"valid_targets_mean": 4092.8,
"valid_targets_min": 1870
},
{
"epoch": 3.84384,
"grad_norm": 0.0025121154244893383,
"learning_rate": 6.181237740350625e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.9284408558160067e-05,
"step": 4005,
"valid_targets_mean": 3402.4,
"valid_targets_min": 2072
},
{
"epoch": 3.84864,
"grad_norm": 0.007040691563797863,
"learning_rate": 6.132880713235543e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.226173768984154e-05,
"step": 4010,
"valid_targets_mean": 3744.0,
"valid_targets_min": 1662
},
{
"epoch": 3.85344,
"grad_norm": 0.0017011433295406567,
"learning_rate": 6.084679306021162e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.698827276821248e-05,
"step": 4015,
"valid_targets_mean": 4849.4,
"valid_targets_min": 1909
},
{
"epoch": 3.85824,
"grad_norm": 0.010975701606423343,
"learning_rate": 6.036634059634403e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.6234490582719445e-05,
"step": 4020,
"valid_targets_mean": 3950.8,
"valid_targets_min": 1802
},
{
"epoch": 3.86304,
"grad_norm": 0.009004613849435001,
"learning_rate": 5.988745513249723e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.65586020052433e-05,
"step": 4025,
"valid_targets_mean": 4084.7,
"valid_targets_min": 1987
},
{
"epoch": 3.86784,
"grad_norm": 0.006895797007772438,
"learning_rate": 5.941014204283065e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.828316352562979e-05,
"step": 4030,
"valid_targets_mean": 3135.8,
"valid_targets_min": 1857
},
{
"epoch": 3.87264,
"grad_norm": 0.01178803809355006,
"learning_rate": 5.893440668385797e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.943587216781452e-05,
"step": 4035,
"valid_targets_mean": 4593.9,
"valid_targets_min": 1908
},
{
"epoch": 3.87744,
"grad_norm": 0.01132365691364727,
"learning_rate": 5.8460254394387335e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.603708218084648e-05,
"step": 4040,
"valid_targets_mean": 2908.2,
"valid_targets_min": 1763
},
{
"epoch": 3.88224,
"grad_norm": 0.0015247764789779767,
"learning_rate": 5.798769049546136e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.867723353323527e-05,
"step": 4045,
"valid_targets_mean": 4326.9,
"valid_targets_min": 2052
},
{
"epoch": 3.88704,
"grad_norm": 0.007712351251859507,
"learning_rate": 5.751672029029734e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.214739551069215e-05,
"step": 4050,
"valid_targets_mean": 3336.8,
"valid_targets_min": 1918
},
{
"epoch": 3.89184,
"grad_norm": 0.005302270584137382,
"learning_rate": 5.704734906422775e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.486428952077404e-05,
"step": 4055,
"valid_targets_mean": 3890.5,
"valid_targets_min": 1614
},
{
"epoch": 3.89664,
"grad_norm": 0.008602600193917502,
"learning_rate": 5.657958208464103e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.3105505533749238e-05,
"step": 4060,
"valid_targets_mean": 5310.7,
"valid_targets_min": 1868
},
{
"epoch": 3.90144,
"grad_norm": 0.011762847617699367,
"learning_rate": 5.611342460092244e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.642755837063305e-05,
"step": 4065,
"valid_targets_mean": 3324.7,
"valid_targets_min": 1763
},
{
"epoch": 3.90624,
"grad_norm": 0.01025277386741305,
"learning_rate": 5.564888184439505e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 8.32563528092578e-05,
"step": 4070,
"valid_targets_mean": 3358.8,
"valid_targets_min": 1987
},
{
"epoch": 3.91104,
"grad_norm": 0.00826164879811961,
"learning_rate": 5.5185959028261135e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.293428305070847e-05,
"step": 4075,
"valid_targets_mean": 3793.2,
"valid_targets_min": 1913
},
{
"epoch": 3.91584,
"grad_norm": 0.0017179245030004447,
"learning_rate": 5.47246613475436e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.292598921689205e-05,
"step": 4080,
"valid_targets_mean": 5032.8,
"valid_targets_min": 1764
},
{
"epoch": 3.92064,
"grad_norm": 0.006387347577353118,
"learning_rate": 5.4264993979027735e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.276900265016593e-05,
"step": 4085,
"valid_targets_mean": 4469.8,
"valid_targets_min": 1662
},
{
"epoch": 3.92544,
"grad_norm": 0.0017208693189951672,
"learning_rate": 5.380696208120315e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.718512016348541e-05,
"step": 4090,
"valid_targets_mean": 3913.8,
"valid_targets_min": 1942
},
{
"epoch": 3.93024,
"grad_norm": 0.009615232784227547,
"learning_rate": 5.335057079420571e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.271994475857355e-05,
"step": 4095,
"valid_targets_mean": 4633.0,
"valid_targets_min": 1906
},
{
"epoch": 3.93504,
"grad_norm": 0.00315117505190966,
"learning_rate": 5.289582523976015e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.916188092669472e-05,
"step": 4100,
"valid_targets_mean": 3094.9,
"valid_targets_min": 1839
},
{
"epoch": 3.9398400000000002,
"grad_norm": 0.002341135347296883,
"learning_rate": 5.244273052112241e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.824275674764067e-05,
"step": 4105,
"valid_targets_mean": 3952.0,
"valid_targets_min": 1820
},
{
"epoch": 3.94464,
"grad_norm": 0.006120762233210705,
"learning_rate": 5.199129172302224e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.396788477199152e-05,
"step": 4110,
"valid_targets_mean": 4057.8,
"valid_targets_min": 1652
},
{
"epoch": 3.94944,
"grad_norm": 0.01147219264594495,
"learning_rate": 5.154151391160638e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.357105692382902e-05,
"step": 4115,
"valid_targets_mean": 3406.0,
"valid_targets_min": 2061
},
{
"epoch": 3.95424,
"grad_norm": 0.0043650589223010496,
"learning_rate": 5.109340213438156e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.6478053263854235e-05,
"step": 4120,
"valid_targets_mean": 3741.1,
"valid_targets_min": 1952
},
{
"epoch": 3.95904,
"grad_norm": 0.0030919506576588917,
"learning_rate": 5.0646961420157995e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.029893741768319e-05,
"step": 4125,
"valid_targets_mean": 4083.2,
"valid_targets_min": 1877
},
{
"epoch": 3.9638400000000003,
"grad_norm": 0.0030273483345704686,
"learning_rate": 5.020219677899276e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4400916774757206e-05,
"step": 4130,
"valid_targets_mean": 3293.4,
"valid_targets_min": 1760
},
{
"epoch": 3.9686399999999997,
"grad_norm": 0.0017464199544329963,
"learning_rate": 4.975911320213365e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.5975579268997535e-05,
"step": 4135,
"valid_targets_mean": 3433.2,
"valid_targets_min": 1705
},
{
"epoch": 3.97344,
"grad_norm": 0.002077433108478966,
"learning_rate": 4.931771566196332e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.3588610424194485e-05,
"step": 4140,
"valid_targets_mean": 3861.1,
"valid_targets_min": 1942
},
{
"epoch": 3.97824,
"grad_norm": 0.002321329052569725,
"learning_rate": 4.887800911194327e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.014351336285472e-05,
"step": 4145,
"valid_targets_mean": 3757.0,
"valid_targets_min": 1917
},
{
"epoch": 3.98304,
"grad_norm": 0.0033831803043769893,
"learning_rate": 4.8439998486558246e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.0929337551933713e-05,
"step": 4150,
"valid_targets_mean": 4829.0,
"valid_targets_min": 1933
},
{
"epoch": 3.9878400000000003,
"grad_norm": 0.0065384692462405886,
"learning_rate": 4.800368870126111e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.445397644303739e-05,
"step": 4155,
"valid_targets_mean": 4013.5,
"valid_targets_min": 2008
},
{
"epoch": 3.9926399999999997,
"grad_norm": 0.007960408672666047,
"learning_rate": 4.756908465241736e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.532538100145757e-05,
"step": 4160,
"valid_targets_mean": 2909.1,
"valid_targets_min": 1933
},
{
"epoch": 3.99744,
"grad_norm": 0.002761429608947698,
"learning_rate": 4.713619121725039e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.965345917502418e-05,
"step": 4165,
"valid_targets_mean": 3661.7,
"valid_targets_min": 1361
},
{
"epoch": 4.00192,
"grad_norm": 0.00564879768287149,
"learning_rate": 4.670501325378682e-06,
"loss": 0.0002,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.989029937656596e-05,
"step": 4170,
"valid_targets_mean": 4154.5,
"valid_targets_min": 1562
},
{
"epoch": 4.00672,
"grad_norm": 0.0017008982835388347,
"learning_rate": 4.627555560080173e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.260703281033784e-05,
"step": 4175,
"valid_targets_mean": 3558.2,
"valid_targets_min": 2030
},
{
"epoch": 4.01152,
"grad_norm": 0.0013598220119315672,
"learning_rate": 4.5847823077764565e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.567889507394284e-05,
"step": 4180,
"valid_targets_mean": 4792.2,
"valid_targets_min": 1716
},
{
"epoch": 4.01632,
"grad_norm": 0.0017277913774604524,
"learning_rate": 4.5421820484784936e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.8666614273097366e-05,
"step": 4185,
"valid_targets_mean": 3129.0,
"valid_targets_min": 1680
},
{
"epoch": 4.02112,
"grad_norm": 0.010995756807561355,
"learning_rate": 4.499755260255881e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.598851955961436e-05,
"step": 4190,
"valid_targets_mean": 3880.6,
"valid_targets_min": 1887
},
{
"epoch": 4.02592,
"grad_norm": 0.007874013108371752,
"learning_rate": 4.457502419231483e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.0256828874116763e-05,
"step": 4195,
"valid_targets_mean": 3937.4,
"valid_targets_min": 1919
},
{
"epoch": 4.03072,
"grad_norm": 0.005097701158583684,
"learning_rate": 4.415423999576091e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.7677243856014684e-05,
"step": 4200,
"valid_targets_mean": 4715.7,
"valid_targets_min": 1930
},
{
"epoch": 4.03552,
"grad_norm": 0.00832156517250208,
"learning_rate": 4.373520473503097e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.421106521273032e-05,
"step": 4205,
"valid_targets_mean": 4367.5,
"valid_targets_min": 2220
},
{
"epoch": 4.04032,
"grad_norm": 0.0013368495812476166,
"learning_rate": 4.33179231126321e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.380177804501727e-05,
"step": 4210,
"valid_targets_mean": 3230.2,
"valid_targets_min": 1958
},
{
"epoch": 4.04512,
"grad_norm": 0.00208369487802161,
"learning_rate": 4.2902399811391575e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.897564238286577e-05,
"step": 4215,
"valid_targets_mean": 3983.1,
"valid_targets_min": 1662
},
{
"epoch": 4.04992,
"grad_norm": 0.001584687114330045,
"learning_rate": 4.248863949440436e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.266106068622321e-05,
"step": 4220,
"valid_targets_mean": 3432.7,
"valid_targets_min": 2007
},
{
"epoch": 4.05472,
"grad_norm": 0.00787766824013007,
"learning_rate": 4.207664680498094e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.363234282005578e-05,
"step": 4225,
"valid_targets_mean": 4572.5,
"valid_targets_min": 1839
},
{
"epoch": 4.05952,
"grad_norm": 0.00205025097170975,
"learning_rate": 4.166642636659495e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.519926601962652e-05,
"step": 4230,
"valid_targets_mean": 5066.3,
"valid_targets_min": 1786
},
{
"epoch": 4.06432,
"grad_norm": 0.0016026371988252155,
"learning_rate": 4.125798278283155e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.269485750934109e-05,
"step": 4235,
"valid_targets_mean": 3498.3,
"valid_targets_min": 2041
},
{
"epoch": 4.06912,
"grad_norm": 0.0017439816942912997,
"learning_rate": 4.085132063733554e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.675786138046533e-05,
"step": 4240,
"valid_targets_mean": 3827.7,
"valid_targets_min": 2024
},
{
"epoch": 4.07392,
"grad_norm": 0.0059827154830725034,
"learning_rate": 4.0446444493760165e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.55681695509702e-05,
"step": 4245,
"valid_targets_mean": 4141.8,
"valid_targets_min": 1889
},
{
"epoch": 4.07872,
"grad_norm": 0.0038426262164381678,
"learning_rate": 4.004335889571556e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.607972030295059e-05,
"step": 4250,
"valid_targets_mean": 3393.1,
"valid_targets_min": 1950
},
{
"epoch": 4.08352,
"grad_norm": 0.00491056822089905,
"learning_rate": 3.96420683667182e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.275919829728082e-05,
"step": 4255,
"valid_targets_mean": 3971.6,
"valid_targets_min": 2020
},
{
"epoch": 4.08832,
"grad_norm": 0.0028428055872032018,
"learning_rate": 3.924257741013968e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.72756837552879e-05,
"step": 4260,
"valid_targets_mean": 3005.8,
"valid_targets_min": 1727
},
{
"epoch": 4.09312,
"grad_norm": 0.002148760727185149,
"learning_rate": 3.884489050915652e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.0193852328229696e-05,
"step": 4265,
"valid_targets_mean": 2827.3,
"valid_targets_min": 1863
},
{
"epoch": 4.09792,
"grad_norm": 0.0023335386496191987,
"learning_rate": 3.844901212669962e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.841453351720702e-05,
"step": 4270,
"valid_targets_mean": 3088.7,
"valid_targets_min": 1930
},
{
"epoch": 4.10272,
"grad_norm": 0.001286310131837442,
"learning_rate": 3.8054946705404415e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.464947803877294e-05,
"step": 4275,
"valid_targets_mean": 4350.3,
"valid_targets_min": 1884
},
{
"epoch": 4.10752,
"grad_norm": 0.0015531321802579076,
"learning_rate": 3.7662698667560714e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.5117111110594124e-05,
"step": 4280,
"valid_targets_mean": 3142.5,
"valid_targets_min": 1942
},
{
"epoch": 4.11232,
"grad_norm": 0.0016055863187996663,
"learning_rate": 3.7272272415063484e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.6740551877301186e-05,
"step": 4285,
"valid_targets_mean": 3298.3,
"valid_targets_min": 2013
},
{
"epoch": 4.11712,
"grad_norm": 0.0029316369728722416,
"learning_rate": 3.6883672329363007e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.9559832657687366e-05,
"step": 4290,
"valid_targets_mean": 3922.3,
"valid_targets_min": 1727
},
{
"epoch": 4.12192,
"grad_norm": 0.0015623211280171884,
"learning_rate": 3.649690277141598e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7854842958040535e-05,
"step": 4295,
"valid_targets_mean": 3290.9,
"valid_targets_min": 1525
},
{
"epoch": 4.12672,
"grad_norm": 0.0027055639776239634,
"learning_rate": 3.6111968081636507e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.4809010938042775e-05,
"step": 4300,
"valid_targets_mean": 3566.5,
"valid_targets_min": 2034
},
{
"epoch": 4.13152,
"grad_norm": 0.0013377359893271355,
"learning_rate": 3.572887257984743e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.381590406410396e-05,
"step": 4305,
"valid_targets_mean": 3170.8,
"valid_targets_min": 1987
},
{
"epoch": 4.1363199999999996,
"grad_norm": 0.003940540400894581,
"learning_rate": 3.5347620565231733e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 7.146632560761645e-05,
"step": 4310,
"valid_targets_mean": 3132.8,
"valid_targets_min": 1909
},
{
"epoch": 4.14112,
"grad_norm": 0.0019501200493331245,
"learning_rate": 3.496821631628442e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4340086131123826e-05,
"step": 4315,
"valid_targets_mean": 4166.7,
"valid_targets_min": 1614
},
{
"epoch": 4.14592,
"grad_norm": 0.0011369610238447416,
"learning_rate": 3.459066409076448e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.429923526709899e-05,
"step": 4320,
"valid_targets_mean": 4413.0,
"valid_targets_min": 1361
},
{
"epoch": 4.15072,
"grad_norm": 0.0014505389624406707,
"learning_rate": 3.421496812564713e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4482301998650655e-05,
"step": 4325,
"valid_targets_mean": 5303.1,
"valid_targets_min": 2088
},
{
"epoch": 4.15552,
"grad_norm": 0.004779096813522042,
"learning_rate": 3.384113263707609e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.184087836416438e-05,
"step": 4330,
"valid_targets_mean": 4378.8,
"valid_targets_min": 1870
},
{
"epoch": 4.16032,
"grad_norm": 0.0026258332815263757,
"learning_rate": 3.34691618203165e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 6.489974475698546e-05,
"step": 4335,
"valid_targets_mean": 4047.0,
"valid_targets_min": 1920
},
{
"epoch": 4.16512,
"grad_norm": 0.001816961044617779,
"learning_rate": 3.309905984970765e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.8048809074098244e-05,
"step": 4340,
"valid_targets_mean": 2844.7,
"valid_targets_min": 1914
},
{
"epoch": 4.16992,
"grad_norm": 0.0018025365511840077,
"learning_rate": 3.2730830878616305e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.494471457088366e-05,
"step": 4345,
"valid_targets_mean": 4423.0,
"valid_targets_min": 1977
},
{
"epoch": 4.17472,
"grad_norm": 0.0015254616003019617,
"learning_rate": 3.2364479039389973e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.3799573429860175e-05,
"step": 4350,
"valid_targets_mean": 3975.1,
"valid_targets_min": 1601
},
{
"epoch": 4.17952,
"grad_norm": 0.0013297521092237158,
"learning_rate": 3.2000008443310505e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.5375484003452584e-05,
"step": 4355,
"valid_targets_mean": 3518.4,
"valid_targets_min": 1764
},
{
"epoch": 4.18432,
"grad_norm": 0.0015651851486661397,
"learning_rate": 3.1637423180548232e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.7060703359893523e-05,
"step": 4360,
"valid_targets_mean": 4383.7,
"valid_targets_min": 2081
},
{
"epoch": 4.18912,
"grad_norm": 0.0013429520317032584,
"learning_rate": 3.127672732011564e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.832937752828002e-05,
"step": 4365,
"valid_targets_mean": 3055.6,
"valid_targets_min": 1931
},
{
"epoch": 4.19392,
"grad_norm": 0.001673435127439738,
"learning_rate": 3.0917924909821993e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.698914199252613e-05,
"step": 4370,
"valid_targets_mean": 3913.2,
"valid_targets_min": 1925
},
{
"epoch": 4.19872,
"grad_norm": 0.0017055197505207748,
"learning_rate": 3.0561019976227867e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7643716495949775e-05,
"step": 4375,
"valid_targets_mean": 4424.2,
"valid_targets_min": 1942
},
{
"epoch": 4.20352,
"grad_norm": 0.001524053630224983,
"learning_rate": 3.020601652459989e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.057669502799399e-05,
"step": 4380,
"valid_targets_mean": 3439.1,
"valid_targets_min": 2033
},
{
"epoch": 4.20832,
"grad_norm": 0.0014977455442873465,
"learning_rate": 2.9852918538865847e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.6328819987829775e-05,
"step": 4385,
"valid_targets_mean": 3529.1,
"valid_targets_min": 1950
},
{
"epoch": 4.21312,
"grad_norm": 0.002089373327408226,
"learning_rate": 2.950172998156995e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.692836955655366e-05,
"step": 4390,
"valid_targets_mean": 4298.4,
"valid_targets_min": 2071
},
{
"epoch": 4.21792,
"grad_norm": 0.0018448814132004277,
"learning_rate": 2.91524547938284e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.71622372767888e-05,
"step": 4395,
"valid_targets_mean": 4462.7,
"valid_targets_min": 1847
},
{
"epoch": 4.22272,
"grad_norm": 0.0012318653842671413,
"learning_rate": 2.880509689528519e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.8981317629804835e-05,
"step": 4400,
"valid_targets_mean": 4393.9,
"valid_targets_min": 1919
},
{
"epoch": 4.22752,
"grad_norm": 0.0013800529639858145,
"learning_rate": 2.845966018406796e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.7751670131692663e-05,
"step": 4405,
"valid_targets_mean": 4296.9,
"valid_targets_min": 1914
},
{
"epoch": 4.23232,
"grad_norm": 0.0022095704660588518,
"learning_rate": 2.8116148536744448e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.149065378238447e-05,
"step": 4410,
"valid_targets_mean": 3783.5,
"valid_targets_min": 1951
},
{
"epoch": 4.23712,
"grad_norm": 0.001829538248299371,
"learning_rate": 2.777456580827882e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.5836652386933565e-05,
"step": 4415,
"valid_targets_mean": 3286.2,
"valid_targets_min": 1972
},
{
"epoch": 4.24192,
"grad_norm": 0.0013569162605098144,
"learning_rate": 2.7434915831988517e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.01278848585207e-05,
"step": 4420,
"valid_targets_mean": 5327.2,
"valid_targets_min": 1786
},
{
"epoch": 4.24672,
"grad_norm": 0.0015208666777376662,
"learning_rate": 2.7097202419501246e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.3911415812326595e-05,
"step": 4425,
"valid_targets_mean": 4008.7,
"valid_targets_min": 1917
},
{
"epoch": 4.25152,
"grad_norm": 0.0013156359603355792,
"learning_rate": 2.6761429360712045e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.497844980098307e-05,
"step": 4430,
"valid_targets_mean": 4711.8,
"valid_targets_min": 1614
},
{
"epoch": 4.25632,
"grad_norm": 0.0054384452715636345,
"learning_rate": 2.642760042374106e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.011658165836707e-05,
"step": 4435,
"valid_targets_mean": 3496.8,
"valid_targets_min": 1912
},
{
"epoch": 4.26112,
"grad_norm": 0.0013737950200195751,
"learning_rate": 2.6095719354890903e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.339675458846614e-05,
"step": 4440,
"valid_targets_mean": 4009.8,
"valid_targets_min": 1877
},
{
"epoch": 4.26592,
"grad_norm": 0.0011869857062110785,
"learning_rate": 2.5765789878604852e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.306513801566325e-05,
"step": 4445,
"valid_targets_mean": 3195.0,
"valid_targets_min": 1833
},
{
"epoch": 4.27072,
"grad_norm": 0.002369333683258055,
"learning_rate": 2.543781569742496e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.995891504222527e-05,
"step": 4450,
"valid_targets_mean": 4051.5,
"valid_targets_min": 1981
},
{
"epoch": 4.27552,
"grad_norm": 0.0015064551394305126,
"learning_rate": 2.5111800491950523e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.0394799978239462e-05,
"step": 4455,
"valid_targets_mean": 3638.0,
"valid_targets_min": 1662
},
{
"epoch": 4.28032,
"grad_norm": 0.001674277187515422,
"learning_rate": 2.4787747920796723e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.41932536684908e-05,
"step": 4460,
"valid_targets_mean": 4709.2,
"valid_targets_min": 1919
},
{
"epoch": 4.28512,
"grad_norm": 0.0016113360197275133,
"learning_rate": 2.446566162055377e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.608020051615313e-05,
"step": 4465,
"valid_targets_mean": 3064.8,
"valid_targets_min": 1906
},
{
"epoch": 4.28992,
"grad_norm": 0.0017275336703297865,
"learning_rate": 2.414554520574579e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.0131959142163396e-05,
"step": 4470,
"valid_targets_mean": 3079.5,
"valid_targets_min": 1562
},
{
"epoch": 4.29472,
"grad_norm": 0.0013714628082071834,
"learning_rate": 2.382740226879052e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.390222627785988e-05,
"step": 4475,
"valid_targets_mean": 4828.3,
"valid_targets_min": 1763
},
{
"epoch": 4.29952,
"grad_norm": 0.0012150699900979316,
"learning_rate": 2.3511236379958824e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.9595783164259046e-05,
"step": 4480,
"valid_targets_mean": 3530.4,
"valid_targets_min": 1662
},
{
"epoch": 4.30432,
"grad_norm": 0.001616671707384578,
"learning_rate": 2.31970510873347e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.014815203845501e-05,
"step": 4485,
"valid_targets_mean": 4057.2,
"valid_targets_min": 1836
},
{
"epoch": 4.30912,
"grad_norm": 0.0011221295175201655,
"learning_rate": 2.2884849916775485e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.353855572640896e-05,
"step": 4490,
"valid_targets_mean": 4496.3,
"valid_targets_min": 1786
},
{
"epoch": 4.3139199999999995,
"grad_norm": 0.0017016556243612912,
"learning_rate": 2.257463637187225e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.1361305193277076e-05,
"step": 4495,
"valid_targets_mean": 3690.3,
"valid_targets_min": 1906
},
{
"epoch": 4.31872,
"grad_norm": 0.0015121984545869538,
"learning_rate": 2.2266413933910426e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.035143527085893e-05,
"step": 4500,
"valid_targets_mean": 3866.2,
"valid_targets_min": 1966
},
{
"epoch": 4.32352,
"grad_norm": 0.0012856343972766713,
"learning_rate": 2.196018606183088e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.976351424877066e-05,
"step": 4505,
"valid_targets_mean": 4928.6,
"valid_targets_min": 2030
},
{
"epoch": 4.32832,
"grad_norm": 0.0014908309871930075,
"learning_rate": 2.1655956192191007e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.7100074880290776e-05,
"step": 4510,
"valid_targets_mean": 4195.6,
"valid_targets_min": 1884
},
{
"epoch": 4.33312,
"grad_norm": 0.0016059641687275934,
"learning_rate": 2.135372773912614e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.639291000785306e-05,
"step": 4515,
"valid_targets_mean": 3228.2,
"valid_targets_min": 1933
},
{
"epoch": 4.33792,
"grad_norm": 0.002000268968529377,
"learning_rate": 2.1053504094311285e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.447868973831646e-05,
"step": 4520,
"valid_targets_mean": 5219.3,
"valid_targets_min": 1928
},
{
"epoch": 4.34272,
"grad_norm": 0.0017280071789846,
"learning_rate": 2.0755288626923022e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.983695544069633e-05,
"step": 4525,
"valid_targets_mean": 3567.2,
"valid_targets_min": 1999
},
{
"epoch": 4.34752,
"grad_norm": 0.0015796876911165173,
"learning_rate": 2.0459084683601736e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.003527257940732e-05,
"step": 4530,
"valid_targets_mean": 3082.1,
"valid_targets_min": 2088
},
{
"epoch": 4.35232,
"grad_norm": 0.0016431065257554265,
"learning_rate": 2.0164895588414037e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.4640182497678325e-05,
"step": 4535,
"valid_targets_mean": 4039.8,
"valid_targets_min": 1863
},
{
"epoch": 4.35712,
"grad_norm": 0.0011173401923015307,
"learning_rate": 1.987272464281551e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.7552010578801855e-05,
"step": 4540,
"valid_targets_mean": 3328.8,
"valid_targets_min": 1909
},
{
"epoch": 4.36192,
"grad_norm": 0.0014470057490486652,
"learning_rate": 1.95825751256135e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.667410055641085e-05,
"step": 4545,
"valid_targets_mean": 3116.9,
"valid_targets_min": 1740
},
{
"epoch": 4.36672,
"grad_norm": 0.0011899865608208137,
"learning_rate": 1.9294450292930576e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.059140362893231e-05,
"step": 4550,
"valid_targets_mean": 4447.5,
"valid_targets_min": 2136
},
{
"epoch": 4.37152,
"grad_norm": 0.0014338406740680588,
"learning_rate": 1.9008353378167755e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.4420336053008214e-05,
"step": 4555,
"valid_targets_mean": 4507.5,
"valid_targets_min": 1949
},
{
"epoch": 4.37632,
"grad_norm": 0.0016033511510176346,
"learning_rate": 1.8724287591968294e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.303139237686992e-05,
"step": 4560,
"valid_targets_mean": 4461.0,
"valid_targets_min": 1958
},
{
"epoch": 4.38112,
"grad_norm": 0.0016662233139541564,
"learning_rate": 1.8442256122181735e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.8418951589846984e-05,
"step": 4565,
"valid_targets_mean": 4491.6,
"valid_targets_min": 2044
},
{
"epoch": 4.38592,
"grad_norm": 0.00227254489455862,
"learning_rate": 1.8162262133828013e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4018466976704076e-05,
"step": 4570,
"valid_targets_mean": 4248.5,
"valid_targets_min": 1931
},
{
"epoch": 4.39072,
"grad_norm": 0.0012256581723182494,
"learning_rate": 1.7884308769061974e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.6851910408586264e-05,
"step": 4575,
"valid_targets_mean": 3628.8,
"valid_targets_min": 1991
},
{
"epoch": 4.39552,
"grad_norm": 0.0013118549809077072,
"learning_rate": 1.7608399147138278e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.930739356088452e-05,
"step": 4580,
"valid_targets_mean": 4122.8,
"valid_targets_min": 1908
},
{
"epoch": 4.40032,
"grad_norm": 0.0014985345497132527,
"learning_rate": 1.7334536364376075e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.729587817564607e-05,
"step": 4585,
"valid_targets_mean": 3863.1,
"valid_targets_min": 1751
},
{
"epoch": 4.40512,
"grad_norm": 0.0016352089801263863,
"learning_rate": 1.7062723494124545e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.489490700303577e-05,
"step": 4590,
"valid_targets_mean": 2983.8,
"valid_targets_min": 1900
},
{
"epoch": 4.40992,
"grad_norm": 0.0012257363638319958,
"learning_rate": 1.6792963586728195e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.1652001780457795e-05,
"step": 4595,
"valid_targets_mean": 3711.4,
"valid_targets_min": 2032
},
{
"epoch": 4.41472,
"grad_norm": 0.0013212030801314416,
"learning_rate": 1.6525259669492832e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.7446647436590865e-05,
"step": 4600,
"valid_targets_mean": 4090.9,
"valid_targets_min": 1907
},
{
"epoch": 4.41952,
"grad_norm": 0.0014011914669706318,
"learning_rate": 1.6259614746651364e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.055836739600636e-05,
"step": 4605,
"valid_targets_mean": 3449.7,
"valid_targets_min": 1764
},
{
"epoch": 4.42432,
"grad_norm": 0.0014717860429847214,
"learning_rate": 1.5996031799330315e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.580058546504006e-05,
"step": 4610,
"valid_targets_mean": 3305.9,
"valid_targets_min": 1802
},
{
"epoch": 4.42912,
"grad_norm": 0.0016473531059666415,
"learning_rate": 1.5734513785516227e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.1261421099770814e-05,
"step": 4615,
"valid_targets_mean": 3253.5,
"valid_targets_min": 1361
},
{
"epoch": 4.43392,
"grad_norm": 0.001331483103913834,
"learning_rate": 1.5475063640022425e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.218392885173671e-05,
"step": 4620,
"valid_targets_mean": 4387.2,
"valid_targets_min": 1943
},
{
"epoch": 4.43872,
"grad_norm": 0.0015678072884918073,
"learning_rate": 1.5217684274456314e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.212444764561951e-05,
"step": 4625,
"valid_targets_mean": 4228.2,
"valid_targets_min": 1914
},
{
"epoch": 4.44352,
"grad_norm": 0.0012720162054364376,
"learning_rate": 1.496237857718641e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.2788058888399974e-05,
"step": 4630,
"valid_targets_mean": 3761.5,
"valid_targets_min": 1908
},
{
"epoch": 4.44832,
"grad_norm": 0.0014693064780329035,
"learning_rate": 1.4709149413310076e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.5739245251752436e-05,
"step": 4635,
"valid_targets_mean": 3045.1,
"valid_targets_min": 1914
},
{
"epoch": 4.45312,
"grad_norm": 0.0012759797820861135,
"learning_rate": 1.445799962462142e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.0074017306324095e-05,
"step": 4640,
"valid_targets_mean": 4218.8,
"valid_targets_min": 1939
},
{
"epoch": 4.45792,
"grad_norm": 0.0014016504839545346,
"learning_rate": 1.420893202957927e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.586061211535707e-05,
"step": 4645,
"valid_targets_mean": 5258.8,
"valid_targets_min": 1763
},
{
"epoch": 4.46272,
"grad_norm": 0.0013382238846672736,
"learning_rate": 1.3961949423275622e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.416348772589117e-05,
"step": 4650,
"valid_targets_mean": 3336.5,
"valid_targets_min": 1917
},
{
"epoch": 4.46752,
"grad_norm": 0.0010650811370673263,
"learning_rate": 1.3717054577404331e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.619651397457346e-05,
"step": 4655,
"valid_targets_mean": 4939.1,
"valid_targets_min": 1942
},
{
"epoch": 4.47232,
"grad_norm": 0.0015467868997038122,
"learning_rate": 1.347425024022988e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.186376099823974e-05,
"step": 4660,
"valid_targets_mean": 3193.4,
"valid_targets_min": 1719
},
{
"epoch": 4.47712,
"grad_norm": 0.001079459379272364,
"learning_rate": 1.3233539136556606e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.495600321912207e-05,
"step": 4665,
"valid_targets_mean": 4908.7,
"valid_targets_min": 1525
},
{
"epoch": 4.48192,
"grad_norm": 0.0016107049369327223,
"learning_rate": 1.2994923967698125e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.6766832888824865e-05,
"step": 4670,
"valid_targets_mean": 3231.1,
"valid_targets_min": 1918
},
{
"epoch": 4.48672,
"grad_norm": 0.001295276413290572,
"learning_rate": 1.2758407411446982e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.188467806263361e-05,
"step": 4675,
"valid_targets_mean": 3830.6,
"valid_targets_min": 1863
},
{
"epoch": 4.49152,
"grad_norm": 0.0014125030915670483,
"learning_rate": 1.252399212204467e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.064816312165931e-05,
"step": 4680,
"valid_targets_mean": 4017.2,
"valid_targets_min": 1906
},
{
"epoch": 4.49632,
"grad_norm": 0.0013458030400534259,
"learning_rate": 1.22916807301517e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.3533407733775675e-05,
"step": 4685,
"valid_targets_mean": 3477.4,
"valid_targets_min": 1820
},
{
"epoch": 4.50112,
"grad_norm": 0.0016436112336502518,
"learning_rate": 1.2061475842818337e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.694011997547932e-05,
"step": 4690,
"valid_targets_mean": 2803.8,
"valid_targets_min": 1771
},
{
"epoch": 4.50592,
"grad_norm": 0.0014744987333515098,
"learning_rate": 1.1833380043455e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.827699401881546e-05,
"step": 4695,
"valid_targets_mean": 3764.2,
"valid_targets_min": 2059
},
{
"epoch": 4.51072,
"grad_norm": 0.0014523313139412053,
"learning_rate": 1.1607395891803641e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.0521079932223074e-05,
"step": 4700,
"valid_targets_mean": 3435.2,
"valid_targets_min": 1919
},
{
"epoch": 4.51552,
"grad_norm": 0.001377506897666381,
"learning_rate": 1.1383525923908678e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.60075207229238e-05,
"step": 4705,
"valid_targets_mean": 3290.6,
"valid_targets_min": 1966
},
{
"epoch": 4.52032,
"grad_norm": 0.001252005700755184,
"learning_rate": 1.1161772652088775e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.753907003556378e-05,
"step": 4710,
"valid_targets_mean": 3920.6,
"valid_targets_min": 1820
},
{
"epoch": 4.52512,
"grad_norm": 0.0025620915151801284,
"learning_rate": 1.094213856490849e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.3474727135617286e-05,
"step": 4715,
"valid_targets_mean": 3555.8,
"valid_targets_min": 1601
},
{
"epoch": 4.52992,
"grad_norm": 0.001519151744512467,
"learning_rate": 1.0724626127150462e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.198120950604789e-05,
"step": 4720,
"valid_targets_mean": 2547.0,
"valid_targets_min": 1981
},
{
"epoch": 4.53472,
"grad_norm": 0.001991121718963719,
"learning_rate": 1.0509237779787717e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.0243176044896245e-05,
"step": 4725,
"valid_targets_mean": 3534.3,
"valid_targets_min": 2086
},
{
"epoch": 4.5395199999999996,
"grad_norm": 0.0013389944210247407,
"learning_rate": 1.029597593995626e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.0416300180368125e-05,
"step": 4730,
"valid_targets_mean": 3721.5,
"valid_targets_min": 1929
},
{
"epoch": 4.54432,
"grad_norm": 0.0017033067169285275,
"learning_rate": 1.008484300092798e-06,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.046371759613976e-05,
"step": 4735,
"valid_targets_mean": 3974.4,
"valid_targets_min": 1562
},
{
"epoch": 4.54912,
"grad_norm": 0.0013382541310036622,
"learning_rate": 9.87584133208368e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.098331919522025e-05,
"step": 4740,
"valid_targets_mean": 4250.1,
"valid_targets_min": 1934
},
{
"epoch": 4.55392,
"grad_norm": 0.0014815237161349228,
"learning_rate": 9.66897327888665e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.0904986488167197e-05,
"step": 4745,
"valid_targets_mean": 3927.1,
"valid_targets_min": 2136
},
{
"epoch": 4.55872,
"grad_norm": 0.0012628924512069915,
"learning_rate": 9.464241162856269e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.71253284154227e-05,
"step": 4750,
"valid_targets_mean": 3516.2,
"valid_targets_min": 1820
},
{
"epoch": 4.5635200000000005,
"grad_norm": 0.0016096247714936995,
"learning_rate": 9.261647281541908e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.163005360169336e-05,
"step": 4755,
"valid_targets_mean": 3711.3,
"valid_targets_min": 1786
},
{
"epoch": 4.56832,
"grad_norm": 0.0011359447908436454,
"learning_rate": 9.061193908497201e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.9243678000057116e-05,
"step": 4760,
"valid_targets_mean": 3960.3,
"valid_targets_min": 1760
},
{
"epoch": 4.57312,
"grad_norm": 0.0012325208487944698,
"learning_rate": 8.862883293254598e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.4878499971237034e-05,
"step": 4765,
"valid_targets_mean": 3877.7,
"valid_targets_min": 1760
},
{
"epoch": 4.57792,
"grad_norm": 0.0017772163052283724,
"learning_rate": 8.666717661299917e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.6678311769501306e-05,
"step": 4770,
"valid_targets_mean": 3336.5,
"valid_targets_min": 1727
},
{
"epoch": 4.58272,
"grad_norm": 0.0012672879514388682,
"learning_rate": 8.472699214047652e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.525630381773226e-05,
"step": 4775,
"valid_targets_mean": 3886.1,
"valid_targets_min": 1986
},
{
"epoch": 4.58752,
"grad_norm": 0.0014442282222083972,
"learning_rate": 8.280830128815953e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.140436794841662e-05,
"step": 4780,
"valid_targets_mean": 2852.9,
"valid_targets_min": 1601
},
{
"epoch": 4.59232,
"grad_norm": 0.0013335062943690265,
"learning_rate": 8.09111255880246e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.9172715585445985e-05,
"step": 4785,
"valid_targets_mean": 4712.3,
"valid_targets_min": 1933
},
{
"epoch": 4.59712,
"grad_norm": 0.0016073643552779076,
"learning_rate": 7.903548633059955e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.3097250959835947e-05,
"step": 4790,
"valid_targets_mean": 3657.0,
"valid_targets_min": 2162
},
{
"epoch": 4.60192,
"grad_norm": 0.0014311250739149058,
"learning_rate": 7.718140456472612e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.254737384850159e-05,
"step": 4795,
"valid_targets_mean": 3186.6,
"valid_targets_min": 1857
},
{
"epoch": 4.60672,
"grad_norm": 0.0014720511963264634,
"learning_rate": 7.534890109732229e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.767356975004077e-05,
"step": 4800,
"valid_targets_mean": 4191.3,
"valid_targets_min": 1986
},
{
"epoch": 4.61152,
"grad_norm": 0.0011422497608168177,
"learning_rate": 7.353799649315085e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.191369640058838e-05,
"step": 4805,
"valid_targets_mean": 5858.8,
"valid_targets_min": 2177
},
{
"epoch": 4.61632,
"grad_norm": 0.0015142999837969848,
"learning_rate": 7.174871107458603e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.843754166155122e-05,
"step": 4810,
"valid_targets_mean": 4474.0,
"valid_targets_min": 1889
},
{
"epoch": 4.62112,
"grad_norm": 0.0012380465021728157,
"learning_rate": 6.998106492138724e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.2066651328932494e-05,
"step": 4815,
"valid_targets_mean": 3932.0,
"valid_targets_min": 2020
},
{
"epoch": 4.62592,
"grad_norm": 0.0013493062176373246,
"learning_rate": 6.823507787047346e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.646211942192167e-05,
"step": 4820,
"valid_targets_mean": 3945.9,
"valid_targets_min": 1525
},
{
"epoch": 4.63072,
"grad_norm": 0.0013500247168241138,
"learning_rate": 6.65107695156999e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.864829341182485e-05,
"step": 4825,
"valid_targets_mean": 3249.5,
"valid_targets_min": 2026
},
{
"epoch": 4.63552,
"grad_norm": 0.0016728963895163553,
"learning_rate": 6.480815920763905e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.096078919246793e-05,
"step": 4830,
"valid_targets_mean": 2811.6,
"valid_targets_min": 1680
},
{
"epoch": 4.64032,
"grad_norm": 0.0013007674582857596,
"learning_rate": 6.312726605336306e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.305595939513296e-05,
"step": 4835,
"valid_targets_mean": 3727.9,
"valid_targets_min": 1763
},
{
"epoch": 4.64512,
"grad_norm": 0.001246805819895664,
"learning_rate": 6.146810891622923e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.767627276829444e-05,
"step": 4840,
"valid_targets_mean": 4590.0,
"valid_targets_min": 1786
},
{
"epoch": 4.64992,
"grad_norm": 0.0015306984235042263,
"learning_rate": 5.983070641566802e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.872297722613439e-05,
"step": 4845,
"valid_targets_mean": 3660.3,
"valid_targets_min": 1909
},
{
"epoch": 4.65472,
"grad_norm": 0.0013636211473654518,
"learning_rate": 5.821507692697537e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.59952864528168e-05,
"step": 4850,
"valid_targets_mean": 4783.3,
"valid_targets_min": 1929
},
{
"epoch": 4.65952,
"grad_norm": 0.001214169634631268,
"learning_rate": 5.662123858110513e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.457337152212858e-05,
"step": 4855,
"valid_targets_mean": 4948.0,
"valid_targets_min": 1981
},
{
"epoch": 4.66432,
"grad_norm": 0.0013015007668589714,
"learning_rate": 5.504920926446611e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.846073428168893e-05,
"step": 4860,
"valid_targets_mean": 4190.8,
"valid_targets_min": 2241
},
{
"epoch": 4.66912,
"grad_norm": 0.0017585809273893223,
"learning_rate": 5.349900661872132e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.999376349383965e-05,
"step": 4865,
"valid_targets_mean": 3302.1,
"valid_targets_min": 1940
},
{
"epoch": 4.67392,
"grad_norm": 0.0014018105059137838,
"learning_rate": 5.197064804058971e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.753218334168196e-05,
"step": 4870,
"valid_targets_mean": 3569.1,
"valid_targets_min": 1868
},
{
"epoch": 4.67872,
"grad_norm": 0.001411049154838511,
"learning_rate": 5.046415068165234e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.0762810385786e-05,
"step": 4875,
"valid_targets_mean": 4144.9,
"valid_targets_min": 1838
},
{
"epoch": 4.68352,
"grad_norm": 0.0012325440682396773,
"learning_rate": 4.897953144815759e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.6161636419128627e-05,
"step": 4880,
"valid_targets_mean": 4015.3,
"valid_targets_min": 1884
},
{
"epoch": 4.68832,
"grad_norm": 0.001081422749527924,
"learning_rate": 4.7516807000833165e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.977273652504664e-05,
"step": 4885,
"valid_targets_mean": 5051.3,
"valid_targets_min": 2148
},
{
"epoch": 4.69312,
"grad_norm": 0.0013326312566954472,
"learning_rate": 4.6075993754698623e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.299923992017284e-05,
"step": 4890,
"valid_targets_mean": 3795.8,
"valid_targets_min": 1930
},
{
"epoch": 4.69792,
"grad_norm": 0.0010834549302240677,
"learning_rate": 4.4657107878881113e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.9331695006694645e-05,
"step": 4895,
"valid_targets_mean": 4620.5,
"valid_targets_min": 1940
},
{
"epoch": 4.70272,
"grad_norm": 0.0009505343422854887,
"learning_rate": 4.326016529643351e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.737485192483291e-05,
"step": 4900,
"valid_targets_mean": 5942.9,
"valid_targets_min": 1991
},
{
"epoch": 4.70752,
"grad_norm": 0.0012846898025216246,
"learning_rate": 4.1885181684157005e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.654539614217356e-05,
"step": 4905,
"valid_targets_mean": 3363.9,
"valid_targets_min": 1917
},
{
"epoch": 4.71232,
"grad_norm": 0.0015367895661445351,
"learning_rate": 4.053217247242369e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.137801442993805e-05,
"step": 4910,
"valid_targets_mean": 3513.6,
"valid_targets_min": 1727
},
{
"epoch": 4.7171199999999995,
"grad_norm": 0.0015445627771844294,
"learning_rate": 3.9201152845004476e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.674181087058969e-05,
"step": 4915,
"valid_targets_mean": 3224.1,
"valid_targets_min": 1924
},
{
"epoch": 4.72192,
"grad_norm": 0.0015343846128040427,
"learning_rate": 3.789213773889744e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.526258660713211e-05,
"step": 4920,
"valid_targets_mean": 2999.2,
"valid_targets_min": 1727
},
{
"epoch": 4.72672,
"grad_norm": 0.001325208866112591,
"learning_rate": 3.6605141844162417e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.196104444214143e-05,
"step": 4925,
"valid_targets_mean": 4132.0,
"valid_targets_min": 1912
},
{
"epoch": 4.73152,
"grad_norm": 0.0018118681699326824,
"learning_rate": 3.5340179603753354e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.0053150112507865e-05,
"step": 4930,
"valid_targets_mean": 3962.4,
"valid_targets_min": 1887
},
{
"epoch": 4.73632,
"grad_norm": 0.0008082094400929223,
"learning_rate": 3.4097265213358435e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.9822517060674727e-05,
"step": 4935,
"valid_targets_mean": 4209.6,
"valid_targets_min": 1951
},
{
"epoch": 4.7411200000000004,
"grad_norm": 0.0013943033363122907,
"learning_rate": 3.287641262123975e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.594924055505544e-05,
"step": 4940,
"valid_targets_mean": 3413.5,
"valid_targets_min": 1614
},
{
"epoch": 4.74592,
"grad_norm": 0.0012017603675163208,
"learning_rate": 3.1677635528076566e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.850576493074186e-05,
"step": 4945,
"valid_targets_mean": 4258.0,
"valid_targets_min": 1917
},
{
"epoch": 4.75072,
"grad_norm": 0.0014305722242892265,
"learning_rate": 3.0500947386812973e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7447800423251465e-05,
"step": 4950,
"valid_targets_mean": 4027.3,
"valid_targets_min": 1925
},
{
"epoch": 4.75552,
"grad_norm": 0.0010461845264905828,
"learning_rate": 2.934636140250513e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.5297613067086786e-05,
"step": 4955,
"valid_targets_mean": 4322.1,
"valid_targets_min": 1836
},
{
"epoch": 4.76032,
"grad_norm": 0.001185201140045603,
"learning_rate": 2.821389053217383e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.970770583488047e-05,
"step": 4960,
"valid_targets_mean": 4760.2,
"valid_targets_min": 1917
},
{
"epoch": 4.76512,
"grad_norm": 0.0011274151535639705,
"learning_rate": 2.710354748465949e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.792166924336925e-05,
"step": 4965,
"valid_targets_mean": 3010.6,
"valid_targets_min": 1802
},
{
"epoch": 4.76992,
"grad_norm": 0.0015942705739524197,
"learning_rate": 2.6015344720479395e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.446161619853228e-05,
"step": 4970,
"valid_targets_mean": 3951.6,
"valid_targets_min": 1908
},
{
"epoch": 4.77472,
"grad_norm": 0.0011431533238156495,
"learning_rate": 2.49492944516867e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.62203354598023e-05,
"step": 4975,
"valid_targets_mean": 4022.9,
"valid_targets_min": 1991
},
{
"epoch": 4.77952,
"grad_norm": 0.0013344896167050537,
"learning_rate": 2.3905408641735183e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.3846070184372365e-05,
"step": 4980,
"valid_targets_mean": 2981.7,
"valid_targets_min": 1764
},
{
"epoch": 4.78432,
"grad_norm": 0.0011469415623424919,
"learning_rate": 2.288369900534404e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.583916986826807e-05,
"step": 4985,
"valid_targets_mean": 4020.9,
"valid_targets_min": 1614
},
{
"epoch": 4.7891200000000005,
"grad_norm": 0.0015332867881165636,
"learning_rate": 2.1884177008366203e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.023212022730149e-05,
"step": 4990,
"valid_targets_mean": 3641.2,
"valid_targets_min": 1992
},
{
"epoch": 4.79392,
"grad_norm": 0.0015958107058125627,
"learning_rate": 2.0906853867660004e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.5333177695283666e-05,
"step": 4995,
"valid_targets_mean": 3073.5,
"valid_targets_min": 1833
},
{
"epoch": 4.79872,
"grad_norm": 0.0014088920318571542,
"learning_rate": 1.9951740550963493e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.387499236850999e-05,
"step": 5000,
"valid_targets_mean": 3618.2,
"valid_targets_min": 1863
},
{
"epoch": 4.80352,
"grad_norm": 0.001382017022764611,
"learning_rate": 1.9018847776770987e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.965832391055301e-05,
"step": 5005,
"valid_targets_mean": 3913.4,
"valid_targets_min": 1680
},
{
"epoch": 4.80832,
"grad_norm": 0.0009667895381881995,
"learning_rate": 1.8108186014212935e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.5687706258613616e-05,
"step": 5010,
"valid_targets_mean": 3918.7,
"valid_targets_min": 1984
},
{
"epoch": 4.81312,
"grad_norm": 0.001125905574920971,
"learning_rate": 1.7219765482938465e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.900204683304764e-05,
"step": 5015,
"valid_targets_mean": 3905.2,
"valid_targets_min": 1614
},
{
"epoch": 4.81792,
"grad_norm": 0.001735614405714739,
"learning_rate": 1.635359615300036e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.774373180931434e-05,
"step": 5020,
"valid_targets_mean": 3537.9,
"valid_targets_min": 2020
},
{
"epoch": 4.82272,
"grad_norm": 0.00135684272286996,
"learning_rate": 1.5509687744744262e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.51240742020309e-05,
"step": 5025,
"valid_targets_mean": 3842.5,
"valid_targets_min": 2001
},
{
"epoch": 4.82752,
"grad_norm": 0.0014588129404354,
"learning_rate": 1.468804972869786e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.749809548025951e-05,
"step": 5030,
"valid_targets_mean": 4380.7,
"valid_targets_min": 1829
},
{
"epoch": 4.83232,
"grad_norm": 0.0011513349659320153,
"learning_rate": 1.3888691325465886e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.5042725610546768e-05,
"step": 5035,
"valid_targets_mean": 4936.8,
"valid_targets_min": 1838
},
{
"epoch": 4.83712,
"grad_norm": 0.0014964758267286004,
"learning_rate": 1.3111621505626616e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.30040929839015e-05,
"step": 5040,
"valid_targets_mean": 3460.6,
"valid_targets_min": 1836
},
{
"epoch": 4.84192,
"grad_norm": 0.0017164816439846106,
"learning_rate": 1.235684898963041e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.070202703587711e-05,
"step": 5045,
"valid_targets_mean": 3200.8,
"valid_targets_min": 1680
},
{
"epoch": 4.84672,
"grad_norm": 0.0015533880396124476,
"learning_rate": 1.1624382247702681e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.0546980269718915e-05,
"step": 5050,
"valid_targets_mean": 3411.6,
"valid_targets_min": 1719
},
{
"epoch": 4.85152,
"grad_norm": 0.0010019739894339837,
"learning_rate": 1.0914229499748186e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.7109126676805317e-05,
"step": 5055,
"valid_targets_mean": 4662.9,
"valid_targets_min": 1918
},
{
"epoch": 4.85632,
"grad_norm": 0.0012845399103813841,
"learning_rate": 1.0226398715259322e-07,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.92291510454379e-05,
"step": 5060,
"valid_targets_mean": 3564.8,
"valid_targets_min": 1829
},
{
"epoch": 4.86112,
"grad_norm": 0.0011385205570641132,
"learning_rate": 9.560897613226205e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.4021744795609266e-05,
"step": 5065,
"valid_targets_mean": 4878.3,
"valid_targets_min": 2041
},
{
"epoch": 4.86592,
"grad_norm": 0.0012616009743158724,
"learning_rate": 8.917733662050287e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.472245953162201e-05,
"step": 5070,
"valid_targets_mean": 5015.9,
"valid_targets_min": 1921
},
{
"epoch": 4.87072,
"grad_norm": 0.001155635403330904,
"learning_rate": 8.296914079461094e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.9761726182186976e-05,
"step": 5075,
"valid_targets_mean": 5231.2,
"valid_targets_min": 1839
},
{
"epoch": 4.87552,
"grad_norm": 0.0013659832914605808,
"learning_rate": 7.698445832433843e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.441186709096655e-05,
"step": 5080,
"valid_targets_mean": 4165.3,
"valid_targets_min": 1877
},
{
"epoch": 4.88032,
"grad_norm": 0.0012340347205992707,
"learning_rate": 7.122335637112621e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.069916030857712e-05,
"step": 5085,
"valid_targets_mean": 4010.7,
"valid_targets_min": 1751
},
{
"epoch": 4.88512,
"grad_norm": 0.001273691882930067,
"learning_rate": 6.568589958734218e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.6386449210112914e-05,
"step": 5090,
"valid_targets_mean": 3385.9,
"valid_targets_min": 1857
},
{
"epoch": 4.88992,
"grad_norm": 0.001393496913272501,
"learning_rate": 6.037215011556185e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.061328218085691e-05,
"step": 5095,
"valid_targets_mean": 4302.8,
"valid_targets_min": 1938
},
{
"epoch": 4.8947199999999995,
"grad_norm": 0.0013498594145078644,
"learning_rate": 5.5282167587862314e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7743702705483884e-05,
"step": 5100,
"valid_targets_mean": 4179.5,
"valid_targets_min": 2008
},
{
"epoch": 4.89952,
"grad_norm": 0.0014143037065501012,
"learning_rate": 5.041600912516264e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.063945380039513e-05,
"step": 5105,
"valid_targets_mean": 3860.1,
"valid_targets_min": 1836
},
{
"epoch": 4.90432,
"grad_norm": 0.0014140500655952196,
"learning_rate": 4.5773729336577865e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.08784656226635e-05,
"step": 5110,
"valid_targets_mean": 3286.4,
"valid_targets_min": 2030
},
{
"epoch": 4.90912,
"grad_norm": 0.0017234645985855681,
"learning_rate": 4.1355380318803816e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.182319753454067e-05,
"step": 5115,
"valid_targets_mean": 3396.9,
"valid_targets_min": 1601
},
{
"epoch": 4.91392,
"grad_norm": 0.0011229129262111707,
"learning_rate": 3.7161011655535425e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.045425000891555e-05,
"step": 5120,
"valid_targets_mean": 3276.5,
"valid_targets_min": 1914
},
{
"epoch": 4.91872,
"grad_norm": 0.001192187863420458,
"learning_rate": 3.319067041691604e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.9014812753302976e-05,
"step": 5125,
"valid_targets_mean": 3593.7,
"valid_targets_min": 1763
},
{
"epoch": 4.92352,
"grad_norm": 0.0015182017551724832,
"learning_rate": 2.9444401158995606e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.1434181437361985e-05,
"step": 5130,
"valid_targets_mean": 2530.2,
"valid_targets_min": 1993
},
{
"epoch": 4.92832,
"grad_norm": 0.0011932741963916822,
"learning_rate": 2.5922245923244436e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.078323399880901e-05,
"step": 5135,
"valid_targets_mean": 3796.1,
"valid_targets_min": 1976
},
{
"epoch": 4.93312,
"grad_norm": 0.001550202425571585,
"learning_rate": 2.2624244236071348e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.0727601774269715e-05,
"step": 5140,
"valid_targets_mean": 3348.7,
"valid_targets_min": 1829
},
{
"epoch": 4.93792,
"grad_norm": 0.0013292556967572553,
"learning_rate": 1.9550433108384005e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.335079236421734e-05,
"step": 5145,
"valid_targets_mean": 3704.0,
"valid_targets_min": 1877
},
{
"epoch": 4.94272,
"grad_norm": 0.0014035126325946453,
"learning_rate": 1.6700847035180378e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.1342160835047252e-05,
"step": 5150,
"valid_targets_mean": 4230.9,
"valid_targets_min": 1786
},
{
"epoch": 4.94752,
"grad_norm": 0.0014310478819625216,
"learning_rate": 1.4075517995146837e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.299306990811601e-05,
"step": 5155,
"valid_targets_mean": 4439.9,
"valid_targets_min": 1949
},
{
"epoch": 4.95232,
"grad_norm": 0.0015978203559360326,
"learning_rate": 1.167447545031175e-08,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.916247806046158e-05,
"step": 5160,
"valid_targets_mean": 3008.0,
"valid_targets_min": 2091
},
{
"epoch": 4.95712,
"grad_norm": 0.0011164404550244923,
"learning_rate": 9.497746345705772e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.2907188142417e-05,
"step": 5165,
"valid_targets_mean": 4431.3,
"valid_targets_min": 1705
},
{
"epoch": 4.96192,
"grad_norm": 0.0012503279471786264,
"learning_rate": 7.545355109073172e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.4081882656901143e-05,
"step": 5170,
"valid_targets_mean": 3681.2,
"valid_targets_min": 1727
},
{
"epoch": 4.9667200000000005,
"grad_norm": 0.001375435267226282,
"learning_rate": 5.817323650578743e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.076618643011898e-05,
"step": 5175,
"valid_targets_mean": 3616.1,
"valid_targets_min": 2113
},
{
"epoch": 4.97152,
"grad_norm": 0.0016537587168405621,
"learning_rate": 4.313671362576877e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.502938827499747e-05,
"step": 5180,
"valid_targets_mean": 2839.1,
"valid_targets_min": 1705
},
{
"epoch": 4.97632,
"grad_norm": 0.0016762299883309327,
"learning_rate": 3.0344151193917316e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.7856032324489206e-05,
"step": 5185,
"valid_targets_mean": 3107.3,
"valid_targets_min": 1919
},
{
"epoch": 4.98112,
"grad_norm": 0.0021278546575005703,
"learning_rate": 1.979569277117399e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.744456626009196e-05,
"step": 5190,
"valid_targets_mean": 3881.2,
"valid_targets_min": 2103
},
{
"epoch": 4.98592,
"grad_norm": 0.00150027232141985,
"learning_rate": 1.1491456734713524e-09,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 3.7057245208416134e-05,
"step": 5195,
"valid_targets_mean": 3717.0,
"valid_targets_min": 1838
},
{
"epoch": 4.99072,
"grad_norm": 0.0010896481788440953,
"learning_rate": 5.431536276523375e-10,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 2.905803376052063e-05,
"step": 5200,
"valid_targets_mean": 4881.5,
"valid_targets_min": 1900
},
{
"epoch": 4.99552,
"grad_norm": 0.001501183108511998,
"learning_rate": 1.6159994023601245e-10,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 4.9408565246267244e-05,
"step": 5205,
"valid_targets_mean": 3176.6,
"valid_targets_min": 1952
},
{
"epoch": 5.0,
"grad_norm": 0.0016249555548919574,
"learning_rate": 4.488893106113779e-12,
"loss": 0.0001,
"loss_nan_ranks": 0,
"loss_rank_avg": 5.124273229739629e-05,
"step": 5210,
"valid_targets_mean": 3937.9,
"valid_targets_min": 1868
},
{
"epoch": 5.0,
"step": 5210,
"total_flos": 6.749812417674346e+18,
"train_loss": 0.0,
"train_runtime": 1.2275,
"train_samples_per_second": 407324.551,
"train_steps_per_second": 4244.322
}
],
"logging_steps": 5,
"max_steps": 5210,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 300,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 6.749812417674346e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}