Files
g1_diverse_tezos_100k_8b/trainer_state.json
ModelHub XC 9efbcb8fae 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/g1_diverse_tezos_100k_8b
Source: Original Platform
2026-05-03 03:14:19 +08:00

13959 lines
389 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 6328,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.005534034311012728,
"grad_norm": 22.573869688184732,
"learning_rate": 2.527646129541864e-07,
"loss": 0.8221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3871062695980072,
"step": 5,
"valid_targets_mean": 6579.2,
"valid_targets_min": 1651
},
{
"epoch": 0.011068068622025456,
"grad_norm": 19.583965059989275,
"learning_rate": 5.687203791469194e-07,
"loss": 0.818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38075920939445496,
"step": 10,
"valid_targets_mean": 6844.8,
"valid_targets_min": 2928
},
{
"epoch": 0.016602102933038185,
"grad_norm": 10.39723815630763,
"learning_rate": 8.846761453396525e-07,
"loss": 0.7289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36340269446372986,
"step": 15,
"valid_targets_mean": 6970.2,
"valid_targets_min": 1816
},
{
"epoch": 0.02213613724405091,
"grad_norm": 3.0485900232610743,
"learning_rate": 1.2006319115323856e-06,
"loss": 0.6323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3266253173351288,
"step": 20,
"valid_targets_mean": 7589.0,
"valid_targets_min": 2058
},
{
"epoch": 0.02767017155506364,
"grad_norm": 1.535701101825782,
"learning_rate": 1.5165876777251187e-06,
"loss": 0.5703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894801199436188,
"step": 25,
"valid_targets_mean": 7366.7,
"valid_targets_min": 3293
},
{
"epoch": 0.03320420586607637,
"grad_norm": 1.0808344775071332,
"learning_rate": 1.8325434439178516e-06,
"loss": 0.5208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2558213472366333,
"step": 30,
"valid_targets_mean": 6763.6,
"valid_targets_min": 2844
},
{
"epoch": 0.0387382401770891,
"grad_norm": 0.7808300398981991,
"learning_rate": 2.148499210110585e-06,
"loss": 0.508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2513916790485382,
"step": 35,
"valid_targets_mean": 6678.9,
"valid_targets_min": 2465
},
{
"epoch": 0.04427227448810182,
"grad_norm": 0.4538559560104941,
"learning_rate": 2.4644549763033174e-06,
"loss": 0.4735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22647960484027863,
"step": 40,
"valid_targets_mean": 7128.3,
"valid_targets_min": 2482
},
{
"epoch": 0.04980630879911455,
"grad_norm": 0.44569451067957555,
"learning_rate": 2.7804107424960508e-06,
"loss": 0.4509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21913795173168182,
"step": 45,
"valid_targets_mean": 6365.0,
"valid_targets_min": 1594
},
{
"epoch": 0.05534034311012728,
"grad_norm": 0.37638104680350243,
"learning_rate": 3.096366508688784e-06,
"loss": 0.4326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21242153644561768,
"step": 50,
"valid_targets_mean": 6929.4,
"valid_targets_min": 2099
},
{
"epoch": 0.06087437742114001,
"grad_norm": 0.340887327503334,
"learning_rate": 3.412322274881517e-06,
"loss": 0.4184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17877615988254547,
"step": 55,
"valid_targets_mean": 6168.6,
"valid_targets_min": 1277
},
{
"epoch": 0.06640841173215274,
"grad_norm": 0.23882053545013524,
"learning_rate": 3.72827804107425e-06,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17955751717090607,
"step": 60,
"valid_targets_mean": 6729.7,
"valid_targets_min": 2910
},
{
"epoch": 0.07194244604316546,
"grad_norm": 0.24725932657940633,
"learning_rate": 4.044233807266983e-06,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18898995220661163,
"step": 65,
"valid_targets_mean": 6594.8,
"valid_targets_min": 1941
},
{
"epoch": 0.0774764803541782,
"grad_norm": 0.22636276011564896,
"learning_rate": 4.360189573459716e-06,
"loss": 0.3861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18377459049224854,
"step": 70,
"valid_targets_mean": 6777.4,
"valid_targets_min": 2598
},
{
"epoch": 0.08301051466519092,
"grad_norm": 0.21545729413371376,
"learning_rate": 4.676145339652449e-06,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18341968953609467,
"step": 75,
"valid_targets_mean": 6707.7,
"valid_targets_min": 2313
},
{
"epoch": 0.08854454897620365,
"grad_norm": 0.20558446498893868,
"learning_rate": 4.9921011058451815e-06,
"loss": 0.3739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1936556100845337,
"step": 80,
"valid_targets_mean": 7161.9,
"valid_targets_min": 1638
},
{
"epoch": 0.09407858328721638,
"grad_norm": 0.19767479431879417,
"learning_rate": 5.308056872037915e-06,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18940621614456177,
"step": 85,
"valid_targets_mean": 7025.5,
"valid_targets_min": 3109
},
{
"epoch": 0.0996126175982291,
"grad_norm": 0.19295545512857692,
"learning_rate": 5.624012638230648e-06,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1677761822938919,
"step": 90,
"valid_targets_mean": 6895.4,
"valid_targets_min": 2040
},
{
"epoch": 0.10514665190924184,
"grad_norm": 0.2020435352377361,
"learning_rate": 5.939968404423381e-06,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823124885559082,
"step": 95,
"valid_targets_mean": 6505.2,
"valid_targets_min": 2623
},
{
"epoch": 0.11068068622025456,
"grad_norm": 0.19088643214652315,
"learning_rate": 6.255924170616115e-06,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17667806148529053,
"step": 100,
"valid_targets_mean": 6831.8,
"valid_targets_min": 2450
},
{
"epoch": 0.11621472053126729,
"grad_norm": 0.1990091606136358,
"learning_rate": 6.571879936808847e-06,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1750369668006897,
"step": 105,
"valid_targets_mean": 6923.1,
"valid_targets_min": 3116
},
{
"epoch": 0.12174875484228002,
"grad_norm": 0.218232857308847,
"learning_rate": 6.8878357030015805e-06,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15672846138477325,
"step": 110,
"valid_targets_mean": 6147.5,
"valid_targets_min": 2014
},
{
"epoch": 0.12728278915329275,
"grad_norm": 0.19960252131354672,
"learning_rate": 7.203791469194313e-06,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17363061010837555,
"step": 115,
"valid_targets_mean": 6990.4,
"valid_targets_min": 2412
},
{
"epoch": 0.13281682346430548,
"grad_norm": 0.22454500068576372,
"learning_rate": 7.519747235387046e-06,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685630828142166,
"step": 120,
"valid_targets_mean": 6798.5,
"valid_targets_min": 2824
},
{
"epoch": 0.13835085777531822,
"grad_norm": 0.21833094391730726,
"learning_rate": 7.83570300157978e-06,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15475989878177643,
"step": 125,
"valid_targets_mean": 7045.3,
"valid_targets_min": 2530
},
{
"epoch": 0.14388489208633093,
"grad_norm": 0.20638162571713792,
"learning_rate": 8.151658767772512e-06,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473006308078766,
"step": 130,
"valid_targets_mean": 6538.4,
"valid_targets_min": 1802
},
{
"epoch": 0.14941892639734367,
"grad_norm": 0.22358362084070507,
"learning_rate": 8.467614533965247e-06,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15598450601100922,
"step": 135,
"valid_targets_mean": 6699.4,
"valid_targets_min": 2155
},
{
"epoch": 0.1549529607083564,
"grad_norm": 0.21017837829312694,
"learning_rate": 8.783570300157978e-06,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14871534705162048,
"step": 140,
"valid_targets_mean": 6332.6,
"valid_targets_min": 2295
},
{
"epoch": 0.1604869950193691,
"grad_norm": 0.21622396498243057,
"learning_rate": 9.09952606635071e-06,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16364316642284393,
"step": 145,
"valid_targets_mean": 6915.4,
"valid_targets_min": 1863
},
{
"epoch": 0.16602102933038185,
"grad_norm": 0.21695105023925934,
"learning_rate": 9.415481832543445e-06,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1467968374490738,
"step": 150,
"valid_targets_mean": 6859.3,
"valid_targets_min": 1842
},
{
"epoch": 0.17155506364139458,
"grad_norm": 0.28985331992579194,
"learning_rate": 9.731437598736178e-06,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15782998502254486,
"step": 155,
"valid_targets_mean": 6832.0,
"valid_targets_min": 2689
},
{
"epoch": 0.1770890979524073,
"grad_norm": 0.22934552913714118,
"learning_rate": 1.004739336492891e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16041989624500275,
"step": 160,
"valid_targets_mean": 6902.6,
"valid_targets_min": 2882
},
{
"epoch": 0.18262313226342003,
"grad_norm": 0.23762401673014116,
"learning_rate": 1.0363349131121642e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13668395578861237,
"step": 165,
"valid_targets_mean": 6325.6,
"valid_targets_min": 1950
},
{
"epoch": 0.18815716657443277,
"grad_norm": 0.23400047830438106,
"learning_rate": 1.0679304897314377e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621910184621811,
"step": 170,
"valid_targets_mean": 7014.8,
"valid_targets_min": 2827
},
{
"epoch": 0.1936912008854455,
"grad_norm": 0.24418156895720325,
"learning_rate": 1.099526066350711e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15957500040531158,
"step": 175,
"valid_targets_mean": 6979.4,
"valid_targets_min": 2777
},
{
"epoch": 0.1992252351964582,
"grad_norm": 0.21969595390343435,
"learning_rate": 1.1311216429699843e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14138895273208618,
"step": 180,
"valid_targets_mean": 6767.5,
"valid_targets_min": 2923
},
{
"epoch": 0.20475926950747095,
"grad_norm": 0.23779818602920866,
"learning_rate": 1.1627172195892576e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15995411574840546,
"step": 185,
"valid_targets_mean": 6852.5,
"valid_targets_min": 2299
},
{
"epoch": 0.21029330381848368,
"grad_norm": 0.2299655072817694,
"learning_rate": 1.1943127962085309e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14684586226940155,
"step": 190,
"valid_targets_mean": 6578.0,
"valid_targets_min": 1726
},
{
"epoch": 0.2158273381294964,
"grad_norm": 0.2242595706921999,
"learning_rate": 1.2259083728278043e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14662371575832367,
"step": 195,
"valid_targets_mean": 6188.8,
"valid_targets_min": 2385
},
{
"epoch": 0.22136137244050913,
"grad_norm": 0.22118820017723173,
"learning_rate": 1.2575039494470776e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13862204551696777,
"step": 200,
"valid_targets_mean": 6247.0,
"valid_targets_min": 1759
},
{
"epoch": 0.22689540675152187,
"grad_norm": 0.586152646493132,
"learning_rate": 1.2890995260663507e-05,
"loss": 0.4144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24356555938720703,
"step": 205,
"valid_targets_mean": 3846.9,
"valid_targets_min": 1635
},
{
"epoch": 0.23242944106253458,
"grad_norm": 0.40113982026614686,
"learning_rate": 1.320695102685624e-05,
"loss": 0.4594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24281583726406097,
"step": 210,
"valid_targets_mean": 4104.0,
"valid_targets_min": 1728
},
{
"epoch": 0.2379634753735473,
"grad_norm": 0.3587578081191217,
"learning_rate": 1.3522906793048973e-05,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2290240079164505,
"step": 215,
"valid_targets_mean": 5437.0,
"valid_targets_min": 2245
},
{
"epoch": 0.24349750968456005,
"grad_norm": 0.3001740341699114,
"learning_rate": 1.3838862559241708e-05,
"loss": 0.4277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19526934623718262,
"step": 220,
"valid_targets_mean": 4097.2,
"valid_targets_min": 1379
},
{
"epoch": 0.24903154399557278,
"grad_norm": 0.31824892620034584,
"learning_rate": 1.415481832543444e-05,
"loss": 0.4195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2064758539199829,
"step": 225,
"valid_targets_mean": 4265.5,
"valid_targets_min": 1788
},
{
"epoch": 0.2545655783065855,
"grad_norm": 0.3003772739169376,
"learning_rate": 1.4470774091627173e-05,
"loss": 0.4264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18863408267498016,
"step": 230,
"valid_targets_mean": 4447.0,
"valid_targets_min": 1177
},
{
"epoch": 0.26009961261759823,
"grad_norm": 0.2664070522457513,
"learning_rate": 1.4786729857819906e-05,
"loss": 0.434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19851483404636383,
"step": 235,
"valid_targets_mean": 4379.6,
"valid_targets_min": 1555
},
{
"epoch": 0.26563364692861097,
"grad_norm": 0.2896341807388695,
"learning_rate": 1.510268562401264e-05,
"loss": 0.4292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23082368075847626,
"step": 240,
"valid_targets_mean": 5404.9,
"valid_targets_min": 1590
},
{
"epoch": 0.2711676812396237,
"grad_norm": 0.27047837917898676,
"learning_rate": 1.5418641390205372e-05,
"loss": 0.4292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18603259325027466,
"step": 245,
"valid_targets_mean": 4231.8,
"valid_targets_min": 1726
},
{
"epoch": 0.27670171555063644,
"grad_norm": 0.27449329042796916,
"learning_rate": 1.5734597156398107e-05,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991693377494812,
"step": 250,
"valid_targets_mean": 4803.9,
"valid_targets_min": 1700
},
{
"epoch": 0.2822357498616491,
"grad_norm": 3.0042063043416634,
"learning_rate": 1.6050552922590838e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18418695032596588,
"step": 255,
"valid_targets_mean": 3728.0,
"valid_targets_min": 1113
},
{
"epoch": 0.28776978417266186,
"grad_norm": 0.31439617437478307,
"learning_rate": 1.6366508688783572e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23006130754947662,
"step": 260,
"valid_targets_mean": 5108.4,
"valid_targets_min": 1637
},
{
"epoch": 0.2933038184836746,
"grad_norm": 0.31360285945290356,
"learning_rate": 1.6682464454976304e-05,
"loss": 0.3914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17801325023174286,
"step": 265,
"valid_targets_mean": 4185.0,
"valid_targets_min": 2178
},
{
"epoch": 0.29883785279468733,
"grad_norm": 0.30802890709568975,
"learning_rate": 1.6998420221169038e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19540362060070038,
"step": 270,
"valid_targets_mean": 4341.5,
"valid_targets_min": 1581
},
{
"epoch": 0.30437188710570007,
"grad_norm": 0.30033819428446645,
"learning_rate": 1.731437598736177e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21151547133922577,
"step": 275,
"valid_targets_mean": 4570.1,
"valid_targets_min": 1677
},
{
"epoch": 0.3099059214167128,
"grad_norm": 0.29709854755432863,
"learning_rate": 1.7630331753554504e-05,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19487600028514862,
"step": 280,
"valid_targets_mean": 4621.4,
"valid_targets_min": 1831
},
{
"epoch": 0.3154399557277255,
"grad_norm": 0.31577946727287876,
"learning_rate": 1.7946287519747235e-05,
"loss": 0.4025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2140292376279831,
"step": 285,
"valid_targets_mean": 4701.1,
"valid_targets_min": 1892
},
{
"epoch": 0.3209739900387382,
"grad_norm": 0.2771669398573801,
"learning_rate": 1.826224328593997e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17965345084667206,
"step": 290,
"valid_targets_mean": 4210.5,
"valid_targets_min": 1282
},
{
"epoch": 0.32650802434975096,
"grad_norm": 0.28721368651483475,
"learning_rate": 1.8578199052132704e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18116088211536407,
"step": 295,
"valid_targets_mean": 4092.7,
"valid_targets_min": 1552
},
{
"epoch": 0.3320420586607637,
"grad_norm": 0.2831149564492413,
"learning_rate": 1.8894154818325436e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16176189482212067,
"step": 300,
"valid_targets_mean": 3938.2,
"valid_targets_min": 1518
},
{
"epoch": 0.33757609297177643,
"grad_norm": 0.32797058470167983,
"learning_rate": 1.921011058451817e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17827928066253662,
"step": 305,
"valid_targets_mean": 3866.6,
"valid_targets_min": 1939
},
{
"epoch": 0.34311012728278917,
"grad_norm": 0.2925512265275017,
"learning_rate": 1.95260663507109e-05,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20264865458011627,
"step": 310,
"valid_targets_mean": 4178.5,
"valid_targets_min": 1919
},
{
"epoch": 0.3486441615938019,
"grad_norm": 0.28525946139415165,
"learning_rate": 1.9842022116903633e-05,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18759731948375702,
"step": 315,
"valid_targets_mean": 4422.5,
"valid_targets_min": 1519
},
{
"epoch": 0.3541781959048146,
"grad_norm": 0.3336622602016608,
"learning_rate": 2.015797788309637e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20357847213745117,
"step": 320,
"valid_targets_mean": 4715.8,
"valid_targets_min": 1890
},
{
"epoch": 0.3597122302158273,
"grad_norm": 0.27871603743410805,
"learning_rate": 2.04739336492891e-05,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18295319378376007,
"step": 325,
"valid_targets_mean": 4308.6,
"valid_targets_min": 1797
},
{
"epoch": 0.36524626452684006,
"grad_norm": 0.26962841694038514,
"learning_rate": 2.0789889415481833e-05,
"loss": 0.3812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1815447360277176,
"step": 330,
"valid_targets_mean": 4429.0,
"valid_targets_min": 1563
},
{
"epoch": 0.3707802988378528,
"grad_norm": 0.3088487589522481,
"learning_rate": 2.1105845181674568e-05,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22907239198684692,
"step": 335,
"valid_targets_mean": 4832.3,
"valid_targets_min": 1789
},
{
"epoch": 0.37631433314886553,
"grad_norm": 0.30545972833166846,
"learning_rate": 2.14218009478673e-05,
"loss": 0.3813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19862891733646393,
"step": 340,
"valid_targets_mean": 4335.4,
"valid_targets_min": 1729
},
{
"epoch": 0.38184836745987827,
"grad_norm": 0.28528331140566465,
"learning_rate": 2.1737756714060033e-05,
"loss": 0.3819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17305584251880646,
"step": 345,
"valid_targets_mean": 3609.3,
"valid_targets_min": 1651
},
{
"epoch": 0.387382401770891,
"grad_norm": 0.2698228535419003,
"learning_rate": 2.2053712480252765e-05,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19168169796466827,
"step": 350,
"valid_targets_mean": 4319.0,
"valid_targets_min": 1420
},
{
"epoch": 0.3929164360819037,
"grad_norm": 0.30836810816091687,
"learning_rate": 2.23696682464455e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20140843093395233,
"step": 355,
"valid_targets_mean": 4539.0,
"valid_targets_min": 1855
},
{
"epoch": 0.3984504703929164,
"grad_norm": 0.29938242402686027,
"learning_rate": 2.2685624012638234e-05,
"loss": 0.3847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20533442497253418,
"step": 360,
"valid_targets_mean": 4650.9,
"valid_targets_min": 1295
},
{
"epoch": 0.40398450470392916,
"grad_norm": 0.29159514782037715,
"learning_rate": 2.3001579778830965e-05,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17482727766036987,
"step": 365,
"valid_targets_mean": 3957.8,
"valid_targets_min": 1401
},
{
"epoch": 0.4095185390149419,
"grad_norm": 0.2960042857765756,
"learning_rate": 2.33175355450237e-05,
"loss": 0.3792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18393875658512115,
"step": 370,
"valid_targets_mean": 4258.2,
"valid_targets_min": 1375
},
{
"epoch": 0.41505257332595463,
"grad_norm": 0.258271336122156,
"learning_rate": 2.363349131121643e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18117231130599976,
"step": 375,
"valid_targets_mean": 4293.1,
"valid_targets_min": 1932
},
{
"epoch": 0.42058660763696737,
"grad_norm": 0.2857141427353967,
"learning_rate": 2.3949447077409165e-05,
"loss": 0.3762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17623044550418854,
"step": 380,
"valid_targets_mean": 4114.5,
"valid_targets_min": 1761
},
{
"epoch": 0.42612064194798005,
"grad_norm": 0.28334088488972164,
"learning_rate": 2.42654028436019e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18481989204883575,
"step": 385,
"valid_targets_mean": 4430.8,
"valid_targets_min": 2314
},
{
"epoch": 0.4316546762589928,
"grad_norm": 0.31103800283731187,
"learning_rate": 2.458135860979463e-05,
"loss": 0.3823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20391111075878143,
"step": 390,
"valid_targets_mean": 4497.4,
"valid_targets_min": 1599
},
{
"epoch": 0.4371887105700055,
"grad_norm": 0.3007656212158998,
"learning_rate": 2.4897314375987366e-05,
"loss": 0.3667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20604145526885986,
"step": 395,
"valid_targets_mean": 4274.5,
"valid_targets_min": 1618
},
{
"epoch": 0.44272274488101826,
"grad_norm": 0.26889513414602545,
"learning_rate": 2.5213270142180094e-05,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16915635764598846,
"step": 400,
"valid_targets_mean": 4277.4,
"valid_targets_min": 1851
},
{
"epoch": 0.448256779192031,
"grad_norm": 0.284968480654406,
"learning_rate": 2.552922590837283e-05,
"loss": 0.3769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1831769496202469,
"step": 405,
"valid_targets_mean": 4469.7,
"valid_targets_min": 1871
},
{
"epoch": 0.45379081350304373,
"grad_norm": 0.26901256292445136,
"learning_rate": 2.5845181674565566e-05,
"loss": 0.3782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19426560401916504,
"step": 410,
"valid_targets_mean": 4527.5,
"valid_targets_min": 1453
},
{
"epoch": 0.45932484781405647,
"grad_norm": 0.27323699028442777,
"learning_rate": 2.6161137440758294e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17527484893798828,
"step": 415,
"valid_targets_mean": 4689.2,
"valid_targets_min": 1243
},
{
"epoch": 0.46485888212506915,
"grad_norm": 0.26749382303257646,
"learning_rate": 2.647709320695103e-05,
"loss": 0.3783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17316754162311554,
"step": 420,
"valid_targets_mean": 4317.8,
"valid_targets_min": 1812
},
{
"epoch": 0.4703929164360819,
"grad_norm": 0.26836824185876,
"learning_rate": 2.679304897314376e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12835562229156494,
"step": 425,
"valid_targets_mean": 5641.1,
"valid_targets_min": 2296
},
{
"epoch": 0.4759269507470946,
"grad_norm": 0.24793671818721102,
"learning_rate": 2.7109004739336494e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12962763011455536,
"step": 430,
"valid_targets_mean": 5349.0,
"valid_targets_min": 2050
},
{
"epoch": 0.48146098505810736,
"grad_norm": 0.21415649307966725,
"learning_rate": 2.742496050552923e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1357322484254837,
"step": 435,
"valid_targets_mean": 5783.2,
"valid_targets_min": 1845
},
{
"epoch": 0.4869950193691201,
"grad_norm": 0.2449205704557651,
"learning_rate": 2.774091627172196e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14369916915893555,
"step": 440,
"valid_targets_mean": 5767.9,
"valid_targets_min": 2653
},
{
"epoch": 0.49252905368013283,
"grad_norm": 0.2059316309784506,
"learning_rate": 2.8056872037914695e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13689398765563965,
"step": 445,
"valid_targets_mean": 5619.5,
"valid_targets_min": 2023
},
{
"epoch": 0.49806308799114557,
"grad_norm": 0.21338401994743855,
"learning_rate": 2.8372827804107426e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.127161905169487,
"step": 450,
"valid_targets_mean": 5253.8,
"valid_targets_min": 1239
},
{
"epoch": 0.5035971223021583,
"grad_norm": 0.21754017832580447,
"learning_rate": 2.868878357030016e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1304529309272766,
"step": 455,
"valid_targets_mean": 5506.8,
"valid_targets_min": 2598
},
{
"epoch": 0.509131156613171,
"grad_norm": 0.2294942844909931,
"learning_rate": 2.9004739336492895e-05,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11473497003316879,
"step": 460,
"valid_targets_mean": 5309.8,
"valid_targets_min": 2443
},
{
"epoch": 0.5146651909241837,
"grad_norm": 0.2196751904342027,
"learning_rate": 2.9320695102685626e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15007314085960388,
"step": 465,
"valid_targets_mean": 5868.3,
"valid_targets_min": 2497
},
{
"epoch": 0.5201992252351965,
"grad_norm": 0.18738709883609975,
"learning_rate": 2.963665086887836e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10643309354782104,
"step": 470,
"valid_targets_mean": 5761.6,
"valid_targets_min": 2096
},
{
"epoch": 0.5257332595462092,
"grad_norm": 0.2175539021849619,
"learning_rate": 2.9952606635071092e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12912330031394958,
"step": 475,
"valid_targets_mean": 5816.0,
"valid_targets_min": 2258
},
{
"epoch": 0.5312672938572219,
"grad_norm": 0.1970812604349457,
"learning_rate": 3.0268562401263827e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13159504532814026,
"step": 480,
"valid_targets_mean": 5984.8,
"valid_targets_min": 2264
},
{
"epoch": 0.5368013281682347,
"grad_norm": 0.1798179806094743,
"learning_rate": 3.058451816745656e-05,
"loss": 0.2343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13087119162082672,
"step": 485,
"valid_targets_mean": 5711.8,
"valid_targets_min": 2394
},
{
"epoch": 0.5423353624792474,
"grad_norm": 0.25288413800579274,
"learning_rate": 3.090047393364929e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1277281939983368,
"step": 490,
"valid_targets_mean": 5680.3,
"valid_targets_min": 2487
},
{
"epoch": 0.5478693967902601,
"grad_norm": 0.22610447769390982,
"learning_rate": 3.121642969984203e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11709853261709213,
"step": 495,
"valid_targets_mean": 5869.9,
"valid_targets_min": 2655
},
{
"epoch": 0.5534034311012729,
"grad_norm": 0.47954836253427174,
"learning_rate": 3.153238546603476e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11786717921495438,
"step": 500,
"valid_targets_mean": 5479.9,
"valid_targets_min": 2153
},
{
"epoch": 0.5589374654122855,
"grad_norm": 0.23140780959919824,
"learning_rate": 3.184834123222749e-05,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12131712585687637,
"step": 505,
"valid_targets_mean": 5297.5,
"valid_targets_min": 1932
},
{
"epoch": 0.5644714997232982,
"grad_norm": 0.20491642615826702,
"learning_rate": 3.216429699842023e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11049050092697144,
"step": 510,
"valid_targets_mean": 5783.3,
"valid_targets_min": 944
},
{
"epoch": 0.570005534034311,
"grad_norm": 0.20016014346656516,
"learning_rate": 3.248025276461296e-05,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10679373145103455,
"step": 515,
"valid_targets_mean": 5570.2,
"valid_targets_min": 2844
},
{
"epoch": 0.5755395683453237,
"grad_norm": 0.23789726284137908,
"learning_rate": 3.279620853080569e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11191616207361221,
"step": 520,
"valid_targets_mean": 5753.7,
"valid_targets_min": 2045
},
{
"epoch": 0.5810736026563365,
"grad_norm": 0.22722793613585027,
"learning_rate": 3.311216429699842e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1198091134428978,
"step": 525,
"valid_targets_mean": 5353.3,
"valid_targets_min": 2316
},
{
"epoch": 0.5866076369673492,
"grad_norm": 0.21981373105431526,
"learning_rate": 3.342812006319116e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11608002334833145,
"step": 530,
"valid_targets_mean": 5618.7,
"valid_targets_min": 2144
},
{
"epoch": 0.5921416712783619,
"grad_norm": 0.21244635954118507,
"learning_rate": 3.374407582938389e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11392959952354431,
"step": 535,
"valid_targets_mean": 5338.1,
"valid_targets_min": 1731
},
{
"epoch": 0.5976757055893747,
"grad_norm": 0.19933294250504463,
"learning_rate": 3.406003159557662e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12038113921880722,
"step": 540,
"valid_targets_mean": 5883.8,
"valid_targets_min": 2583
},
{
"epoch": 0.6032097399003874,
"grad_norm": 0.22758141250939715,
"learning_rate": 3.437598736176936e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11625228077173233,
"step": 545,
"valid_targets_mean": 5300.8,
"valid_targets_min": 1973
},
{
"epoch": 0.6087437742114001,
"grad_norm": 0.21233039772834064,
"learning_rate": 3.4691943127962084e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12226393818855286,
"step": 550,
"valid_targets_mean": 5928.1,
"valid_targets_min": 3227
},
{
"epoch": 0.6142778085224129,
"grad_norm": 0.21065540622054063,
"learning_rate": 3.500789889415482e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11683835834264755,
"step": 555,
"valid_targets_mean": 5923.1,
"valid_targets_min": 2392
},
{
"epoch": 0.6198118428334256,
"grad_norm": 0.21163909369812556,
"learning_rate": 3.532385466034755e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10224387794733047,
"step": 560,
"valid_targets_mean": 5607.5,
"valid_targets_min": 1927
},
{
"epoch": 0.6253458771444383,
"grad_norm": 0.18564813482011772,
"learning_rate": 3.5639810426540284e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13485325872898102,
"step": 565,
"valid_targets_mean": 5891.4,
"valid_targets_min": 1659
},
{
"epoch": 0.630879911455451,
"grad_norm": 0.18394726290312965,
"learning_rate": 3.595576619273302e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11927980184555054,
"step": 570,
"valid_targets_mean": 5810.3,
"valid_targets_min": 2797
},
{
"epoch": 0.6364139457664637,
"grad_norm": 0.2233018855151671,
"learning_rate": 3.6271721958925753e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1191728413105011,
"step": 575,
"valid_targets_mean": 5845.2,
"valid_targets_min": 2085
},
{
"epoch": 0.6419479800774764,
"grad_norm": 0.18891122067095578,
"learning_rate": 3.6587677725118485e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10877739638090134,
"step": 580,
"valid_targets_mean": 5777.4,
"valid_targets_min": 2375
},
{
"epoch": 0.6474820143884892,
"grad_norm": 0.22782608500286497,
"learning_rate": 3.690363349131122e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11073682457208633,
"step": 585,
"valid_targets_mean": 5355.5,
"valid_targets_min": 1462
},
{
"epoch": 0.6530160486995019,
"grad_norm": 0.18715533043352361,
"learning_rate": 3.7219589257503954e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10883685946464539,
"step": 590,
"valid_targets_mean": 5619.6,
"valid_targets_min": 2248
},
{
"epoch": 0.6585500830105147,
"grad_norm": 0.1807423599008659,
"learning_rate": 3.7535545023696685e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11599501967430115,
"step": 595,
"valid_targets_mean": 5980.5,
"valid_targets_min": 2300
},
{
"epoch": 0.6640841173215274,
"grad_norm": 0.18248038573986183,
"learning_rate": 3.7851500789889416e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11335260421037674,
"step": 600,
"valid_targets_mean": 5847.6,
"valid_targets_min": 3518
},
{
"epoch": 0.6696181516325401,
"grad_norm": 0.2003961315282654,
"learning_rate": 3.8167456556082154e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11822617799043655,
"step": 605,
"valid_targets_mean": 5279.1,
"valid_targets_min": 2145
},
{
"epoch": 0.6751521859435529,
"grad_norm": 0.18542784290777958,
"learning_rate": 3.8483412322274885e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11544450372457504,
"step": 610,
"valid_targets_mean": 5963.4,
"valid_targets_min": 1785
},
{
"epoch": 0.6806862202545656,
"grad_norm": 0.19641417454190124,
"learning_rate": 3.8799368088467617e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12316196411848068,
"step": 615,
"valid_targets_mean": 5615.0,
"valid_targets_min": 1880
},
{
"epoch": 0.6862202545655783,
"grad_norm": 0.1874576999126586,
"learning_rate": 3.9115323854660355e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10751807689666748,
"step": 620,
"valid_targets_mean": 5902.0,
"valid_targets_min": 2804
},
{
"epoch": 0.6917542888765911,
"grad_norm": 0.24128158732751992,
"learning_rate": 3.943127962085308e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10644346475601196,
"step": 625,
"valid_targets_mean": 5319.6,
"valid_targets_min": 2528
},
{
"epoch": 0.6972883231876038,
"grad_norm": 0.18947226772815468,
"learning_rate": 3.974723538704582e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10888642817735672,
"step": 630,
"valid_targets_mean": 5529.9,
"valid_targets_min": 2824
},
{
"epoch": 0.7028223574986165,
"grad_norm": 0.19843731199616285,
"learning_rate": 3.999999695692766e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10342171043157578,
"step": 635,
"valid_targets_mean": 5210.4,
"valid_targets_min": 2273
},
{
"epoch": 0.7083563918096292,
"grad_norm": 0.18980116649020176,
"learning_rate": 3.999989044949274e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1191055178642273,
"step": 640,
"valid_targets_mean": 5708.2,
"valid_targets_min": 2025
},
{
"epoch": 0.7138904261206419,
"grad_norm": 0.20411494778223988,
"learning_rate": 3.999963178936651e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10782010108232498,
"step": 645,
"valid_targets_mean": 5535.9,
"valid_targets_min": 2354
},
{
"epoch": 0.7194244604316546,
"grad_norm": 0.17255710493878107,
"learning_rate": 3.999922097851675e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11195490509271622,
"step": 650,
"valid_targets_mean": 5587.0,
"valid_targets_min": 2655
},
{
"epoch": 0.7249584947426674,
"grad_norm": 0.18555854481909534,
"learning_rate": 3.9998658020068784e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10752513259649277,
"step": 655,
"valid_targets_mean": 5726.0,
"valid_targets_min": 1536
},
{
"epoch": 0.7304925290536801,
"grad_norm": 0.18167748433444353,
"learning_rate": 3.999794291830542e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11595481634140015,
"step": 660,
"valid_targets_mean": 5276.6,
"valid_targets_min": 1725
},
{
"epoch": 0.7360265633646929,
"grad_norm": 0.18817894948873296,
"learning_rate": 3.9997075678666916e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10897151380777359,
"step": 665,
"valid_targets_mean": 4917.2,
"valid_targets_min": 1306
},
{
"epoch": 0.7415605976757056,
"grad_norm": 0.18637142332630313,
"learning_rate": 3.999605630775096e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10294731706380844,
"step": 670,
"valid_targets_mean": 5920.3,
"valid_targets_min": 2692
},
{
"epoch": 0.7470946319867183,
"grad_norm": 0.1785392311851408,
"learning_rate": 3.999488481331258e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09978693723678589,
"step": 675,
"valid_targets_mean": 5935.9,
"valid_targets_min": 2414
},
{
"epoch": 0.7526286662977311,
"grad_norm": 0.20179880948163537,
"learning_rate": 3.9993561204264146e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10697966814041138,
"step": 680,
"valid_targets_mean": 5286.9,
"valid_targets_min": 1052
},
{
"epoch": 0.7581627006087438,
"grad_norm": 0.36865020584556263,
"learning_rate": 3.9992085490675234e-05,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20275266468524933,
"step": 685,
"valid_targets_mean": 4064.5,
"valid_targets_min": 2223
},
{
"epoch": 0.7636967349197565,
"grad_norm": 0.3368021068093887,
"learning_rate": 3.99904576837726e-05,
"loss": 0.3874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19558501243591309,
"step": 690,
"valid_targets_mean": 4034.0,
"valid_targets_min": 1203
},
{
"epoch": 0.7692307692307693,
"grad_norm": 0.30594385458337714,
"learning_rate": 3.998867779594006e-05,
"loss": 0.3743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19384127855300903,
"step": 695,
"valid_targets_mean": 4315.0,
"valid_targets_min": 1773
},
{
"epoch": 0.774764803541782,
"grad_norm": 0.2690179495002744,
"learning_rate": 3.9986745840718436e-05,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699591875076294,
"step": 700,
"valid_targets_mean": 4799.0,
"valid_targets_min": 1603
},
{
"epoch": 0.7802988378527946,
"grad_norm": 0.23845997029468932,
"learning_rate": 3.998466183280542e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17642243206501007,
"step": 705,
"valid_targets_mean": 4921.9,
"valid_targets_min": 1695
},
{
"epoch": 0.7858328721638074,
"grad_norm": 0.23728225244280673,
"learning_rate": 3.9982425788055466e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17517788708209991,
"step": 710,
"valid_targets_mean": 4232.0,
"valid_targets_min": 1416
},
{
"epoch": 0.7913669064748201,
"grad_norm": 0.2404569963674739,
"learning_rate": 3.998003772347968e-05,
"loss": 0.3365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17175722122192383,
"step": 715,
"valid_targets_mean": 7718.0,
"valid_targets_min": 1254
},
{
"epoch": 0.7969009407858328,
"grad_norm": 0.23498357970697878,
"learning_rate": 3.9977497657245674e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17249642312526703,
"step": 720,
"valid_targets_mean": 7411.9,
"valid_targets_min": 1367
},
{
"epoch": 0.8024349750968456,
"grad_norm": 0.21293551752089374,
"learning_rate": 3.9974805608677465e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14262016117572784,
"step": 725,
"valid_targets_mean": 6794.7,
"valid_targets_min": 1002
},
{
"epoch": 0.8079690094078583,
"grad_norm": 0.35505785754047214,
"learning_rate": 3.9971961598255274e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1443863958120346,
"step": 730,
"valid_targets_mean": 7931.0,
"valid_targets_min": 2635
},
{
"epoch": 0.813503043718871,
"grad_norm": 0.18843536910159747,
"learning_rate": 3.9968965647615425e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430182307958603,
"step": 735,
"valid_targets_mean": 7836.5,
"valid_targets_min": 1113
},
{
"epoch": 0.8190370780298838,
"grad_norm": 0.20338764208992186,
"learning_rate": 3.9965817779550126e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13604462146759033,
"step": 740,
"valid_targets_mean": 8004.7,
"valid_targets_min": 2354
},
{
"epoch": 0.8245711123408965,
"grad_norm": 0.1532663067966529,
"learning_rate": 3.996251801800734e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12938176095485687,
"step": 745,
"valid_targets_mean": 14621.4,
"valid_targets_min": 1121
},
{
"epoch": 0.8301051466519093,
"grad_norm": 0.14561220287672735,
"learning_rate": 3.9959066388090597e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12480156868696213,
"step": 750,
"valid_targets_mean": 13730.6,
"valid_targets_min": 5627
},
{
"epoch": 0.835639180962922,
"grad_norm": 0.1407702815224483,
"learning_rate": 3.995546291605877e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12473263591527939,
"step": 755,
"valid_targets_mean": 13851.5,
"valid_targets_min": 2420
},
{
"epoch": 0.8411732152739347,
"grad_norm": 0.14372957684020582,
"learning_rate": 3.995170762932591e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11691296845674515,
"step": 760,
"valid_targets_mean": 10187.0,
"valid_targets_min": 4526
},
{
"epoch": 0.8467072495849475,
"grad_norm": 0.2323270872047143,
"learning_rate": 3.994780055646102e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13866698741912842,
"step": 765,
"valid_targets_mean": 7247.6,
"valid_targets_min": 1894
},
{
"epoch": 0.8522412838959601,
"grad_norm": 0.22739619288922386,
"learning_rate": 3.994374172718785e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12408073991537094,
"step": 770,
"valid_targets_mean": 7225.9,
"valid_targets_min": 1279
},
{
"epoch": 0.8577753182069728,
"grad_norm": 0.39006362577079406,
"learning_rate": 3.993953117238466e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16530466079711914,
"step": 775,
"valid_targets_mean": 4795.3,
"valid_targets_min": 1685
},
{
"epoch": 0.8633093525179856,
"grad_norm": 0.3242688535462117,
"learning_rate": 3.993516892408398e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1452576369047165,
"step": 780,
"valid_targets_mean": 4640.0,
"valid_targets_min": 1767
},
{
"epoch": 0.8688433868289983,
"grad_norm": 0.25941774708005494,
"learning_rate": 3.993065501547238e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14877530932426453,
"step": 785,
"valid_targets_mean": 4969.9,
"valid_targets_min": 1543
},
{
"epoch": 0.874377421140011,
"grad_norm": 0.2304050970573324,
"learning_rate": 3.992598948089024e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1475018709897995,
"step": 790,
"valid_targets_mean": 4724.9,
"valid_targets_min": 1634
},
{
"epoch": 0.8799114554510238,
"grad_norm": 0.260910096283691,
"learning_rate": 3.99211723558314e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1795371174812317,
"step": 795,
"valid_targets_mean": 3955.6,
"valid_targets_min": 1829
},
{
"epoch": 0.8854454897620365,
"grad_norm": 0.22463559577059178,
"learning_rate": 3.9916203676943016e-05,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1876264065504074,
"step": 800,
"valid_targets_mean": 5335.9,
"valid_targets_min": 2041
},
{
"epoch": 0.8909795240730493,
"grad_norm": 0.21762357743673363,
"learning_rate": 3.991108348202518e-05,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19074296951293945,
"step": 805,
"valid_targets_mean": 5668.2,
"valid_targets_min": 1895
},
{
"epoch": 0.896513558384062,
"grad_norm": 0.22305146954992916,
"learning_rate": 3.9905811810030676e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15585224330425262,
"step": 810,
"valid_targets_mean": 5241.9,
"valid_targets_min": 2052
},
{
"epoch": 0.9020475926950747,
"grad_norm": 0.25423401454979944,
"learning_rate": 3.9900388701064676e-05,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1668250560760498,
"step": 815,
"valid_targets_mean": 4501.1,
"valid_targets_min": 1859
},
{
"epoch": 0.9075816270060875,
"grad_norm": 0.22576903339912976,
"learning_rate": 3.989481419638444e-05,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16919755935668945,
"step": 820,
"valid_targets_mean": 5344.1,
"valid_targets_min": 2200
},
{
"epoch": 0.9131156613171002,
"grad_norm": 0.25973565946214083,
"learning_rate": 3.988908833839899e-05,
"loss": 0.3401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16168487071990967,
"step": 825,
"valid_targets_mean": 4667.0,
"valid_targets_min": 2131
},
{
"epoch": 0.9186496956281129,
"grad_norm": 0.24009224852265348,
"learning_rate": 3.988321117066881e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17461256682872772,
"step": 830,
"valid_targets_mean": 4774.7,
"valid_targets_min": 1735
},
{
"epoch": 0.9241837299391257,
"grad_norm": 0.24743671307697393,
"learning_rate": 3.987718273790548e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16680864989757538,
"step": 835,
"valid_targets_mean": 5840.8,
"valid_targets_min": 2338
},
{
"epoch": 0.9297177642501383,
"grad_norm": 0.26168458507079656,
"learning_rate": 3.9871003085971364e-05,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17075331509113312,
"step": 840,
"valid_targets_mean": 4816.4,
"valid_targets_min": 1674
},
{
"epoch": 0.935251798561151,
"grad_norm": 0.23232107381013864,
"learning_rate": 3.986467226187926e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656631976366043,
"step": 845,
"valid_targets_mean": 5732.7,
"valid_targets_min": 1854
},
{
"epoch": 0.9407858328721638,
"grad_norm": 0.27341206012899355,
"learning_rate": 3.985819031379203e-05,
"loss": 0.3265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14391395449638367,
"step": 850,
"valid_targets_mean": 4115.7,
"valid_targets_min": 1512
},
{
"epoch": 0.9463198671831765,
"grad_norm": 0.22767348437154553,
"learning_rate": 3.9851557291022224e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15771305561065674,
"step": 855,
"valid_targets_mean": 5378.9,
"valid_targets_min": 2469
},
{
"epoch": 0.9518539014941892,
"grad_norm": 0.228541958830484,
"learning_rate": 3.984477324403174e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492053121328354,
"step": 860,
"valid_targets_mean": 4137.5,
"valid_targets_min": 1891
},
{
"epoch": 0.957387935805202,
"grad_norm": 0.20561509877155584,
"learning_rate": 3.983783822443141e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15702982246875763,
"step": 865,
"valid_targets_mean": 4230.2,
"valid_targets_min": 1879
},
{
"epoch": 0.9629219701162147,
"grad_norm": 0.22705250814177763,
"learning_rate": 3.9830752284980624e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16598166525363922,
"step": 870,
"valid_targets_mean": 4060.4,
"valid_targets_min": 1929
},
{
"epoch": 0.9684560044272275,
"grad_norm": 0.213751893760191,
"learning_rate": 3.982351547958691e-05,
"loss": 0.3204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574791520833969,
"step": 875,
"valid_targets_mean": 4318.9,
"valid_targets_min": 1421
},
{
"epoch": 0.9739900387382402,
"grad_norm": 0.2299802209897319,
"learning_rate": 3.9816127863305535e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15395411849021912,
"step": 880,
"valid_targets_mean": 4196.6,
"valid_targets_min": 2018
},
{
"epoch": 0.9795240730492529,
"grad_norm": 0.22056896946644247,
"learning_rate": 3.9808589492339093e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15959514677524567,
"step": 885,
"valid_targets_mean": 4083.7,
"valid_targets_min": 1696
},
{
"epoch": 0.9850581073602657,
"grad_norm": 0.212685778198781,
"learning_rate": 3.9800900424037074e-05,
"loss": 0.3183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1645464152097702,
"step": 890,
"valid_targets_mean": 4253.7,
"valid_targets_min": 2036
},
{
"epoch": 0.9905921416712784,
"grad_norm": 0.1917607058601535,
"learning_rate": 3.979306071689542e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14884722232818604,
"step": 895,
"valid_targets_mean": 4333.8,
"valid_targets_min": 1885
},
{
"epoch": 0.9961261759822911,
"grad_norm": 0.2288504359536138,
"learning_rate": 3.978507043055609e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15858103334903717,
"step": 900,
"valid_targets_mean": 4365.4,
"valid_targets_min": 1943
},
{
"epoch": 1.0011068068622024,
"grad_norm": 0.28075043239026515,
"learning_rate": 3.977692962580658e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15253998339176178,
"step": 905,
"valid_targets_mean": 7176.8,
"valid_targets_min": 2475
},
{
"epoch": 1.0066408411732153,
"grad_norm": 0.25456043767832615,
"learning_rate": 3.976863836457951e-05,
"loss": 0.3125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15757876634597778,
"step": 910,
"valid_targets_mean": 7152.2,
"valid_targets_min": 1817
},
{
"epoch": 1.012174875484228,
"grad_norm": 0.23203080605619728,
"learning_rate": 3.9760196709952105e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1390572041273117,
"step": 915,
"valid_targets_mean": 6413.1,
"valid_targets_min": 2694
},
{
"epoch": 1.0177089097952408,
"grad_norm": 0.19501821276663242,
"learning_rate": 3.975160472614575e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14973397552967072,
"step": 920,
"valid_targets_mean": 6742.4,
"valid_targets_min": 2529
},
{
"epoch": 1.0232429441062534,
"grad_norm": 0.19217358370469367,
"learning_rate": 3.974286247852547e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13378290832042694,
"step": 925,
"valid_targets_mean": 6891.3,
"valid_targets_min": 2165
},
{
"epoch": 1.0287769784172662,
"grad_norm": 0.1958278238627834,
"learning_rate": 3.973397003359944e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1444612592458725,
"step": 930,
"valid_targets_mean": 6714.7,
"valid_targets_min": 1734
},
{
"epoch": 1.0343110127282789,
"grad_norm": 0.17503375002909113,
"learning_rate": 3.972492745901853e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14504456520080566,
"step": 935,
"valid_targets_mean": 7105.4,
"valid_targets_min": 1845
},
{
"epoch": 1.0398450470392917,
"grad_norm": 0.19689281067552836,
"learning_rate": 3.9715734823575694e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1314559280872345,
"step": 940,
"valid_targets_mean": 6475.6,
"valid_targets_min": 2297
},
{
"epoch": 1.0453790813503043,
"grad_norm": 0.17574426136805996,
"learning_rate": 3.970639219720554e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14803387224674225,
"step": 945,
"valid_targets_mean": 6744.1,
"valid_targets_min": 2793
},
{
"epoch": 1.0509131156613172,
"grad_norm": 0.1785812212021472,
"learning_rate": 3.969689965098375e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12867371737957,
"step": 950,
"valid_targets_mean": 6725.4,
"valid_targets_min": 2520
},
{
"epoch": 1.0564471499723298,
"grad_norm": 0.2020877145542382,
"learning_rate": 3.968725725712652e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1310427039861679,
"step": 955,
"valid_targets_mean": 6286.6,
"valid_targets_min": 2643
},
{
"epoch": 1.0619811842833426,
"grad_norm": 0.17480637632142337,
"learning_rate": 3.9677465088990086e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14058233797550201,
"step": 960,
"valid_targets_mean": 6647.1,
"valid_targets_min": 2218
},
{
"epoch": 1.0675152185943553,
"grad_norm": 0.18176363686246289,
"learning_rate": 3.966752322107008e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14324791729450226,
"step": 965,
"valid_targets_mean": 6991.6,
"valid_targets_min": 3271
},
{
"epoch": 1.073049252905368,
"grad_norm": 0.18316339501001513,
"learning_rate": 3.965743172900101e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419498324394226,
"step": 970,
"valid_targets_mean": 7175.3,
"valid_targets_min": 1805
},
{
"epoch": 1.0785832872163807,
"grad_norm": 0.17368634878804703,
"learning_rate": 3.964719068955569e-05,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12790296971797943,
"step": 975,
"valid_targets_mean": 6327.0,
"valid_targets_min": 1224
},
{
"epoch": 1.0841173215273934,
"grad_norm": 0.18090420263161394,
"learning_rate": 3.963680018064462e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16885483264923096,
"step": 980,
"valid_targets_mean": 7451.6,
"valid_targets_min": 1864
},
{
"epoch": 1.0896513558384062,
"grad_norm": 0.1697452461712111,
"learning_rate": 3.962626028131545e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15592683851718903,
"step": 985,
"valid_targets_mean": 7721.9,
"valid_targets_min": 3662
},
{
"epoch": 1.0951853901494188,
"grad_norm": 0.17748411877088877,
"learning_rate": 3.9615571071752305e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14733010530471802,
"step": 990,
"valid_targets_mean": 7039.7,
"valid_targets_min": 1698
},
{
"epoch": 1.1007194244604317,
"grad_norm": 0.17111740120076824,
"learning_rate": 3.960473263327523e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15300166606903076,
"step": 995,
"valid_targets_mean": 7115.9,
"valid_targets_min": 1492
},
{
"epoch": 1.1062534587714443,
"grad_norm": 0.16650248420319466,
"learning_rate": 3.9593745048339564e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12374699115753174,
"step": 1000,
"valid_targets_mean": 6713.1,
"valid_targets_min": 2543
},
{
"epoch": 1.1117874930824572,
"grad_norm": 0.1678513032654032,
"learning_rate": 3.958260840053528e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383708268404007,
"step": 1005,
"valid_targets_mean": 6488.6,
"valid_targets_min": 2556
},
{
"epoch": 1.1173215273934698,
"grad_norm": 0.18025520979543855,
"learning_rate": 3.957132277458642e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14708085358142853,
"step": 1010,
"valid_targets_mean": 7216.3,
"valid_targets_min": 1992
},
{
"epoch": 1.1228555617044826,
"grad_norm": 0.19456611664282664,
"learning_rate": 3.9559888256350335e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1300152689218521,
"step": 1015,
"valid_targets_mean": 6421.9,
"valid_targets_min": 2444
},
{
"epoch": 1.1283895960154953,
"grad_norm": 0.16137239816538576,
"learning_rate": 3.9548304932817164e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1205127164721489,
"step": 1020,
"valid_targets_mean": 6405.9,
"valid_targets_min": 2545
},
{
"epoch": 1.1339236303265081,
"grad_norm": 0.17348272652206792,
"learning_rate": 3.9536572892109066e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12615039944648743,
"step": 1025,
"valid_targets_mean": 6837.7,
"valid_targets_min": 2151
},
{
"epoch": 1.1394576646375207,
"grad_norm": 0.18148333043463813,
"learning_rate": 3.9524692223479624e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15118034183979034,
"step": 1030,
"valid_targets_mean": 7361.1,
"valid_targets_min": 2378
},
{
"epoch": 1.1449916989485334,
"grad_norm": 0.18131447382404747,
"learning_rate": 3.951266301731311e-05,
"loss": 0.2737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340409368276596,
"step": 1035,
"valid_targets_mean": 6319.2,
"valid_targets_min": 2356
},
{
"epoch": 1.1505257332595462,
"grad_norm": 0.163951472238804,
"learning_rate": 3.950048536512383e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11924827098846436,
"step": 1040,
"valid_targets_mean": 6630.8,
"valid_targets_min": 1972
},
{
"epoch": 1.156059767570559,
"grad_norm": 0.17678653243995013,
"learning_rate": 3.948815935955542e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.141445592045784,
"step": 1045,
"valid_targets_mean": 6972.9,
"valid_targets_min": 2135
},
{
"epoch": 1.1615938018815717,
"grad_norm": 0.16588165744271002,
"learning_rate": 3.947568509438013e-05,
"loss": 0.2737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13333432376384735,
"step": 1050,
"valid_targets_mean": 6707.8,
"valid_targets_min": 1871
},
{
"epoch": 1.1671278361925843,
"grad_norm": 0.17341045683221493,
"learning_rate": 3.946306266449814e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12358522415161133,
"step": 1055,
"valid_targets_mean": 6739.1,
"valid_targets_min": 2150
},
{
"epoch": 1.1726618705035972,
"grad_norm": 0.17207704447771158,
"learning_rate": 3.945029216593682e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13025973737239838,
"step": 1060,
"valid_targets_mean": 6861.2,
"valid_targets_min": 2514
},
{
"epoch": 1.1781959048146098,
"grad_norm": 0.16244557894426362,
"learning_rate": 3.943737369584997e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1395055502653122,
"step": 1065,
"valid_targets_mean": 7224.6,
"valid_targets_min": 2698
},
{
"epoch": 1.1837299391256226,
"grad_norm": 0.16903966101182416,
"learning_rate": 3.942430735251714e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13284917175769806,
"step": 1070,
"valid_targets_mean": 6807.6,
"valid_targets_min": 2279
},
{
"epoch": 1.1892639734366353,
"grad_norm": 0.5838918039734643,
"learning_rate": 3.941109323534284e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13204120099544525,
"step": 1075,
"valid_targets_mean": 6986.2,
"valid_targets_min": 2280
},
{
"epoch": 1.194798007747648,
"grad_norm": 0.1619581813660958,
"learning_rate": 3.9397731444855784e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1205381453037262,
"step": 1080,
"valid_targets_mean": 6668.9,
"valid_targets_min": 3573
},
{
"epoch": 1.2003320420586607,
"grad_norm": 0.17972197349829508,
"learning_rate": 3.9384222082708154e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14235249161720276,
"step": 1085,
"valid_targets_mean": 7348.7,
"valid_targets_min": 2266
},
{
"epoch": 1.2058660763696736,
"grad_norm": 0.17975739708819172,
"learning_rate": 3.93705652516748e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13401982188224792,
"step": 1090,
"valid_targets_mean": 6718.5,
"valid_targets_min": 1852
},
{
"epoch": 1.2114001106806862,
"grad_norm": 0.16450821294263088,
"learning_rate": 3.935676105565249e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11176055669784546,
"step": 1095,
"valid_targets_mean": 6317.0,
"valid_targets_min": 1890
},
{
"epoch": 1.2169341449916988,
"grad_norm": 0.18586118472743715,
"learning_rate": 3.934280959965905e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12307751178741455,
"step": 1100,
"valid_targets_mean": 6423.0,
"valid_targets_min": 1961
},
{
"epoch": 1.2224681793027117,
"grad_norm": 0.16354727134618027,
"learning_rate": 3.932871098983266e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13544310629367828,
"step": 1105,
"valid_targets_mean": 6961.5,
"valid_targets_min": 2011
},
{
"epoch": 1.2280022136137245,
"grad_norm": 0.26445155244963164,
"learning_rate": 3.931446533343097e-05,
"loss": 0.3569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16654008626937866,
"step": 1110,
"valid_targets_mean": 4264.4,
"valid_targets_min": 1664
},
{
"epoch": 1.2335362479247372,
"grad_norm": 0.259149059080008,
"learning_rate": 3.9300072738830326e-05,
"loss": 0.3616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17894653975963593,
"step": 1115,
"valid_targets_mean": 4403.8,
"valid_targets_min": 1896
},
{
"epoch": 1.2390702822357498,
"grad_norm": 0.2532394954077379,
"learning_rate": 3.928553331552493e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17868827283382416,
"step": 1120,
"valid_targets_mean": 4392.9,
"valid_targets_min": 1282
},
{
"epoch": 1.2446043165467626,
"grad_norm": 0.2355989102476764,
"learning_rate": 3.9270847174126e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16397854685783386,
"step": 1125,
"valid_targets_mean": 4179.3,
"valid_targets_min": 1998
},
{
"epoch": 1.2501383508577752,
"grad_norm": 0.23545544996639933,
"learning_rate": 3.925601442636095e-05,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17215688526630402,
"step": 1130,
"valid_targets_mean": 4410.1,
"valid_targets_min": 1629
},
{
"epoch": 1.255672385168788,
"grad_norm": 0.23534951612683017,
"learning_rate": 3.924103518507251e-05,
"loss": 0.3587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1638919711112976,
"step": 1135,
"valid_targets_mean": 4081.9,
"valid_targets_min": 1820
},
{
"epoch": 1.2612064194798007,
"grad_norm": 0.23489838611021904,
"learning_rate": 3.922590956421792e-05,
"loss": 0.3711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18799881637096405,
"step": 1140,
"valid_targets_mean": 4430.3,
"valid_targets_min": 1591
},
{
"epoch": 1.2667404537908136,
"grad_norm": 0.231684281912992,
"learning_rate": 3.921063767886799e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15110845863819122,
"step": 1145,
"valid_targets_mean": 3639.0,
"valid_targets_min": 1609
},
{
"epoch": 1.2722744881018262,
"grad_norm": 0.22883238121740831,
"learning_rate": 3.9195219645206286e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17991988360881805,
"step": 1150,
"valid_targets_mean": 4169.2,
"valid_targets_min": 2003
},
{
"epoch": 1.277808522412839,
"grad_norm": 0.23839713321871983,
"learning_rate": 3.917965558052822e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18226949870586395,
"step": 1155,
"valid_targets_mean": 4387.5,
"valid_targets_min": 1802
},
{
"epoch": 1.2833425567238517,
"grad_norm": 0.22438517731822086,
"learning_rate": 3.9163945603240144e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18129350244998932,
"step": 1160,
"valid_targets_mean": 4586.4,
"valid_targets_min": 1431
},
{
"epoch": 1.2888765910348643,
"grad_norm": 0.2470833669018919,
"learning_rate": 3.914808983285848e-05,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15314365923404694,
"step": 1165,
"valid_targets_mean": 4150.2,
"valid_targets_min": 1451
},
{
"epoch": 1.2944106253458771,
"grad_norm": 0.22268292074124693,
"learning_rate": 3.913208839000882e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1547563523054123,
"step": 1170,
"valid_targets_mean": 4058.3,
"valid_targets_min": 1500
},
{
"epoch": 1.29994465965689,
"grad_norm": 0.23898654391290106,
"learning_rate": 3.911594139642493e-05,
"loss": 0.3392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17526842653751373,
"step": 1175,
"valid_targets_mean": 4309.4,
"valid_targets_min": 1370
},
{
"epoch": 1.3054786939679026,
"grad_norm": 0.21380823907483926,
"learning_rate": 3.909964897494793e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16898113489151,
"step": 1180,
"valid_targets_mean": 4254.8,
"valid_targets_min": 1915
},
{
"epoch": 1.3110127282789152,
"grad_norm": 0.26882185157487465,
"learning_rate": 3.9083211249525277e-05,
"loss": 0.3429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16856753826141357,
"step": 1185,
"valid_targets_mean": 3897.5,
"valid_targets_min": 1699
},
{
"epoch": 1.316546762589928,
"grad_norm": 0.2309951770435585,
"learning_rate": 3.906662834520987e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1852109432220459,
"step": 1190,
"valid_targets_mean": 4873.8,
"valid_targets_min": 1374
},
{
"epoch": 1.3220807969009407,
"grad_norm": 0.21792217488268217,
"learning_rate": 3.904990038815907e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1790103316307068,
"step": 1195,
"valid_targets_mean": 4314.8,
"valid_targets_min": 1526
},
{
"epoch": 1.3276148312119536,
"grad_norm": 0.23123270794811962,
"learning_rate": 3.903302750563376e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14537380635738373,
"step": 1200,
"valid_targets_mean": 3668.5,
"valid_targets_min": 1735
},
{
"epoch": 1.3331488655229662,
"grad_norm": 0.2693499746386558,
"learning_rate": 3.901600982599737e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15684859454631805,
"step": 1205,
"valid_targets_mean": 4198.7,
"valid_targets_min": 1587
},
{
"epoch": 1.338682899833979,
"grad_norm": 0.21173376275796202,
"learning_rate": 3.89988474787149e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16322259604930878,
"step": 1210,
"valid_targets_mean": 4426.8,
"valid_targets_min": 1624
},
{
"epoch": 1.3442169341449917,
"grad_norm": 0.24726409366171126,
"learning_rate": 3.898154059435192e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15184156596660614,
"step": 1215,
"valid_targets_mean": 3844.5,
"valid_targets_min": 1660
},
{
"epoch": 1.3497509684560045,
"grad_norm": 0.21934453532998735,
"learning_rate": 3.896408930457361e-05,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16550517082214355,
"step": 1220,
"valid_targets_mean": 4607.4,
"valid_targets_min": 1446
},
{
"epoch": 1.3552850027670171,
"grad_norm": 0.22442116015233177,
"learning_rate": 3.8946493742143744e-05,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17187415063381195,
"step": 1225,
"valid_targets_mean": 4620.0,
"valid_targets_min": 1843
},
{
"epoch": 1.3608190370780298,
"grad_norm": 0.20627885478063304,
"learning_rate": 3.8928754040923645e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1436220407485962,
"step": 1230,
"valid_targets_mean": 4062.0,
"valid_targets_min": 1629
},
{
"epoch": 1.3663530713890426,
"grad_norm": 0.2185699711014017,
"learning_rate": 3.891087033587122e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684235781431198,
"step": 1235,
"valid_targets_mean": 4552.9,
"valid_targets_min": 1687
},
{
"epoch": 1.3718871057000555,
"grad_norm": 0.21370744728285102,
"learning_rate": 3.889284276303992e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14738354086875916,
"step": 1240,
"valid_targets_mean": 4288.0,
"valid_targets_min": 1735
},
{
"epoch": 1.377421140011068,
"grad_norm": 0.22076208540817957,
"learning_rate": 3.887467145957768e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16767971217632294,
"step": 1245,
"valid_targets_mean": 4494.9,
"valid_targets_min": 1742
},
{
"epoch": 1.3829551743220807,
"grad_norm": 0.2258390472368909,
"learning_rate": 3.8856356563725874e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17086593806743622,
"step": 1250,
"valid_targets_mean": 4560.7,
"valid_targets_min": 1850
},
{
"epoch": 1.3884892086330936,
"grad_norm": 0.23613538896669242,
"learning_rate": 3.883789821481832e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17400549352169037,
"step": 1255,
"valid_targets_mean": 4525.4,
"valid_targets_min": 1488
},
{
"epoch": 1.3940232429441062,
"grad_norm": 0.23064138194881575,
"learning_rate": 3.881929655328016e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510716825723648,
"step": 1260,
"valid_targets_mean": 4337.6,
"valid_targets_min": 1551
},
{
"epoch": 1.399557277255119,
"grad_norm": 0.2400505261171503,
"learning_rate": 3.8800551720626794e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14990423619747162,
"step": 1265,
"valid_targets_mean": 4064.8,
"valid_targets_min": 1260
},
{
"epoch": 1.4050913115661317,
"grad_norm": 0.24599218182439966,
"learning_rate": 3.878166385946286e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16412757337093353,
"step": 1270,
"valid_targets_mean": 4271.5,
"valid_targets_min": 1965
},
{
"epoch": 1.4106253458771445,
"grad_norm": 0.21566388081545748,
"learning_rate": 3.876263311348108e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1625698059797287,
"step": 1275,
"valid_targets_mean": 4530.3,
"valid_targets_min": 1812
},
{
"epoch": 1.4161593801881571,
"grad_norm": 0.20195854254771664,
"learning_rate": 3.874345962746121e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16930294036865234,
"step": 1280,
"valid_targets_mean": 5182.0,
"valid_targets_min": 2171
},
{
"epoch": 1.42169341449917,
"grad_norm": 0.21607264069691856,
"learning_rate": 3.8724143547268924e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.145011767745018,
"step": 1285,
"valid_targets_mean": 4341.3,
"valid_targets_min": 1861
},
{
"epoch": 1.4272274488101826,
"grad_norm": 0.2237693296652014,
"learning_rate": 3.870468501985471e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15807199478149414,
"step": 1290,
"valid_targets_mean": 4484.4,
"valid_targets_min": 1651
},
{
"epoch": 1.4327614831211952,
"grad_norm": 0.22529943616165538,
"learning_rate": 3.8685084193252745e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15684156119823456,
"step": 1295,
"valid_targets_mean": 4192.0,
"valid_targets_min": 1684
},
{
"epoch": 1.438295517432208,
"grad_norm": 0.24576986248520252,
"learning_rate": 3.866534121657977e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745026856660843,
"step": 1300,
"valid_targets_mean": 4869.7,
"valid_targets_min": 1745
},
{
"epoch": 1.443829551743221,
"grad_norm": 0.21766701909656544,
"learning_rate": 3.8645456240033946e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14245377480983734,
"step": 1305,
"valid_targets_mean": 3970.9,
"valid_targets_min": 1643
},
{
"epoch": 1.4493635860542335,
"grad_norm": 0.21818942722818285,
"learning_rate": 3.8625429414893763e-05,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14716601371765137,
"step": 1310,
"valid_targets_mean": 4239.2,
"valid_targets_min": 1695
},
{
"epoch": 1.4548976203652462,
"grad_norm": 0.21251289322826,
"learning_rate": 3.860526089351679e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16402918100357056,
"step": 1315,
"valid_targets_mean": 4571.5,
"valid_targets_min": 1696
},
{
"epoch": 1.460431654676259,
"grad_norm": 0.2336086082990606,
"learning_rate": 3.858495082933864e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.163013756275177,
"step": 1320,
"valid_targets_mean": 4433.2,
"valid_targets_min": 2003
},
{
"epoch": 1.4659656889872716,
"grad_norm": 0.2396576832714152,
"learning_rate": 3.8564499376871694e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15132392942905426,
"step": 1325,
"valid_targets_mean": 4008.7,
"valid_targets_min": 1371
},
{
"epoch": 1.4714997232982845,
"grad_norm": 0.18098797137211153,
"learning_rate": 3.854390669170397e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10818668454885483,
"step": 1330,
"valid_targets_mean": 5755.9,
"valid_targets_min": 1607
},
{
"epoch": 1.4770337576092971,
"grad_norm": 0.1787066797313889,
"learning_rate": 3.852317293049796e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0983661413192749,
"step": 1335,
"valid_targets_mean": 5835.6,
"valid_targets_min": 2306
},
{
"epoch": 1.48256779192031,
"grad_norm": 0.17085975919111254,
"learning_rate": 3.8502298250989415e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09475555270910263,
"step": 1340,
"valid_targets_mean": 5367.4,
"valid_targets_min": 2272
},
{
"epoch": 1.4881018262313226,
"grad_norm": 0.1681837566049417,
"learning_rate": 3.8481282811986117e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08345619589090347,
"step": 1345,
"valid_targets_mean": 5459.6,
"valid_targets_min": 1924
},
{
"epoch": 1.4936358605423354,
"grad_norm": 0.15219321287099127,
"learning_rate": 3.8460126773366735e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09989086538553238,
"step": 1350,
"valid_targets_mean": 5662.9,
"valid_targets_min": 2081
},
{
"epoch": 1.499169894853348,
"grad_norm": 0.15555993992068823,
"learning_rate": 3.843883029607956e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09627845138311386,
"step": 1355,
"valid_targets_mean": 5408.0,
"valid_targets_min": 1663
},
{
"epoch": 1.5047039291643607,
"grad_norm": 0.1575554029684579,
"learning_rate": 3.841739354214129e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10124339908361435,
"step": 1360,
"valid_targets_mean": 6090.0,
"valid_targets_min": 3233
},
{
"epoch": 1.5102379634753735,
"grad_norm": 0.17073776730783605,
"learning_rate": 3.839581667463582e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08516725152730942,
"step": 1365,
"valid_targets_mean": 5283.3,
"valid_targets_min": 2542
},
{
"epoch": 1.5157719977863864,
"grad_norm": 0.1610335812807677,
"learning_rate": 3.837409985771297e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10468452423810959,
"step": 1370,
"valid_targets_mean": 5841.9,
"valid_targets_min": 3074
},
{
"epoch": 1.521306032097399,
"grad_norm": 0.15022862826788239,
"learning_rate": 3.835224325658724e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09101595729589462,
"step": 1375,
"valid_targets_mean": 5844.2,
"valid_targets_min": 1791
},
{
"epoch": 1.5268400664084116,
"grad_norm": 0.15473274276046864,
"learning_rate": 3.8330247037536587e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09456873685121536,
"step": 1380,
"valid_targets_mean": 5735.6,
"valid_targets_min": 2746
},
{
"epoch": 1.5323741007194245,
"grad_norm": 0.16114760241509796,
"learning_rate": 3.830811136790112e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09572803229093552,
"step": 1385,
"valid_targets_mean": 5778.7,
"valid_targets_min": 2829
},
{
"epoch": 1.5379081350304373,
"grad_norm": 0.16418451727918168,
"learning_rate": 3.8285836416081846e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08751516789197922,
"step": 1390,
"valid_targets_mean": 5638.1,
"valid_targets_min": 1955
},
{
"epoch": 1.54344216934145,
"grad_norm": 0.15617353071730314,
"learning_rate": 3.826342235153939e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0809503123164177,
"step": 1395,
"valid_targets_mean": 5649.6,
"valid_targets_min": 1657
},
{
"epoch": 1.5489762036524626,
"grad_norm": 0.1687895202850322,
"learning_rate": 3.82408693447927e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09529554843902588,
"step": 1400,
"valid_targets_mean": 5870.3,
"valid_targets_min": 3122
},
{
"epoch": 1.5545102379634754,
"grad_norm": 0.15097236666408503,
"learning_rate": 3.821817756741774e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08635803312063217,
"step": 1405,
"valid_targets_mean": 5898.3,
"valid_targets_min": 2722
},
{
"epoch": 1.560044272274488,
"grad_norm": 0.17377232093918724,
"learning_rate": 3.819534719204621e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0999286100268364,
"step": 1410,
"valid_targets_mean": 5430.9,
"valid_targets_min": 1832
},
{
"epoch": 1.565578306585501,
"grad_norm": 0.15515421991156828,
"learning_rate": 3.8172378392364215e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09400574117898941,
"step": 1415,
"valid_targets_mean": 5711.7,
"valid_targets_min": 1876
},
{
"epoch": 1.5711123408965135,
"grad_norm": 0.18249126639634058,
"learning_rate": 3.814927134311095e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08851730823516846,
"step": 1420,
"valid_targets_mean": 5817.8,
"valid_targets_min": 3349
},
{
"epoch": 1.5766463752075262,
"grad_norm": 0.17463154504582576,
"learning_rate": 3.812602622007736e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10670870542526245,
"step": 1425,
"valid_targets_mean": 6213.9,
"valid_targets_min": 2486
},
{
"epoch": 1.582180409518539,
"grad_norm": 0.15520876012616955,
"learning_rate": 3.810264320010482e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10215985029935837,
"step": 1430,
"valid_targets_mean": 5960.8,
"valid_targets_min": 1760
},
{
"epoch": 1.5877144438295518,
"grad_norm": 0.15302405983671816,
"learning_rate": 3.807912246108377e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08349398523569107,
"step": 1435,
"valid_targets_mean": 5431.6,
"valid_targets_min": 1939
},
{
"epoch": 1.5932484781405645,
"grad_norm": 0.1638805599904952,
"learning_rate": 3.805546418195237e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09607791155576706,
"step": 1440,
"valid_targets_mean": 5619.5,
"valid_targets_min": 1402
},
{
"epoch": 1.598782512451577,
"grad_norm": 0.16184784396834395,
"learning_rate": 3.8031668542695164e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09894770383834839,
"step": 1445,
"valid_targets_mean": 5685.0,
"valid_targets_min": 1115
},
{
"epoch": 1.60431654676259,
"grad_norm": 0.14470877256991516,
"learning_rate": 3.800773572434166e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08206525444984436,
"step": 1450,
"valid_targets_mean": 5896.3,
"valid_targets_min": 2249
},
{
"epoch": 1.6098505810736028,
"grad_norm": 0.1616847234283941,
"learning_rate": 3.7983665908965006e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08751017600297928,
"step": 1455,
"valid_targets_mean": 5286.9,
"valid_targets_min": 2419
},
{
"epoch": 1.6153846153846154,
"grad_norm": 0.16780432753063682,
"learning_rate": 3.795945927968055e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09756562858819962,
"step": 1460,
"valid_targets_mean": 5907.0,
"valid_targets_min": 2764
},
{
"epoch": 1.620918649695628,
"grad_norm": 0.15430952235574313,
"learning_rate": 3.7935116020644496e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0840432420372963,
"step": 1465,
"valid_targets_mean": 5677.7,
"valid_targets_min": 2561
},
{
"epoch": 1.626452684006641,
"grad_norm": 0.17774260453796328,
"learning_rate": 3.791063631705247e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08377804607152939,
"step": 1470,
"valid_targets_mean": 5690.5,
"valid_targets_min": 2153
},
{
"epoch": 1.6319867183176535,
"grad_norm": 0.15507806329693358,
"learning_rate": 3.7886020355138144e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09811588376760483,
"step": 1475,
"valid_targets_mean": 5799.1,
"valid_targets_min": 2167
},
{
"epoch": 1.6375207526286664,
"grad_norm": 0.16053247401611923,
"learning_rate": 3.7861268322171775e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1035495176911354,
"step": 1480,
"valid_targets_mean": 5970.1,
"valid_targets_min": 3079
},
{
"epoch": 1.643054786939679,
"grad_norm": 0.14849765401498888,
"learning_rate": 3.7836380406458824e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08759353309869766,
"step": 1485,
"valid_targets_mean": 5799.0,
"valid_targets_min": 2123
},
{
"epoch": 1.6485888212506916,
"grad_norm": 0.1605302752895466,
"learning_rate": 3.781135679733849e-05,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07913342863321304,
"step": 1490,
"valid_targets_mean": 5474.9,
"valid_targets_min": 1505
},
{
"epoch": 1.6541228555617045,
"grad_norm": 0.15361664307520298,
"learning_rate": 3.77861976851823e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07888994365930557,
"step": 1495,
"valid_targets_mean": 5696.5,
"valid_targets_min": 2150
},
{
"epoch": 1.6596568898727173,
"grad_norm": 0.16091667110596974,
"learning_rate": 3.7760903261392614e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08942961692810059,
"step": 1500,
"valid_targets_mean": 5482.0,
"valid_targets_min": 1925
},
{
"epoch": 1.66519092418373,
"grad_norm": 0.15842859658005418,
"learning_rate": 3.773547371840124e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08590523153543472,
"step": 1505,
"valid_targets_mean": 5700.8,
"valid_targets_min": 2524
},
{
"epoch": 1.6707249584947426,
"grad_norm": 0.15930986743197398,
"learning_rate": 3.77099092496679e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09003861993551254,
"step": 1510,
"valid_targets_mean": 5443.2,
"valid_targets_min": 1992
},
{
"epoch": 1.6762589928057554,
"grad_norm": 0.15717236223857892,
"learning_rate": 3.768421004967879e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08390811085700989,
"step": 1515,
"valid_targets_mean": 5506.9,
"valid_targets_min": 2062
},
{
"epoch": 1.6817930271167683,
"grad_norm": 0.16274698844769872,
"learning_rate": 3.7658376313945104e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08415307849645615,
"step": 1520,
"valid_targets_mean": 5554.7,
"valid_targets_min": 2289
},
{
"epoch": 1.6873270614277809,
"grad_norm": 0.15826237180855693,
"learning_rate": 3.763240823900155e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08058290928602219,
"step": 1525,
"valid_targets_mean": 5283.6,
"valid_targets_min": 2511
},
{
"epoch": 1.6928610957387935,
"grad_norm": 0.15034453834066436,
"learning_rate": 3.7606306022404824e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08194555342197418,
"step": 1530,
"valid_targets_mean": 5367.8,
"valid_targets_min": 1636
},
{
"epoch": 1.6983951300498064,
"grad_norm": 0.1583222022360076,
"learning_rate": 3.7580069862732145e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08407051116228104,
"step": 1535,
"valid_targets_mean": 5643.5,
"valid_targets_min": 1822
},
{
"epoch": 1.703929164360819,
"grad_norm": 0.1714358773650662,
"learning_rate": 3.7553699959579716e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08538398146629333,
"step": 1540,
"valid_targets_mean": 5522.8,
"valid_targets_min": 2271
},
{
"epoch": 1.7094631986718318,
"grad_norm": 0.17664480726337453,
"learning_rate": 3.7527196513561224e-05,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08488353341817856,
"step": 1545,
"valid_targets_mean": 5634.4,
"valid_targets_min": 3397
},
{
"epoch": 1.7149972329828445,
"grad_norm": 0.16551892245239816,
"learning_rate": 3.750055972630631e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09638077020645142,
"step": 1550,
"valid_targets_mean": 5882.0,
"valid_targets_min": 1620
},
{
"epoch": 1.720531267293857,
"grad_norm": 0.17200205226469634,
"learning_rate": 3.747378980045902e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08725154399871826,
"step": 1555,
"valid_targets_mean": 5484.1,
"valid_targets_min": 1983
},
{
"epoch": 1.72606530160487,
"grad_norm": 0.1542667371346797,
"learning_rate": 3.744688693967629e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09500366449356079,
"step": 1560,
"valid_targets_mean": 6050.4,
"valid_targets_min": 2705
},
{
"epoch": 1.7315993359158828,
"grad_norm": 0.14814420685720778,
"learning_rate": 3.741985134862638e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08133411407470703,
"step": 1565,
"valid_targets_mean": 5951.2,
"valid_targets_min": 1263
},
{
"epoch": 1.7371333702268954,
"grad_norm": 0.15781816560926434,
"learning_rate": 3.7392683232987294e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08072637766599655,
"step": 1570,
"valid_targets_mean": 5333.5,
"valid_targets_min": 2761
},
{
"epoch": 1.742667404537908,
"grad_norm": 0.1635678128038785,
"learning_rate": 3.736538279944527e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10370779037475586,
"step": 1575,
"valid_targets_mean": 5898.5,
"valid_targets_min": 1918
},
{
"epoch": 1.7482014388489209,
"grad_norm": 0.14261265693671554,
"learning_rate": 3.7337950255693176e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08859887719154358,
"step": 1580,
"valid_targets_mean": 5690.7,
"valid_targets_min": 2491
},
{
"epoch": 1.7537354731599337,
"grad_norm": 0.152831569549247,
"learning_rate": 3.731038581042891e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10772746801376343,
"step": 1585,
"valid_targets_mean": 5855.6,
"valid_targets_min": 1834
},
{
"epoch": 1.7592695074709463,
"grad_norm": 0.2647356527516756,
"learning_rate": 3.728268967335386e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324308067560196,
"step": 1590,
"valid_targets_mean": 4478.1,
"valid_targets_min": 1152
},
{
"epoch": 1.764803541781959,
"grad_norm": 0.2424881601505193,
"learning_rate": 3.7254862055171265e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12917517125606537,
"step": 1595,
"valid_targets_mean": 4434.4,
"valid_targets_min": 1363
},
{
"epoch": 1.7703375760929718,
"grad_norm": 0.26389469655832054,
"learning_rate": 3.7226903167584624e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14717340469360352,
"step": 1600,
"valid_targets_mean": 4586.5,
"valid_targets_min": 1203
},
{
"epoch": 1.7758716104039847,
"grad_norm": 0.29187032871634677,
"learning_rate": 3.7198813223296116e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13220685720443726,
"step": 1605,
"valid_targets_mean": 4198.7,
"valid_targets_min": 1898
},
{
"epoch": 1.7814056447149973,
"grad_norm": 0.22776258261432347,
"learning_rate": 3.7170592436004935e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1366225928068161,
"step": 1610,
"valid_targets_mean": 4499.3,
"valid_targets_min": 2282
},
{
"epoch": 1.78693967902601,
"grad_norm": 0.22817137768793902,
"learning_rate": 3.714224102040569e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12853863835334778,
"step": 1615,
"valid_targets_mean": 4354.3,
"valid_targets_min": 2243
},
{
"epoch": 1.7924737133370225,
"grad_norm": 0.2229030717728699,
"learning_rate": 3.7113759192186787e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1050797700881958,
"step": 1620,
"valid_targets_mean": 5987.4,
"valid_targets_min": 1045
},
{
"epoch": 1.7980077476480354,
"grad_norm": 0.21115591425185332,
"learning_rate": 3.708514716802874e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11311844736337662,
"step": 1625,
"valid_targets_mean": 7339.2,
"valid_targets_min": 1398
},
{
"epoch": 1.8035417819590482,
"grad_norm": 0.2174003005062392,
"learning_rate": 3.705640516560257e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12683409452438354,
"step": 1630,
"valid_targets_mean": 7609.3,
"valid_targets_min": 2489
},
{
"epoch": 1.8090758162700609,
"grad_norm": 0.177464000416812,
"learning_rate": 3.702753340356813e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11056222766637802,
"step": 1635,
"valid_targets_mean": 8182.5,
"valid_targets_min": 2323
},
{
"epoch": 1.8146098505810735,
"grad_norm": 0.1870460713862642,
"learning_rate": 3.699853210157243e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11322402209043503,
"step": 1640,
"valid_targets_mean": 7945.0,
"valid_targets_min": 2386
},
{
"epoch": 1.8201438848920863,
"grad_norm": 0.18526910832781884,
"learning_rate": 3.6969401480247984e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10831591486930847,
"step": 1645,
"valid_targets_mean": 7628.4,
"valid_targets_min": 2019
},
{
"epoch": 1.8256779192030992,
"grad_norm": 0.13803254078026828,
"learning_rate": 3.694014176121114e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.096345454454422,
"step": 1650,
"valid_targets_mean": 13487.5,
"valid_targets_min": 1304
},
{
"epoch": 1.8312119535141118,
"grad_norm": 0.1323739468997748,
"learning_rate": 3.6910753167060366e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10764390230178833,
"step": 1655,
"valid_targets_mean": 14044.6,
"valid_targets_min": 2837
},
{
"epoch": 1.8367459878251244,
"grad_norm": 0.12739906419458874,
"learning_rate": 3.688123592137455e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09776881337165833,
"step": 1660,
"valid_targets_mean": 12808.5,
"valid_targets_min": 1264
},
{
"epoch": 1.8422800221361373,
"grad_norm": 0.18472517875224204,
"learning_rate": 3.685159024871137e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10981454700231552,
"step": 1665,
"valid_targets_mean": 7773.3,
"valid_targets_min": 1300
},
{
"epoch": 1.8478140564471501,
"grad_norm": 0.18058654658948134,
"learning_rate": 3.682181637460549e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1116521880030632,
"step": 1670,
"valid_targets_mean": 8022.5,
"valid_targets_min": 1221
},
{
"epoch": 1.8533480907581628,
"grad_norm": 0.18724230912218406,
"learning_rate": 3.67919145255669e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10184332728385925,
"step": 1675,
"valid_targets_mean": 7332.0,
"valid_targets_min": 935
},
{
"epoch": 1.8588821250691754,
"grad_norm": 0.284846970975493,
"learning_rate": 3.67618849290792e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1234837993979454,
"step": 1680,
"valid_targets_mean": 4677.9,
"valid_targets_min": 1413
},
{
"epoch": 1.864416159380188,
"grad_norm": 0.23265322355069754,
"learning_rate": 3.6731727813597826e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12468057125806808,
"step": 1685,
"valid_targets_mean": 5047.0,
"valid_targets_min": 1422
},
{
"epoch": 1.8699501936912009,
"grad_norm": 0.24901026147462169,
"learning_rate": 3.6701443408548356e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1232062578201294,
"step": 1690,
"valid_targets_mean": 4560.3,
"valid_targets_min": 2177
},
{
"epoch": 1.8754842280022137,
"grad_norm": 0.24845493572710523,
"learning_rate": 3.667103194432473e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12273026257753372,
"step": 1695,
"valid_targets_mean": 4750.5,
"valid_targets_min": 2094
},
{
"epoch": 1.8810182623132263,
"grad_norm": 0.21352332489113723,
"learning_rate": 3.664049365228753e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13580043613910675,
"step": 1700,
"valid_targets_mean": 4360.2,
"valid_targets_min": 1571
},
{
"epoch": 1.886552296624239,
"grad_norm": 0.24187118495071433,
"learning_rate": 3.66098287647622e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1355639547109604,
"step": 1705,
"valid_targets_mean": 4350.1,
"valid_targets_min": 1350
},
{
"epoch": 1.8920863309352518,
"grad_norm": 0.2221319087254357,
"learning_rate": 3.657903751503726e-05,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442292481660843,
"step": 1710,
"valid_targets_mean": 5759.9,
"valid_targets_min": 2496
},
{
"epoch": 1.8976203652462647,
"grad_norm": 0.22014101686720144,
"learning_rate": 3.6548120137362586e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13664335012435913,
"step": 1715,
"valid_targets_mean": 4665.8,
"valid_targets_min": 1862
},
{
"epoch": 1.9031543995572773,
"grad_norm": 0.19549340134656434,
"learning_rate": 3.6517076866947557e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1436709612607956,
"step": 1720,
"valid_targets_mean": 5136.1,
"valid_targets_min": 2075
},
{
"epoch": 1.90868843386829,
"grad_norm": 0.18788086589483333,
"learning_rate": 3.648590793995935e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428404301404953,
"step": 1725,
"valid_targets_mean": 5201.3,
"valid_targets_min": 2016
},
{
"epoch": 1.9142224681793027,
"grad_norm": 0.19335780199762595,
"learning_rate": 3.645461359352104e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1349288523197174,
"step": 1730,
"valid_targets_mean": 5300.8,
"valid_targets_min": 1145
},
{
"epoch": 1.9197565024903156,
"grad_norm": 0.21764207689379206,
"learning_rate": 3.6423194065709906e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11965199559926987,
"step": 1735,
"valid_targets_mean": 4597.2,
"valid_targets_min": 1963
},
{
"epoch": 1.9252905368013282,
"grad_norm": 0.20259374288682375,
"learning_rate": 3.639164959555553e-05,
"loss": 0.2735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12947358191013336,
"step": 1740,
"valid_targets_mean": 4532.3,
"valid_targets_min": 1109
},
{
"epoch": 1.9308245711123408,
"grad_norm": 0.2011284156115527,
"learning_rate": 3.635998042303804e-05,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12850068509578705,
"step": 1745,
"valid_targets_mean": 5127.4,
"valid_targets_min": 2148
},
{
"epoch": 1.9363586054233535,
"grad_norm": 0.23379586205063374,
"learning_rate": 3.632818678908624e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14635328948497772,
"step": 1750,
"valid_targets_mean": 5093.4,
"valid_targets_min": 2249
},
{
"epoch": 1.9418926397343663,
"grad_norm": 0.24506410198251863,
"learning_rate": 3.629626893557581e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13486354053020477,
"step": 1755,
"valid_targets_mean": 4493.6,
"valid_targets_min": 1745
},
{
"epoch": 1.9474266740453792,
"grad_norm": 0.20344712413332988,
"learning_rate": 3.626422710532743e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13823886215686798,
"step": 1760,
"valid_targets_mean": 5985.7,
"valid_targets_min": 1785
},
{
"epoch": 1.9529607083563918,
"grad_norm": 0.23951804276675492,
"learning_rate": 3.6232061542104984e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12460750341415405,
"step": 1765,
"valid_targets_mean": 4282.6,
"valid_targets_min": 1345
},
{
"epoch": 1.9584947426674044,
"grad_norm": 0.21081778587343794,
"learning_rate": 3.619977249061366e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12043123692274094,
"step": 1770,
"valid_targets_mean": 4043.1,
"valid_targets_min": 1453
},
{
"epoch": 1.9640287769784173,
"grad_norm": 0.2000956213548545,
"learning_rate": 3.6167360196498104e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12249448150396347,
"step": 1775,
"valid_targets_mean": 3962.6,
"valid_targets_min": 1950
},
{
"epoch": 1.9695628112894301,
"grad_norm": 0.2063885651633084,
"learning_rate": 3.6134824906340565e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12181480973958969,
"step": 1780,
"valid_targets_mean": 4089.9,
"valid_targets_min": 2225
},
{
"epoch": 1.9750968456004427,
"grad_norm": 0.1963326019016443,
"learning_rate": 3.610216686765899e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13744494318962097,
"step": 1785,
"valid_targets_mean": 4647.0,
"valid_targets_min": 1720
},
{
"epoch": 1.9806308799114554,
"grad_norm": 0.20396733516424023,
"learning_rate": 3.6069386328905156e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12744426727294922,
"step": 1790,
"valid_targets_mean": 4220.0,
"valid_targets_min": 1637
},
{
"epoch": 1.9861649142224682,
"grad_norm": 0.21173248608648465,
"learning_rate": 3.603648353946281e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12109271436929703,
"step": 1795,
"valid_targets_mean": 4065.2,
"valid_targets_min": 2020
},
{
"epoch": 1.991698948533481,
"grad_norm": 0.19300670821745727,
"learning_rate": 3.60034587496457e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12375432252883911,
"step": 1800,
"valid_targets_mean": 4378.8,
"valid_targets_min": 2197
},
{
"epoch": 1.9972329828444937,
"grad_norm": 0.20611442328641857,
"learning_rate": 3.597031221069575e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1273588091135025,
"step": 1805,
"valid_targets_mean": 4250.2,
"valid_targets_min": 2029
},
{
"epoch": 2.002213613724405,
"grad_norm": 0.25460945090750153,
"learning_rate": 3.593704417478108e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12178600579500198,
"step": 1810,
"valid_targets_mean": 6556.2,
"valid_targets_min": 1732
},
{
"epoch": 2.007747648035418,
"grad_norm": 0.196181622903712,
"learning_rate": 3.5903654894994156e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12736719846725464,
"step": 1815,
"valid_targets_mean": 6745.2,
"valid_targets_min": 2595
},
{
"epoch": 2.0132816823464306,
"grad_norm": 0.18163396282759997,
"learning_rate": 3.5870144625349796e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12206553667783737,
"step": 1820,
"valid_targets_mean": 6414.2,
"valid_targets_min": 1804
},
{
"epoch": 2.018815716657443,
"grad_norm": 0.17498500763921046,
"learning_rate": 3.583651362078329e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313360035419464,
"step": 1825,
"valid_targets_mean": 7147.8,
"valid_targets_min": 2654
},
{
"epoch": 2.024349750968456,
"grad_norm": 0.15874180378712185,
"learning_rate": 3.580276213714842e-05,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12748394906520844,
"step": 1830,
"valid_targets_mean": 7391.1,
"valid_targets_min": 2506
},
{
"epoch": 2.029883785279469,
"grad_norm": 0.16967369735811572,
"learning_rate": 3.576889043121556e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09263142198324203,
"step": 1835,
"valid_targets_mean": 5653.9,
"valid_targets_min": 2050
},
{
"epoch": 2.0354178195904815,
"grad_norm": 0.15502565084525127,
"learning_rate": 3.573489876066967e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11003027111291885,
"step": 1840,
"valid_targets_mean": 6577.6,
"valid_targets_min": 2180
},
{
"epoch": 2.040951853901494,
"grad_norm": 0.17240419472611698,
"learning_rate": 3.570078738410838e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1300700157880783,
"step": 1845,
"valid_targets_mean": 7243.6,
"valid_targets_min": 1462
},
{
"epoch": 2.0464858882125068,
"grad_norm": 0.15041215438948005,
"learning_rate": 3.566655656104e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09950295835733414,
"step": 1850,
"valid_targets_mean": 5979.6,
"valid_targets_min": 2261
},
{
"epoch": 2.05201992252352,
"grad_norm": 0.16398165353835098,
"learning_rate": 3.563220655188155e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11267545819282532,
"step": 1855,
"valid_targets_mean": 6526.0,
"valid_targets_min": 2889
},
{
"epoch": 2.0575539568345325,
"grad_norm": 0.1644283942720737,
"learning_rate": 3.559773761795677e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11775601655244827,
"step": 1860,
"valid_targets_mean": 6637.4,
"valid_targets_min": 2198
},
{
"epoch": 2.063087991145545,
"grad_norm": 0.18894361057192038,
"learning_rate": 3.556315002149417e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11832115054130554,
"step": 1865,
"valid_targets_mean": 6630.0,
"valid_targets_min": 2447
},
{
"epoch": 2.0686220254565577,
"grad_norm": 0.15871754158886173,
"learning_rate": 3.552844402562496e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11108693480491638,
"step": 1870,
"valid_targets_mean": 6784.3,
"valid_targets_min": 2018
},
{
"epoch": 2.074156059767571,
"grad_norm": 0.1666703709693314,
"learning_rate": 3.5493619894381134e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10879040509462357,
"step": 1875,
"valid_targets_mean": 6594.1,
"valid_targets_min": 1738
},
{
"epoch": 2.0796900940785834,
"grad_norm": 0.16471460484089057,
"learning_rate": 3.5458677892693414e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10758719593286514,
"step": 1880,
"valid_targets_mean": 6608.3,
"valid_targets_min": 2294
},
{
"epoch": 2.085224128389596,
"grad_norm": 0.15983077692158537,
"learning_rate": 3.542361828638922e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11144182831048965,
"step": 1885,
"valid_targets_mean": 6807.7,
"valid_targets_min": 2459
},
{
"epoch": 2.0907581627006087,
"grad_norm": 0.16073131019754824,
"learning_rate": 3.538844134219069e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13222560286521912,
"step": 1890,
"valid_targets_mean": 7171.7,
"valid_targets_min": 2663
},
{
"epoch": 2.0962921970116213,
"grad_norm": 0.16666788192831658,
"learning_rate": 3.5353147327712637e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1460612565279007,
"step": 1895,
"valid_targets_mean": 7488.9,
"valid_targets_min": 1737
},
{
"epoch": 2.1018262313226344,
"grad_norm": 0.16460431294876285,
"learning_rate": 3.531773651146049e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10749489814043045,
"step": 1900,
"valid_targets_mean": 6740.6,
"valid_targets_min": 3073
},
{
"epoch": 2.107360265633647,
"grad_norm": 0.17328310563867794,
"learning_rate": 3.5282209162828264e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11726633459329605,
"step": 1905,
"valid_targets_mean": 7155.1,
"valid_targets_min": 2303
},
{
"epoch": 2.1128942999446596,
"grad_norm": 0.1708861905255187,
"learning_rate": 3.5246565552096536e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11879414319992065,
"step": 1910,
"valid_targets_mean": 6865.1,
"valid_targets_min": 3211
},
{
"epoch": 2.1184283342556722,
"grad_norm": 0.1628843755311141,
"learning_rate": 3.5210805950430366e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10074803978204727,
"step": 1915,
"valid_targets_mean": 6133.8,
"valid_targets_min": 3408
},
{
"epoch": 2.1239623685666853,
"grad_norm": 0.1712030155859964,
"learning_rate": 3.51749306298772e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11956235021352768,
"step": 1920,
"valid_targets_mean": 7243.4,
"valid_targets_min": 2661
},
{
"epoch": 2.129496402877698,
"grad_norm": 0.15855319282312255,
"learning_rate": 3.5138939863364884e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10077456384897232,
"step": 1925,
"valid_targets_mean": 6463.6,
"valid_targets_min": 2198
},
{
"epoch": 2.1350304371887106,
"grad_norm": 0.1731689581044804,
"learning_rate": 3.5102833924699515e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12133423238992691,
"step": 1930,
"valid_targets_mean": 7358.3,
"valid_targets_min": 2450
},
{
"epoch": 2.140564471499723,
"grad_norm": 0.16938213670980715,
"learning_rate": 3.5066613088563376e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12302404642105103,
"step": 1935,
"valid_targets_mean": 7186.7,
"valid_targets_min": 3067
},
{
"epoch": 2.146098505810736,
"grad_norm": 0.1602878817587104,
"learning_rate": 3.503027763051286e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09725018590688705,
"step": 1940,
"valid_targets_mean": 6213.1,
"valid_targets_min": 2512
},
{
"epoch": 2.151632540121749,
"grad_norm": 0.17073852982024915,
"learning_rate": 3.499382782697638e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10988564044237137,
"step": 1945,
"valid_targets_mean": 6629.0,
"valid_targets_min": 2721
},
{
"epoch": 2.1571665744327615,
"grad_norm": 0.16508704276971933,
"learning_rate": 3.495726395525222e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11532676219940186,
"step": 1950,
"valid_targets_mean": 6951.3,
"valid_targets_min": 1410
},
{
"epoch": 2.162700608743774,
"grad_norm": 0.16850115690665773,
"learning_rate": 3.4920586293506505e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11975447088479996,
"step": 1955,
"valid_targets_mean": 6716.0,
"valid_targets_min": 2015
},
{
"epoch": 2.1682346430547867,
"grad_norm": 0.18027122835951337,
"learning_rate": 3.488379512077099e-05,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077960804104805,
"step": 1960,
"valid_targets_mean": 6754.2,
"valid_targets_min": 1285
},
{
"epoch": 2.1737686773658,
"grad_norm": 0.1694207004089083,
"learning_rate": 3.4846890716941005e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12165435403585434,
"step": 1965,
"valid_targets_mean": 7055.3,
"valid_targets_min": 1824
},
{
"epoch": 2.1793027116768124,
"grad_norm": 0.16984422107945202,
"learning_rate": 3.480987336277332e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1043839231133461,
"step": 1970,
"valid_targets_mean": 6240.7,
"valid_targets_min": 2520
},
{
"epoch": 2.184836745987825,
"grad_norm": 0.15928989504119623,
"learning_rate": 3.4772743339883975e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11364192515611649,
"step": 1975,
"valid_targets_mean": 7048.4,
"valid_targets_min": 2534
},
{
"epoch": 2.1903707802988377,
"grad_norm": 0.17238125314734223,
"learning_rate": 3.4735500930746155e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11842123419046402,
"step": 1980,
"valid_targets_mean": 7279.1,
"valid_targets_min": 2874
},
{
"epoch": 2.1959048146098508,
"grad_norm": 0.16521197109465582,
"learning_rate": 3.469814641868806e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10197652131319046,
"step": 1985,
"valid_targets_mean": 6879.3,
"valid_targets_min": 2655
},
{
"epoch": 2.2014388489208634,
"grad_norm": 0.19198517275447463,
"learning_rate": 3.4660680087890724e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12141253799200058,
"step": 1990,
"valid_targets_mean": 7067.9,
"valid_targets_min": 2044
},
{
"epoch": 2.206972883231876,
"grad_norm": 0.16151705568785352,
"learning_rate": 3.4623102223385854e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12976032495498657,
"step": 1995,
"valid_targets_mean": 7770.0,
"valid_targets_min": 1537
},
{
"epoch": 2.2125069175428886,
"grad_norm": 0.18893779239098643,
"learning_rate": 3.458541311105369e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286742091178894,
"step": 2000,
"valid_targets_mean": 6690.8,
"valid_targets_min": 2068
},
{
"epoch": 2.2180409518539017,
"grad_norm": 0.16505910458823952,
"learning_rate": 3.454761303762078e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10115599632263184,
"step": 2005,
"valid_targets_mean": 6521.1,
"valid_targets_min": 1758
},
{
"epoch": 2.2235749861649143,
"grad_norm": 0.16847553045939181,
"learning_rate": 3.4509702290657856e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13247986137866974,
"step": 2010,
"valid_targets_mean": 7180.3,
"valid_targets_min": 2546
},
{
"epoch": 2.229109020475927,
"grad_norm": 0.32498045972365375,
"learning_rate": 3.4471681158577604e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15396571159362793,
"step": 2015,
"valid_targets_mean": 4645.0,
"valid_targets_min": 1835
},
{
"epoch": 2.2346430547869396,
"grad_norm": 0.3199891571560827,
"learning_rate": 3.443354993063248e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1466095894575119,
"step": 2020,
"valid_targets_mean": 5546.4,
"valid_targets_min": 2098
},
{
"epoch": 2.240177089097952,
"grad_norm": 0.26512644951778497,
"learning_rate": 3.439530889691254e-05,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1405329555273056,
"step": 2025,
"valid_targets_mean": 4328.5,
"valid_targets_min": 1980
},
{
"epoch": 2.2457111234089653,
"grad_norm": 0.2869325070126373,
"learning_rate": 3.4356958348343155e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12140665203332901,
"step": 2030,
"valid_targets_mean": 3992.0,
"valid_targets_min": 2005
},
{
"epoch": 2.251245157719978,
"grad_norm": 0.2589383495052475,
"learning_rate": 3.431849857668292e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13259261846542358,
"step": 2035,
"valid_targets_mean": 4146.0,
"valid_targets_min": 1570
},
{
"epoch": 2.2567791920309905,
"grad_norm": 0.24535043204958112,
"learning_rate": 3.42799298745213e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14231093227863312,
"step": 2040,
"valid_targets_mean": 4619.1,
"valid_targets_min": 1887
},
{
"epoch": 2.262313226342003,
"grad_norm": 0.256468789178841,
"learning_rate": 3.42412525352765e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13515257835388184,
"step": 2045,
"valid_targets_mean": 4458.5,
"valid_targets_min": 1561
},
{
"epoch": 2.2678472606530162,
"grad_norm": 0.2524559056796063,
"learning_rate": 3.42024668531932e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1405826061964035,
"step": 2050,
"valid_targets_mean": 4055.2,
"valid_targets_min": 1504
},
{
"epoch": 2.273381294964029,
"grad_norm": 0.2273920463882431,
"learning_rate": 3.41635731233403e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11907500773668289,
"step": 2055,
"valid_targets_mean": 4350.9,
"valid_targets_min": 1772
},
{
"epoch": 2.2789153292750415,
"grad_norm": 0.2449799495311102,
"learning_rate": 3.412457164160872e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11413963884115219,
"step": 2060,
"valid_targets_mean": 3810.2,
"valid_targets_min": 1857
},
{
"epoch": 2.284449363586054,
"grad_norm": 0.24708374303357555,
"learning_rate": 3.408546270470909e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14712080359458923,
"step": 2065,
"valid_targets_mean": 4675.1,
"valid_targets_min": 1726
},
{
"epoch": 2.2899833978970667,
"grad_norm": 0.2367581615241945,
"learning_rate": 3.404624661016956e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13800793886184692,
"step": 2070,
"valid_targets_mean": 4311.9,
"valid_targets_min": 1715
},
{
"epoch": 2.29551743220808,
"grad_norm": 0.2417319220816092,
"learning_rate": 3.400692365633346e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14577551186084747,
"step": 2075,
"valid_targets_mean": 4801.3,
"valid_targets_min": 1735
},
{
"epoch": 2.3010514665190924,
"grad_norm": 0.25106235822407685,
"learning_rate": 3.39674941423571e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1416432410478592,
"step": 2080,
"valid_targets_mean": 4260.2,
"valid_targets_min": 2003
},
{
"epoch": 2.306585500830105,
"grad_norm": 0.22436144371235098,
"learning_rate": 3.392795836820746e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11476701498031616,
"step": 2085,
"valid_targets_mean": 4150.7,
"valid_targets_min": 1400
},
{
"epoch": 2.312119535141118,
"grad_norm": 0.2535443617210647,
"learning_rate": 3.38883166346599e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14522124826908112,
"step": 2090,
"valid_targets_mean": 4290.6,
"valid_targets_min": 1471
},
{
"epoch": 2.3176535694521307,
"grad_norm": 0.21858072979627968,
"learning_rate": 3.384856924329592e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11835676431655884,
"step": 2095,
"valid_targets_mean": 4075.0,
"valid_targets_min": 1330
},
{
"epoch": 2.3231876037631434,
"grad_norm": 0.21954086058104552,
"learning_rate": 3.380871649650077e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12017607688903809,
"step": 2100,
"valid_targets_mean": 4359.4,
"valid_targets_min": 1655
},
{
"epoch": 2.328721638074156,
"grad_norm": 0.2542703005591101,
"learning_rate": 3.376875869746126e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12094666808843613,
"step": 2105,
"valid_targets_mean": 3815.9,
"valid_targets_min": 1415
},
{
"epoch": 2.3342556723851686,
"grad_norm": 0.251126910414918,
"learning_rate": 3.372869615016339e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12940432131290436,
"step": 2110,
"valid_targets_mean": 4242.0,
"valid_targets_min": 1487
},
{
"epoch": 2.3397897066961817,
"grad_norm": 0.2643944650713139,
"learning_rate": 3.3688529159390046e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12784574925899506,
"step": 2115,
"valid_targets_mean": 4385.7,
"valid_targets_min": 1708
},
{
"epoch": 2.3453237410071943,
"grad_norm": 0.2461152263037893,
"learning_rate": 3.364825803071869e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11380674690008163,
"step": 2120,
"valid_targets_mean": 3871.0,
"valid_targets_min": 1449
},
{
"epoch": 2.350857775318207,
"grad_norm": 0.2621383638045265,
"learning_rate": 3.360788307051904e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12078753858804703,
"step": 2125,
"valid_targets_mean": 3865.1,
"valid_targets_min": 1769
},
{
"epoch": 2.3563918096292196,
"grad_norm": 0.24641782553806202,
"learning_rate": 3.35674045859507e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13783816993236542,
"step": 2130,
"valid_targets_mean": 4496.6,
"valid_targets_min": 2112
},
{
"epoch": 2.3619258439402326,
"grad_norm": 0.24085148737669346,
"learning_rate": 3.35268228849609e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14685018360614777,
"step": 2135,
"valid_targets_mean": 4774.4,
"valid_targets_min": 1607
},
{
"epoch": 2.3674598782512453,
"grad_norm": 0.2220386797959251,
"learning_rate": 3.348613827628206e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1352035254240036,
"step": 2140,
"valid_targets_mean": 4803.5,
"valid_targets_min": 1845
},
{
"epoch": 2.372993912562258,
"grad_norm": 0.240284130200847,
"learning_rate": 3.3445351069429525e-05,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14021100103855133,
"step": 2145,
"valid_targets_mean": 4359.3,
"valid_targets_min": 1571
},
{
"epoch": 2.3785279468732705,
"grad_norm": 0.2428089987954204,
"learning_rate": 3.340446157469916e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12046308070421219,
"step": 2150,
"valid_targets_mean": 4695.8,
"valid_targets_min": 1357
},
{
"epoch": 2.384061981184283,
"grad_norm": 0.26202820127755705,
"learning_rate": 3.3363470103164986e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11755248159170151,
"step": 2155,
"valid_targets_mean": 3991.0,
"valid_targets_min": 1560
},
{
"epoch": 2.389596015495296,
"grad_norm": 0.25794323418326875,
"learning_rate": 3.3322376966676865e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14617593586444855,
"step": 2160,
"valid_targets_mean": 4203.9,
"valid_targets_min": 1391
},
{
"epoch": 2.395130049806309,
"grad_norm": 0.24069832733527413,
"learning_rate": 3.328118247785807e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13045255839824677,
"step": 2165,
"valid_targets_mean": 4457.6,
"valid_targets_min": 1571
},
{
"epoch": 2.4006640841173215,
"grad_norm": 0.24464630121892514,
"learning_rate": 3.3239886950102933e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13744525611400604,
"step": 2170,
"valid_targets_mean": 4402.4,
"valid_targets_min": 2100
},
{
"epoch": 2.406198118428334,
"grad_norm": 0.245525174323216,
"learning_rate": 3.319849069757446e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11348900943994522,
"step": 2175,
"valid_targets_mean": 4009.4,
"valid_targets_min": 1787
},
{
"epoch": 2.411732152739347,
"grad_norm": 0.25531675363724365,
"learning_rate": 3.315699403520193e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12031114846467972,
"step": 2180,
"valid_targets_mean": 4591.5,
"valid_targets_min": 1915
},
{
"epoch": 2.41726618705036,
"grad_norm": 0.2723623550882369,
"learning_rate": 3.3115397278678525e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12081772089004517,
"step": 2185,
"valid_targets_mean": 3853.5,
"valid_targets_min": 1692
},
{
"epoch": 2.4228002213613724,
"grad_norm": 0.2759578981507214,
"learning_rate": 3.3073700744458905e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10981065779924393,
"step": 2190,
"valid_targets_mean": 3809.5,
"valid_targets_min": 1771
},
{
"epoch": 2.428334255672385,
"grad_norm": 0.2708688860694367,
"learning_rate": 3.303190474975679e-05,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11741551011800766,
"step": 2195,
"valid_targets_mean": 4231.2,
"valid_targets_min": 1649
},
{
"epoch": 2.4338682899833977,
"grad_norm": 0.26191735840776026,
"learning_rate": 3.299000961254259e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15129616856575012,
"step": 2200,
"valid_targets_mean": 4823.4,
"valid_targets_min": 1879
},
{
"epoch": 2.4394023242944107,
"grad_norm": 0.24684680082578841,
"learning_rate": 3.2948015651540926e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11781984567642212,
"step": 2205,
"valid_targets_mean": 4126.4,
"valid_targets_min": 1435
},
{
"epoch": 2.4449363586054234,
"grad_norm": 0.2571977772945324,
"learning_rate": 3.290592318622827e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11264637857675552,
"step": 2210,
"valid_targets_mean": 3882.1,
"valid_targets_min": 1659
},
{
"epoch": 2.450470392916436,
"grad_norm": 0.25102524109760466,
"learning_rate": 3.286373253683048e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11968725174665451,
"step": 2215,
"valid_targets_mean": 4487.3,
"valid_targets_min": 1825
},
{
"epoch": 2.456004427227449,
"grad_norm": 0.2743124438502291,
"learning_rate": 3.2821444024320326e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13843697309494019,
"step": 2220,
"valid_targets_mean": 4427.6,
"valid_targets_min": 1596
},
{
"epoch": 2.4615384615384617,
"grad_norm": 0.25338666208737304,
"learning_rate": 3.277905797041514e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14188285171985626,
"step": 2225,
"valid_targets_mean": 4976.6,
"valid_targets_min": 1470
},
{
"epoch": 2.4670724958494743,
"grad_norm": 0.25251346662449287,
"learning_rate": 3.273657469757431e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13103936612606049,
"step": 2230,
"valid_targets_mean": 5125.1,
"valid_targets_min": 1955
},
{
"epoch": 2.472606530160487,
"grad_norm": 0.18675770996860236,
"learning_rate": 3.26939945289968e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08323365449905396,
"step": 2235,
"valid_targets_mean": 5392.4,
"valid_targets_min": 1736
},
{
"epoch": 2.4781405644714996,
"grad_norm": 0.18709599083859213,
"learning_rate": 3.265131778861876e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08022157102823257,
"step": 2240,
"valid_targets_mean": 5752.5,
"valid_targets_min": 2418
},
{
"epoch": 2.4836745987825126,
"grad_norm": 0.1581221414370123,
"learning_rate": 3.2608544801111e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07407370954751968,
"step": 2245,
"valid_targets_mean": 5096.6,
"valid_targets_min": 1180
},
{
"epoch": 2.4892086330935252,
"grad_norm": 0.15996766971390297,
"learning_rate": 3.256567589187657e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08508744835853577,
"step": 2250,
"valid_targets_mean": 5641.0,
"valid_targets_min": 2134
},
{
"epoch": 2.494742667404538,
"grad_norm": 0.1503407078520133,
"learning_rate": 3.2522711387048246e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0826578214764595,
"step": 2255,
"valid_targets_mean": 5802.1,
"valid_targets_min": 3269
},
{
"epoch": 2.5002767017155505,
"grad_norm": 0.15113352160318952,
"learning_rate": 3.2479651613486075e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08101323246955872,
"step": 2260,
"valid_targets_mean": 5432.3,
"valid_targets_min": 1602
},
{
"epoch": 2.5058107360265636,
"grad_norm": 0.15169501414305464,
"learning_rate": 3.243649689877487e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07829853147268295,
"step": 2265,
"valid_targets_mean": 5743.6,
"valid_targets_min": 2175
},
{
"epoch": 2.511344770337576,
"grad_norm": 0.1471582265896324,
"learning_rate": 3.239324757122174e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07005364447832108,
"step": 2270,
"valid_targets_mean": 5761.5,
"valid_targets_min": 3064
},
{
"epoch": 2.516878804648589,
"grad_norm": 0.15319141052788057,
"learning_rate": 3.2349903959853557e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0837135836482048,
"step": 2275,
"valid_targets_mean": 5588.5,
"valid_targets_min": 2372
},
{
"epoch": 2.5224128389596014,
"grad_norm": 0.15171378597396376,
"learning_rate": 3.230646639441449e-05,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07668746262788773,
"step": 2280,
"valid_targets_mean": 5415.7,
"valid_targets_min": 2271
},
{
"epoch": 2.527946873270614,
"grad_norm": 0.15186774768441974,
"learning_rate": 3.226293520536345e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0768275186419487,
"step": 2285,
"valid_targets_mean": 5562.1,
"valid_targets_min": 2281
},
{
"epoch": 2.533480907581627,
"grad_norm": 0.17699707125016628,
"learning_rate": 3.221931072387165e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06258273124694824,
"step": 2290,
"valid_targets_mean": 5284.1,
"valid_targets_min": 973
},
{
"epoch": 2.5390149418926398,
"grad_norm": 0.16796400444970988,
"learning_rate": 3.217559328182003e-05,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07881813496351242,
"step": 2295,
"valid_targets_mean": 5722.6,
"valid_targets_min": 2512
},
{
"epoch": 2.5445489762036524,
"grad_norm": 0.16922323148374335,
"learning_rate": 3.2131783211796716e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0652880072593689,
"step": 2300,
"valid_targets_mean": 4999.8,
"valid_targets_min": 1687
},
{
"epoch": 2.5500830105146655,
"grad_norm": 0.16119863560776443,
"learning_rate": 3.208788084709455e-05,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07294315099716187,
"step": 2305,
"valid_targets_mean": 5641.6,
"valid_targets_min": 2140
},
{
"epoch": 2.555617044825678,
"grad_norm": 0.16848133595850323,
"learning_rate": 3.20438865217085e-05,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07951802015304565,
"step": 2310,
"valid_targets_mean": 5478.7,
"valid_targets_min": 1603
},
{
"epoch": 2.5611510791366907,
"grad_norm": 0.15915104081782677,
"learning_rate": 3.1999800570333146e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07250721007585526,
"step": 2315,
"valid_targets_mean": 5777.6,
"valid_targets_min": 2255
},
{
"epoch": 2.5666851134477033,
"grad_norm": 0.16108384255341257,
"learning_rate": 3.195562332836015e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07589638233184814,
"step": 2320,
"valid_targets_mean": 5722.6,
"valid_targets_min": 1753
},
{
"epoch": 2.572219147758716,
"grad_norm": 0.1755066395817842,
"learning_rate": 3.191135513187564e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07764853537082672,
"step": 2325,
"valid_targets_mean": 5676.9,
"valid_targets_min": 1668
},
{
"epoch": 2.5777531820697286,
"grad_norm": 0.17430824924843394,
"learning_rate": 3.186699631765775e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07290103286504745,
"step": 2330,
"valid_targets_mean": 5766.0,
"valid_targets_min": 2729
},
{
"epoch": 2.5832872163807417,
"grad_norm": 0.17057163905522507,
"learning_rate": 3.182254722317396e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07022867351770401,
"step": 2335,
"valid_targets_mean": 5821.4,
"valid_targets_min": 2004
},
{
"epoch": 2.5888212506917543,
"grad_norm": 0.15791232305329486,
"learning_rate": 3.177800818657859e-05,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0739402249455452,
"step": 2340,
"valid_targets_mean": 5754.9,
"valid_targets_min": 3355
},
{
"epoch": 2.594355285002767,
"grad_norm": 0.17193888788181674,
"learning_rate": 3.1733379546710226e-05,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06612033396959305,
"step": 2345,
"valid_targets_mean": 5748.6,
"valid_targets_min": 2067
},
{
"epoch": 2.59988931931378,
"grad_norm": 0.15255677334789028,
"learning_rate": 3.168866164308909e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07562779635190964,
"step": 2350,
"valid_targets_mean": 5688.9,
"valid_targets_min": 1637
},
{
"epoch": 2.6054233536247926,
"grad_norm": 0.16904413269578494,
"learning_rate": 3.164385481591453e-05,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07645299285650253,
"step": 2355,
"valid_targets_mean": 5857.9,
"valid_targets_min": 2260
},
{
"epoch": 2.6109573879358052,
"grad_norm": 0.16744205276671484,
"learning_rate": 3.159895940606237e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08270134031772614,
"step": 2360,
"valid_targets_mean": 5516.6,
"valid_targets_min": 1184
},
{
"epoch": 2.616491422246818,
"grad_norm": 0.16642339253554195,
"learning_rate": 3.1553975755082366e-05,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07753140479326248,
"step": 2365,
"valid_targets_mean": 5969.0,
"valid_targets_min": 2448
},
{
"epoch": 2.6220254565578305,
"grad_norm": 0.16838695928479055,
"learning_rate": 3.150890420519555e-05,
"loss": 0.1337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06355169415473938,
"step": 2370,
"valid_targets_mean": 5274.3,
"valid_targets_min": 1542
},
{
"epoch": 2.6275594908688436,
"grad_norm": 0.17243268355338107,
"learning_rate": 3.14637450992917e-05,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07621452957391739,
"step": 2375,
"valid_targets_mean": 5350.8,
"valid_targets_min": 2456
},
{
"epoch": 2.633093525179856,
"grad_norm": 0.17277521809452379,
"learning_rate": 3.1418498780926666e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061686377972364426,
"step": 2380,
"valid_targets_mean": 5759.4,
"valid_targets_min": 3046
},
{
"epoch": 2.638627559490869,
"grad_norm": 0.16747105085539926,
"learning_rate": 3.1373165594319784e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06588593870401382,
"step": 2385,
"valid_targets_mean": 5577.3,
"valid_targets_min": 2091
},
{
"epoch": 2.6441615938018814,
"grad_norm": 0.17286141433563584,
"learning_rate": 3.132774588435128e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07492373883724213,
"step": 2390,
"valid_targets_mean": 5280.2,
"valid_targets_min": 2551
},
{
"epoch": 2.6496956281128945,
"grad_norm": 0.17616906402572663,
"learning_rate": 3.1282239996559575e-05,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07154124230146408,
"step": 2395,
"valid_targets_mean": 5727.3,
"valid_targets_min": 2530
},
{
"epoch": 2.655229662423907,
"grad_norm": 0.17794751292359126,
"learning_rate": 3.123664827713875e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06947065144777298,
"step": 2400,
"valid_targets_mean": 5774.6,
"valid_targets_min": 1202
},
{
"epoch": 2.6607636967349197,
"grad_norm": 0.17260761975203412,
"learning_rate": 3.119097107293583e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06682231277227402,
"step": 2405,
"valid_targets_mean": 5240.7,
"valid_targets_min": 1928
},
{
"epoch": 2.6662977310459324,
"grad_norm": 0.165118957251718,
"learning_rate": 3.114520873144821e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06677956134080887,
"step": 2410,
"valid_targets_mean": 5512.1,
"valid_targets_min": 2321
},
{
"epoch": 2.671831765356945,
"grad_norm": 0.15925324907477573,
"learning_rate": 3.109936160082096e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06604073196649551,
"step": 2415,
"valid_targets_mean": 5468.1,
"valid_targets_min": 2393
},
{
"epoch": 2.677365799667958,
"grad_norm": 0.1740316680183045,
"learning_rate": 3.1053430029844215e-05,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0712900385260582,
"step": 2420,
"valid_targets_mean": 5260.7,
"valid_targets_min": 2063
},
{
"epoch": 2.6828998339789707,
"grad_norm": 0.19632240056281522,
"learning_rate": 3.1007414367950484e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0738878846168518,
"step": 2425,
"valid_targets_mean": 5720.1,
"valid_targets_min": 2402
},
{
"epoch": 2.6884338682899833,
"grad_norm": 0.18012558106553866,
"learning_rate": 3.096131496521203e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07787241786718369,
"step": 2430,
"valid_targets_mean": 5954.4,
"valid_targets_min": 2397
},
{
"epoch": 2.6939679026009964,
"grad_norm": 0.17581719862803866,
"learning_rate": 3.091513217233819e-05,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07507916539907455,
"step": 2435,
"valid_targets_mean": 5727.8,
"valid_targets_min": 1876
},
{
"epoch": 2.699501936912009,
"grad_norm": 0.17347837639945535,
"learning_rate": 3.086886634067269e-05,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06442199647426605,
"step": 2440,
"valid_targets_mean": 5569.0,
"valid_targets_min": 1965
},
{
"epoch": 2.7050359712230216,
"grad_norm": 0.16489782674925513,
"learning_rate": 3.0822517822191e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06415524333715439,
"step": 2445,
"valid_targets_mean": 5661.8,
"valid_targets_min": 2471
},
{
"epoch": 2.7105700055340343,
"grad_norm": 0.16368842284606797,
"learning_rate": 3.077608696949765e-05,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06764273345470428,
"step": 2450,
"valid_targets_mean": 5622.1,
"valid_targets_min": 2291
},
{
"epoch": 2.716104039845047,
"grad_norm": 0.18330837065767697,
"learning_rate": 3.072957413582353e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07820945233106613,
"step": 2455,
"valid_targets_mean": 5615.0,
"valid_targets_min": 1872
},
{
"epoch": 2.7216380741560595,
"grad_norm": 0.18111367512510274,
"learning_rate": 3.068297967502321e-05,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06971076875925064,
"step": 2460,
"valid_targets_mean": 5620.1,
"valid_targets_min": 2509
},
{
"epoch": 2.7271721084670726,
"grad_norm": 0.181017231669242,
"learning_rate": 3.063630394157228e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06892272084951401,
"step": 2465,
"valid_targets_mean": 5791.0,
"valid_targets_min": 2652
},
{
"epoch": 2.732706142778085,
"grad_norm": 0.16873712291586646,
"learning_rate": 3.05895472905646e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06001288816332817,
"step": 2470,
"valid_targets_mean": 5198.1,
"valid_targets_min": 2440
},
{
"epoch": 2.738240177089098,
"grad_norm": 0.1868490278778886,
"learning_rate": 3.054271007770963e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06651145964860916,
"step": 2475,
"valid_targets_mean": 5649.1,
"valid_targets_min": 2077
},
{
"epoch": 2.743774211400111,
"grad_norm": 0.17000751161197922,
"learning_rate": 3.0495792659329723e-05,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.071280837059021,
"step": 2480,
"valid_targets_mean": 5574.3,
"valid_targets_min": 2057
},
{
"epoch": 2.7493082457111235,
"grad_norm": 0.1771028695622922,
"learning_rate": 3.0448795392357406e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07716403156518936,
"step": 2485,
"valid_targets_mean": 5628.9,
"valid_targets_min": 2814
},
{
"epoch": 2.754842280022136,
"grad_norm": 0.28237982686418645,
"learning_rate": 3.0401718634332674e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10520079731941223,
"step": 2490,
"valid_targets_mean": 4304.0,
"valid_targets_min": 1999
},
{
"epoch": 2.760376314333149,
"grad_norm": 0.3327083760173073,
"learning_rate": 3.0354562743400264e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10733775049448013,
"step": 2495,
"valid_targets_mean": 4515.2,
"valid_targets_min": 2164
},
{
"epoch": 2.7659103486441614,
"grad_norm": 0.31049768057667776,
"learning_rate": 3.0307328078306916e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11256422847509384,
"step": 2500,
"valid_targets_mean": 4470.0,
"valid_targets_min": 1842
},
{
"epoch": 2.7714443829551745,
"grad_norm": 0.2809847389542365,
"learning_rate": 3.026001499839868e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10991676896810532,
"step": 2505,
"valid_targets_mean": 4624.8,
"valid_targets_min": 2330
},
{
"epoch": 2.776978417266187,
"grad_norm": 0.2670407115330399,
"learning_rate": 3.021262386361814e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10309511423110962,
"step": 2510,
"valid_targets_mean": 4104.8,
"valid_targets_min": 1757
},
{
"epoch": 2.7825124515771997,
"grad_norm": 0.2487675603371622,
"learning_rate": 3.0165155034501716e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10134413838386536,
"step": 2515,
"valid_targets_mean": 4168.2,
"valid_targets_min": 2144
},
{
"epoch": 2.7880464858882124,
"grad_norm": 0.385750753122307,
"learning_rate": 3.0117608872176886e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08835925906896591,
"step": 2520,
"valid_targets_mean": 7307.1,
"valid_targets_min": 1241
},
{
"epoch": 2.7935805201992254,
"grad_norm": 0.2972093207639648,
"learning_rate": 3.0069985738359454e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09143689274787903,
"step": 2525,
"valid_targets_mean": 6482.4,
"valid_targets_min": 1234
},
{
"epoch": 2.799114554510238,
"grad_norm": 0.29782874213402083,
"learning_rate": 3.002228599535081e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08202945441007614,
"step": 2530,
"valid_targets_mean": 6422.1,
"valid_targets_min": 2269
},
{
"epoch": 2.8046485888212507,
"grad_norm": 0.25631859635668064,
"learning_rate": 2.997451000603516e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09196306020021439,
"step": 2535,
"valid_targets_mean": 8032.0,
"valid_targets_min": 1561
},
{
"epoch": 2.8101826231322633,
"grad_norm": 0.22517445589923313,
"learning_rate": 2.9926658133876753e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09404587745666504,
"step": 2540,
"valid_targets_mean": 7753.7,
"valid_targets_min": 997
},
{
"epoch": 2.815716657443276,
"grad_norm": 0.21994484776162698,
"learning_rate": 2.987873074291715e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08639196306467056,
"step": 2545,
"valid_targets_mean": 7592.0,
"valid_targets_min": 1134
},
{
"epoch": 2.821250691754289,
"grad_norm": 0.24575217873515323,
"learning_rate": 2.983072819777241e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09172558784484863,
"step": 2550,
"valid_targets_mean": 12918.2,
"valid_targets_min": 1948
},
{
"epoch": 2.8267847260653016,
"grad_norm": 0.15527163383639894,
"learning_rate": 2.9782650863630363e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09034281969070435,
"step": 2555,
"valid_targets_mean": 13792.4,
"valid_targets_min": 1105
},
{
"epoch": 2.8323187603763142,
"grad_norm": 0.13533382276779396,
"learning_rate": 2.9734499106247807e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08931824564933777,
"step": 2560,
"valid_targets_mean": 13438.8,
"valid_targets_min": 1167
},
{
"epoch": 2.8378527946873273,
"grad_norm": 0.13404710125492317,
"learning_rate": 2.968627329194771e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09555711597204208,
"step": 2565,
"valid_targets_mean": 13485.9,
"valid_targets_min": 3165
},
{
"epoch": 2.84338682899834,
"grad_norm": 0.20197899539890302,
"learning_rate": 2.963797378761647e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08223999291658401,
"step": 2570,
"valid_targets_mean": 6748.4,
"valid_targets_min": 1326
},
{
"epoch": 2.8489208633093526,
"grad_norm": 0.22908324980878794,
"learning_rate": 2.958960096070106e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08211114257574081,
"step": 2575,
"valid_targets_mean": 7122.6,
"valid_targets_min": 802
},
{
"epoch": 2.854454897620365,
"grad_norm": 0.21069092400808864,
"learning_rate": 2.95411551792063e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08094976097345352,
"step": 2580,
"valid_targets_mean": 7025.2,
"valid_targets_min": 974
},
{
"epoch": 2.859988931931378,
"grad_norm": 0.24247812593799903,
"learning_rate": 2.9492636811692007e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09617865830659866,
"step": 2585,
"valid_targets_mean": 4722.1,
"valid_targets_min": 1833
},
{
"epoch": 2.8655229662423904,
"grad_norm": 0.3284985892901276,
"learning_rate": 2.944404622727021e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1026540994644165,
"step": 2590,
"valid_targets_mean": 4635.6,
"valid_targets_min": 2233
},
{
"epoch": 2.8710570005534035,
"grad_norm": 0.26228909838556336,
"learning_rate": 2.9395383795602343e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08885417133569717,
"step": 2595,
"valid_targets_mean": 4973.8,
"valid_targets_min": 1415
},
{
"epoch": 2.876591034864416,
"grad_norm": 0.26117458416833533,
"learning_rate": 2.934664988689643e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10508755594491959,
"step": 2600,
"valid_targets_mean": 5083.4,
"valid_targets_min": 1921
},
{
"epoch": 2.8821250691754288,
"grad_norm": 0.24051633479555667,
"learning_rate": 2.9297844871904274e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09834790229797363,
"step": 2605,
"valid_targets_mean": 4291.8,
"valid_targets_min": 1566
},
{
"epoch": 2.887659103486442,
"grad_norm": 0.22965236694884916,
"learning_rate": 2.9248969121918632e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10472244024276733,
"step": 2610,
"valid_targets_mean": 4530.1,
"valid_targets_min": 1886
},
{
"epoch": 2.8931931377974545,
"grad_norm": 0.21364671524876022,
"learning_rate": 2.9200023008770373e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1135094165802002,
"step": 2615,
"valid_targets_mean": 5348.9,
"valid_targets_min": 1919
},
{
"epoch": 2.898727172108467,
"grad_norm": 0.2209531134133939,
"learning_rate": 2.915100690482569e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12207873910665512,
"step": 2620,
"valid_targets_mean": 5068.9,
"valid_targets_min": 1828
},
{
"epoch": 2.9042612064194797,
"grad_norm": 0.2211608236960134,
"learning_rate": 2.9101921182983227e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09815773367881775,
"step": 2625,
"valid_targets_mean": 4750.7,
"valid_targets_min": 1799
},
{
"epoch": 2.9097952407304923,
"grad_norm": 0.2499134010821729,
"learning_rate": 2.905276621667127e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10744103044271469,
"step": 2630,
"valid_targets_mean": 4307.7,
"valid_targets_min": 1767
},
{
"epoch": 2.9153292750415054,
"grad_norm": 0.23090348616357698,
"learning_rate": 2.9003542379844884e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11299965530633926,
"step": 2635,
"valid_targets_mean": 5096.7,
"valid_targets_min": 1742
},
{
"epoch": 2.920863309352518,
"grad_norm": 0.2320420684470363,
"learning_rate": 2.8954250046983073e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10773200541734695,
"step": 2640,
"valid_targets_mean": 4752.5,
"valid_targets_min": 1336
},
{
"epoch": 2.9263973436635307,
"grad_norm": 0.22083962294312315,
"learning_rate": 2.890488959308596e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1107417568564415,
"step": 2645,
"valid_targets_mean": 4916.1,
"valid_targets_min": 1577
},
{
"epoch": 2.9319313779745433,
"grad_norm": 0.22091590603380928,
"learning_rate": 2.8855461393671896e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10437620431184769,
"step": 2650,
"valid_targets_mean": 5456.0,
"valid_targets_min": 1907
},
{
"epoch": 2.9374654122855564,
"grad_norm": 0.24532483951310813,
"learning_rate": 2.8805965824774615e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10593270510435104,
"step": 2655,
"valid_targets_mean": 5207.6,
"valid_targets_min": 1726
},
{
"epoch": 2.942999446596569,
"grad_norm": 0.27364048448227346,
"learning_rate": 2.8756403262940375e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10775301605463028,
"step": 2660,
"valid_targets_mean": 5106.3,
"valid_targets_min": 2259
},
{
"epoch": 2.9485334809075816,
"grad_norm": 0.2920537004724869,
"learning_rate": 2.8706774085225114e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09780740737915039,
"step": 2665,
"valid_targets_mean": 4084.7,
"valid_targets_min": 1191
},
{
"epoch": 2.9540675152185942,
"grad_norm": 0.27117239277014693,
"learning_rate": 2.865707866919154e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09460770338773727,
"step": 2670,
"valid_targets_mean": 4309.1,
"valid_targets_min": 1672
},
{
"epoch": 2.959601549529607,
"grad_norm": 0.2533093955054154,
"learning_rate": 2.8607317392906285e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09425908327102661,
"step": 2675,
"valid_targets_mean": 4199.7,
"valid_targets_min": 1743
},
{
"epoch": 2.96513558384062,
"grad_norm": 0.2544597366637726,
"learning_rate": 2.8557490634937027e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09826552867889404,
"step": 2680,
"valid_targets_mean": 3982.9,
"valid_targets_min": 1242
},
{
"epoch": 2.9706696181516326,
"grad_norm": 0.2270008550810053,
"learning_rate": 2.850759877434962e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08753231912851334,
"step": 2685,
"valid_targets_mean": 4210.3,
"valid_targets_min": 2144
},
{
"epoch": 2.976203652462645,
"grad_norm": 0.23023731050285826,
"learning_rate": 2.845764219070518e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09693797677755356,
"step": 2690,
"valid_targets_mean": 4198.8,
"valid_targets_min": 1335
},
{
"epoch": 2.9817376867736582,
"grad_norm": 0.24052515348826364,
"learning_rate": 2.8407621264057222e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09210985898971558,
"step": 2695,
"valid_targets_mean": 4010.5,
"valid_targets_min": 1501
},
{
"epoch": 2.987271721084671,
"grad_norm": 0.22041660826317713,
"learning_rate": 2.8357536374948752e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10018914192914963,
"step": 2700,
"valid_targets_mean": 4123.1,
"valid_targets_min": 2004
},
{
"epoch": 2.9928057553956835,
"grad_norm": 0.22308832266909892,
"learning_rate": 2.8307387904409408e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1004939153790474,
"step": 2705,
"valid_targets_mean": 4315.6,
"valid_targets_min": 2203
},
{
"epoch": 2.998339789706696,
"grad_norm": 0.2267894178719489,
"learning_rate": 2.8257176233952508e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09376098960638046,
"step": 2710,
"valid_targets_mean": 4404.2,
"valid_targets_min": 1768
},
{
"epoch": 3.0033204205866078,
"grad_norm": 0.3260552849333209,
"learning_rate": 2.8206901745572182e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12010964751243591,
"step": 2715,
"valid_targets_mean": 7708.5,
"valid_targets_min": 2114
},
{
"epoch": 3.0088544548976204,
"grad_norm": 0.2488611435270132,
"learning_rate": 2.8156564821740464e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11786027997732162,
"step": 2720,
"valid_targets_mean": 7049.1,
"valid_targets_min": 1582
},
{
"epoch": 3.014388489208633,
"grad_norm": 0.1921083844286432,
"learning_rate": 2.8106165845404367e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10925697535276413,
"step": 2725,
"valid_targets_mean": 6744.9,
"valid_targets_min": 2415
},
{
"epoch": 3.0199225235196456,
"grad_norm": 0.1821419754608182,
"learning_rate": 2.8055705199982995e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11892497539520264,
"step": 2730,
"valid_targets_mean": 7223.4,
"valid_targets_min": 1917
},
{
"epoch": 3.0254565578306587,
"grad_norm": 0.15693484811819064,
"learning_rate": 2.8005183269364603e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10714951902627945,
"step": 2735,
"valid_targets_mean": 6793.6,
"valid_targets_min": 2699
},
{
"epoch": 3.0309905921416713,
"grad_norm": 0.16709176637637066,
"learning_rate": 2.795460043790367e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08674667030572891,
"step": 2740,
"valid_targets_mean": 6319.4,
"valid_targets_min": 2331
},
{
"epoch": 3.036524626452684,
"grad_norm": 0.16398990842948868,
"learning_rate": 2.7903957090418007e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09815031290054321,
"step": 2745,
"valid_targets_mean": 6464.3,
"valid_targets_min": 2301
},
{
"epoch": 3.0420586607636966,
"grad_norm": 0.1738792299814764,
"learning_rate": 2.785325361218581e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08038411289453506,
"step": 2750,
"valid_targets_mean": 5905.9,
"valid_targets_min": 1789
},
{
"epoch": 3.0475926950747096,
"grad_norm": 0.1804894694966061,
"learning_rate": 2.780249038894272e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0968136116862297,
"step": 2755,
"valid_targets_mean": 6846.8,
"valid_targets_min": 2291
},
{
"epoch": 3.0531267293857223,
"grad_norm": 0.16073218176284065,
"learning_rate": 2.77516678068789e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10354902595281601,
"step": 2760,
"valid_targets_mean": 6919.4,
"valid_targets_min": 1723
},
{
"epoch": 3.058660763696735,
"grad_norm": 0.18868948921708006,
"learning_rate": 2.7700786252636107e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10971930623054504,
"step": 2765,
"valid_targets_mean": 7691.2,
"valid_targets_min": 2510
},
{
"epoch": 3.0641947980077475,
"grad_norm": 0.21268751522461696,
"learning_rate": 2.7649846113304738e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1004100814461708,
"step": 2770,
"valid_targets_mean": 6916.7,
"valid_targets_min": 2234
},
{
"epoch": 3.06972883231876,
"grad_norm": 0.18504147125623674,
"learning_rate": 2.7598847776420865e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10682997852563858,
"step": 2775,
"valid_targets_mean": 6807.6,
"valid_targets_min": 2726
},
{
"epoch": 3.075262866629773,
"grad_norm": 0.17716671792405636,
"learning_rate": 2.7547791629963332e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09369424730539322,
"step": 2780,
"valid_targets_mean": 7006.3,
"valid_targets_min": 2770
},
{
"epoch": 3.080796900940786,
"grad_norm": 0.17303029321105318,
"learning_rate": 2.7496678062350773e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10050015896558762,
"step": 2785,
"valid_targets_mean": 6757.8,
"valid_targets_min": 2587
},
{
"epoch": 3.0863309352517985,
"grad_norm": 0.21149449511005555,
"learning_rate": 2.744550746243866e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09726202487945557,
"step": 2790,
"valid_targets_mean": 6627.8,
"valid_targets_min": 2615
},
{
"epoch": 3.091864969562811,
"grad_norm": 0.1734481214507415,
"learning_rate": 2.7394280219516342e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08735307306051254,
"step": 2795,
"valid_targets_mean": 6780.6,
"valid_targets_min": 1765
},
{
"epoch": 3.097399003873824,
"grad_norm": 0.1689887983129223,
"learning_rate": 2.7342996723304112e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1004621684551239,
"step": 2800,
"valid_targets_mean": 6800.9,
"valid_targets_min": 2579
},
{
"epoch": 3.102933038184837,
"grad_norm": 0.17087147304863046,
"learning_rate": 2.72916573639502e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10274376720190048,
"step": 2805,
"valid_targets_mean": 7386.6,
"valid_targets_min": 2617
},
{
"epoch": 3.1084670724958494,
"grad_norm": 0.18170372433423485,
"learning_rate": 2.7240262532027825e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09600893408060074,
"step": 2810,
"valid_targets_mean": 7072.9,
"valid_targets_min": 1681
},
{
"epoch": 3.114001106806862,
"grad_norm": 0.1902362690377946,
"learning_rate": 2.7188812618532236e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09322325140237808,
"step": 2815,
"valid_targets_mean": 6639.1,
"valid_targets_min": 3065
},
{
"epoch": 3.119535141117875,
"grad_norm": 0.20059988733734505,
"learning_rate": 2.713730801487771e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09941449016332626,
"step": 2820,
"valid_targets_mean": 6858.6,
"valid_targets_min": 1617
},
{
"epoch": 3.1250691754288877,
"grad_norm": 0.1851527145531092,
"learning_rate": 2.7085749112894596e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09204109758138657,
"step": 2825,
"valid_targets_mean": 7061.5,
"valid_targets_min": 1644
},
{
"epoch": 3.1306032097399004,
"grad_norm": 0.19876799779267673,
"learning_rate": 2.7034136304826342e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08583220094442368,
"step": 2830,
"valid_targets_mean": 6095.5,
"valid_targets_min": 1940
},
{
"epoch": 3.136137244050913,
"grad_norm": 0.21456728555996507,
"learning_rate": 2.6982469983326464e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08667775988578796,
"step": 2835,
"valid_targets_mean": 6642.1,
"valid_targets_min": 3179
},
{
"epoch": 3.141671278361926,
"grad_norm": 0.1852695398214736,
"learning_rate": 2.6930750541455616e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09901637583971024,
"step": 2840,
"valid_targets_mean": 6965.1,
"valid_targets_min": 2543
},
{
"epoch": 3.1472053126729387,
"grad_norm": 0.17489563656293733,
"learning_rate": 2.6878978372678567e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08868839591741562,
"step": 2845,
"valid_targets_mean": 7017.0,
"valid_targets_min": 2142
},
{
"epoch": 3.1527393469839513,
"grad_norm": 0.20139088817043452,
"learning_rate": 2.682715387086121e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0875069797039032,
"step": 2850,
"valid_targets_mean": 6845.5,
"valid_targets_min": 1710
},
{
"epoch": 3.158273381294964,
"grad_norm": 0.19119018997986806,
"learning_rate": 2.677527743026759e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09193676710128784,
"step": 2855,
"valid_targets_mean": 6665.5,
"valid_targets_min": 2561
},
{
"epoch": 3.1638074156059766,
"grad_norm": 0.20580010529432702,
"learning_rate": 2.6723349445556857e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10696002840995789,
"step": 2860,
"valid_targets_mean": 7223.8,
"valid_targets_min": 2785
},
{
"epoch": 3.1693414499169896,
"grad_norm": 0.1946678998474377,
"learning_rate": 2.6671370311780303e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09646815061569214,
"step": 2865,
"valid_targets_mean": 7461.0,
"valid_targets_min": 2445
},
{
"epoch": 3.1748754842280023,
"grad_norm": 0.19551830245272903,
"learning_rate": 2.6619340424378367e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09138414263725281,
"step": 2870,
"valid_targets_mean": 6816.0,
"valid_targets_min": 2527
},
{
"epoch": 3.180409518539015,
"grad_norm": 0.23049576923409093,
"learning_rate": 2.656726017917757e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09756263345479965,
"step": 2875,
"valid_targets_mean": 7153.1,
"valid_targets_min": 2039
},
{
"epoch": 3.1859435528500275,
"grad_norm": 0.20343859617581705,
"learning_rate": 2.651512997238757e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10609716176986694,
"step": 2880,
"valid_targets_mean": 7173.5,
"valid_targets_min": 3054
},
{
"epoch": 3.1914775871610406,
"grad_norm": 0.20071464261230162,
"learning_rate": 2.6462950200598094e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09010434150695801,
"step": 2885,
"valid_targets_mean": 6941.1,
"valid_targets_min": 2433
},
{
"epoch": 3.197011621472053,
"grad_norm": 0.20500500621992115,
"learning_rate": 2.641072126077595e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08181817829608917,
"step": 2890,
"valid_targets_mean": 6240.0,
"valid_targets_min": 2230
},
{
"epoch": 3.202545655783066,
"grad_norm": 0.19535535133451618,
"learning_rate": 2.635844355026201e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08865565806627274,
"step": 2895,
"valid_targets_mean": 7364.3,
"valid_targets_min": 2192
},
{
"epoch": 3.2080796900940785,
"grad_norm": 0.1897151141024659,
"learning_rate": 2.6306117466768167e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08853700757026672,
"step": 2900,
"valid_targets_mean": 6757.6,
"valid_targets_min": 1881
},
{
"epoch": 3.213613724405091,
"grad_norm": 0.20943692032905442,
"learning_rate": 2.6253743408374313e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10196039825677872,
"step": 2905,
"valid_targets_mean": 7209.8,
"valid_targets_min": 1944
},
{
"epoch": 3.219147758716104,
"grad_norm": 0.1935204265289269,
"learning_rate": 2.6201321773525338e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08931133151054382,
"step": 2910,
"valid_targets_mean": 6967.8,
"valid_targets_min": 2450
},
{
"epoch": 3.2246817930271168,
"grad_norm": 0.286822677674402,
"learning_rate": 2.6148852961028066e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08451773971319199,
"step": 2915,
"valid_targets_mean": 3892.3,
"valid_targets_min": 1207
},
{
"epoch": 3.2302158273381294,
"grad_norm": 0.3861579584361899,
"learning_rate": 2.609633737004824e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09060275554656982,
"step": 2920,
"valid_targets_mean": 4990.3,
"valid_targets_min": 1823
},
{
"epoch": 3.235749861649142,
"grad_norm": 0.3831401215740749,
"learning_rate": 2.604377540010746e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09715189784765244,
"step": 2925,
"valid_targets_mean": 4408.2,
"valid_targets_min": 1915
},
{
"epoch": 3.241283895960155,
"grad_norm": 0.3632796786868025,
"learning_rate": 2.5991167451080195e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08995544910430908,
"step": 2930,
"valid_targets_mean": 4236.2,
"valid_targets_min": 1432
},
{
"epoch": 3.2468179302711677,
"grad_norm": 0.3654482389278134,
"learning_rate": 2.593851392319067e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09162074327468872,
"step": 2935,
"valid_targets_mean": 3938.6,
"valid_targets_min": 1433
},
{
"epoch": 3.2523519645821803,
"grad_norm": 0.331181711978515,
"learning_rate": 2.588581521700989e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1132919192314148,
"step": 2940,
"valid_targets_mean": 5005.6,
"valid_targets_min": 2114
},
{
"epoch": 3.257885998893193,
"grad_norm": 0.2984211657827162,
"learning_rate": 2.5833071733452543e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08910011500120163,
"step": 2945,
"valid_targets_mean": 3783.9,
"valid_targets_min": 1636
},
{
"epoch": 3.263420033204206,
"grad_norm": 0.3057568807284397,
"learning_rate": 2.5780283873773975e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11115298420190811,
"step": 2950,
"valid_targets_mean": 4429.8,
"valid_targets_min": 1385
},
{
"epoch": 3.2689540675152187,
"grad_norm": 0.3334752774018342,
"learning_rate": 2.5727452039567148e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09694870561361313,
"step": 2955,
"valid_targets_mean": 4083.3,
"valid_targets_min": 1931
},
{
"epoch": 3.2744881018262313,
"grad_norm": 0.2987416030856599,
"learning_rate": 2.5674576632759528e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10165077447891235,
"step": 2960,
"valid_targets_mean": 4112.9,
"valid_targets_min": 1850
},
{
"epoch": 3.280022136137244,
"grad_norm": 0.2820928535868255,
"learning_rate": 2.5621658055610102e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10538693517446518,
"step": 2965,
"valid_targets_mean": 4394.1,
"valid_targets_min": 1563
},
{
"epoch": 3.285556170448257,
"grad_norm": 0.2928257056247332,
"learning_rate": 2.5568696710706275e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10181987285614014,
"step": 2970,
"valid_targets_mean": 4841.0,
"valid_targets_min": 1692
},
{
"epoch": 3.2910902047592696,
"grad_norm": 0.2702920625567065,
"learning_rate": 2.5515693000960804e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.088201604783535,
"step": 2975,
"valid_targets_mean": 3999.7,
"valid_targets_min": 1273
},
{
"epoch": 3.2966242390702822,
"grad_norm": 0.2787562271224257,
"learning_rate": 2.546264732960876e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10615724325180054,
"step": 2980,
"valid_targets_mean": 4681.2,
"valid_targets_min": 1604
},
{
"epoch": 3.302158273381295,
"grad_norm": 0.2910523675114332,
"learning_rate": 2.540956010020443e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10740578174591064,
"step": 2985,
"valid_targets_mean": 4388.4,
"valid_targets_min": 1227
},
{
"epoch": 3.3076923076923075,
"grad_norm": 0.2842663902466955,
"learning_rate": 2.535643171661827e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08907082676887512,
"step": 2990,
"valid_targets_mean": 3892.8,
"valid_targets_min": 1207
},
{
"epoch": 3.3132263420033206,
"grad_norm": 0.2617368302587257,
"learning_rate": 2.530326258303383e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1079702377319336,
"step": 2995,
"valid_targets_mean": 4398.5,
"valid_targets_min": 2229
},
{
"epoch": 3.318760376314333,
"grad_norm": 0.2786891448668176,
"learning_rate": 2.5250053103944653e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09582444280385971,
"step": 3000,
"valid_targets_mean": 4250.3,
"valid_targets_min": 1806
},
{
"epoch": 3.324294410625346,
"grad_norm": 0.2941018152542811,
"learning_rate": 2.5196803684151223e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08968652039766312,
"step": 3005,
"valid_targets_mean": 4232.0,
"valid_targets_min": 1263
},
{
"epoch": 3.3298284449363584,
"grad_norm": 0.28117186217774265,
"learning_rate": 2.5143514728757904e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11329822987318039,
"step": 3010,
"valid_targets_mean": 5043.6,
"valid_targets_min": 1841
},
{
"epoch": 3.3353624792473715,
"grad_norm": 0.2802942381724536,
"learning_rate": 2.5090186643169804e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09427406638860703,
"step": 3015,
"valid_targets_mean": 3982.5,
"valid_targets_min": 1785
},
{
"epoch": 3.340896513558384,
"grad_norm": 0.32475933644846067,
"learning_rate": 2.5036819833089734e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1276949793100357,
"step": 3020,
"valid_targets_mean": 4740.7,
"valid_targets_min": 1552
},
{
"epoch": 3.3464305478693968,
"grad_norm": 0.32006737602777374,
"learning_rate": 2.4983414704515104e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09326666593551636,
"step": 3025,
"valid_targets_mean": 4246.9,
"valid_targets_min": 1659
},
{
"epoch": 3.3519645821804094,
"grad_norm": 0.27630109677520476,
"learning_rate": 2.492997166373485e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09285572916269302,
"step": 3030,
"valid_targets_mean": 4407.0,
"valid_targets_min": 1384
},
{
"epoch": 3.357498616491422,
"grad_norm": 0.28240313121848504,
"learning_rate": 2.4876491117326315e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09093517065048218,
"step": 3035,
"valid_targets_mean": 3929.4,
"valid_targets_min": 1212
},
{
"epoch": 3.363032650802435,
"grad_norm": 0.31520104902216356,
"learning_rate": 2.482297347215219e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10813164710998535,
"step": 3040,
"valid_targets_mean": 4758.0,
"valid_targets_min": 1634
},
{
"epoch": 3.3685666851134477,
"grad_norm": 0.290618673534816,
"learning_rate": 2.476941913535738e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08990909904241562,
"step": 3045,
"valid_targets_mean": 4235.8,
"valid_targets_min": 1303
},
{
"epoch": 3.3741007194244603,
"grad_norm": 0.275550505368689,
"learning_rate": 2.4715828514365953e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09693226963281631,
"step": 3050,
"valid_targets_mean": 4851.0,
"valid_targets_min": 1845
},
{
"epoch": 3.3796347537354734,
"grad_norm": 0.2963432180668484,
"learning_rate": 2.4662202016878e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08788219839334488,
"step": 3055,
"valid_targets_mean": 3943.5,
"valid_targets_min": 1444
},
{
"epoch": 3.385168788046486,
"grad_norm": 0.29499952415638026,
"learning_rate": 2.4608540050866544e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09814119338989258,
"step": 3060,
"valid_targets_mean": 4412.8,
"valid_targets_min": 1966
},
{
"epoch": 3.3907028223574986,
"grad_norm": 0.3042118001971243,
"learning_rate": 2.4554843024574454e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09488651901483536,
"step": 3065,
"valid_targets_mean": 4550.5,
"valid_targets_min": 1194
},
{
"epoch": 3.3962368566685113,
"grad_norm": 0.2939692802430235,
"learning_rate": 2.450111134651132e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10834595561027527,
"step": 3070,
"valid_targets_mean": 4816.4,
"valid_targets_min": 1586
},
{
"epoch": 3.401770890979524,
"grad_norm": 0.2857820932330975,
"learning_rate": 2.4447345425450353e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09045431762933731,
"step": 3075,
"valid_targets_mean": 4299.6,
"valid_targets_min": 1866
},
{
"epoch": 3.407304925290537,
"grad_norm": 0.3019933684662385,
"learning_rate": 2.4393545670425276e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0811840146780014,
"step": 3080,
"valid_targets_mean": 3712.6,
"valid_targets_min": 1675
},
{
"epoch": 3.4128389596015496,
"grad_norm": 0.30329649427969957,
"learning_rate": 2.43397124907272e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0953529104590416,
"step": 3085,
"valid_targets_mean": 4404.2,
"valid_targets_min": 1801
},
{
"epoch": 3.418372993912562,
"grad_norm": 0.3100850324511087,
"learning_rate": 2.4285846295901537e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09615548700094223,
"step": 3090,
"valid_targets_mean": 4216.7,
"valid_targets_min": 1385
},
{
"epoch": 3.423907028223575,
"grad_norm": 0.306563388540784,
"learning_rate": 2.423194749574485e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08508458733558655,
"step": 3095,
"valid_targets_mean": 4448.0,
"valid_targets_min": 1434
},
{
"epoch": 3.429441062534588,
"grad_norm": 0.3297129530561979,
"learning_rate": 2.4178016500301757e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09123352915048599,
"step": 3100,
"valid_targets_mean": 4399.5,
"valid_targets_min": 1633
},
{
"epoch": 3.4349750968456005,
"grad_norm": 0.2956509424732023,
"learning_rate": 2.412405371986182e-05,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09261216968297958,
"step": 3105,
"valid_targets_mean": 5115.6,
"valid_targets_min": 1868
},
{
"epoch": 3.440509131156613,
"grad_norm": 0.32424268893973734,
"learning_rate": 2.4070059564956393e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09287405014038086,
"step": 3110,
"valid_targets_mean": 4610.4,
"valid_targets_min": 1423
},
{
"epoch": 3.446043165467626,
"grad_norm": 0.3177883403955838,
"learning_rate": 2.4016034446355533e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08633139729499817,
"step": 3115,
"valid_targets_mean": 4042.8,
"valid_targets_min": 1613
},
{
"epoch": 3.4515771997786384,
"grad_norm": 0.2943065081811316,
"learning_rate": 2.396197877506484e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09375669807195663,
"step": 3120,
"valid_targets_mean": 4377.2,
"valid_targets_min": 1484
},
{
"epoch": 3.4571112340896515,
"grad_norm": 0.2642397180732357,
"learning_rate": 2.390789296232237e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11398092657327652,
"step": 3125,
"valid_targets_mean": 5438.3,
"valid_targets_min": 1560
},
{
"epoch": 3.462645268400664,
"grad_norm": 0.30534761153482814,
"learning_rate": 2.3853777419595476e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09357643872499466,
"step": 3130,
"valid_targets_mean": 4372.1,
"valid_targets_min": 2038
},
{
"epoch": 3.4681793027116767,
"grad_norm": 0.27270808124872176,
"learning_rate": 2.3799632558577675e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07442276924848557,
"step": 3135,
"valid_targets_mean": 5855.8,
"valid_targets_min": 1883
},
{
"epoch": 3.4737133370226894,
"grad_norm": 0.24153688662366368,
"learning_rate": 2.3745458791185554e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07261274009943008,
"step": 3140,
"valid_targets_mean": 5574.1,
"valid_targets_min": 2410
},
{
"epoch": 3.4792473713337024,
"grad_norm": 0.17721777678165035,
"learning_rate": 2.3691256529555587e-05,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06744299083948135,
"step": 3145,
"valid_targets_mean": 5714.9,
"valid_targets_min": 1867
},
{
"epoch": 3.484781405644715,
"grad_norm": 0.17939390430450763,
"learning_rate": 2.3637026186041028e-05,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06565037369728088,
"step": 3150,
"valid_targets_mean": 5655.9,
"valid_targets_min": 2408
},
{
"epoch": 3.4903154399557277,
"grad_norm": 0.16869028724210566,
"learning_rate": 2.3582768173208788e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05937578156590462,
"step": 3155,
"valid_targets_mean": 5437.7,
"valid_targets_min": 2380
},
{
"epoch": 3.4958494742667403,
"grad_norm": 0.17528165871270113,
"learning_rate": 2.3528482903836248e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06441015750169754,
"step": 3160,
"valid_targets_mean": 5273.7,
"valid_targets_min": 2383
},
{
"epoch": 3.501383508577753,
"grad_norm": 0.16460285910916572,
"learning_rate": 2.3474170790908166e-05,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06017139554023743,
"step": 3165,
"valid_targets_mean": 5861.0,
"valid_targets_min": 2743
},
{
"epoch": 3.506917542888766,
"grad_norm": 0.17600501488293324,
"learning_rate": 2.3419832247613514e-05,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06484571099281311,
"step": 3170,
"valid_targets_mean": 5160.7,
"valid_targets_min": 1693
},
{
"epoch": 3.5124515771997786,
"grad_norm": 0.17434239041445998,
"learning_rate": 2.3365467687342336e-05,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05803552269935608,
"step": 3175,
"valid_targets_mean": 5590.1,
"valid_targets_min": 1422
},
{
"epoch": 3.5179856115107913,
"grad_norm": 0.17499098929635343,
"learning_rate": 2.33110775236826e-05,
"loss": 0.1273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06218947470188141,
"step": 3180,
"valid_targets_mean": 6409.6,
"valid_targets_min": 2530
},
{
"epoch": 3.5235196458218043,
"grad_norm": 0.16318966508533975,
"learning_rate": 2.3256662170417076e-05,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05842486396431923,
"step": 3185,
"valid_targets_mean": 5695.5,
"valid_targets_min": 1750
},
{
"epoch": 3.529053680132817,
"grad_norm": 0.1708102667677403,
"learning_rate": 2.3202222041520135e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05957861244678497,
"step": 3190,
"valid_targets_mean": 5893.7,
"valid_targets_min": 1777
},
{
"epoch": 3.5345877144438296,
"grad_norm": 0.1948736754459281,
"learning_rate": 2.3147757551154667e-05,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0627470389008522,
"step": 3195,
"valid_targets_mean": 5945.1,
"valid_targets_min": 2180
},
{
"epoch": 3.540121748754842,
"grad_norm": 0.17992534289584564,
"learning_rate": 2.309326911366888e-05,
"loss": 0.115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05356718227267265,
"step": 3200,
"valid_targets_mean": 5163.2,
"valid_targets_min": 2070
},
{
"epoch": 3.545655783065855,
"grad_norm": 0.1896234788874136,
"learning_rate": 2.3038757143593155e-05,
"loss": 0.1144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05686204507946968,
"step": 3205,
"valid_targets_mean": 5939.5,
"valid_targets_min": 2847
},
{
"epoch": 3.551189817376868,
"grad_norm": 0.1934068787610231,
"learning_rate": 2.298422205563692e-05,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05834668502211571,
"step": 3210,
"valid_targets_mean": 5371.9,
"valid_targets_min": 1377
},
{
"epoch": 3.5567238516878805,
"grad_norm": 0.20265828021309631,
"learning_rate": 2.2929664264685463e-05,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055999208241701126,
"step": 3215,
"valid_targets_mean": 5458.5,
"valid_targets_min": 1522
},
{
"epoch": 3.562257885998893,
"grad_norm": 0.18832600204742164,
"learning_rate": 2.2875084185796796e-05,
"loss": 0.1174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05172300711274147,
"step": 3220,
"valid_targets_mean": 5541.6,
"valid_targets_min": 2876
},
{
"epoch": 3.5677919203099058,
"grad_norm": 0.19124983926618677,
"learning_rate": 2.282048223419849e-05,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05770617723464966,
"step": 3225,
"valid_targets_mean": 5546.1,
"valid_targets_min": 1917
},
{
"epoch": 3.573325954620919,
"grad_norm": 0.1815657905894023,
"learning_rate": 2.2765858825284512e-05,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05621454119682312,
"step": 3230,
"valid_targets_mean": 5396.4,
"valid_targets_min": 1801
},
{
"epoch": 3.5788599889319315,
"grad_norm": 0.18039022969585103,
"learning_rate": 2.2711214374612073e-05,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05948448181152344,
"step": 3235,
"valid_targets_mean": 5903.2,
"valid_targets_min": 2781
},
{
"epoch": 3.584394023242944,
"grad_norm": 0.18527243267165797,
"learning_rate": 2.265654929789846e-05,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05525258556008339,
"step": 3240,
"valid_targets_mean": 5584.1,
"valid_targets_min": 2118
},
{
"epoch": 3.5899280575539567,
"grad_norm": 0.18795759761112604,
"learning_rate": 2.260186401101788e-05,
"loss": 0.1166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05691872909665108,
"step": 3245,
"valid_targets_mean": 5704.3,
"valid_targets_min": 2934
},
{
"epoch": 3.5954620918649693,
"grad_norm": 0.18431748353924032,
"learning_rate": 2.2547158929998295e-05,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050647616386413574,
"step": 3250,
"valid_targets_mean": 5652.3,
"valid_targets_min": 2882
},
{
"epoch": 3.6009961261759824,
"grad_norm": 0.1836061155823106,
"learning_rate": 2.2492434471018242e-05,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046802204102277756,
"step": 3255,
"valid_targets_mean": 5334.6,
"valid_targets_min": 2788
},
{
"epoch": 3.606530160486995,
"grad_norm": 0.17861875194505744,
"learning_rate": 2.243769105040369e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05294260382652283,
"step": 3260,
"valid_targets_mean": 5215.5,
"valid_targets_min": 1972
},
{
"epoch": 3.6120641947980077,
"grad_norm": 0.18093941310905542,
"learning_rate": 2.2382929084624858e-05,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05248071625828743,
"step": 3265,
"valid_targets_mean": 5419.0,
"valid_targets_min": 2222
},
{
"epoch": 3.6175982291090207,
"grad_norm": 0.18748518763677194,
"learning_rate": 2.232814899029305e-05,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047866091132164,
"step": 3270,
"valid_targets_mean": 6090.2,
"valid_targets_min": 2674
},
{
"epoch": 3.6231322634200334,
"grad_norm": 0.19665222290693413,
"learning_rate": 2.2273351184157504e-05,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055568646639585495,
"step": 3275,
"valid_targets_mean": 5320.1,
"valid_targets_min": 1569
},
{
"epoch": 3.628666297731046,
"grad_norm": 0.22082547667814492,
"learning_rate": 2.2218536083102168e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05981751158833504,
"step": 3280,
"valid_targets_mean": 5572.3,
"valid_targets_min": 1129
},
{
"epoch": 3.6342003320420586,
"grad_norm": 0.19055385755567586,
"learning_rate": 2.2163704104142586e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04928545281291008,
"step": 3285,
"valid_targets_mean": 5389.2,
"valid_targets_min": 1754
},
{
"epoch": 3.6397343663530712,
"grad_norm": 0.19954978228249304,
"learning_rate": 2.210885566442271e-05,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05369424819946289,
"step": 3290,
"valid_targets_mean": 5636.7,
"valid_targets_min": 2583
},
{
"epoch": 3.645268400664084,
"grad_norm": 0.19931274918591688,
"learning_rate": 2.2053991181211706e-05,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04861845448613167,
"step": 3295,
"valid_targets_mean": 5504.9,
"valid_targets_min": 1563
},
{
"epoch": 3.650802434975097,
"grad_norm": 0.20336889771034933,
"learning_rate": 2.1999111071900806e-05,
"loss": 0.1035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05100370571017265,
"step": 3300,
"valid_targets_mean": 5358.7,
"valid_targets_min": 2485
},
{
"epoch": 3.6563364692861096,
"grad_norm": 0.20145951306806356,
"learning_rate": 2.1944215754000107e-05,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061765749007463455,
"step": 3305,
"valid_targets_mean": 5603.7,
"valid_targets_min": 2272
},
{
"epoch": 3.661870503597122,
"grad_norm": 0.4966725091201629,
"learning_rate": 2.188930564513541e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05129636451601982,
"step": 3310,
"valid_targets_mean": 5764.9,
"valid_targets_min": 2253
},
{
"epoch": 3.6674045379081353,
"grad_norm": 0.1958144887330287,
"learning_rate": 2.183438116304506e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05419323965907097,
"step": 3315,
"valid_targets_mean": 5999.5,
"valid_targets_min": 1804
},
{
"epoch": 3.672938572219148,
"grad_norm": 0.20186968025351232,
"learning_rate": 2.1779442725576722e-05,
"loss": 0.1068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04640122130513191,
"step": 3320,
"valid_targets_mean": 5618.7,
"valid_targets_min": 2151
},
{
"epoch": 3.6784726065301605,
"grad_norm": 0.19428287401499916,
"learning_rate": 2.1724490750684238e-05,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049658600240945816,
"step": 3325,
"valid_targets_mean": 5737.9,
"valid_targets_min": 1134
},
{
"epoch": 3.684006640841173,
"grad_norm": 0.20853568450404253,
"learning_rate": 2.1669525656424454e-05,
"loss": 0.1083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05687330290675163,
"step": 3330,
"valid_targets_mean": 5562.4,
"valid_targets_min": 2524
},
{
"epoch": 3.6895406751521858,
"grad_norm": 0.20138033879262535,
"learning_rate": 2.1614547860954005e-05,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04973490163683891,
"step": 3335,
"valid_targets_mean": 5549.1,
"valid_targets_min": 2082
},
{
"epoch": 3.695074709463199,
"grad_norm": 0.20307972370942748,
"learning_rate": 2.1559557782526162e-05,
"loss": 0.1046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06023570895195007,
"step": 3340,
"valid_targets_mean": 6159.9,
"valid_targets_min": 2331
},
{
"epoch": 3.7006087437742115,
"grad_norm": 0.1925172789049576,
"learning_rate": 2.1504555839487636e-05,
"loss": 0.1005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05248604714870453,
"step": 3345,
"valid_targets_mean": 5593.5,
"valid_targets_min": 2366
},
{
"epoch": 3.706142778085224,
"grad_norm": 0.20737964844426446,
"learning_rate": 2.14495424502754e-05,
"loss": 0.0991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05406155064702034,
"step": 3350,
"valid_targets_mean": 5608.8,
"valid_targets_min": 2612
},
{
"epoch": 3.7116768123962367,
"grad_norm": 0.21321632992915002,
"learning_rate": 2.139451803341351e-05,
"loss": 0.1006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05330200493335724,
"step": 3355,
"valid_targets_mean": 5524.9,
"valid_targets_min": 2217
},
{
"epoch": 3.7172108467072498,
"grad_norm": 0.20866461352352217,
"learning_rate": 2.133948300750992e-05,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05255679413676262,
"step": 3360,
"valid_targets_mean": 5398.8,
"valid_targets_min": 1864
},
{
"epoch": 3.7227448810182624,
"grad_norm": 0.21615500098606666,
"learning_rate": 2.1284437791253273e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05293337628245354,
"step": 3365,
"valid_targets_mean": 5673.8,
"valid_targets_min": 2189
},
{
"epoch": 3.728278915329275,
"grad_norm": 0.18285632131411686,
"learning_rate": 2.122938280340977e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052879661321640015,
"step": 3370,
"valid_targets_mean": 5651.7,
"valid_targets_min": 3032
},
{
"epoch": 3.7338129496402876,
"grad_norm": 0.20603578255440028,
"learning_rate": 2.1174318462819925e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05127779021859169,
"step": 3375,
"valid_targets_mean": 5350.3,
"valid_targets_min": 1305
},
{
"epoch": 3.7393469839513003,
"grad_norm": 0.19738589050719968,
"learning_rate": 2.1119245188395414e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052101802080869675,
"step": 3380,
"valid_targets_mean": 6064.2,
"valid_targets_min": 2801
},
{
"epoch": 3.7448810182623133,
"grad_norm": 0.17640985034996595,
"learning_rate": 2.1064163399115883e-05,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051063280552625656,
"step": 3385,
"valid_targets_mean": 5364.2,
"valid_targets_min": 2088
},
{
"epoch": 3.750415052573326,
"grad_norm": 0.20762261921662648,
"learning_rate": 2.1009073514025743e-05,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049620259553194046,
"step": 3390,
"valid_targets_mean": 5511.1,
"valid_targets_min": 2194
},
{
"epoch": 3.7559490868843386,
"grad_norm": 0.2818458833816632,
"learning_rate": 2.0953975952231015e-05,
"loss": 0.1264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07185864448547363,
"step": 3395,
"valid_targets_mean": 4122.2,
"valid_targets_min": 1988
},
{
"epoch": 3.7614831211953517,
"grad_norm": 0.3703796923782842,
"learning_rate": 2.08988711328961e-05,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08274849504232407,
"step": 3400,
"valid_targets_mean": 4674.5,
"valid_targets_min": 1999
},
{
"epoch": 3.7670171555063643,
"grad_norm": 0.35697897890053726,
"learning_rate": 2.0843759475240625e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07798462361097336,
"step": 3405,
"valid_targets_mean": 4400.6,
"valid_targets_min": 1173
},
{
"epoch": 3.772551189817377,
"grad_norm": 0.34355115258038904,
"learning_rate": 2.0788641398536237e-05,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08108644932508469,
"step": 3410,
"valid_targets_mean": 4527.1,
"valid_targets_min": 1917
},
{
"epoch": 3.7780852241283895,
"grad_norm": 0.2802880828112715,
"learning_rate": 2.073351732210343e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07276499271392822,
"step": 3415,
"valid_targets_mean": 4372.0,
"valid_targets_min": 1283
},
{
"epoch": 3.783619258439402,
"grad_norm": 0.2873614036864067,
"learning_rate": 2.067838766530832e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07237691432237625,
"step": 3420,
"valid_targets_mean": 4184.1,
"valid_targets_min": 1752
},
{
"epoch": 3.789153292750415,
"grad_norm": 0.3112753635064296,
"learning_rate": 2.062325284755949e-05,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07607384026050568,
"step": 3425,
"valid_targets_mean": 7490.5,
"valid_targets_min": 1699
},
{
"epoch": 3.794687327061428,
"grad_norm": 0.2938322497063729,
"learning_rate": 2.0568113288304773e-05,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07387111335992813,
"step": 3430,
"valid_targets_mean": 7260.8,
"valid_targets_min": 1426
},
{
"epoch": 3.8002213613724405,
"grad_norm": 0.2916769580095921,
"learning_rate": 2.0512969407028103e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06837702542543411,
"step": 3435,
"valid_targets_mean": 7299.8,
"valid_targets_min": 996
},
{
"epoch": 3.805755395683453,
"grad_norm": 0.31919923173242226,
"learning_rate": 2.0457821623246263e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07120344787836075,
"step": 3440,
"valid_targets_mean": 7641.9,
"valid_targets_min": 1230
},
{
"epoch": 3.811289429994466,
"grad_norm": 0.24702206519128803,
"learning_rate": 2.0402670356505734e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060001153498888016,
"step": 3445,
"valid_targets_mean": 6535.7,
"valid_targets_min": 1027
},
{
"epoch": 3.816823464305479,
"grad_norm": 0.25088171572413825,
"learning_rate": 2.0347516026379498e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06905766576528549,
"step": 3450,
"valid_targets_mean": 8137.3,
"valid_targets_min": 2136
},
{
"epoch": 3.8223574986164914,
"grad_norm": 0.26797108470524955,
"learning_rate": 2.0292359052463856e-05,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08341628313064575,
"step": 3455,
"valid_targets_mean": 14691.3,
"valid_targets_min": 4833
},
{
"epoch": 3.827891532927504,
"grad_norm": 0.18658299888065677,
"learning_rate": 2.0237199854375195e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08647984266281128,
"step": 3460,
"valid_targets_mean": 13659.3,
"valid_targets_min": 4559
},
{
"epoch": 3.8334255672385167,
"grad_norm": 0.15668057439242344,
"learning_rate": 2.0182038851746836e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06748253852128983,
"step": 3465,
"valid_targets_mean": 11821.1,
"valid_targets_min": 1028
},
{
"epoch": 3.8389596015495298,
"grad_norm": 0.1441504264141319,
"learning_rate": 2.0126876464225832e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07420114427804947,
"step": 3470,
"valid_targets_mean": 13088.8,
"valid_targets_min": 1103
},
{
"epoch": 3.8444936358605424,
"grad_norm": 0.19666886204621933,
"learning_rate": 2.0071713111469768e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.064952552318573,
"step": 3475,
"valid_targets_mean": 7919.6,
"valid_targets_min": 2223
},
{
"epoch": 3.850027670171555,
"grad_norm": 0.26433296077389334,
"learning_rate": 2.0016549213143567e-05,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05874726548790932,
"step": 3480,
"valid_targets_mean": 7816.1,
"valid_targets_min": 1665
},
{
"epoch": 3.8555617044825676,
"grad_norm": 0.30906600677339086,
"learning_rate": 1.996138518891631e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053055714815855026,
"step": 3485,
"valid_targets_mean": 6050.3,
"valid_targets_min": 1080
},
{
"epoch": 3.8610957387935807,
"grad_norm": 0.27246669254577127,
"learning_rate": 1.9906221458458036e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08226754516363144,
"step": 3490,
"valid_targets_mean": 5350.3,
"valid_targets_min": 2411
},
{
"epoch": 3.8666297731045933,
"grad_norm": 0.3377397171769842,
"learning_rate": 1.985105844143654e-05,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06281077116727829,
"step": 3495,
"valid_targets_mean": 4708.8,
"valid_targets_min": 1501
},
{
"epoch": 3.872163807415606,
"grad_norm": 0.2929815010490038,
"learning_rate": 1.979589655751421e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06699756532907486,
"step": 3500,
"valid_targets_mean": 4942.9,
"valid_targets_min": 1766
},
{
"epoch": 3.8776978417266186,
"grad_norm": 0.2567591919624809,
"learning_rate": 1.9740736226344775e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07040539383888245,
"step": 3505,
"valid_targets_mean": 5004.8,
"valid_targets_min": 1840
},
{
"epoch": 3.883231876037631,
"grad_norm": 0.26801555266148386,
"learning_rate": 1.9685577867570197e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0682801902294159,
"step": 3510,
"valid_targets_mean": 4034.9,
"valid_targets_min": 2025
},
{
"epoch": 3.8887659103486443,
"grad_norm": 0.3086796660354632,
"learning_rate": 1.9630421900817407e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07974547892808914,
"step": 3515,
"valid_targets_mean": 4940.1,
"valid_targets_min": 2012
},
{
"epoch": 3.894299944659657,
"grad_norm": 0.2811177468129799,
"learning_rate": 1.9575268745695133e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0761692151427269,
"step": 3520,
"valid_targets_mean": 4119.7,
"valid_targets_min": 1305
},
{
"epoch": 3.8998339789706695,
"grad_norm": 0.23447014214849063,
"learning_rate": 1.952011882179074e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08349272608757019,
"step": 3525,
"valid_targets_mean": 5118.2,
"valid_targets_min": 2161
},
{
"epoch": 3.9053680132816826,
"grad_norm": 0.2765881507094179,
"learning_rate": 1.946497254866697e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09142681211233139,
"step": 3530,
"valid_targets_mean": 5002.8,
"valid_targets_min": 1723
},
{
"epoch": 3.910902047592695,
"grad_norm": 0.23418257070583998,
"learning_rate": 1.9409830345858843e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08624914288520813,
"step": 3535,
"valid_targets_mean": 5169.8,
"valid_targets_min": 1906
},
{
"epoch": 3.916436081903708,
"grad_norm": 0.2413458604168126,
"learning_rate": 1.9354692632870358e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08076553791761398,
"step": 3540,
"valid_targets_mean": 5038.4,
"valid_targets_min": 1650
},
{
"epoch": 3.9219701162147205,
"grad_norm": 0.24352589831960533,
"learning_rate": 1.9299559829171396e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07839047908782959,
"step": 3545,
"valid_targets_mean": 4684.4,
"valid_targets_min": 1996
},
{
"epoch": 3.927504150525733,
"grad_norm": 0.2638840372227269,
"learning_rate": 1.9244432354194483e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08922380208969116,
"step": 3550,
"valid_targets_mean": 4838.9,
"valid_targets_min": 1977
},
{
"epoch": 3.9330381848367457,
"grad_norm": 0.24960441994375437,
"learning_rate": 1.918931062733159e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08381988853216171,
"step": 3555,
"valid_targets_mean": 5133.2,
"valid_targets_min": 1506
},
{
"epoch": 3.938572219147759,
"grad_norm": 0.2442163896469321,
"learning_rate": 1.9134195067930985e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08304736018180847,
"step": 3560,
"valid_targets_mean": 5072.2,
"valid_targets_min": 2124
},
{
"epoch": 3.9441062534587714,
"grad_norm": 0.28311527205978554,
"learning_rate": 1.9079086095293978e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09676555544137955,
"step": 3565,
"valid_targets_mean": 5254.5,
"valid_targets_min": 1760
},
{
"epoch": 3.949640287769784,
"grad_norm": 0.2775742290309911,
"learning_rate": 1.90239841286718e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06859570741653442,
"step": 3570,
"valid_targets_mean": 4087.4,
"valid_targets_min": 1891
},
{
"epoch": 3.955174322080797,
"grad_norm": 0.30165383534771095,
"learning_rate": 1.8968889587262373e-05,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0765879675745964,
"step": 3575,
"valid_targets_mean": 4363.6,
"valid_targets_min": 1955
},
{
"epoch": 3.9607083563918097,
"grad_norm": 0.3177687011272404,
"learning_rate": 1.8913802890207132e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07781877368688583,
"step": 3580,
"valid_targets_mean": 4320.0,
"valid_targets_min": 2526
},
{
"epoch": 3.9662423907028224,
"grad_norm": 0.2626966192151495,
"learning_rate": 1.885872445658784e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07548317313194275,
"step": 3585,
"valid_targets_mean": 4363.6,
"valid_targets_min": 1674
},
{
"epoch": 3.971776425013835,
"grad_norm": 0.2800247562347386,
"learning_rate": 1.8803654705423372e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06895517557859421,
"step": 3590,
"valid_targets_mean": 4099.5,
"valid_targets_min": 2050
},
{
"epoch": 3.9773104593248476,
"grad_norm": 0.27891467086583555,
"learning_rate": 1.8748594055666577e-05,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07581552118062973,
"step": 3595,
"valid_targets_mean": 4430.0,
"valid_targets_min": 1829
},
{
"epoch": 3.9828444936358607,
"grad_norm": 0.24997155449664565,
"learning_rate": 1.8693542926201042e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07906609028577805,
"step": 3600,
"valid_targets_mean": 4739.8,
"valid_targets_min": 2082
},
{
"epoch": 3.9883785279468733,
"grad_norm": 0.2609218020015554,
"learning_rate": 1.8638501735837956e-05,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0702708438038826,
"step": 3605,
"valid_targets_mean": 4067.0,
"valid_targets_min": 1637
},
{
"epoch": 3.993912562257886,
"grad_norm": 0.24947274856100093,
"learning_rate": 1.8583470903312842e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07230882346630096,
"step": 3610,
"valid_targets_mean": 4236.1,
"valid_targets_min": 2259
},
{
"epoch": 3.999446596568899,
"grad_norm": 0.2604568289333355,
"learning_rate": 1.8528450847282494e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06669026613235474,
"step": 3615,
"valid_targets_mean": 3957.5,
"valid_targets_min": 1518
},
{
"epoch": 4.00442722744881,
"grad_norm": 0.3615296486902075,
"learning_rate": 1.8473441986321658e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1087537333369255,
"step": 3620,
"valid_targets_mean": 7661.5,
"valid_targets_min": 2439
},
{
"epoch": 4.009961261759823,
"grad_norm": 0.24874350087256913,
"learning_rate": 1.841844473891995e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09617044776678085,
"step": 3625,
"valid_targets_mean": 6907.5,
"valid_targets_min": 2738
},
{
"epoch": 4.015495296070836,
"grad_norm": 0.21774237548987765,
"learning_rate": 1.836345952347862e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08362749963998795,
"step": 3630,
"valid_targets_mean": 6410.7,
"valid_targets_min": 2445
},
{
"epoch": 4.0210293303818485,
"grad_norm": 0.21921994848890536,
"learning_rate": 1.8308486758307382e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08051495999097824,
"step": 3635,
"valid_targets_mean": 6399.4,
"valid_targets_min": 1929
},
{
"epoch": 4.026563364692861,
"grad_norm": 0.20926541818543987,
"learning_rate": 1.825352686162125e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07576586306095123,
"step": 3640,
"valid_targets_mean": 6164.7,
"valid_targets_min": 1823
},
{
"epoch": 4.032097399003874,
"grad_norm": 0.18768126266546767,
"learning_rate": 1.81985802515373e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07731462270021439,
"step": 3645,
"valid_targets_mean": 6921.8,
"valid_targets_min": 2809
},
{
"epoch": 4.037631433314886,
"grad_norm": 0.18836188233033177,
"learning_rate": 1.8143647346071566e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0950491726398468,
"step": 3650,
"valid_targets_mean": 6955.7,
"valid_targets_min": 2131
},
{
"epoch": 4.043165467625899,
"grad_norm": 0.19727093822121985,
"learning_rate": 1.8088728563135806e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08911281824111938,
"step": 3655,
"valid_targets_mean": 7009.1,
"valid_targets_min": 1790
},
{
"epoch": 4.048699501936912,
"grad_norm": 0.20294571729859454,
"learning_rate": 1.8033824320534336e-05,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07729238271713257,
"step": 3660,
"valid_targets_mean": 6647.1,
"valid_targets_min": 1889
},
{
"epoch": 4.054233536247925,
"grad_norm": 0.21478276080125386,
"learning_rate": 1.7978935035960873e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09047490358352661,
"step": 3665,
"valid_targets_mean": 7243.6,
"valid_targets_min": 2074
},
{
"epoch": 4.059767570558938,
"grad_norm": 0.22279499864290855,
"learning_rate": 1.79240611269953e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09274063259363174,
"step": 3670,
"valid_targets_mean": 7255.7,
"valid_targets_min": 1549
},
{
"epoch": 4.06530160486995,
"grad_norm": 0.24519964467416966,
"learning_rate": 1.7869203011100566e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0784914568066597,
"step": 3675,
"valid_targets_mean": 7046.5,
"valid_targets_min": 1799
},
{
"epoch": 4.070835639180963,
"grad_norm": 0.20156601817139844,
"learning_rate": 1.781436110561945e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0783810019493103,
"step": 3680,
"valid_targets_mean": 6997.1,
"valid_targets_min": 1617
},
{
"epoch": 4.076369673491976,
"grad_norm": 0.21464079402718325,
"learning_rate": 1.7759535827771422e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07057405263185501,
"step": 3685,
"valid_targets_mean": 6658.6,
"valid_targets_min": 1317
},
{
"epoch": 4.081903707802988,
"grad_norm": 0.21650675445364018,
"learning_rate": 1.7704727594649422e-05,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07326150685548782,
"step": 3690,
"valid_targets_mean": 6380.2,
"valid_targets_min": 1852
},
{
"epoch": 4.087437742114001,
"grad_norm": 0.21109180543842868,
"learning_rate": 1.7649936823216763e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08527389913797379,
"step": 3695,
"valid_targets_mean": 7227.7,
"valid_targets_min": 2572
},
{
"epoch": 4.0929717764250135,
"grad_norm": 0.21597274911137776,
"learning_rate": 1.7595163930303902e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0764990746974945,
"step": 3700,
"valid_targets_mean": 6691.6,
"valid_targets_min": 2260
},
{
"epoch": 4.098505810736026,
"grad_norm": 0.21074152697566187,
"learning_rate": 1.7540409332605254e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07818029820919037,
"step": 3705,
"valid_targets_mean": 6555.6,
"valid_targets_min": 2516
},
{
"epoch": 4.10403984504704,
"grad_norm": 0.2096894213490095,
"learning_rate": 1.7485673446676083e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07488299906253815,
"step": 3710,
"valid_targets_mean": 6841.9,
"valid_targets_min": 2355
},
{
"epoch": 4.109573879358052,
"grad_norm": 0.22354028109558502,
"learning_rate": 1.7430956688929283e-05,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0797095000743866,
"step": 3715,
"valid_targets_mean": 7266.3,
"valid_targets_min": 2994
},
{
"epoch": 4.115107913669065,
"grad_norm": 0.23105711899293185,
"learning_rate": 1.737625947563224e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07823490351438522,
"step": 3720,
"valid_targets_mean": 6713.0,
"valid_targets_min": 1810
},
{
"epoch": 4.1206419479800775,
"grad_norm": 0.2376544784068995,
"learning_rate": 1.7321582222903633e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06807952374219894,
"step": 3725,
"valid_targets_mean": 5598.9,
"valid_targets_min": 1999
},
{
"epoch": 4.12617598229109,
"grad_norm": 0.24742699875160848,
"learning_rate": 1.7266925346710298e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0800933688879013,
"step": 3730,
"valid_targets_mean": 7036.1,
"valid_targets_min": 2562
},
{
"epoch": 4.131710016602103,
"grad_norm": 0.22579775043356334,
"learning_rate": 1.7212289262864062e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06760784983634949,
"step": 3735,
"valid_targets_mean": 6320.9,
"valid_targets_min": 2368
},
{
"epoch": 4.137244050913115,
"grad_norm": 0.23946866129603425,
"learning_rate": 1.7157674387018558e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05896640196442604,
"step": 3740,
"valid_targets_mean": 6202.8,
"valid_targets_min": 2211
},
{
"epoch": 4.142778085224128,
"grad_norm": 0.24631315838170026,
"learning_rate": 1.7103081134666082e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07588019222021103,
"step": 3745,
"valid_targets_mean": 6766.1,
"valid_targets_min": 2573
},
{
"epoch": 4.148312119535142,
"grad_norm": 0.239737773218279,
"learning_rate": 1.7048509921134414e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07164987921714783,
"step": 3750,
"valid_targets_mean": 6909.6,
"valid_targets_min": 1794
},
{
"epoch": 4.153846153846154,
"grad_norm": 0.23206720441459175,
"learning_rate": 1.6993961161583688e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07039956748485565,
"step": 3755,
"valid_targets_mean": 6667.0,
"valid_targets_min": 2490
},
{
"epoch": 4.159380188157167,
"grad_norm": 0.28050518211988124,
"learning_rate": 1.69394352710032e-05,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07837789505720139,
"step": 3760,
"valid_targets_mean": 7530.7,
"valid_targets_min": 2368
},
{
"epoch": 4.164914222468179,
"grad_norm": 0.2430050074307155,
"learning_rate": 1.6884932664208278e-05,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07588884234428406,
"step": 3765,
"valid_targets_mean": 7045.4,
"valid_targets_min": 2157
},
{
"epoch": 4.170448256779192,
"grad_norm": 0.2712507508374963,
"learning_rate": 1.6830453755837097e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08221418410539627,
"step": 3770,
"valid_targets_mean": 7343.0,
"valid_targets_min": 2030
},
{
"epoch": 4.175982291090205,
"grad_norm": 0.23336410380253853,
"learning_rate": 1.677599896034756e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08233041316270828,
"step": 3775,
"valid_targets_mean": 7534.6,
"valid_targets_min": 2929
},
{
"epoch": 4.181516325401217,
"grad_norm": 0.2407133203249527,
"learning_rate": 1.6721568692014132e-05,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08575388789176941,
"step": 3780,
"valid_targets_mean": 7523.0,
"valid_targets_min": 2726
},
{
"epoch": 4.18705035971223,
"grad_norm": 0.27008357658440313,
"learning_rate": 1.666716336492465e-05,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08472446352243423,
"step": 3785,
"valid_targets_mean": 7667.5,
"valid_targets_min": 2094
},
{
"epoch": 4.192584394023243,
"grad_norm": 0.25094042506394354,
"learning_rate": 1.661278339297725e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06790081411600113,
"step": 3790,
"valid_targets_mean": 6404.8,
"valid_targets_min": 1726
},
{
"epoch": 4.198118428334256,
"grad_norm": 0.24960985494169227,
"learning_rate": 1.6558429189877136e-05,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08814112097024918,
"step": 3795,
"valid_targets_mean": 7508.5,
"valid_targets_min": 1982
},
{
"epoch": 4.203652462645269,
"grad_norm": 0.23685380443519255,
"learning_rate": 1.6504101169133502e-05,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07432366907596588,
"step": 3800,
"valid_targets_mean": 6691.5,
"valid_targets_min": 2313
},
{
"epoch": 4.209186496956281,
"grad_norm": 0.2233873764002913,
"learning_rate": 1.6449799744056326e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07543178647756577,
"step": 3805,
"valid_targets_mean": 7022.8,
"valid_targets_min": 2791
},
{
"epoch": 4.214720531267294,
"grad_norm": 0.25189444245731557,
"learning_rate": 1.639552532775327e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07702386379241943,
"step": 3810,
"valid_targets_mean": 6730.0,
"valid_targets_min": 2100
},
{
"epoch": 4.220254565578307,
"grad_norm": 0.25534754639468726,
"learning_rate": 1.6341278333126537e-05,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06664300709962845,
"step": 3815,
"valid_targets_mean": 6620.6,
"valid_targets_min": 2477
},
{
"epoch": 4.225788599889319,
"grad_norm": 0.2974132005135256,
"learning_rate": 1.628705917286968e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06445831805467606,
"step": 3820,
"valid_targets_mean": 4577.6,
"valid_targets_min": 1817
},
{
"epoch": 4.231322634200332,
"grad_norm": 0.44015971722572467,
"learning_rate": 1.6232868259464533e-05,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051866840571165085,
"step": 3825,
"valid_targets_mean": 3941.8,
"valid_targets_min": 1708
},
{
"epoch": 4.2368566685113445,
"grad_norm": 0.42445133585718986,
"learning_rate": 1.6178706005178005e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06825078278779984,
"step": 3830,
"valid_targets_mean": 4732.0,
"valid_targets_min": 2113
},
{
"epoch": 4.242390702822357,
"grad_norm": 0.3906783833792015,
"learning_rate": 1.6124572822059002e-05,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0659128725528717,
"step": 3835,
"valid_targets_mean": 4162.7,
"valid_targets_min": 1439
},
{
"epoch": 4.247924737133371,
"grad_norm": 0.34059660618028414,
"learning_rate": 1.6070469121935244e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05694308876991272,
"step": 3840,
"valid_targets_mean": 4168.2,
"valid_targets_min": 1580
},
{
"epoch": 4.253458771444383,
"grad_norm": 0.3878126160306128,
"learning_rate": 1.601639531641017e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07526243478059769,
"step": 3845,
"valid_targets_mean": 4418.8,
"valid_targets_min": 1172
},
{
"epoch": 4.258992805755396,
"grad_norm": 0.3222207333090876,
"learning_rate": 1.59623518168598e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07659698277711868,
"step": 3850,
"valid_targets_mean": 4298.7,
"valid_targets_min": 1729
},
{
"epoch": 4.2645268400664085,
"grad_norm": 0.3405375114224534,
"learning_rate": 1.5908339034429553e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06387145072221756,
"step": 3855,
"valid_targets_mean": 4263.8,
"valid_targets_min": 1526
},
{
"epoch": 4.270060874377421,
"grad_norm": 0.35138119803410545,
"learning_rate": 1.585435738003122e-05,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07715055346488953,
"step": 3860,
"valid_targets_mean": 4593.6,
"valid_targets_min": 1793
},
{
"epoch": 4.275594908688434,
"grad_norm": 0.33785285840583545,
"learning_rate": 1.5800407264339723e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06908231228590012,
"step": 3865,
"valid_targets_mean": 4257.0,
"valid_targets_min": 2012
},
{
"epoch": 4.281128942999446,
"grad_norm": 0.3310320736650623,
"learning_rate": 1.5746489097790095e-05,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06672009080648422,
"step": 3870,
"valid_targets_mean": 3774.0,
"valid_targets_min": 1808
},
{
"epoch": 4.286662977310459,
"grad_norm": 0.311463607839016,
"learning_rate": 1.569260329057428e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07763797044754028,
"step": 3875,
"valid_targets_mean": 4852.8,
"valid_targets_min": 1619
},
{
"epoch": 4.292197011621472,
"grad_norm": 0.3118208083512682,
"learning_rate": 1.5638750252638063e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07648203521966934,
"step": 3880,
"valid_targets_mean": 4255.5,
"valid_targets_min": 1551
},
{
"epoch": 4.297731045932485,
"grad_norm": 0.3243321560248647,
"learning_rate": 1.5584930393677908e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07285168766975403,
"step": 3885,
"valid_targets_mean": 3931.0,
"valid_targets_min": 1430
},
{
"epoch": 4.303265080243498,
"grad_norm": 0.31813386126179766,
"learning_rate": 1.5531144123137884e-05,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06385066360235214,
"step": 3890,
"valid_targets_mean": 4537.8,
"valid_targets_min": 1511
},
{
"epoch": 4.30879911455451,
"grad_norm": 0.33780246281634424,
"learning_rate": 1.5477391850206526e-05,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08562406152486801,
"step": 3895,
"valid_targets_mean": 4946.9,
"valid_targets_min": 1389
},
{
"epoch": 4.314333148865523,
"grad_norm": 0.3090801042995307,
"learning_rate": 1.5423673983813714e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06944170594215393,
"step": 3900,
"valid_targets_mean": 4475.8,
"valid_targets_min": 1986
},
{
"epoch": 4.319867183176536,
"grad_norm": 0.2998739282759218,
"learning_rate": 1.53699909326276e-05,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0686049684882164,
"step": 3905,
"valid_targets_mean": 4404.4,
"valid_targets_min": 1591
},
{
"epoch": 4.325401217487548,
"grad_norm": 0.31359183343090213,
"learning_rate": 1.531634310505144e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07918906956911087,
"step": 3910,
"valid_targets_mean": 4628.4,
"valid_targets_min": 1929
},
{
"epoch": 4.330935251798561,
"grad_norm": 0.3021828405506255,
"learning_rate": 1.5262730909220545e-05,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06379434466362,
"step": 3915,
"valid_targets_mean": 4265.2,
"valid_targets_min": 1686
},
{
"epoch": 4.3364692861095735,
"grad_norm": 0.31493550037750695,
"learning_rate": 1.5209154752999142e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060155678540468216,
"step": 3920,
"valid_targets_mean": 3913.0,
"valid_targets_min": 1477
},
{
"epoch": 4.342003320420587,
"grad_norm": 0.2979376162118054,
"learning_rate": 1.515561504397728e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06678381562232971,
"step": 3925,
"valid_targets_mean": 4541.2,
"valid_targets_min": 2006
},
{
"epoch": 4.3475373547316,
"grad_norm": 0.34626094261505586,
"learning_rate": 1.5102112189467742e-05,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08782351016998291,
"step": 3930,
"valid_targets_mean": 4729.2,
"valid_targets_min": 1459
},
{
"epoch": 4.353071389042612,
"grad_norm": 0.350296048861095,
"learning_rate": 1.50486465965029e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07288840413093567,
"step": 3935,
"valid_targets_mean": 4464.4,
"valid_targets_min": 1616
},
{
"epoch": 4.358605423353625,
"grad_norm": 0.31987640666361744,
"learning_rate": 1.4995218671831705e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06294938921928406,
"step": 3940,
"valid_targets_mean": 3874.0,
"valid_targets_min": 1494
},
{
"epoch": 4.3641394576646375,
"grad_norm": 0.30819667327862005,
"learning_rate": 1.494182882191648e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06814851611852646,
"step": 3945,
"valid_targets_mean": 4333.2,
"valid_targets_min": 1769
},
{
"epoch": 4.36967349197565,
"grad_norm": 0.2924284374500159,
"learning_rate": 1.4888477452929939e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0692083016037941,
"step": 3950,
"valid_targets_mean": 4336.7,
"valid_targets_min": 1614
},
{
"epoch": 4.375207526286663,
"grad_norm": 0.2980347648638733,
"learning_rate": 1.4835164970752009e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06465265899896622,
"step": 3955,
"valid_targets_mean": 4379.2,
"valid_targets_min": 1480
},
{
"epoch": 4.380741560597675,
"grad_norm": 0.33585729515337576,
"learning_rate": 1.4781891780966807e-05,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07466866075992584,
"step": 3960,
"valid_targets_mean": 4534.8,
"valid_targets_min": 1647
},
{
"epoch": 4.386275594908689,
"grad_norm": 0.33954531909020547,
"learning_rate": 1.4728658288859513e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06735555827617645,
"step": 3965,
"valid_targets_mean": 4447.5,
"valid_targets_min": 1564
},
{
"epoch": 4.3918096292197015,
"grad_norm": 0.3253826621039958,
"learning_rate": 1.4675464899413284e-05,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062315523624420166,
"step": 3970,
"valid_targets_mean": 3862.5,
"valid_targets_min": 1318
},
{
"epoch": 4.397343663530714,
"grad_norm": 0.3159085492524021,
"learning_rate": 1.462231201730622e-05,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06629395484924316,
"step": 3975,
"valid_targets_mean": 3827.4,
"valid_targets_min": 1371
},
{
"epoch": 4.402877697841727,
"grad_norm": 0.32534308965146447,
"learning_rate": 1.456920004690823e-05,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07012656331062317,
"step": 3980,
"valid_targets_mean": 4606.9,
"valid_targets_min": 1870
},
{
"epoch": 4.408411732152739,
"grad_norm": 0.3216555715303935,
"learning_rate": 1.4516129392278003e-05,
"loss": 0.1268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05857391655445099,
"step": 3985,
"valid_targets_mean": 3911.3,
"valid_targets_min": 1488
},
{
"epoch": 4.413945766463752,
"grad_norm": 0.3282521488414122,
"learning_rate": 1.4463100457159877e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06805693358182907,
"step": 3990,
"valid_targets_mean": 4191.2,
"valid_targets_min": 1884
},
{
"epoch": 4.419479800774765,
"grad_norm": 0.32474929052230217,
"learning_rate": 1.4410113644980839e-05,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06785105913877487,
"step": 3995,
"valid_targets_mean": 4723.3,
"valid_targets_min": 1628
},
{
"epoch": 4.425013835085777,
"grad_norm": 0.3284907213593056,
"learning_rate": 1.4357169358847389e-05,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05492676421999931,
"step": 4000,
"valid_targets_mean": 4008.1,
"valid_targets_min": 1914
},
{
"epoch": 4.43054786939679,
"grad_norm": 0.35574101579330153,
"learning_rate": 1.4304268001542519e-05,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06498607993125916,
"step": 4005,
"valid_targets_mean": 4685.6,
"valid_targets_min": 2247
},
{
"epoch": 4.436081903707803,
"grad_norm": 0.33321809273036523,
"learning_rate": 1.4251409975522636e-05,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061576616019010544,
"step": 4010,
"valid_targets_mean": 4355.3,
"valid_targets_min": 1633
},
{
"epoch": 4.441615938018816,
"grad_norm": 0.33404638633231243,
"learning_rate": 1.419859568291447e-05,
"loss": 0.1283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07737898081541061,
"step": 4015,
"valid_targets_mean": 4712.5,
"valid_targets_min": 1714
},
{
"epoch": 4.447149972329829,
"grad_norm": 0.3497397035228793,
"learning_rate": 1.4145825525512083e-05,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06712006777524948,
"step": 4020,
"valid_targets_mean": 4363.5,
"valid_targets_min": 1473
},
{
"epoch": 4.452684006640841,
"grad_norm": 0.36013635115483095,
"learning_rate": 1.4093099904773726e-05,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06490481644868851,
"step": 4025,
"valid_targets_mean": 4250.2,
"valid_targets_min": 1551
},
{
"epoch": 4.458218040951854,
"grad_norm": 0.32488215075011995,
"learning_rate": 1.4040419221818868e-05,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06323728710412979,
"step": 4030,
"valid_targets_mean": 4371.3,
"valid_targets_min": 2003
},
{
"epoch": 4.4637520752628665,
"grad_norm": 0.3249210032879383,
"learning_rate": 1.3987783877425072e-05,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06592188030481339,
"step": 4035,
"valid_targets_mean": 4365.3,
"valid_targets_min": 1446
},
{
"epoch": 4.469286109573879,
"grad_norm": 0.28724233199462046,
"learning_rate": 1.393519427202501e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05613340064883232,
"step": 4040,
"valid_targets_mean": 5889.4,
"valid_targets_min": 1633
},
{
"epoch": 4.474820143884892,
"grad_norm": 0.23711156534213082,
"learning_rate": 1.3882650805703377e-05,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051731567829847336,
"step": 4045,
"valid_targets_mean": 5894.5,
"valid_targets_min": 2159
},
{
"epoch": 4.480354178195904,
"grad_norm": 0.19306426908842927,
"learning_rate": 1.3830153878193834e-05,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0583718977868557,
"step": 4050,
"valid_targets_mean": 5530.8,
"valid_targets_min": 2066
},
{
"epoch": 4.485888212506918,
"grad_norm": 0.18149358463243234,
"learning_rate": 1.3777703888876028e-05,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04824841022491455,
"step": 4055,
"valid_targets_mean": 5229.4,
"valid_targets_min": 1790
},
{
"epoch": 4.491422246817931,
"grad_norm": 0.17464115907385364,
"learning_rate": 1.3725301236772483e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05410352349281311,
"step": 4060,
"valid_targets_mean": 5318.1,
"valid_targets_min": 2531
},
{
"epoch": 4.496956281128943,
"grad_norm": 0.17874490281802502,
"learning_rate": 1.3672946320545628e-05,
"loss": 0.107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05268557742238045,
"step": 4065,
"valid_targets_mean": 5814.4,
"valid_targets_min": 1901
},
{
"epoch": 4.502490315439956,
"grad_norm": 0.16795797581062424,
"learning_rate": 1.362063953849469e-05,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04696022346615791,
"step": 4070,
"valid_targets_mean": 5287.9,
"valid_targets_min": 1855
},
{
"epoch": 4.508024349750968,
"grad_norm": 0.17567280237182417,
"learning_rate": 1.3568381288552748e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053378403186798096,
"step": 4075,
"valid_targets_mean": 5617.3,
"valid_targets_min": 1984
},
{
"epoch": 4.513558384061981,
"grad_norm": 0.17977586868192777,
"learning_rate": 1.3516171968283649e-05,
"loss": 0.0908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049263015389442444,
"step": 4080,
"valid_targets_mean": 5884.0,
"valid_targets_min": 2647
},
{
"epoch": 4.519092418372994,
"grad_norm": 0.19740781183830758,
"learning_rate": 1.3464011974878988e-05,
"loss": 0.0987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04521234333515167,
"step": 4085,
"valid_targets_mean": 5214.2,
"valid_targets_min": 2632
},
{
"epoch": 4.524626452684006,
"grad_norm": 0.20383505960047912,
"learning_rate": 1.3411901705155126e-05,
"loss": 0.0966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04395684972405434,
"step": 4090,
"valid_targets_mean": 5505.8,
"valid_targets_min": 2755
},
{
"epoch": 4.530160486995019,
"grad_norm": 0.19576017975585366,
"learning_rate": 1.3359841555550102e-05,
"loss": 0.0959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047161608934402466,
"step": 4095,
"valid_targets_mean": 5478.0,
"valid_targets_min": 1291
},
{
"epoch": 4.5356945213060325,
"grad_norm": 0.20223095318809983,
"learning_rate": 1.3307831922120691e-05,
"loss": 0.091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04582715034484863,
"step": 4100,
"valid_targets_mean": 5744.8,
"valid_targets_min": 1269
},
{
"epoch": 4.541228555617045,
"grad_norm": 0.20193723656409343,
"learning_rate": 1.325587320053934e-05,
"loss": 0.0894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04994739219546318,
"step": 4105,
"valid_targets_mean": 5808.3,
"valid_targets_min": 1922
},
{
"epoch": 4.546762589928058,
"grad_norm": 0.21038735128119,
"learning_rate": 1.3203965786091187e-05,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04188760742545128,
"step": 4110,
"valid_targets_mean": 5499.9,
"valid_targets_min": 1968
},
{
"epoch": 4.55229662423907,
"grad_norm": 0.21118246301948174,
"learning_rate": 1.3152110073671027e-05,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040510065853595734,
"step": 4115,
"valid_targets_mean": 5453.8,
"valid_targets_min": 1899
},
{
"epoch": 4.557830658550083,
"grad_norm": 0.20307802961381277,
"learning_rate": 1.3100306457780339e-05,
"loss": 0.0887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048915524035692215,
"step": 4120,
"valid_targets_mean": 5544.6,
"valid_targets_min": 2127
},
{
"epoch": 4.563364692861096,
"grad_norm": 0.2178967026283615,
"learning_rate": 1.3048555332524263e-05,
"loss": 0.0874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04666067659854889,
"step": 4125,
"valid_targets_mean": 5964.0,
"valid_targets_min": 2088
},
{
"epoch": 4.568898727172108,
"grad_norm": 0.20195987432932186,
"learning_rate": 1.2996857091608595e-05,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037834491580724716,
"step": 4130,
"valid_targets_mean": 5607.6,
"valid_targets_min": 3237
},
{
"epoch": 4.574432761483121,
"grad_norm": 0.19860253079715776,
"learning_rate": 1.2945212128336819e-05,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04107757285237312,
"step": 4135,
"valid_targets_mean": 5680.2,
"valid_targets_min": 2183
},
{
"epoch": 4.5799667957941335,
"grad_norm": 0.2018354713018964,
"learning_rate": 1.2893620835607092e-05,
"loss": 0.0885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046085942536592484,
"step": 4140,
"valid_targets_mean": 5323.5,
"valid_targets_min": 2257
},
{
"epoch": 4.585500830105147,
"grad_norm": 0.21606523713545506,
"learning_rate": 1.2842083605909276e-05,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04127819463610649,
"step": 4145,
"valid_targets_mean": 5460.1,
"valid_targets_min": 3076
},
{
"epoch": 4.59103486441616,
"grad_norm": 0.2101210681414386,
"learning_rate": 1.2790600831321913e-05,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04266387224197388,
"step": 4150,
"valid_targets_mean": 5721.5,
"valid_targets_min": 1692
},
{
"epoch": 4.596568898727172,
"grad_norm": 0.19303279577936738,
"learning_rate": 1.273917290350929e-05,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04391302540898323,
"step": 4155,
"valid_targets_mean": 5423.7,
"valid_targets_min": 2850
},
{
"epoch": 4.602102933038185,
"grad_norm": 0.2196543955803934,
"learning_rate": 1.268780021371844e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04037768021225929,
"step": 4160,
"valid_targets_mean": 5830.5,
"valid_targets_min": 2413
},
{
"epoch": 4.6076369673491975,
"grad_norm": 0.1984560903462667,
"learning_rate": 1.2636483152776143e-05,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04546644166111946,
"step": 4165,
"valid_targets_mean": 5912.3,
"valid_targets_min": 2614
},
{
"epoch": 4.61317100166021,
"grad_norm": 0.22930911625183262,
"learning_rate": 1.2585222111085996e-05,
"loss": 0.0875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046509597450494766,
"step": 4170,
"valid_targets_mean": 5704.6,
"valid_targets_min": 1416
},
{
"epoch": 4.618705035971223,
"grad_norm": 0.21168966624145297,
"learning_rate": 1.2534017478625391e-05,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04334982857108116,
"step": 4175,
"valid_targets_mean": 5734.4,
"valid_targets_min": 2234
},
{
"epoch": 4.624239070282236,
"grad_norm": 0.2125073621973969,
"learning_rate": 1.2482869644942608e-05,
"loss": 0.0751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04163689911365509,
"step": 4180,
"valid_targets_mean": 5532.1,
"valid_targets_min": 2237
},
{
"epoch": 4.629773104593248,
"grad_norm": 0.21539042139380618,
"learning_rate": 1.2431778999153796e-05,
"loss": 0.0836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03761904314160347,
"step": 4185,
"valid_targets_mean": 4842.2,
"valid_targets_min": 1875
},
{
"epoch": 4.6353071389042615,
"grad_norm": 0.205450846924651,
"learning_rate": 1.2380745929940052e-05,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0382852703332901,
"step": 4190,
"valid_targets_mean": 5742.5,
"valid_targets_min": 2469
},
{
"epoch": 4.640841173215274,
"grad_norm": 0.19439066732416754,
"learning_rate": 1.232977082554445e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03928928077220917,
"step": 4195,
"valid_targets_mean": 5476.2,
"valid_targets_min": 1835
},
{
"epoch": 4.646375207526287,
"grad_norm": 0.1853857456809193,
"learning_rate": 1.2278854073769066e-05,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037013471126556396,
"step": 4200,
"valid_targets_mean": 5632.0,
"valid_targets_min": 1288
},
{
"epoch": 4.651909241837299,
"grad_norm": 0.20631684561188882,
"learning_rate": 1.2227996061972083e-05,
"loss": 0.075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03684552013874054,
"step": 4205,
"valid_targets_mean": 5595.0,
"valid_targets_min": 2228
},
{
"epoch": 4.657443276148312,
"grad_norm": 0.2192507106190281,
"learning_rate": 1.2177197177064768e-05,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04795651137828827,
"step": 4210,
"valid_targets_mean": 6140.2,
"valid_targets_min": 2896
},
{
"epoch": 4.662977310459325,
"grad_norm": 0.2121775921922545,
"learning_rate": 1.2126457805508603e-05,
"loss": 0.0782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03650488331913948,
"step": 4215,
"valid_targets_mean": 5670.7,
"valid_targets_min": 2615
},
{
"epoch": 4.668511344770337,
"grad_norm": 0.20449506169734838,
"learning_rate": 1.207577833331229e-05,
"loss": 0.08,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04212837293744087,
"step": 4220,
"valid_targets_mean": 6108.9,
"valid_targets_min": 3283
},
{
"epoch": 4.674045379081351,
"grad_norm": 0.19508106582699883,
"learning_rate": 1.202515914602886e-05,
"loss": 0.0777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03631249815225601,
"step": 4225,
"valid_targets_mean": 5478.3,
"valid_targets_min": 2154
},
{
"epoch": 4.679579413392363,
"grad_norm": 0.20810963639880978,
"learning_rate": 1.1974600628752681e-05,
"loss": 0.0784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03693137690424919,
"step": 4230,
"valid_targets_mean": 5802.5,
"valid_targets_min": 1887
},
{
"epoch": 4.685113447703376,
"grad_norm": 0.21279762134599406,
"learning_rate": 1.1924103166116598e-05,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038755886256694794,
"step": 4235,
"valid_targets_mean": 5761.5,
"valid_targets_min": 1754
},
{
"epoch": 4.690647482014389,
"grad_norm": 0.20795635056360526,
"learning_rate": 1.1873667142288956e-05,
"loss": 0.0723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03495751693844795,
"step": 4240,
"valid_targets_mean": 5489.2,
"valid_targets_min": 2284
},
{
"epoch": 4.696181516325401,
"grad_norm": 0.20836060464310172,
"learning_rate": 1.1823292940970692e-05,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03726666420698166,
"step": 4245,
"valid_targets_mean": 5341.3,
"valid_targets_min": 2340
},
{
"epoch": 4.701715550636414,
"grad_norm": 0.20843861440410902,
"learning_rate": 1.1772980945392427e-05,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03751606121659279,
"step": 4250,
"valid_targets_mean": 5431.4,
"valid_targets_min": 1828
},
{
"epoch": 4.7072495849474265,
"grad_norm": 0.19972530412032494,
"learning_rate": 1.172273153831152e-05,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03226105496287346,
"step": 4255,
"valid_targets_mean": 5290.1,
"valid_targets_min": 2681
},
{
"epoch": 4.712783619258439,
"grad_norm": 0.20865318170034022,
"learning_rate": 1.167254510200921e-05,
"loss": 0.074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04075950011610985,
"step": 4260,
"valid_targets_mean": 5485.9,
"valid_targets_min": 2475
},
{
"epoch": 4.718317653569452,
"grad_norm": 0.23813125977819116,
"learning_rate": 1.1622422018287635e-05,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03836166486144066,
"step": 4265,
"valid_targets_mean": 5596.4,
"valid_targets_min": 2069
},
{
"epoch": 4.723851687880465,
"grad_norm": 0.21498738596125336,
"learning_rate": 1.1572362668466995e-05,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04106292873620987,
"step": 4270,
"valid_targets_mean": 5956.1,
"valid_targets_min": 2766
},
{
"epoch": 4.729385722191478,
"grad_norm": 0.21114082725651798,
"learning_rate": 1.1522367433382633e-05,
"loss": 0.0752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039354342967271805,
"step": 4275,
"valid_targets_mean": 5119.2,
"valid_targets_min": 2043
},
{
"epoch": 4.7349197565024905,
"grad_norm": 0.2151908373056844,
"learning_rate": 1.147243669338209e-05,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037762101739645004,
"step": 4280,
"valid_targets_mean": 5718.6,
"valid_targets_min": 2696
},
{
"epoch": 4.740453790813503,
"grad_norm": 0.2099551489654757,
"learning_rate": 1.1422570828322285e-05,
"loss": 0.0762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039806973189115524,
"step": 4285,
"valid_targets_mean": 5818.4,
"valid_targets_min": 2425
},
{
"epoch": 4.745987825124516,
"grad_norm": 0.20429021711714365,
"learning_rate": 1.1372770217566562e-05,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03849330544471741,
"step": 4290,
"valid_targets_mean": 5530.9,
"valid_targets_min": 1540
},
{
"epoch": 4.751521859435528,
"grad_norm": 0.2026865420434942,
"learning_rate": 1.1323035239981856e-05,
"loss": 0.0789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03567812219262123,
"step": 4295,
"valid_targets_mean": 5335.0,
"valid_targets_min": 2544
},
{
"epoch": 4.757055893746541,
"grad_norm": 0.29789586977612714,
"learning_rate": 1.1273366273935759e-05,
"loss": 0.0959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05724092945456505,
"step": 4300,
"valid_targets_mean": 4571.2,
"valid_targets_min": 2219
},
{
"epoch": 4.762589928057554,
"grad_norm": 0.3316362801818146,
"learning_rate": 1.1223763697293695e-05,
"loss": 0.1046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04876897856593132,
"step": 4305,
"valid_targets_mean": 3826.4,
"valid_targets_min": 1483
},
{
"epoch": 4.768123962368566,
"grad_norm": 0.33551860487043705,
"learning_rate": 1.1174227887416005e-05,
"loss": 0.103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05014974996447563,
"step": 4310,
"valid_targets_mean": 4318.0,
"valid_targets_min": 1571
},
{
"epoch": 4.77365799667958,
"grad_norm": 0.327002436914812,
"learning_rate": 1.1124759221155092e-05,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0552230030298233,
"step": 4315,
"valid_targets_mean": 4533.9,
"valid_targets_min": 1401
},
{
"epoch": 4.779192030990592,
"grad_norm": 0.28803494848222577,
"learning_rate": 1.107535807485256e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05753651261329651,
"step": 4320,
"valid_targets_mean": 4452.8,
"valid_targets_min": 2102
},
{
"epoch": 4.784726065301605,
"grad_norm": 0.2686551481691491,
"learning_rate": 1.1026024824336323e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051282186061143875,
"step": 4325,
"valid_targets_mean": 3980.8,
"valid_targets_min": 1100
},
{
"epoch": 4.790260099612618,
"grad_norm": 0.3433498093901168,
"learning_rate": 1.0976759844917795e-05,
"loss": 0.1003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04425298050045967,
"step": 4330,
"valid_targets_mean": 6227.9,
"valid_targets_min": 952
},
{
"epoch": 4.79579413392363,
"grad_norm": 0.33910744534375425,
"learning_rate": 1.092756351138897e-05,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05586230754852295,
"step": 4335,
"valid_targets_mean": 7692.2,
"valid_targets_min": 974
},
{
"epoch": 4.801328168234643,
"grad_norm": 0.3059364705184329,
"learning_rate": 1.0878436198019645e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05682585760951042,
"step": 4340,
"valid_targets_mean": 8154.4,
"valid_targets_min": 2085
},
{
"epoch": 4.8068622025456555,
"grad_norm": 0.27601921800383866,
"learning_rate": 1.0829378278554493e-05,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04944746568799019,
"step": 4345,
"valid_targets_mean": 7351.3,
"valid_targets_min": 917
},
{
"epoch": 4.812396236856668,
"grad_norm": 0.2769996942215238,
"learning_rate": 1.0780390126210288e-05,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054811980575323105,
"step": 4350,
"valid_targets_mean": 7964.9,
"valid_targets_min": 2908
},
{
"epoch": 4.817930271167681,
"grad_norm": 0.22968483653271038,
"learning_rate": 1.0731472113673052e-05,
"loss": 0.1057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04972505569458008,
"step": 4355,
"valid_targets_mean": 7937.8,
"valid_targets_min": 1400
},
{
"epoch": 4.823464305478694,
"grad_norm": 0.2853677264211911,
"learning_rate": 1.0682624613095167e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06412405520677567,
"step": 4360,
"valid_targets_mean": 12586.8,
"valid_targets_min": 5456
},
{
"epoch": 4.828998339789707,
"grad_norm": 0.1943599246918971,
"learning_rate": 1.0633847996092614e-05,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0753672644495964,
"step": 4365,
"valid_targets_mean": 13651.0,
"valid_targets_min": 1115
},
{
"epoch": 4.83453237410072,
"grad_norm": 0.1775365824202433,
"learning_rate": 1.0585142633742092e-05,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07086262851953506,
"step": 4370,
"valid_targets_mean": 14026.5,
"valid_targets_min": 1038
},
{
"epoch": 4.840066408411732,
"grad_norm": 0.1549695067204721,
"learning_rate": 1.0536508896578242e-05,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06735699623823166,
"step": 4375,
"valid_targets_mean": 12705.8,
"valid_targets_min": 1006
},
{
"epoch": 4.845600442722745,
"grad_norm": 0.22373494573606925,
"learning_rate": 1.0487947154590772e-05,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04747587442398071,
"step": 4380,
"valid_targets_mean": 7084.4,
"valid_targets_min": 1340
},
{
"epoch": 4.851134477033757,
"grad_norm": 0.24007175445827605,
"learning_rate": 1.0439457777221706e-05,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04307395592331886,
"step": 4385,
"valid_targets_mean": 7130.2,
"valid_targets_min": 915
},
{
"epoch": 4.85666851134477,
"grad_norm": 0.29404821959647026,
"learning_rate": 1.0391041133362523e-05,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06584474444389343,
"step": 4390,
"valid_targets_mean": 5321.2,
"valid_targets_min": 2197
},
{
"epoch": 4.862202545655783,
"grad_norm": 0.26180868997040285,
"learning_rate": 1.0342697591351377e-05,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049729812890291214,
"step": 4395,
"valid_targets_mean": 4732.5,
"valid_targets_min": 1967
},
{
"epoch": 4.867736579966795,
"grad_norm": 0.29007400477711953,
"learning_rate": 1.0294427518970292e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05817165970802307,
"step": 4400,
"valid_targets_mean": 5243.5,
"valid_targets_min": 1678
},
{
"epoch": 4.873270614277809,
"grad_norm": 0.3072483070061111,
"learning_rate": 1.0246231283442332e-05,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05918870493769646,
"step": 4405,
"valid_targets_mean": 5038.7,
"valid_targets_min": 1770
},
{
"epoch": 4.8788046485888215,
"grad_norm": 0.28996219297193787,
"learning_rate": 1.0198109251428872e-05,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05295060947537422,
"step": 4410,
"valid_targets_mean": 4237.3,
"valid_targets_min": 1640
},
{
"epoch": 4.884338682899834,
"grad_norm": 0.27499077703198677,
"learning_rate": 1.0150061789026733e-05,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06034369766712189,
"step": 4415,
"valid_targets_mean": 4563.9,
"valid_targets_min": 1755
},
{
"epoch": 4.889872717210847,
"grad_norm": 0.31840419017600025,
"learning_rate": 1.0102089261765462e-05,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06176462769508362,
"step": 4420,
"valid_targets_mean": 5055.2,
"valid_targets_min": 1858
},
{
"epoch": 4.895406751521859,
"grad_norm": 0.2689260733055054,
"learning_rate": 1.0054192034604522e-05,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06580108404159546,
"step": 4425,
"valid_targets_mean": 4773.1,
"valid_targets_min": 1714
},
{
"epoch": 4.900940785832872,
"grad_norm": 0.2647577766370914,
"learning_rate": 1.000637047193049e-05,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0675923228263855,
"step": 4430,
"valid_targets_mean": 5269.0,
"valid_targets_min": 1316
},
{
"epoch": 4.906474820143885,
"grad_norm": 0.25175825106931504,
"learning_rate": 9.958624937554356e-06,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0740848183631897,
"step": 4435,
"valid_targets_mean": 5723.2,
"valid_targets_min": 1929
},
{
"epoch": 4.912008854454898,
"grad_norm": 0.2541669896283131,
"learning_rate": 9.910955794708668e-06,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06130128726363182,
"step": 4440,
"valid_targets_mean": 4649.5,
"valid_targets_min": 1923
},
{
"epoch": 4.917542888765911,
"grad_norm": 0.24388814289257738,
"learning_rate": 9.863363406044849e-06,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06754420697689056,
"step": 4445,
"valid_targets_mean": 4893.2,
"valid_targets_min": 1673
},
{
"epoch": 4.923076923076923,
"grad_norm": 0.253006989245634,
"learning_rate": 9.815848133630364e-06,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0545407272875309,
"step": 4450,
"valid_targets_mean": 4655.0,
"valid_targets_min": 1883
},
{
"epoch": 4.928610957387936,
"grad_norm": 0.26114474356839684,
"learning_rate": 9.768410338946038e-06,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0732916072010994,
"step": 4455,
"valid_targets_mean": 5300.7,
"valid_targets_min": 2051
},
{
"epoch": 4.934144991698949,
"grad_norm": 0.2541083629983541,
"learning_rate": 9.721050382883242e-06,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0583202950656414,
"step": 4460,
"valid_targets_mean": 4678.7,
"valid_targets_min": 1933
},
{
"epoch": 4.939679026009961,
"grad_norm": 0.2414388793326451,
"learning_rate": 9.673768625741193e-06,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061433177441358566,
"step": 4465,
"valid_targets_mean": 5780.5,
"valid_targets_min": 1422
},
{
"epoch": 4.945213060320974,
"grad_norm": 0.26581185336094676,
"learning_rate": 9.626565427224192e-06,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0596851110458374,
"step": 4470,
"valid_targets_mean": 4821.9,
"valid_targets_min": 2022
},
{
"epoch": 4.9507470946319865,
"grad_norm": 0.2735582196598092,
"learning_rate": 9.57944114643889e-06,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05883411690592766,
"step": 4475,
"valid_targets_mean": 4274.3,
"valid_targets_min": 1649
},
{
"epoch": 4.956281128942999,
"grad_norm": 0.27818780258660997,
"learning_rate": 9.532396141891569e-06,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0458868183195591,
"step": 4480,
"valid_targets_mean": 4046.1,
"valid_targets_min": 1637
},
{
"epoch": 4.961815163254013,
"grad_norm": 0.3003596198137884,
"learning_rate": 9.485430771485373e-06,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04684314504265785,
"step": 4485,
"valid_targets_mean": 4062.4,
"valid_targets_min": 1853
},
{
"epoch": 4.967349197565025,
"grad_norm": 0.2868799722839849,
"learning_rate": 9.438545392517652e-06,
"loss": 0.0991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04980555176734924,
"step": 4490,
"valid_targets_mean": 4217.3,
"valid_targets_min": 1262
},
{
"epoch": 4.972883231876038,
"grad_norm": 0.26196698800655627,
"learning_rate": 9.391740361677173e-06,
"loss": 0.1015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04342920705676079,
"step": 4495,
"valid_targets_mean": 4143.7,
"valid_targets_min": 1761
},
{
"epoch": 4.9784172661870505,
"grad_norm": 0.26604115606438405,
"learning_rate": 9.345016035041465e-06,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05186079069972038,
"step": 4500,
"valid_targets_mean": 4363.9,
"valid_targets_min": 1864
},
{
"epoch": 4.983951300498063,
"grad_norm": 0.278259737373658,
"learning_rate": 9.298372768074087e-06,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05233500525355339,
"step": 4505,
"valid_targets_mean": 4360.2,
"valid_targets_min": 1789
},
{
"epoch": 4.989485334809076,
"grad_norm": 0.25668363958803886,
"learning_rate": 9.251810915621886e-06,
"loss": 0.1026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05602368712425232,
"step": 4510,
"valid_targets_mean": 4662.1,
"valid_targets_min": 1550
},
{
"epoch": 4.995019369120088,
"grad_norm": 0.2768152114205245,
"learning_rate": 9.205330831912391e-06,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048191387206315994,
"step": 4515,
"valid_targets_mean": 4001.0,
"valid_targets_min": 1185
},
{
"epoch": 5.0,
"grad_norm": 0.26913245830976207,
"learning_rate": 9.158932870551012e-06,
"loss": 0.0912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051119934767484665,
"step": 4520,
"valid_targets_mean": 6656.8,
"valid_targets_min": 2566
},
{
"epoch": 5.005534034311013,
"grad_norm": 0.3818780932790394,
"learning_rate": 9.11261738451843e-06,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06865507364273071,
"step": 4525,
"valid_targets_mean": 6579.2,
"valid_targets_min": 1651
},
{
"epoch": 5.011068068622025,
"grad_norm": 0.26736649847077115,
"learning_rate": 9.066384726167852e-06,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07701835036277771,
"step": 4530,
"valid_targets_mean": 6844.8,
"valid_targets_min": 2928
},
{
"epoch": 5.016602102933038,
"grad_norm": 0.24921269016703676,
"learning_rate": 9.02023524722238e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0844825804233551,
"step": 4535,
"valid_targets_mean": 6970.2,
"valid_targets_min": 1816
},
{
"epoch": 5.0221361372440505,
"grad_norm": 0.23123025216852947,
"learning_rate": 8.97416929877232e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08778110146522522,
"step": 4540,
"valid_targets_mean": 7589.0,
"valid_targets_min": 2058
},
{
"epoch": 5.027670171555064,
"grad_norm": 0.2183352157949055,
"learning_rate": 8.928187231272473e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08101414889097214,
"step": 4545,
"valid_targets_mean": 7366.7,
"valid_targets_min": 3293
},
{
"epoch": 5.033204205866077,
"grad_norm": 0.22039800103534601,
"learning_rate": 8.882289394539535e-06,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06690150499343872,
"step": 4550,
"valid_targets_mean": 6763.6,
"valid_targets_min": 2844
},
{
"epoch": 5.038738240177089,
"grad_norm": 0.21931906805649626,
"learning_rate": 8.836476137749385e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07438153773546219,
"step": 4555,
"valid_targets_mean": 6678.9,
"valid_targets_min": 2465
},
{
"epoch": 5.044272274488102,
"grad_norm": 0.20586807991514844,
"learning_rate": 8.790747809434455e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06708905845880508,
"step": 4560,
"valid_targets_mean": 7128.3,
"valid_targets_min": 2482
},
{
"epoch": 5.0498063087991145,
"grad_norm": 0.2325373502097837,
"learning_rate": 8.745104757481046e-06,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06491201370954514,
"step": 4565,
"valid_targets_mean": 6365.0,
"valid_targets_min": 1594
},
{
"epoch": 5.055340343110127,
"grad_norm": 0.28916764748195456,
"learning_rate": 8.699547329126736e-06,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06788638234138489,
"step": 4570,
"valid_targets_mean": 6929.4,
"valid_targets_min": 2099
},
{
"epoch": 5.06087437742114,
"grad_norm": 0.25615559212069233,
"learning_rate": 8.654075870957676e-06,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05642274022102356,
"step": 4575,
"valid_targets_mean": 6168.6,
"valid_targets_min": 1277
},
{
"epoch": 5.066408411732152,
"grad_norm": 0.2691284143249438,
"learning_rate": 8.608690728906004e-06,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06038684770464897,
"step": 4580,
"valid_targets_mean": 6729.7,
"valid_targets_min": 2910
},
{
"epoch": 5.071942446043165,
"grad_norm": 0.2751600219231519,
"learning_rate": 8.563392248247193e-06,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06257107108831406,
"step": 4585,
"valid_targets_mean": 6594.8,
"valid_targets_min": 1941
},
{
"epoch": 5.0774764803541785,
"grad_norm": 0.250400668036176,
"learning_rate": 8.518180773597406e-06,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062037717550992966,
"step": 4590,
"valid_targets_mean": 6777.4,
"valid_targets_min": 2598
},
{
"epoch": 5.083010514665191,
"grad_norm": 0.23213367037483715,
"learning_rate": 8.473056648910909e-06,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061457958072423935,
"step": 4595,
"valid_targets_mean": 6707.7,
"valid_targets_min": 2313
},
{
"epoch": 5.088544548976204,
"grad_norm": 0.24681629870719266,
"learning_rate": 8.428020217477435e-06,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06621939688920975,
"step": 4600,
"valid_targets_mean": 7161.9,
"valid_targets_min": 1638
},
{
"epoch": 5.094078583287216,
"grad_norm": 0.22011790924248184,
"learning_rate": 8.383071821919581e-06,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06517525762319565,
"step": 4605,
"valid_targets_mean": 7025.5,
"valid_targets_min": 3109
},
{
"epoch": 5.099612617598229,
"grad_norm": 0.2308272738760395,
"learning_rate": 8.338211804190171e-06,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06220779940485954,
"step": 4610,
"valid_targets_mean": 6895.4,
"valid_targets_min": 2040
},
{
"epoch": 5.105146651909242,
"grad_norm": 0.2519594431488911,
"learning_rate": 8.293440505569702e-06,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06370244175195694,
"step": 4615,
"valid_targets_mean": 6505.2,
"valid_targets_min": 2623
},
{
"epoch": 5.110680686220254,
"grad_norm": 0.23678060362713865,
"learning_rate": 8.248758266663732e-06,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06401697546243668,
"step": 4620,
"valid_targets_mean": 6831.8,
"valid_targets_min": 2450
},
{
"epoch": 5.116214720531267,
"grad_norm": 0.2512630049931684,
"learning_rate": 8.204165427400248e-06,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05943406745791435,
"step": 4625,
"valid_targets_mean": 6923.1,
"valid_targets_min": 3116
},
{
"epoch": 5.12174875484228,
"grad_norm": 0.262980975137919,
"learning_rate": 8.159662327027143e-06,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051256000995635986,
"step": 4630,
"valid_targets_mean": 6147.5,
"valid_targets_min": 2014
},
{
"epoch": 5.127282789153293,
"grad_norm": 0.25330742312270843,
"learning_rate": 8.115249304109596e-06,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062148112803697586,
"step": 4635,
"valid_targets_mean": 6990.4,
"valid_targets_min": 2412
},
{
"epoch": 5.132816823464306,
"grad_norm": 0.23882554511618578,
"learning_rate": 8.070926696527512e-06,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058880433440208435,
"step": 4640,
"valid_targets_mean": 6798.5,
"valid_targets_min": 2824
},
{
"epoch": 5.138350857775318,
"grad_norm": 0.31616935487527625,
"learning_rate": 8.026694841472929e-06,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05718575045466423,
"step": 4645,
"valid_targets_mean": 7045.3,
"valid_targets_min": 2530
},
{
"epoch": 5.143884892086331,
"grad_norm": 0.2323324300764862,
"learning_rate": 7.982554075447482e-06,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05392269790172577,
"step": 4650,
"valid_targets_mean": 6538.4,
"valid_targets_min": 1802
},
{
"epoch": 5.1494189263973436,
"grad_norm": 0.26192731565345284,
"learning_rate": 7.938504734259836e-06,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0585092194378376,
"step": 4655,
"valid_targets_mean": 6699.4,
"valid_targets_min": 2155
},
{
"epoch": 5.154952960708356,
"grad_norm": 0.27065708663094357,
"learning_rate": 7.894547153023104e-06,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052169669419527054,
"step": 4660,
"valid_targets_mean": 6332.6,
"valid_targets_min": 2295
},
{
"epoch": 5.160486995019369,
"grad_norm": 0.2792905073585824,
"learning_rate": 7.850681666152348e-06,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06055386736989021,
"step": 4665,
"valid_targets_mean": 6915.4,
"valid_targets_min": 1863
},
{
"epoch": 5.166021029330381,
"grad_norm": 0.26818560060554336,
"learning_rate": 7.806908607361975e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05585666000843048,
"step": 4670,
"valid_targets_mean": 6859.3,
"valid_targets_min": 1842
},
{
"epoch": 5.171555063641395,
"grad_norm": 0.24361678510373205,
"learning_rate": 7.763228309663249e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05813150480389595,
"step": 4675,
"valid_targets_mean": 6832.0,
"valid_targets_min": 2689
},
{
"epoch": 5.177089097952408,
"grad_norm": 0.25066633263052085,
"learning_rate": 7.719641105361734e-06,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05950310826301575,
"step": 4680,
"valid_targets_mean": 6902.6,
"valid_targets_min": 2882
},
{
"epoch": 5.18262313226342,
"grad_norm": 0.2379735265243224,
"learning_rate": 7.676147326054777e-06,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04992043972015381,
"step": 4685,
"valid_targets_mean": 6325.6,
"valid_targets_min": 1950
},
{
"epoch": 5.188157166574433,
"grad_norm": 0.23783821622074944,
"learning_rate": 7.632747302628955e-06,
"loss": 0.1181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05535200610756874,
"step": 4690,
"valid_targets_mean": 7014.8,
"valid_targets_min": 2827
},
{
"epoch": 5.1936912008854454,
"grad_norm": 0.2536124353503241,
"learning_rate": 7.589441365257602e-06,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059621792286634445,
"step": 4695,
"valid_targets_mean": 6979.4,
"valid_targets_min": 2777
},
{
"epoch": 5.199225235196458,
"grad_norm": 0.2624400473065704,
"learning_rate": 7.546229843398271e-06,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05143032595515251,
"step": 4700,
"valid_targets_mean": 6767.5,
"valid_targets_min": 2923
},
{
"epoch": 5.204759269507471,
"grad_norm": 0.23777881827254418,
"learning_rate": 7.503113065790222e-06,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05865449085831642,
"step": 4705,
"valid_targets_mean": 6852.5,
"valid_targets_min": 2299
},
{
"epoch": 5.210293303818483,
"grad_norm": 0.2662602707599381,
"learning_rate": 7.4600913604519445e-06,
"loss": 0.1174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056671250611543655,
"step": 4710,
"valid_targets_mean": 6578.0,
"valid_targets_min": 1726
},
{
"epoch": 5.215827338129497,
"grad_norm": 0.25881459566492687,
"learning_rate": 7.417165054678643e-06,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05237901210784912,
"step": 4715,
"valid_targets_mean": 6188.8,
"valid_targets_min": 2385
},
{
"epoch": 5.2213613724405095,
"grad_norm": 0.2578321461673644,
"learning_rate": 7.374334475039762e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05409706011414528,
"step": 4720,
"valid_targets_mean": 6247.0,
"valid_targets_min": 1759
},
{
"epoch": 5.226895406751522,
"grad_norm": 0.3264457151684806,
"learning_rate": 7.331599947376471e-06,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04035346210002899,
"step": 4725,
"valid_targets_mean": 3846.9,
"valid_targets_min": 1635
},
{
"epoch": 5.232429441062535,
"grad_norm": 0.40942657277044675,
"learning_rate": 7.2889617967992255e-06,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04189052805304527,
"step": 4730,
"valid_targets_mean": 4104.0,
"valid_targets_min": 1728
},
{
"epoch": 5.237963475373547,
"grad_norm": 0.41042956707091544,
"learning_rate": 7.246420347685279e-06,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06203579530119896,
"step": 4735,
"valid_targets_mean": 5437.0,
"valid_targets_min": 2245
},
{
"epoch": 5.24349750968456,
"grad_norm": 0.3061378279333753,
"learning_rate": 7.203975923676187e-06,
"loss": 0.0966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044795963913202286,
"step": 4740,
"valid_targets_mean": 4097.2,
"valid_targets_min": 1379
},
{
"epoch": 5.249031543995573,
"grad_norm": 0.2914998837573403,
"learning_rate": 7.161628847675404e-06,
"loss": 0.0912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04384605959057808,
"step": 4745,
"valid_targets_mean": 4265.5,
"valid_targets_min": 1788
},
{
"epoch": 5.254565578306585,
"grad_norm": 0.30376807330939326,
"learning_rate": 7.119379441845755e-06,
"loss": 0.0981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04657572880387306,
"step": 4750,
"valid_targets_mean": 4447.0,
"valid_targets_min": 1177
},
{
"epoch": 5.260099612617598,
"grad_norm": 0.3306816287024313,
"learning_rate": 7.077228027607051e-06,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047103408724069595,
"step": 4755,
"valid_targets_mean": 4379.6,
"valid_targets_min": 1555
},
{
"epoch": 5.265633646928611,
"grad_norm": 0.3191925419611457,
"learning_rate": 7.035174925633601e-06,
"loss": 0.1048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06188632547855377,
"step": 4760,
"valid_targets_mean": 5404.9,
"valid_targets_min": 1590
},
{
"epoch": 5.271167681239624,
"grad_norm": 0.27568048786242777,
"learning_rate": 6.993220455851793e-06,
"loss": 0.0967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044619277119636536,
"step": 4765,
"valid_targets_mean": 4231.8,
"valid_targets_min": 1726
},
{
"epoch": 5.276701715550637,
"grad_norm": 0.2681799337705664,
"learning_rate": 6.9513649374376545e-06,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05106706544756889,
"step": 4770,
"valid_targets_mean": 4803.9,
"valid_targets_min": 1700
},
{
"epoch": 5.282235749861649,
"grad_norm": 0.298973414328357,
"learning_rate": 6.909608688814406e-06,
"loss": 0.098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044636014848947525,
"step": 4775,
"valid_targets_mean": 3728.0,
"valid_targets_min": 1113
},
{
"epoch": 5.287769784172662,
"grad_norm": 0.28881994899588387,
"learning_rate": 6.867952027650082e-06,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06730066984891891,
"step": 4780,
"valid_targets_mean": 5108.4,
"valid_targets_min": 1637
},
{
"epoch": 5.2933038184836745,
"grad_norm": 0.30289762439677825,
"learning_rate": 6.82639527085506e-06,
"loss": 0.099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04290211200714111,
"step": 4785,
"valid_targets_mean": 4185.0,
"valid_targets_min": 2178
},
{
"epoch": 5.298837852794687,
"grad_norm": 0.25043690090210174,
"learning_rate": 6.784938734579696e-06,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045655298978090286,
"step": 4790,
"valid_targets_mean": 4341.5,
"valid_targets_min": 1581
},
{
"epoch": 5.3043718871057,
"grad_norm": 0.305794362107919,
"learning_rate": 6.7435827342118975e-06,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051216140389442444,
"step": 4795,
"valid_targets_mean": 4570.1,
"valid_targets_min": 1677
},
{
"epoch": 5.309905921416712,
"grad_norm": 0.3031531972220382,
"learning_rate": 6.702327584374733e-06,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05147046968340874,
"step": 4800,
"valid_targets_mean": 4621.4,
"valid_targets_min": 1831
},
{
"epoch": 5.315439955727726,
"grad_norm": 0.3162091598967438,
"learning_rate": 6.661173598924009e-06,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05728279426693916,
"step": 4805,
"valid_targets_mean": 4701.1,
"valid_targets_min": 1892
},
{
"epoch": 5.3209739900387385,
"grad_norm": 0.27126503376359495,
"learning_rate": 6.620121090945932e-06,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04581926390528679,
"step": 4810,
"valid_targets_mean": 4210.5,
"valid_targets_min": 1282
},
{
"epoch": 5.326508024349751,
"grad_norm": 0.2692516343928811,
"learning_rate": 6.5791703727547e-06,
"loss": 0.0936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0382157638669014,
"step": 4815,
"valid_targets_mean": 4092.7,
"valid_targets_min": 1552
},
{
"epoch": 5.332042058660764,
"grad_norm": 0.3396002792680986,
"learning_rate": 6.538321755890103e-06,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04399949684739113,
"step": 4820,
"valid_targets_mean": 3938.2,
"valid_targets_min": 1518
},
{
"epoch": 5.337576092971776,
"grad_norm": 0.29307725564948145,
"learning_rate": 6.497575551115205e-06,
"loss": 0.0998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04623451828956604,
"step": 4825,
"valid_targets_mean": 3866.6,
"valid_targets_min": 1939
},
{
"epoch": 5.343110127282789,
"grad_norm": 0.28264014387665437,
"learning_rate": 6.456932068413928e-06,
"loss": 0.0987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04547819495201111,
"step": 4830,
"valid_targets_mean": 4178.5,
"valid_targets_min": 1919
},
{
"epoch": 5.348644161593802,
"grad_norm": 0.3035715825727704,
"learning_rate": 6.416391616988735e-06,
"loss": 0.098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05045393109321594,
"step": 4835,
"valid_targets_mean": 4422.5,
"valid_targets_min": 1519
},
{
"epoch": 5.354178195904814,
"grad_norm": 0.2996643875725543,
"learning_rate": 6.3759545052582596e-06,
"loss": 0.0972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05186879634857178,
"step": 4840,
"valid_targets_mean": 4715.8,
"valid_targets_min": 1890
},
{
"epoch": 5.359712230215827,
"grad_norm": 0.27842839335332986,
"learning_rate": 6.335621040854949e-06,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04677329584956169,
"step": 4845,
"valid_targets_mean": 4308.6,
"valid_targets_min": 1797
},
{
"epoch": 5.36524626452684,
"grad_norm": 0.2728960533899608,
"learning_rate": 6.295391530622754e-06,
"loss": 0.0961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04513225331902504,
"step": 4850,
"valid_targets_mean": 4429.0,
"valid_targets_min": 1563
},
{
"epoch": 5.370780298837853,
"grad_norm": 0.2930308558837003,
"learning_rate": 6.255266280614747e-06,
"loss": 0.0987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0623805969953537,
"step": 4855,
"valid_targets_mean": 4832.3,
"valid_targets_min": 1789
},
{
"epoch": 5.376314333148866,
"grad_norm": 0.2809054803196358,
"learning_rate": 6.215245596090853e-06,
"loss": 0.0929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04654247686266899,
"step": 4860,
"valid_targets_mean": 4335.4,
"valid_targets_min": 1729
},
{
"epoch": 5.381848367459878,
"grad_norm": 0.26481027178759486,
"learning_rate": 6.1753297815154716e-06,
"loss": 0.0886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03547029569745064,
"step": 4865,
"valid_targets_mean": 3609.3,
"valid_targets_min": 1651
},
{
"epoch": 5.387382401770891,
"grad_norm": 0.27745340499226884,
"learning_rate": 6.135519140555199e-06,
"loss": 0.0875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04294551536440849,
"step": 4870,
"valid_targets_mean": 4319.0,
"valid_targets_min": 1420
},
{
"epoch": 5.3929164360819035,
"grad_norm": 0.30288204365953497,
"learning_rate": 6.0958139760765074e-06,
"loss": 0.0921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04404045268893242,
"step": 4875,
"valid_targets_mean": 4539.0,
"valid_targets_min": 1855
},
{
"epoch": 5.398450470392916,
"grad_norm": 0.3005477264174116,
"learning_rate": 6.05621459014343e-06,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052519965916872025,
"step": 4880,
"valid_targets_mean": 4650.9,
"valid_targets_min": 1295
},
{
"epoch": 5.403984504703929,
"grad_norm": 0.2588205344702586,
"learning_rate": 6.016721284015281e-06,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041075099259614944,
"step": 4885,
"valid_targets_mean": 3957.8,
"valid_targets_min": 1401
},
{
"epoch": 5.409518539014942,
"grad_norm": 0.26904245923876685,
"learning_rate": 5.977334358144335e-06,
"loss": 0.0902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04499991610646248,
"step": 4890,
"valid_targets_mean": 4258.2,
"valid_targets_min": 1375
},
{
"epoch": 5.415052573325955,
"grad_norm": 0.27780104929993793,
"learning_rate": 5.938054112173585e-06,
"loss": 0.0937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04547039791941643,
"step": 4895,
"valid_targets_mean": 4293.1,
"valid_targets_min": 1932
},
{
"epoch": 5.4205866076369675,
"grad_norm": 0.2835969799258284,
"learning_rate": 5.898880844934411e-06,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042660683393478394,
"step": 4900,
"valid_targets_mean": 4114.5,
"valid_targets_min": 1761
},
{
"epoch": 5.42612064194798,
"grad_norm": 0.26809629928124185,
"learning_rate": 5.859814854444361e-06,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04189951717853546,
"step": 4905,
"valid_targets_mean": 4430.8,
"valid_targets_min": 2314
},
{
"epoch": 5.431654676258993,
"grad_norm": 0.3033668506817014,
"learning_rate": 5.820856437904829e-06,
"loss": 0.0893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04731345176696777,
"step": 4910,
"valid_targets_mean": 4497.4,
"valid_targets_min": 1599
},
{
"epoch": 5.437188710570005,
"grad_norm": 0.27894467946557433,
"learning_rate": 5.782005891698843e-06,
"loss": 0.0889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04985889792442322,
"step": 4915,
"valid_targets_mean": 4274.5,
"valid_targets_min": 1618
},
{
"epoch": 5.442722744881018,
"grad_norm": 0.2610829057581517,
"learning_rate": 5.743263511388777e-06,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043534595519304276,
"step": 4920,
"valid_targets_mean": 4277.4,
"valid_targets_min": 1851
},
{
"epoch": 5.448256779192031,
"grad_norm": 0.2814480946363349,
"learning_rate": 5.704629591714119e-06,
"loss": 0.0845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04236781597137451,
"step": 4925,
"valid_targets_mean": 4469.7,
"valid_targets_min": 1871
},
{
"epoch": 5.453790813503044,
"grad_norm": 0.28196491095765974,
"learning_rate": 5.666104426589227e-06,
"loss": 0.0902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045051101595163345,
"step": 4930,
"valid_targets_mean": 4527.5,
"valid_targets_min": 1453
},
{
"epoch": 5.459324847814057,
"grad_norm": 0.2793798119184077,
"learning_rate": 5.627688309101074e-06,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04612480476498604,
"step": 4935,
"valid_targets_mean": 4689.2,
"valid_targets_min": 1243
},
{
"epoch": 5.464858882125069,
"grad_norm": 0.2527466996252714,
"learning_rate": 5.5893815315070545e-06,
"loss": 0.088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03624003753066063,
"step": 4940,
"valid_targets_mean": 4317.8,
"valid_targets_min": 1812
},
{
"epoch": 5.470392916436082,
"grad_norm": 0.2548369389008775,
"learning_rate": 5.551184385232717e-06,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03714959695935249,
"step": 4945,
"valid_targets_mean": 5641.1,
"valid_targets_min": 2296
},
{
"epoch": 5.475926950747095,
"grad_norm": 0.26918984483077724,
"learning_rate": 5.513097160869594e-06,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04826346039772034,
"step": 4950,
"valid_targets_mean": 5349.0,
"valid_targets_min": 2050
},
{
"epoch": 5.481460985058107,
"grad_norm": 0.22898992837192203,
"learning_rate": 5.475120148172952e-06,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0547969788312912,
"step": 4955,
"valid_targets_mean": 5783.2,
"valid_targets_min": 1845
},
{
"epoch": 5.48699501936912,
"grad_norm": 0.20835361008156356,
"learning_rate": 5.4372536360596095e-06,
"loss": 0.0899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05061693117022514,
"step": 4960,
"valid_targets_mean": 5767.9,
"valid_targets_min": 2653
},
{
"epoch": 5.4925290536801326,
"grad_norm": 0.3263923310676471,
"learning_rate": 5.39949791260574e-06,
"loss": 0.0929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04884323105216026,
"step": 4965,
"valid_targets_mean": 5619.5,
"valid_targets_min": 2023
},
{
"epoch": 5.498063087991145,
"grad_norm": 0.18223012730725743,
"learning_rate": 5.36185326504465e-06,
"loss": 0.0859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043797388672828674,
"step": 4970,
"valid_targets_mean": 5253.8,
"valid_targets_min": 1239
},
{
"epoch": 5.503597122302159,
"grad_norm": 0.17208167859721404,
"learning_rate": 5.324319979764638e-06,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041199374943971634,
"step": 4975,
"valid_targets_mean": 5506.8,
"valid_targets_min": 2598
},
{
"epoch": 5.509131156613171,
"grad_norm": 0.1742427957489206,
"learning_rate": 5.286898342306781e-06,
"loss": 0.0785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03271806240081787,
"step": 4980,
"valid_targets_mean": 5309.8,
"valid_targets_min": 2443
},
{
"epoch": 5.514665190924184,
"grad_norm": 0.19408572897818147,
"learning_rate": 5.24958863736279e-06,
"loss": 0.0746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05028039216995239,
"step": 4985,
"valid_targets_mean": 5868.3,
"valid_targets_min": 2497
},
{
"epoch": 5.520199225235197,
"grad_norm": 0.1883711835145652,
"learning_rate": 5.212391148772808e-06,
"loss": 0.0752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035246167331933975,
"step": 4990,
"valid_targets_mean": 5761.6,
"valid_targets_min": 2096
},
{
"epoch": 5.525733259546209,
"grad_norm": 0.20122322848305024,
"learning_rate": 5.175306159523292e-06,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04153045266866684,
"step": 4995,
"valid_targets_mean": 5816.0,
"valid_targets_min": 2258
},
{
"epoch": 5.531267293857222,
"grad_norm": 0.1877338847041848,
"learning_rate": 5.138333951744834e-06,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040626995265483856,
"step": 5000,
"valid_targets_mean": 5984.8,
"valid_targets_min": 2264
},
{
"epoch": 5.5368013281682344,
"grad_norm": 0.18575057786697535,
"learning_rate": 5.101474806710018e-06,
"loss": 0.0701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03857755288481712,
"step": 5005,
"valid_targets_mean": 5711.8,
"valid_targets_min": 2394
},
{
"epoch": 5.542335362479247,
"grad_norm": 0.1937292314638601,
"learning_rate": 5.064729004831297e-06,
"loss": 0.0701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0389263816177845,
"step": 5010,
"valid_targets_mean": 5680.3,
"valid_targets_min": 2487
},
{
"epoch": 5.54786939679026,
"grad_norm": 0.19161248239894565,
"learning_rate": 5.028096825658817e-06,
"loss": 0.0656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03286981210112572,
"step": 5015,
"valid_targets_mean": 5869.9,
"valid_targets_min": 2655
},
{
"epoch": 5.553403431101273,
"grad_norm": 0.1803407447825603,
"learning_rate": 4.991578547878353e-06,
"loss": 0.0662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03436180204153061,
"step": 5020,
"valid_targets_mean": 5479.9,
"valid_targets_min": 2153
},
{
"epoch": 5.558937465412286,
"grad_norm": 0.1926916620778669,
"learning_rate": 4.955174449309126e-06,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03226090595126152,
"step": 5025,
"valid_targets_mean": 5297.5,
"valid_targets_min": 1932
},
{
"epoch": 5.5644714997232985,
"grad_norm": 0.17699772829970112,
"learning_rate": 4.918884806901736e-06,
"loss": 0.0661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02836117148399353,
"step": 5030,
"valid_targets_mean": 5783.3,
"valid_targets_min": 944
},
{
"epoch": 5.570005534034311,
"grad_norm": 0.18361638296491878,
"learning_rate": 4.882709896736035e-06,
"loss": 0.064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029991939663887024,
"step": 5035,
"valid_targets_mean": 5570.2,
"valid_targets_min": 2844
},
{
"epoch": 5.575539568345324,
"grad_norm": 0.19332970772301838,
"learning_rate": 4.846649994019028e-06,
"loss": 0.0646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030482301488518715,
"step": 5040,
"valid_targets_mean": 5753.7,
"valid_targets_min": 2045
},
{
"epoch": 5.581073602656336,
"grad_norm": 0.1802565765077648,
"learning_rate": 4.810705373082785e-06,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03281958028674126,
"step": 5045,
"valid_targets_mean": 5353.3,
"valid_targets_min": 2316
},
{
"epoch": 5.586607636967349,
"grad_norm": 0.18209674554957742,
"learning_rate": 4.77487630738233e-06,
"loss": 0.0659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03288013115525246,
"step": 5050,
"valid_targets_mean": 5618.7,
"valid_targets_min": 2144
},
{
"epoch": 5.592141671278362,
"grad_norm": 0.19378510164029844,
"learning_rate": 4.739163069493611e-06,
"loss": 0.064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03251936659216881,
"step": 5055,
"valid_targets_mean": 5338.1,
"valid_targets_min": 1731
},
{
"epoch": 5.597675705589374,
"grad_norm": 0.1904853135186227,
"learning_rate": 4.7035659311113665e-06,
"loss": 0.0621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035014282912015915,
"step": 5060,
"valid_targets_mean": 5883.8,
"valid_targets_min": 2583
},
{
"epoch": 5.603209739900388,
"grad_norm": 0.17577557424938922,
"learning_rate": 4.668085163047109e-06,
"loss": 0.0605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029335923492908478,
"step": 5065,
"valid_targets_mean": 5300.8,
"valid_targets_min": 1973
},
{
"epoch": 5.6087437742114,
"grad_norm": 0.1927824160022825,
"learning_rate": 4.632721035227028e-06,
"loss": 0.0633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03788955882191658,
"step": 5070,
"valid_targets_mean": 5928.1,
"valid_targets_min": 3227
},
{
"epoch": 5.614277808522413,
"grad_norm": 0.19769655833056504,
"learning_rate": 4.597473816689959e-06,
"loss": 0.0641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032567158341407776,
"step": 5075,
"valid_targets_mean": 5923.1,
"valid_targets_min": 2392
},
{
"epoch": 5.619811842833426,
"grad_norm": 0.17335162190475464,
"learning_rate": 4.562343775585334e-06,
"loss": 0.0609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026050040498375893,
"step": 5080,
"valid_targets_mean": 5607.5,
"valid_targets_min": 1927
},
{
"epoch": 5.625345877144438,
"grad_norm": 0.1927394890214593,
"learning_rate": 4.5273311791711265e-06,
"loss": 0.0576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033131640404462814,
"step": 5085,
"valid_targets_mean": 5891.4,
"valid_targets_min": 1659
},
{
"epoch": 5.630879911455451,
"grad_norm": 0.17771864942156337,
"learning_rate": 4.492436293811844e-06,
"loss": 0.0599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032288823276758194,
"step": 5090,
"valid_targets_mean": 5810.3,
"valid_targets_min": 2797
},
{
"epoch": 5.6364139457664635,
"grad_norm": 0.19154573618071724,
"learning_rate": 4.457659384976463e-06,
"loss": 0.0576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03311631456017494,
"step": 5095,
"valid_targets_mean": 5845.2,
"valid_targets_min": 2085
},
{
"epoch": 5.641947980077476,
"grad_norm": 0.17290736570454462,
"learning_rate": 4.423000717236458e-06,
"loss": 0.0602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026159053668379784,
"step": 5100,
"valid_targets_mean": 5777.4,
"valid_targets_min": 2375
},
{
"epoch": 5.647482014388489,
"grad_norm": 0.1682909452754771,
"learning_rate": 4.388460554263743e-06,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028254443779587746,
"step": 5105,
"valid_targets_mean": 5355.5,
"valid_targets_min": 1462
},
{
"epoch": 5.653016048699502,
"grad_norm": 0.16940272629745565,
"learning_rate": 4.354039158828698e-06,
"loss": 0.0536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0268237367272377,
"step": 5110,
"valid_targets_mean": 5619.6,
"valid_targets_min": 2248
},
{
"epoch": 5.658550083010515,
"grad_norm": 0.20684182065746543,
"learning_rate": 4.319736792798157e-06,
"loss": 0.0571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03059101104736328,
"step": 5115,
"valid_targets_mean": 5980.5,
"valid_targets_min": 2300
},
{
"epoch": 5.6640841173215275,
"grad_norm": 0.20355768534181248,
"learning_rate": 4.285553717133413e-06,
"loss": 0.0573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0313802994787693,
"step": 5120,
"valid_targets_mean": 5847.6,
"valid_targets_min": 3518
},
{
"epoch": 5.66961815163254,
"grad_norm": 0.17795362801982467,
"learning_rate": 4.251490191888246e-06,
"loss": 0.0554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025926783680915833,
"step": 5125,
"valid_targets_mean": 5279.1,
"valid_targets_min": 2145
},
{
"epoch": 5.675152185943553,
"grad_norm": 0.19984037968820786,
"learning_rate": 4.217546476206915e-06,
"loss": 0.0583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03138670697808266,
"step": 5130,
"valid_targets_mean": 5963.4,
"valid_targets_min": 1785
},
{
"epoch": 5.680686220254565,
"grad_norm": 0.2050104885169466,
"learning_rate": 4.183722828322232e-06,
"loss": 0.0575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03241662308573723,
"step": 5135,
"valid_targets_mean": 5615.0,
"valid_targets_min": 1880
},
{
"epoch": 5.686220254565578,
"grad_norm": 0.1790320457867811,
"learning_rate": 4.150019505553546e-06,
"loss": 0.0551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024099178612232208,
"step": 5140,
"valid_targets_mean": 5902.0,
"valid_targets_min": 2804
},
{
"epoch": 5.6917542888765915,
"grad_norm": 0.1748063463819483,
"learning_rate": 4.116436764304832e-06,
"loss": 0.0526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027424706146121025,
"step": 5145,
"valid_targets_mean": 5319.6,
"valid_targets_min": 2528
},
{
"epoch": 5.697288323187604,
"grad_norm": 0.1782024377321046,
"learning_rate": 4.082974860062718e-06,
"loss": 0.0556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026081182062625885,
"step": 5150,
"valid_targets_mean": 5529.9,
"valid_targets_min": 2824
},
{
"epoch": 5.702822357498617,
"grad_norm": 0.177274788200606,
"learning_rate": 4.0496340473945264e-06,
"loss": 0.0509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024925321340560913,
"step": 5155,
"valid_targets_mean": 5210.4,
"valid_targets_min": 2273
},
{
"epoch": 5.708356391809629,
"grad_norm": 0.19751307017113642,
"learning_rate": 4.0164145799463686e-06,
"loss": 0.0518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027725854888558388,
"step": 5160,
"valid_targets_mean": 5708.2,
"valid_targets_min": 2025
},
{
"epoch": 5.713890426120642,
"grad_norm": 0.1837401122379636,
"learning_rate": 3.983316710441203e-06,
"loss": 0.0518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024004802107810974,
"step": 5165,
"valid_targets_mean": 5535.9,
"valid_targets_min": 2354
},
{
"epoch": 5.719424460431655,
"grad_norm": 0.190406571209415,
"learning_rate": 3.950340690676904e-06,
"loss": 0.0547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028329044580459595,
"step": 5170,
"valid_targets_mean": 5587.0,
"valid_targets_min": 2655
},
{
"epoch": 5.724958494742667,
"grad_norm": 0.1949683903785584,
"learning_rate": 3.917486771524348e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02764093317091465,
"step": 5175,
"valid_targets_mean": 5726.0,
"valid_targets_min": 1536
},
{
"epoch": 5.73049252905368,
"grad_norm": 0.18363803990275362,
"learning_rate": 3.884755202925523e-06,
"loss": 0.0535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026779597625136375,
"step": 5180,
"valid_targets_mean": 5276.6,
"valid_targets_min": 1725
},
{
"epoch": 5.7360265633646925,
"grad_norm": 0.1923047283339151,
"learning_rate": 3.852146233891598e-06,
"loss": 0.0539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025118621066212654,
"step": 5185,
"valid_targets_mean": 4917.2,
"valid_targets_min": 1306
},
{
"epoch": 5.741560597675706,
"grad_norm": 0.18362331997004988,
"learning_rate": 3.819660112501053e-06,
"loss": 0.0523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025888383388519287,
"step": 5190,
"valid_targets_mean": 5920.3,
"valid_targets_min": 2692
},
{
"epoch": 5.747094631986719,
"grad_norm": 0.19299061576096796,
"learning_rate": 3.787297085897783e-06,
"loss": 0.0536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026169372722506523,
"step": 5195,
"valid_targets_mean": 5935.9,
"valid_targets_min": 2414
},
{
"epoch": 5.752628666297731,
"grad_norm": 0.1934208644361245,
"learning_rate": 3.7550574002892193e-06,
"loss": 0.057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02640332095324993,
"step": 5200,
"valid_targets_mean": 5286.9,
"valid_targets_min": 1052
},
{
"epoch": 5.758162700608744,
"grad_norm": 0.28244689860994376,
"learning_rate": 3.722941300944454e-06,
"loss": 0.0706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03444273769855499,
"step": 5205,
"valid_targets_mean": 4064.5,
"valid_targets_min": 2223
},
{
"epoch": 5.7636967349197565,
"grad_norm": 0.296330254238661,
"learning_rate": 3.6909490321923634e-06,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03813193738460541,
"step": 5210,
"valid_targets_mean": 4034.0,
"valid_targets_min": 1203
},
{
"epoch": 5.769230769230769,
"grad_norm": 0.3122974913435053,
"learning_rate": 3.6590808374197816e-06,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036831844598054886,
"step": 5215,
"valid_targets_mean": 4315.0,
"valid_targets_min": 1773
},
{
"epoch": 5.774764803541782,
"grad_norm": 0.2718515044346279,
"learning_rate": 3.627336959069605e-06,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04120616614818573,
"step": 5220,
"valid_targets_mean": 4799.0,
"valid_targets_min": 1603
},
{
"epoch": 5.780298837852794,
"grad_norm": 0.24395973721925102,
"learning_rate": 3.5957176386389893e-06,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04204801842570305,
"step": 5225,
"valid_targets_mean": 4921.9,
"valid_targets_min": 1695
},
{
"epoch": 5.785832872163807,
"grad_norm": 0.24764045579431937,
"learning_rate": 3.5642231166774897e-06,
"loss": 0.0749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039783138781785965,
"step": 5230,
"valid_targets_mean": 4232.0,
"valid_targets_min": 1416
},
{
"epoch": 5.7913669064748206,
"grad_norm": 0.3306174867366802,
"learning_rate": 3.532853632785227e-06,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0378490649163723,
"step": 5235,
"valid_targets_mean": 7718.0,
"valid_targets_min": 1254
},
{
"epoch": 5.796900940785833,
"grad_norm": 0.32124352248548405,
"learning_rate": 3.501609425611079e-06,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040089331567287445,
"step": 5240,
"valid_targets_mean": 7411.9,
"valid_targets_min": 1367
},
{
"epoch": 5.802434975096846,
"grad_norm": 0.2691272435692972,
"learning_rate": 3.4704907328508576e-06,
"loss": 0.0803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036173637956380844,
"step": 5245,
"valid_targets_mean": 6794.7,
"valid_targets_min": 1002
},
{
"epoch": 5.807969009407858,
"grad_norm": 0.2620356647940023,
"learning_rate": 3.439497791245512e-06,
"loss": 0.086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0450415201485157,
"step": 5250,
"valid_targets_mean": 7931.0,
"valid_targets_min": 2635
},
{
"epoch": 5.813503043718871,
"grad_norm": 0.22557524289207584,
"learning_rate": 3.408630836579294e-06,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03923304006457329,
"step": 5255,
"valid_targets_mean": 7836.5,
"valid_targets_min": 1113
},
{
"epoch": 5.819037078029884,
"grad_norm": 0.2045914134636371,
"learning_rate": 3.3778901036780076e-06,
"loss": 0.0807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03792804852128029,
"step": 5260,
"valid_targets_mean": 8004.7,
"valid_targets_min": 2354
},
{
"epoch": 5.824571112340896,
"grad_norm": 0.3427586199909158,
"learning_rate": 3.347275826407199e-06,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06689509004354477,
"step": 5265,
"valid_targets_mean": 14621.4,
"valid_targets_min": 1121
},
{
"epoch": 5.830105146651909,
"grad_norm": 0.29603497949784,
"learning_rate": 3.3167882376703696e-06,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06736762076616287,
"step": 5270,
"valid_targets_mean": 13730.6,
"valid_targets_min": 5627
},
{
"epoch": 5.835639180962922,
"grad_norm": 0.20784944949332113,
"learning_rate": 3.286427569407229e-06,
"loss": 0.1285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06973903626203537,
"step": 5275,
"valid_targets_mean": 13851.5,
"valid_targets_min": 2420
},
{
"epoch": 5.841173215273935,
"grad_norm": 0.18870880205922533,
"learning_rate": 3.2561940525919124e-06,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05548988655209541,
"step": 5280,
"valid_targets_mean": 10187.0,
"valid_targets_min": 4526
},
{
"epoch": 5.846707249584948,
"grad_norm": 0.27156730295517534,
"learning_rate": 3.226087917231231e-06,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03967982530593872,
"step": 5285,
"valid_targets_mean": 7247.6,
"valid_targets_min": 1894
},
{
"epoch": 5.85224128389596,
"grad_norm": 0.234889121335806,
"learning_rate": 3.1961093923629028e-06,
"loss": 0.0716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03272298723459244,
"step": 5290,
"valid_targets_mean": 7225.9,
"valid_targets_min": 1279
},
{
"epoch": 5.857775318206973,
"grad_norm": 0.2709109126040272,
"learning_rate": 3.166258706053855e-06,
"loss": 0.0777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05472330376505852,
"step": 5295,
"valid_targets_mean": 4795.3,
"valid_targets_min": 1685
},
{
"epoch": 5.863309352517986,
"grad_norm": 0.2507789435309829,
"learning_rate": 3.1365360853984294e-06,
"loss": 0.0965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04301333427429199,
"step": 5300,
"valid_targets_mean": 4640.0,
"valid_targets_min": 1767
},
{
"epoch": 5.868843386828998,
"grad_norm": 0.24171054349923565,
"learning_rate": 3.106941756516708e-06,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03779042512178421,
"step": 5305,
"valid_targets_mean": 4969.9,
"valid_targets_min": 1543
},
{
"epoch": 5.874377421140011,
"grad_norm": 0.23818204523791442,
"learning_rate": 3.077475944552768e-06,
"loss": 0.086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03676900640130043,
"step": 5310,
"valid_targets_mean": 4724.9,
"valid_targets_min": 1634
},
{
"epoch": 5.8799114554510234,
"grad_norm": 0.2745452909907268,
"learning_rate": 3.0481388736729566e-06,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040772464126348495,
"step": 5315,
"valid_targets_mean": 3955.6,
"valid_targets_min": 1829
},
{
"epoch": 5.885445489762036,
"grad_norm": 0.2716601097234908,
"learning_rate": 3.0189307670642186e-06,
"loss": 0.0844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05109298229217529,
"step": 5320,
"valid_targets_mean": 5335.9,
"valid_targets_min": 2041
},
{
"epoch": 5.89097952407305,
"grad_norm": 0.28363532790959217,
"learning_rate": 2.9898518469323677e-06,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059856902807950974,
"step": 5325,
"valid_targets_mean": 5668.2,
"valid_targets_min": 1895
},
{
"epoch": 5.896513558384062,
"grad_norm": 0.2885730075923772,
"learning_rate": 2.9609023345004217e-06,
"loss": 0.1012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055200595408678055,
"step": 5330,
"valid_targets_mean": 5241.9,
"valid_targets_min": 2052
},
{
"epoch": 5.902047592695075,
"grad_norm": 0.2418413992225755,
"learning_rate": 2.93208245000689e-06,
"loss": 0.1018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04855811595916748,
"step": 5335,
"valid_targets_mean": 4501.1,
"valid_targets_min": 1859
},
{
"epoch": 5.9075816270060875,
"grad_norm": 0.21570529848712508,
"learning_rate": 2.9033924127041224e-06,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04917898774147034,
"step": 5340,
"valid_targets_mean": 5344.1,
"valid_targets_min": 2200
},
{
"epoch": 5.9131156613171,
"grad_norm": 0.23318304045499405,
"learning_rate": 2.8748324408566454e-06,
"loss": 0.1001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047095414251089096,
"step": 5345,
"valid_targets_mean": 4667.0,
"valid_targets_min": 2131
},
{
"epoch": 5.918649695628113,
"grad_norm": 0.2213096477089317,
"learning_rate": 2.846402751739463e-06,
"loss": 0.0943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04613789916038513,
"step": 5350,
"valid_targets_mean": 4774.7,
"valid_targets_min": 1735
},
{
"epoch": 5.924183729939125,
"grad_norm": 0.2155036772624133,
"learning_rate": 2.8181035616364536e-06,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047325681895017624,
"step": 5355,
"valid_targets_mean": 5840.8,
"valid_targets_min": 2338
},
{
"epoch": 5.929717764250138,
"grad_norm": 0.23045482683818375,
"learning_rate": 2.789935085838693e-06,
"loss": 0.0981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04686537757515907,
"step": 5360,
"valid_targets_mean": 4816.4,
"valid_targets_min": 1674
},
{
"epoch": 5.935251798561151,
"grad_norm": 0.23606907939433505,
"learning_rate": 2.761897538642828e-06,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05562064051628113,
"step": 5365,
"valid_targets_mean": 5732.7,
"valid_targets_min": 1854
},
{
"epoch": 5.940785832872164,
"grad_norm": 0.21496323680378623,
"learning_rate": 2.733991133349434e-06,
"loss": 0.095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038572560995817184,
"step": 5370,
"valid_targets_mean": 4115.7,
"valid_targets_min": 1512
},
{
"epoch": 5.946319867183177,
"grad_norm": 0.22849226855351992,
"learning_rate": 2.706216082261408e-06,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04715319350361824,
"step": 5375,
"valid_targets_mean": 5378.9,
"valid_targets_min": 2469
},
{
"epoch": 5.951853901494189,
"grad_norm": 0.22534943956068945,
"learning_rate": 2.678572596682354e-06,
"loss": 0.0789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03633340075612068,
"step": 5380,
"valid_targets_mean": 4137.5,
"valid_targets_min": 1891
},
{
"epoch": 5.957387935805202,
"grad_norm": 0.22497875005678122,
"learning_rate": 2.651060886914949e-06,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036558959633111954,
"step": 5385,
"valid_targets_mean": 4230.2,
"valid_targets_min": 1879
},
{
"epoch": 5.962921970116215,
"grad_norm": 0.22473026813893437,
"learning_rate": 2.623681162259386e-06,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03210429102182388,
"step": 5390,
"valid_targets_mean": 4060.4,
"valid_targets_min": 1929
},
{
"epoch": 5.968456004427227,
"grad_norm": 0.2688832422929091,
"learning_rate": 2.596433631011732e-06,
"loss": 0.0694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03812266141176224,
"step": 5395,
"valid_targets_mean": 4318.9,
"valid_targets_min": 1421
},
{
"epoch": 5.97399003873824,
"grad_norm": 0.25749309111006674,
"learning_rate": 2.569318500462392e-06,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03529876843094826,
"step": 5400,
"valid_targets_mean": 4196.6,
"valid_targets_min": 2018
},
{
"epoch": 5.979524073049253,
"grad_norm": 0.23337191064636828,
"learning_rate": 2.5423359768944967e-06,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0353553332388401,
"step": 5405,
"valid_targets_mean": 4083.7,
"valid_targets_min": 1696
},
{
"epoch": 5.985058107360266,
"grad_norm": 0.22862376038231164,
"learning_rate": 2.5154862655823563e-06,
"loss": 0.0735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036466386169195175,
"step": 5410,
"valid_targets_mean": 4253.7,
"valid_targets_min": 2036
},
{
"epoch": 5.990592141671279,
"grad_norm": 0.22955140120017462,
"learning_rate": 2.4887695707898728e-06,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03640773519873619,
"step": 5415,
"valid_targets_mean": 4333.8,
"valid_targets_min": 1885
},
{
"epoch": 5.996126175982291,
"grad_norm": 0.2125943251045193,
"learning_rate": 2.4621860957690123e-06,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03555760160088539,
"step": 5420,
"valid_targets_mean": 4365.4,
"valid_targets_min": 1943
},
{
"epoch": 6.001106806862203,
"grad_norm": 0.26368627735327654,
"learning_rate": 2.435736042758252e-06,
"loss": 0.0677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059096869081258774,
"step": 5425,
"valid_targets_mean": 7176.8,
"valid_targets_min": 2475
},
{
"epoch": 6.0066408411732155,
"grad_norm": 0.47193555298918144,
"learning_rate": 2.409419612981023e-06,
"loss": 0.1281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07251014560461044,
"step": 5430,
"valid_targets_mean": 7152.2,
"valid_targets_min": 1817
},
{
"epoch": 6.012174875484228,
"grad_norm": 0.3653661869376702,
"learning_rate": 2.383237006644208e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06588508933782578,
"step": 5435,
"valid_targets_mean": 6413.1,
"valid_targets_min": 2694
},
{
"epoch": 6.017708909795241,
"grad_norm": 0.2862731006886899,
"learning_rate": 2.3571884229365984e-06,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06910615414381027,
"step": 5440,
"valid_targets_mean": 6742.4,
"valid_targets_min": 2529
},
{
"epoch": 6.023242944106253,
"grad_norm": 0.23404931027479792,
"learning_rate": 2.3312740600273888e-06,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06342857331037521,
"step": 5445,
"valid_targets_mean": 6891.3,
"valid_targets_min": 2165
},
{
"epoch": 6.028776978417266,
"grad_norm": 0.21433044642997082,
"learning_rate": 2.3054941150646525e-06,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06521899253129959,
"step": 5450,
"valid_targets_mean": 6714.7,
"valid_targets_min": 1734
},
{
"epoch": 6.034311012728279,
"grad_norm": 0.20433087046826062,
"learning_rate": 2.2798487841738727e-06,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0649661123752594,
"step": 5455,
"valid_targets_mean": 7105.4,
"valid_targets_min": 1845
},
{
"epoch": 6.039845047039291,
"grad_norm": 0.19088713467699442,
"learning_rate": 2.2543382624564235e-06,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05487219616770744,
"step": 5460,
"valid_targets_mean": 6475.6,
"valid_targets_min": 2297
},
{
"epoch": 6.045379081350305,
"grad_norm": 0.19942065796995198,
"learning_rate": 2.22896274398809e-06,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05961311236023903,
"step": 5465,
"valid_targets_mean": 6744.1,
"valid_targets_min": 2793
},
{
"epoch": 6.050913115661317,
"grad_norm": 0.19120702109483861,
"learning_rate": 2.2037224218176067e-06,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05088047310709953,
"step": 5470,
"valid_targets_mean": 6725.4,
"valid_targets_min": 2520
},
{
"epoch": 6.05644714997233,
"grad_norm": 0.20696475872471462,
"learning_rate": 2.1786174879651646e-06,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050160735845565796,
"step": 5475,
"valid_targets_mean": 6286.6,
"valid_targets_min": 2643
},
{
"epoch": 6.061981184283343,
"grad_norm": 0.2838515581035275,
"learning_rate": 2.15364813342098e-06,
"loss": 0.115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055874865502119064,
"step": 5480,
"valid_targets_mean": 6647.1,
"valid_targets_min": 2218
},
{
"epoch": 6.067515218594355,
"grad_norm": 0.24429025940738258,
"learning_rate": 2.128814548143814e-06,
"loss": 0.1127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05764148011803627,
"step": 5485,
"valid_targets_mean": 6991.6,
"valid_targets_min": 3271
},
{
"epoch": 6.073049252905368,
"grad_norm": 0.22561127923089053,
"learning_rate": 2.1041169210595445e-06,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05936726927757263,
"step": 5490,
"valid_targets_mean": 7175.3,
"valid_targets_min": 1805
},
{
"epoch": 6.0785832872163805,
"grad_norm": 0.22212852022644294,
"learning_rate": 2.0795554400597286e-06,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04884013533592224,
"step": 5495,
"valid_targets_mean": 6327.0,
"valid_targets_min": 1224
},
{
"epoch": 6.084117321527393,
"grad_norm": 0.21393129624832247,
"learning_rate": 2.0551302920001493e-06,
"loss": 0.107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06428065896034241,
"step": 5500,
"valid_targets_mean": 7451.6,
"valid_targets_min": 1864
},
{
"epoch": 6.089651355838406,
"grad_norm": 0.2087036431848382,
"learning_rate": 2.0308416626994364e-06,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06320202350616455,
"step": 5505,
"valid_targets_mean": 7721.9,
"valid_targets_min": 3662
},
{
"epoch": 6.095185390149419,
"grad_norm": 0.18708347512612522,
"learning_rate": 2.0066897369376102e-06,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052226606756448746,
"step": 5510,
"valid_targets_mean": 7039.7,
"valid_targets_min": 1698
},
{
"epoch": 6.100719424460432,
"grad_norm": 0.20885772048522724,
"learning_rate": 1.982674698454703e-06,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055415648967027664,
"step": 5515,
"valid_targets_mean": 7115.9,
"valid_targets_min": 1492
},
{
"epoch": 6.1062534587714445,
"grad_norm": 0.2033519261853173,
"learning_rate": 1.958796729949355e-06,
"loss": 0.101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04657214879989624,
"step": 5520,
"valid_targets_mean": 6713.1,
"valid_targets_min": 2543
},
{
"epoch": 6.111787493082457,
"grad_norm": 0.21636598733741638,
"learning_rate": 1.9350560130774234e-06,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053439270704984665,
"step": 5525,
"valid_targets_mean": 6488.6,
"valid_targets_min": 2556
},
{
"epoch": 6.11732152739347,
"grad_norm": 0.212204397525806,
"learning_rate": 1.911452728450589e-06,
"loss": 0.0999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05276120826601982,
"step": 5530,
"valid_targets_mean": 7216.3,
"valid_targets_min": 1992
},
{
"epoch": 6.122855561704482,
"grad_norm": 0.20517538957361184,
"learning_rate": 1.887987055635001e-06,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046480581164360046,
"step": 5535,
"valid_targets_mean": 6421.9,
"valid_targets_min": 2444
},
{
"epoch": 6.128389596015495,
"grad_norm": 0.21771474389513235,
"learning_rate": 1.8646591731499053e-06,
"loss": 0.0982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04300164803862572,
"step": 5540,
"valid_targets_mean": 6405.9,
"valid_targets_min": 2545
},
{
"epoch": 6.133923630326508,
"grad_norm": 0.20624266728265683,
"learning_rate": 1.841469258466273e-06,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047111015766859055,
"step": 5545,
"valid_targets_mean": 6837.7,
"valid_targets_min": 2151
},
{
"epoch": 6.13945766463752,
"grad_norm": 0.1983984538297293,
"learning_rate": 1.8184174880054728e-06,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0536317341029644,
"step": 5550,
"valid_targets_mean": 7361.1,
"valid_targets_min": 2378
},
{
"epoch": 6.144991698948534,
"grad_norm": 0.21196934655380573,
"learning_rate": 1.7955040371379052e-06,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045640040189027786,
"step": 5555,
"valid_targets_mean": 6319.2,
"valid_targets_min": 2356
},
{
"epoch": 6.150525733259546,
"grad_norm": 0.21184599881715346,
"learning_rate": 1.7727290801816877e-06,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041314657777547836,
"step": 5560,
"valid_targets_mean": 6630.8,
"valid_targets_min": 1972
},
{
"epoch": 6.156059767570559,
"grad_norm": 0.21228986821072401,
"learning_rate": 1.750092790401321e-06,
"loss": 0.0883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04752728343009949,
"step": 5565,
"valid_targets_mean": 6972.9,
"valid_targets_min": 2135
},
{
"epoch": 6.161593801881572,
"grad_norm": 0.2160322976500172,
"learning_rate": 1.7275953400063672e-06,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046096403151750565,
"step": 5570,
"valid_targets_mean": 6707.8,
"valid_targets_min": 1871
},
{
"epoch": 6.167127836192584,
"grad_norm": 0.2008173954902481,
"learning_rate": 1.7052369001501489e-06,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043318573385477066,
"step": 5575,
"valid_targets_mean": 6739.1,
"valid_targets_min": 2150
},
{
"epoch": 6.172661870503597,
"grad_norm": 0.2002716284364717,
"learning_rate": 1.6830176409284327e-06,
"loss": 0.0934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045532722026109695,
"step": 5580,
"valid_targets_mean": 6861.2,
"valid_targets_min": 2514
},
{
"epoch": 6.17819590481461,
"grad_norm": 0.19935046559834757,
"learning_rate": 1.6609377313781539e-06,
"loss": 0.0976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05056362226605415,
"step": 5585,
"valid_targets_mean": 7224.6,
"valid_targets_min": 2698
},
{
"epoch": 6.183729939125622,
"grad_norm": 0.20653748117791743,
"learning_rate": 1.6389973394761116e-06,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04757365211844444,
"step": 5590,
"valid_targets_mean": 6807.6,
"valid_targets_min": 2279
},
{
"epoch": 6.189263973436636,
"grad_norm": 0.19818533807915628,
"learning_rate": 1.617196632137703e-06,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04539031162858009,
"step": 5595,
"valid_targets_mean": 6986.2,
"valid_targets_min": 2280
},
{
"epoch": 6.194798007747648,
"grad_norm": 0.20166258302871556,
"learning_rate": 1.595535775215653e-06,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04186883568763733,
"step": 5600,
"valid_targets_mean": 6668.9,
"valid_targets_min": 3573
},
{
"epoch": 6.200332042058661,
"grad_norm": 0.2403254196566056,
"learning_rate": 1.574014933498751e-06,
"loss": 0.093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05118389055132866,
"step": 5605,
"valid_targets_mean": 7348.7,
"valid_targets_min": 2266
},
{
"epoch": 6.205866076369674,
"grad_norm": 0.2343022776577193,
"learning_rate": 1.5526342707105912e-06,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0463598258793354,
"step": 5610,
"valid_targets_mean": 6718.5,
"valid_targets_min": 1852
},
{
"epoch": 6.211400110680686,
"grad_norm": 0.20474245395725305,
"learning_rate": 1.5313939495083329e-06,
"loss": 0.0936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03855031356215477,
"step": 5615,
"valid_targets_mean": 6317.0,
"valid_targets_min": 1890
},
{
"epoch": 6.216934144991699,
"grad_norm": 0.20389018507643655,
"learning_rate": 1.5102941314814645e-06,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04324701055884361,
"step": 5620,
"valid_targets_mean": 6423.0,
"valid_targets_min": 1961
},
{
"epoch": 6.2224681793027115,
"grad_norm": 0.22347203143863656,
"learning_rate": 1.489334977150567e-06,
"loss": 0.0943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049007613211870193,
"step": 5625,
"valid_targets_mean": 6961.5,
"valid_targets_min": 2011
},
{
"epoch": 6.228002213613724,
"grad_norm": 0.29422745024398256,
"learning_rate": 1.468516645966107e-06,
"loss": 0.0749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033227451145648956,
"step": 5630,
"valid_targets_mean": 4264.4,
"valid_targets_min": 1664
},
{
"epoch": 6.233536247924737,
"grad_norm": 0.2453358322792234,
"learning_rate": 1.4478392963071985e-06,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02738841436803341,
"step": 5635,
"valid_targets_mean": 4403.8,
"valid_targets_min": 1896
},
{
"epoch": 6.23907028223575,
"grad_norm": 0.30540480705047374,
"learning_rate": 1.4273030854804292e-06,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03664984181523323,
"step": 5640,
"valid_targets_mean": 4392.9,
"valid_targets_min": 1282
},
{
"epoch": 6.244604316546763,
"grad_norm": 0.2717082701357272,
"learning_rate": 1.4069081697186415e-06,
"loss": 0.0709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03534964099526405,
"step": 5645,
"valid_targets_mean": 4179.3,
"valid_targets_min": 1998
},
{
"epoch": 6.2501383508577755,
"grad_norm": 0.2475574410090893,
"learning_rate": 1.386654704179753e-06,
"loss": 0.0675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036007124930620193,
"step": 5650,
"valid_targets_mean": 4410.1,
"valid_targets_min": 1629
},
{
"epoch": 6.255672385168788,
"grad_norm": 0.22433925042604627,
"learning_rate": 1.3665428429455729e-06,
"loss": 0.0709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03184202313423157,
"step": 5655,
"valid_targets_mean": 4081.9,
"valid_targets_min": 1820
},
{
"epoch": 6.261206419479801,
"grad_norm": 0.24733371250383948,
"learning_rate": 1.346572739020624e-06,
"loss": 0.0803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040468450635671616,
"step": 5660,
"valid_targets_mean": 4430.3,
"valid_targets_min": 1591
},
{
"epoch": 6.266740453790813,
"grad_norm": 0.2194558634851793,
"learning_rate": 1.326744544331e-06,
"loss": 0.0735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02739051915705204,
"step": 5665,
"valid_targets_mean": 3639.0,
"valid_targets_min": 1609
},
{
"epoch": 6.272274488101826,
"grad_norm": 0.22573361756053215,
"learning_rate": 1.3070584097231764e-06,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03558327630162239,
"step": 5670,
"valid_targets_mean": 4169.2,
"valid_targets_min": 2003
},
{
"epoch": 6.277808522412839,
"grad_norm": 0.23202403327961435,
"learning_rate": 1.2875144849628973e-06,
"loss": 0.0709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039374466985464096,
"step": 5675,
"valid_targets_mean": 4387.5,
"valid_targets_min": 1802
},
{
"epoch": 6.283342556723852,
"grad_norm": 0.23588444742883982,
"learning_rate": 1.2681129187340147e-06,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041341233998537064,
"step": 5680,
"valid_targets_mean": 4586.4,
"valid_targets_min": 1431
},
{
"epoch": 6.288876591034865,
"grad_norm": 0.24261143005195893,
"learning_rate": 1.2488538586373645e-06,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035322047770023346,
"step": 5685,
"valid_targets_mean": 4150.2,
"valid_targets_min": 1451
},
{
"epoch": 6.294410625345877,
"grad_norm": 0.23626406873269493,
"learning_rate": 1.2297374511896387e-06,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03342689946293831,
"step": 5690,
"valid_targets_mean": 4058.3,
"valid_targets_min": 1500
},
{
"epoch": 6.29994465965689,
"grad_norm": 0.22893138639014132,
"learning_rate": 1.2107638418222733e-06,
"loss": 0.0739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03557369112968445,
"step": 5695,
"valid_targets_mean": 4309.4,
"valid_targets_min": 1370
},
{
"epoch": 6.305478693967903,
"grad_norm": 0.20742676858737275,
"learning_rate": 1.1919331748803531e-06,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032634858042001724,
"step": 5700,
"valid_targets_mean": 4254.8,
"valid_targets_min": 1915
},
{
"epoch": 6.311012728278915,
"grad_norm": 0.21245971613137082,
"learning_rate": 1.173245593621486e-06,
"loss": 0.0727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033117055892944336,
"step": 5705,
"valid_targets_mean": 3897.5,
"valid_targets_min": 1699
},
{
"epoch": 6.316546762589928,
"grad_norm": 0.2211524280699169,
"learning_rate": 1.1547012402147461e-06,
"loss": 0.0735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03834658861160278,
"step": 5710,
"valid_targets_mean": 4873.8,
"valid_targets_min": 1374
},
{
"epoch": 6.3220807969009405,
"grad_norm": 0.22494584076410562,
"learning_rate": 1.1363002557395663e-06,
"loss": 0.0696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03914666920900345,
"step": 5715,
"valid_targets_mean": 4314.8,
"valid_targets_min": 1526
},
{
"epoch": 6.327614831211953,
"grad_norm": 0.21502150042346616,
"learning_rate": 1.1180427801846827e-06,
"loss": 0.0691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028126897290349007,
"step": 5720,
"valid_targets_mean": 3668.5,
"valid_targets_min": 1735
},
{
"epoch": 6.333148865522967,
"grad_norm": 0.2415860232914858,
"learning_rate": 1.0999289524470537e-06,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0350409634411335,
"step": 5725,
"valid_targets_mean": 4198.7,
"valid_targets_min": 1587
},
{
"epoch": 6.338682899833979,
"grad_norm": 0.22985989637869847,
"learning_rate": 1.0819589103308204e-06,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030462943017482758,
"step": 5730,
"valid_targets_mean": 4426.8,
"valid_targets_min": 1624
},
{
"epoch": 6.344216934144992,
"grad_norm": 0.23139369403799398,
"learning_rate": 1.064132790546246e-06,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03156794235110283,
"step": 5735,
"valid_targets_mean": 3844.5,
"valid_targets_min": 1660
},
{
"epoch": 6.3497509684560045,
"grad_norm": 0.240471213429906,
"learning_rate": 1.0464507287086744e-06,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03767099231481552,
"step": 5740,
"valid_targets_mean": 4607.4,
"valid_targets_min": 1446
},
{
"epoch": 6.355285002767017,
"grad_norm": 0.22192997179412693,
"learning_rate": 1.0289128593375119e-06,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04201770946383476,
"step": 5745,
"valid_targets_mean": 4620.0,
"valid_targets_min": 1843
},
{
"epoch": 6.36081903707803,
"grad_norm": 0.2047492893678803,
"learning_rate": 1.011519315855185e-06,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030818996950984,
"step": 5750,
"valid_targets_mean": 4062.0,
"valid_targets_min": 1629
},
{
"epoch": 6.366353071389042,
"grad_norm": 0.21823041506261645,
"learning_rate": 9.94270230586145e-07,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03921927139163017,
"step": 5755,
"valid_targets_mean": 4552.9,
"valid_targets_min": 1687
},
{
"epoch": 6.371887105700055,
"grad_norm": 0.2220340611729739,
"learning_rate": 9.771657347558428e-07,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031742434948682785,
"step": 5760,
"valid_targets_mean": 4288.0,
"valid_targets_min": 1735
},
{
"epoch": 6.377421140011068,
"grad_norm": 0.21745186872682112,
"learning_rate": 9.602059584897506e-07,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03511330857872963,
"step": 5765,
"valid_targets_mean": 4494.9,
"valid_targets_min": 1742
},
{
"epoch": 6.382955174322081,
"grad_norm": 0.21894433232405924,
"learning_rate": 9.433910308123572e-07,
"loss": 0.0676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03947247937321663,
"step": 5770,
"valid_targets_mean": 4560.7,
"valid_targets_min": 1850
},
{
"epoch": 6.388489208633094,
"grad_norm": 0.22995324546061463,
"learning_rate": 9.267210796461823e-07,
"loss": 0.0655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03699576109647751,
"step": 5775,
"valid_targets_mean": 4525.4,
"valid_targets_min": 1488
},
{
"epoch": 6.394023242944106,
"grad_norm": 0.22563307465188687,
"learning_rate": 9.101962318108226e-07,
"loss": 0.0678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03179671987891197,
"step": 5780,
"valid_targets_mean": 4337.6,
"valid_targets_min": 1551
},
{
"epoch": 6.399557277255119,
"grad_norm": 0.22470922312893973,
"learning_rate": 8.93816613021965e-07,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033924076706171036,
"step": 5785,
"valid_targets_mean": 4064.8,
"valid_targets_min": 1260
},
{
"epoch": 6.405091311566132,
"grad_norm": 0.2322852894397586,
"learning_rate": 8.775823478904488e-07,
"loss": 0.0698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03452476114034653,
"step": 5790,
"valid_targets_mean": 4271.5,
"valid_targets_min": 1965
},
{
"epoch": 6.410625345877144,
"grad_norm": 0.24177928417312386,
"learning_rate": 8.61493559921307e-07,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037243809551000595,
"step": 5795,
"valid_targets_mean": 4530.3,
"valid_targets_min": 1812
},
{
"epoch": 6.416159380188157,
"grad_norm": 0.2216906788415978,
"learning_rate": 8.455503715128266e-07,
"loss": 0.0707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038190603256225586,
"step": 5800,
"valid_targets_mean": 5182.0,
"valid_targets_min": 2171
},
{
"epoch": 6.4216934144991695,
"grad_norm": 0.2120593332647113,
"learning_rate": 8.297529039556274e-07,
"loss": 0.0636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032920487225055695,
"step": 5805,
"valid_targets_mean": 4341.3,
"valid_targets_min": 1861
},
{
"epoch": 6.427227448810182,
"grad_norm": 0.21228521891675042,
"learning_rate": 8.141012774317269e-07,
"loss": 0.061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0351475290954113,
"step": 5810,
"valid_targets_mean": 4484.4,
"valid_targets_min": 1651
},
{
"epoch": 6.432761483121196,
"grad_norm": 0.19448488726474453,
"learning_rate": 7.98595611013635e-07,
"loss": 0.0635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02942313253879547,
"step": 5815,
"valid_targets_mean": 4192.0,
"valid_targets_min": 1684
},
{
"epoch": 6.438295517432208,
"grad_norm": 0.20833364189105583,
"learning_rate": 7.832360226634361e-07,
"loss": 0.0669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03339335694909096,
"step": 5820,
"valid_targets_mean": 4869.7,
"valid_targets_min": 1745
},
{
"epoch": 6.443829551743221,
"grad_norm": 0.19617265316913424,
"learning_rate": 7.680226292319082e-07,
"loss": 0.0642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02662007510662079,
"step": 5825,
"valid_targets_mean": 3970.9,
"valid_targets_min": 1643
},
{
"epoch": 6.4493635860542335,
"grad_norm": 0.2179831646410156,
"learning_rate": 7.52955546457621e-07,
"loss": 0.0669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034840185195207596,
"step": 5830,
"valid_targets_mean": 4239.2,
"valid_targets_min": 1695
},
{
"epoch": 6.454897620365246,
"grad_norm": 0.21340091815248927,
"learning_rate": 7.380348889660661e-07,
"loss": 0.0637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033205918967723846,
"step": 5835,
"valid_targets_mean": 4571.5,
"valid_targets_min": 1696
},
{
"epoch": 6.460431654676259,
"grad_norm": 0.21409959567631628,
"learning_rate": 7.232607702687699e-07,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03569451719522476,
"step": 5840,
"valid_targets_mean": 4433.2,
"valid_targets_min": 2003
},
{
"epoch": 6.465965688987271,
"grad_norm": 0.20028490308433225,
"learning_rate": 7.086333027624493e-07,
"loss": 0.0625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028834521770477295,
"step": 5845,
"valid_targets_mean": 4008.7,
"valid_targets_min": 1371
},
{
"epoch": 6.471499723298284,
"grad_norm": 0.28020985868169035,
"learning_rate": 6.941525977281393e-07,
"loss": 0.0706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03831277787685394,
"step": 5850,
"valid_targets_mean": 5755.9,
"valid_targets_min": 1607
},
{
"epoch": 6.477033757609298,
"grad_norm": 0.32129073672421576,
"learning_rate": 6.798187653303534e-07,
"loss": 0.0826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042238298803567886,
"step": 5855,
"valid_targets_mean": 5835.6,
"valid_targets_min": 2306
},
{
"epoch": 6.48256779192031,
"grad_norm": 0.2736503696001417,
"learning_rate": 6.656319146162516e-07,
"loss": 0.0875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03857993707060814,
"step": 5860,
"valid_targets_mean": 5367.4,
"valid_targets_min": 2272
},
{
"epoch": 6.488101826231323,
"grad_norm": 0.23936583896726388,
"learning_rate": 6.515921535147974e-07,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03267192468047142,
"step": 5865,
"valid_targets_mean": 5459.6,
"valid_targets_min": 1924
},
{
"epoch": 6.493635860542335,
"grad_norm": 0.21675915459435122,
"learning_rate": 6.376995888359516e-07,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040545906871557236,
"step": 5870,
"valid_targets_mean": 5662.9,
"valid_targets_min": 2081
},
{
"epoch": 6.499169894853348,
"grad_norm": 0.19691958549470645,
"learning_rate": 6.239543262698422e-07,
"loss": 0.0763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035456351935863495,
"step": 5875,
"valid_targets_mean": 5408.0,
"valid_targets_min": 1663
},
{
"epoch": 6.504703929164361,
"grad_norm": 0.18219063079375922,
"learning_rate": 6.103564703859799e-07,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037758808583021164,
"step": 5880,
"valid_targets_mean": 6090.0,
"valid_targets_min": 3233
},
{
"epoch": 6.510237963475373,
"grad_norm": 0.1787082903748495,
"learning_rate": 5.969061246324525e-07,
"loss": 0.0682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030553584918379784,
"step": 5885,
"valid_targets_mean": 5283.3,
"valid_targets_min": 2542
},
{
"epoch": 6.515771997786386,
"grad_norm": 0.18264859649970874,
"learning_rate": 5.836033913351302e-07,
"loss": 0.0674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03753102943301201,
"step": 5890,
"valid_targets_mean": 5841.9,
"valid_targets_min": 3074
},
{
"epoch": 6.5213060320973995,
"grad_norm": 0.16662900561871258,
"learning_rate": 5.7044837169691e-07,
"loss": 0.0636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03211820498108864,
"step": 5895,
"valid_targets_mean": 5844.2,
"valid_targets_min": 1791
},
{
"epoch": 6.526840066408412,
"grad_norm": 0.16649539115731712,
"learning_rate": 5.574411657969125e-07,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03245365247130394,
"step": 5900,
"valid_targets_mean": 5735.6,
"valid_targets_min": 2746
},
{
"epoch": 6.532374100719425,
"grad_norm": 0.16434361967617983,
"learning_rate": 5.445818725897534e-07,
"loss": 0.0645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031247785314917564,
"step": 5905,
"valid_targets_mean": 5778.7,
"valid_targets_min": 2829
},
{
"epoch": 6.537908135030437,
"grad_norm": 0.16181782660191443,
"learning_rate": 5.318705899047727e-07,
"loss": 0.0602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030019355937838554,
"step": 5910,
"valid_targets_mean": 5638.1,
"valid_targets_min": 1955
},
{
"epoch": 6.54344216934145,
"grad_norm": 0.15453935494744914,
"learning_rate": 5.193074144452892e-07,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02768268622457981,
"step": 5915,
"valid_targets_mean": 5649.6,
"valid_targets_min": 1657
},
{
"epoch": 6.548976203652463,
"grad_norm": 0.16303444707259854,
"learning_rate": 5.068924417878807e-07,
"loss": 0.0571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030390538275241852,
"step": 5920,
"valid_targets_mean": 5870.3,
"valid_targets_min": 3122
},
{
"epoch": 6.554510237963475,
"grad_norm": 0.162724661938449,
"learning_rate": 4.946257663816334e-07,
"loss": 0.057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02618623711168766,
"step": 5925,
"valid_targets_mean": 5898.3,
"valid_targets_min": 2722
},
{
"epoch": 6.560044272274488,
"grad_norm": 0.16815058862489182,
"learning_rate": 4.825074815474495e-07,
"loss": 0.0599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030746882781386375,
"step": 5930,
"valid_targets_mean": 5430.9,
"valid_targets_min": 1832
},
{
"epoch": 6.5655783065855005,
"grad_norm": 0.16268319766530676,
"learning_rate": 4.7053767947730976e-07,
"loss": 0.0562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02740519307553768,
"step": 5935,
"valid_targets_mean": 5711.7,
"valid_targets_min": 1876
},
{
"epoch": 6.571112340896514,
"grad_norm": 0.16185701199142863,
"learning_rate": 4.587164512335984e-07,
"loss": 0.0553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028320694342255592,
"step": 5940,
"valid_targets_mean": 5817.8,
"valid_targets_min": 3349
},
{
"epoch": 6.576646375207527,
"grad_norm": 0.17315465874497984,
"learning_rate": 4.4704388674838836e-07,
"loss": 0.0568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0337056927382946,
"step": 5945,
"valid_targets_mean": 6213.9,
"valid_targets_min": 2486
},
{
"epoch": 6.582180409518539,
"grad_norm": 0.16874657796605771,
"learning_rate": 4.355200748227728e-07,
"loss": 0.0566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027117937803268433,
"step": 5950,
"valid_targets_mean": 5960.8,
"valid_targets_min": 1760
},
{
"epoch": 6.587714443829552,
"grad_norm": 0.16953088257827853,
"learning_rate": 4.241451031261812e-07,
"loss": 0.0571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02523176372051239,
"step": 5955,
"valid_targets_mean": 5431.6,
"valid_targets_min": 1939
},
{
"epoch": 6.5932484781405645,
"grad_norm": 0.17046845562368365,
"learning_rate": 4.129190581957154e-07,
"loss": 0.0556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028271449729800224,
"step": 5960,
"valid_targets_mean": 5619.5,
"valid_targets_min": 1402
},
{
"epoch": 6.598782512451577,
"grad_norm": 0.1658430114537753,
"learning_rate": 4.0184202543549266e-07,
"loss": 0.0535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029601609334349632,
"step": 5965,
"valid_targets_mean": 5685.0,
"valid_targets_min": 1115
},
{
"epoch": 6.60431654676259,
"grad_norm": 0.16261583595041115,
"learning_rate": 3.9091408911599016e-07,
"loss": 0.0512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02375098504126072,
"step": 5970,
"valid_targets_mean": 5896.3,
"valid_targets_min": 2249
},
{
"epoch": 6.609850581073602,
"grad_norm": 0.17113988788796894,
"learning_rate": 3.8013533237341026e-07,
"loss": 0.0551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024803929030895233,
"step": 5975,
"valid_targets_mean": 5286.9,
"valid_targets_min": 2419
},
{
"epoch": 6.615384615384615,
"grad_norm": 0.16227669472509565,
"learning_rate": 3.695058372090432e-07,
"loss": 0.055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031464751809835434,
"step": 5980,
"valid_targets_mean": 5907.0,
"valid_targets_min": 2764
},
{
"epoch": 6.6209186496956285,
"grad_norm": 0.15230008226364655,
"learning_rate": 3.590256844886475e-07,
"loss": 0.0491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02285112999379635,
"step": 5985,
"valid_targets_mean": 5677.7,
"valid_targets_min": 2561
},
{
"epoch": 6.626452684006641,
"grad_norm": 0.15507053735181311,
"learning_rate": 3.486949539418327e-07,
"loss": 0.0496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022178545594215393,
"step": 5990,
"valid_targets_mean": 5690.5,
"valid_targets_min": 2153
},
{
"epoch": 6.631986718317654,
"grad_norm": 0.15406847130900264,
"learning_rate": 3.385137241614489e-07,
"loss": 0.0507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025633057579398155,
"step": 5995,
"valid_targets_mean": 5799.1,
"valid_targets_min": 2167
},
{
"epoch": 6.637520752628666,
"grad_norm": 0.16701465983686922,
"learning_rate": 3.284820726030025e-07,
"loss": 0.0502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02921949326992035,
"step": 6000,
"valid_targets_mean": 5970.1,
"valid_targets_min": 3079
},
{
"epoch": 6.643054786939679,
"grad_norm": 0.1491935829405977,
"learning_rate": 3.1860007558404125e-07,
"loss": 0.0489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023413682356476784,
"step": 6005,
"valid_targets_mean": 5799.0,
"valid_targets_min": 2123
},
{
"epoch": 6.648588821250692,
"grad_norm": 0.150245854586345,
"learning_rate": 3.088678082836083e-07,
"loss": 0.0499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019299032166600227,
"step": 6010,
"valid_targets_mean": 5474.9,
"valid_targets_min": 1505
},
{
"epoch": 6.654122855561704,
"grad_norm": 0.14307532650864027,
"learning_rate": 2.992853447416377e-07,
"loss": 0.0452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019033873453736305,
"step": 6015,
"valid_targets_mean": 5696.5,
"valid_targets_min": 2150
},
{
"epoch": 6.659656889872717,
"grad_norm": 0.15702109651212837,
"learning_rate": 2.8985275785841094e-07,
"loss": 0.0494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02460307441651821,
"step": 6020,
"valid_targets_mean": 5482.0,
"valid_targets_min": 1925
},
{
"epoch": 6.6651909241837295,
"grad_norm": 0.16295466209332987,
"learning_rate": 2.805701193939947e-07,
"loss": 0.0479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023025652393698692,
"step": 6025,
"valid_targets_mean": 5700.8,
"valid_targets_min": 2524
},
{
"epoch": 6.670724958494743,
"grad_norm": 0.17077714740007088,
"learning_rate": 2.71437499967695e-07,
"loss": 0.0475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02456340752542019,
"step": 6030,
"valid_targets_mean": 5443.2,
"valid_targets_min": 1992
},
{
"epoch": 6.676258992805756,
"grad_norm": 0.15583333265496774,
"learning_rate": 2.624549690575284e-07,
"loss": 0.0471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0222936999052763,
"step": 6035,
"valid_targets_mean": 5506.9,
"valid_targets_min": 2062
},
{
"epoch": 6.681793027116768,
"grad_norm": 0.14726673158584985,
"learning_rate": 2.5362259499967623e-07,
"loss": 0.0471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021626999601721764,
"step": 6040,
"valid_targets_mean": 5554.7,
"valid_targets_min": 2289
},
{
"epoch": 6.687327061427781,
"grad_norm": 0.1432897815929805,
"learning_rate": 2.449404449879844e-07,
"loss": 0.0456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021053863689303398,
"step": 6045,
"valid_targets_mean": 5283.6,
"valid_targets_min": 2511
},
{
"epoch": 6.6928610957387935,
"grad_norm": 0.1497531374262155,
"learning_rate": 2.3640858507343766e-07,
"loss": 0.0438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02070341445505619,
"step": 6050,
"valid_targets_mean": 5367.8,
"valid_targets_min": 1636
},
{
"epoch": 6.698395130049806,
"grad_norm": 0.1481851861278496,
"learning_rate": 2.2802708016366636e-07,
"loss": 0.0458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022724062204360962,
"step": 6055,
"valid_targets_mean": 5643.5,
"valid_targets_min": 1822
},
{
"epoch": 6.703929164360819,
"grad_norm": 0.14848419552320255,
"learning_rate": 2.1979599402244256e-07,
"loss": 0.042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021349245682358742,
"step": 6060,
"valid_targets_mean": 5522.8,
"valid_targets_min": 2271
},
{
"epoch": 6.709463198671831,
"grad_norm": 0.1593119673142632,
"learning_rate": 2.1171538926920697e-07,
"loss": 0.0435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0206944290548563,
"step": 6065,
"valid_targets_mean": 5634.4,
"valid_targets_min": 3397
},
{
"epoch": 6.714997232982844,
"grad_norm": 0.16781758974714178,
"learning_rate": 2.0378532737858724e-07,
"loss": 0.0429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024538887664675713,
"step": 6070,
"valid_targets_mean": 5882.0,
"valid_targets_min": 1620
},
{
"epoch": 6.7205312672938575,
"grad_norm": 0.15427347780497472,
"learning_rate": 1.9600586867992045e-07,
"loss": 0.0445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02108161151409149,
"step": 6075,
"valid_targets_mean": 5484.1,
"valid_targets_min": 1983
},
{
"epoch": 6.72606530160487,
"grad_norm": 0.1590775756796442,
"learning_rate": 1.8837707235681347e-07,
"loss": 0.0448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025591416284441948,
"step": 6080,
"valid_targets_mean": 6050.4,
"valid_targets_min": 2705
},
{
"epoch": 6.731599335915883,
"grad_norm": 0.14284190422291548,
"learning_rate": 1.8089899644667673e-07,
"loss": 0.0414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019970562309026718,
"step": 6085,
"valid_targets_mean": 5951.2,
"valid_targets_min": 1263
},
{
"epoch": 6.737133370226895,
"grad_norm": 0.15288214426850036,
"learning_rate": 1.7357169784029348e-07,
"loss": 0.0448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021346738561987877,
"step": 6090,
"valid_targets_mean": 5333.5,
"valid_targets_min": 2761
},
{
"epoch": 6.742667404537908,
"grad_norm": 0.15933272800140702,
"learning_rate": 1.6639523228137778e-07,
"loss": 0.0435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026872599497437477,
"step": 6095,
"valid_targets_mean": 5898.5,
"valid_targets_min": 1918
},
{
"epoch": 6.748201438848921,
"grad_norm": 0.15210885857654943,
"learning_rate": 1.5936965436615492e-07,
"loss": 0.0424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019810838624835014,
"step": 6100,
"valid_targets_mean": 5690.7,
"valid_targets_min": 2491
},
{
"epoch": 6.753735473159933,
"grad_norm": 0.16212466670735068,
"learning_rate": 1.524950175429507e-07,
"loss": 0.0473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026772432029247284,
"step": 6105,
"valid_targets_mean": 5855.6,
"valid_targets_min": 1834
},
{
"epoch": 6.759269507470947,
"grad_norm": 0.2781957807032019,
"learning_rate": 1.4577137411177166e-07,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028757303953170776,
"step": 6110,
"valid_targets_mean": 4478.1,
"valid_targets_min": 1152
},
{
"epoch": 6.764803541781959,
"grad_norm": 0.285966123432216,
"learning_rate": 1.3919877522392322e-07,
"loss": 0.0616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027906084433197975,
"step": 6115,
"valid_targets_mean": 4434.4,
"valid_targets_min": 1363
},
{
"epoch": 6.770337576092972,
"grad_norm": 0.2660206536747435,
"learning_rate": 1.3277727088160775e-07,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033058829605579376,
"step": 6120,
"valid_targets_mean": 4586.5,
"valid_targets_min": 1203
},
{
"epoch": 6.775871610403985,
"grad_norm": 0.2815578821576788,
"learning_rate": 1.2650690993755377e-07,
"loss": 0.0656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03213704749941826,
"step": 6125,
"valid_targets_mean": 4198.7,
"valid_targets_min": 1898
},
{
"epoch": 6.781405644714997,
"grad_norm": 0.27812158818342514,
"learning_rate": 1.2038774009463406e-07,
"loss": 0.0675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03444572538137436,
"step": 6130,
"valid_targets_mean": 4499.3,
"valid_targets_min": 2282
},
{
"epoch": 6.78693967902601,
"grad_norm": 0.2538775243898183,
"learning_rate": 1.1441980790551699e-07,
"loss": 0.0644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0322687067091465,
"step": 6135,
"valid_targets_mean": 4354.3,
"valid_targets_min": 2243
},
{
"epoch": 6.7924737133370225,
"grad_norm": 0.4139407017723169,
"learning_rate": 1.0860315877229133e-07,
"loss": 0.0656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0316312201321125,
"step": 6140,
"valid_targets_mean": 5987.4,
"valid_targets_min": 1045
},
{
"epoch": 6.798007747648035,
"grad_norm": 0.4219852983365904,
"learning_rate": 1.0293783694614645e-07,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037688422948122025,
"step": 6145,
"valid_targets_mean": 7339.2,
"valid_targets_min": 1398
},
{
"epoch": 6.803541781959048,
"grad_norm": 0.4271759301135669,
"learning_rate": 9.742388552701266e-08,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0405937097966671,
"step": 6150,
"valid_targets_mean": 7609.3,
"valid_targets_min": 2489
},
{
"epoch": 6.809075816270061,
"grad_norm": 0.47550541018352915,
"learning_rate": 9.206134646325026e-08,
"loss": 0.0858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042033206671476364,
"step": 6155,
"valid_targets_mean": 8182.5,
"valid_targets_min": 2323
},
{
"epoch": 6.814609850581074,
"grad_norm": 0.4541435636889632,
"learning_rate": 8.685026055131662e-08,
"loss": 0.0852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04260958358645439,
"step": 6160,
"valid_targets_mean": 7945.0,
"valid_targets_min": 2386
},
{
"epoch": 6.820143884892087,
"grad_norm": 0.4187211676260777,
"learning_rate": 8.179066743546848e-08,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04068029299378395,
"step": 6165,
"valid_targets_mean": 7628.4,
"valid_targets_min": 2019
},
{
"epoch": 6.825677919203099,
"grad_norm": 0.7188901584149283,
"learning_rate": 7.688260560745342e-08,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0671887993812561,
"step": 6170,
"valid_targets_mean": 13487.5,
"valid_targets_min": 1304
},
{
"epoch": 6.831211953514112,
"grad_norm": 0.8134072666671982,
"learning_rate": 7.212611240621448e-08,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08201751857995987,
"step": 6175,
"valid_targets_mean": 14044.6,
"valid_targets_min": 2837
},
{
"epoch": 6.836745987825124,
"grad_norm": 0.7728347504284517,
"learning_rate": 6.752122401761263e-08,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07637709379196167,
"step": 6180,
"valid_targets_mean": 12808.5,
"valid_targets_min": 1264
},
{
"epoch": 6.842280022136137,
"grad_norm": 0.4866135651542434,
"learning_rate": 6.306797547414923e-08,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04519471526145935,
"step": 6185,
"valid_targets_mean": 7773.3,
"valid_targets_min": 1300
},
{
"epoch": 6.84781405644715,
"grad_norm": 0.34132735867861963,
"learning_rate": 5.876640065469508e-08,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03255182504653931,
"step": 6190,
"valid_targets_mean": 8022.5,
"valid_targets_min": 1221
},
{
"epoch": 6.853348090758162,
"grad_norm": 0.24281825590975215,
"learning_rate": 5.4616532284239576e-08,
"loss": 0.0597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026530781760811806,
"step": 6195,
"valid_targets_mean": 7332.0,
"valid_targets_min": 935
},
{
"epoch": 6.858882125069176,
"grad_norm": 0.3378643276186545,
"learning_rate": 5.061840193363754e-08,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043400898575782776,
"step": 6200,
"valid_targets_mean": 4677.9,
"valid_targets_min": 1413
},
{
"epoch": 6.8644161593801885,
"grad_norm": 0.2939484612048038,
"learning_rate": 4.677204001937163e-08,
"loss": 0.0809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04071999713778496,
"step": 6205,
"valid_targets_mean": 5047.0,
"valid_targets_min": 1422
},
{
"epoch": 6.869950193691201,
"grad_norm": 0.26447990416566697,
"learning_rate": 4.3077475803317006e-08,
"loss": 0.0709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03539319708943367,
"step": 6210,
"valid_targets_mean": 4560.3,
"valid_targets_min": 2177
},
{
"epoch": 6.875484228002214,
"grad_norm": 0.24448712356713942,
"learning_rate": 3.953473739252145e-08,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03483784198760986,
"step": 6215,
"valid_targets_mean": 4750.5,
"valid_targets_min": 2094
},
{
"epoch": 6.881018262313226,
"grad_norm": 0.24136576815497512,
"learning_rate": 3.6143851738992265e-08,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03553052619099617,
"step": 6220,
"valid_targets_mean": 4360.2,
"valid_targets_min": 1571
},
{
"epoch": 6.886552296624239,
"grad_norm": 0.2540992167336122,
"learning_rate": 3.290484463948973e-08,
"loss": 0.0737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03783242031931877,
"step": 6225,
"valid_targets_mean": 4350.1,
"valid_targets_min": 1350
},
{
"epoch": 6.892086330935252,
"grad_norm": 0.26436404059943236,
"learning_rate": 2.981774073533172e-08,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046336591243743896,
"step": 6230,
"valid_targets_mean": 5759.9,
"valid_targets_min": 2496
},
{
"epoch": 6.897620365246264,
"grad_norm": 0.28374694012095986,
"learning_rate": 2.6882563512204972e-08,
"loss": 0.0886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04141201451420784,
"step": 6235,
"valid_targets_mean": 4665.8,
"valid_targets_min": 1862
},
{
"epoch": 6.903154399557277,
"grad_norm": 0.27667918620344506,
"learning_rate": 2.4099335299987426e-08,
"loss": 0.0909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047536592930555344,
"step": 6240,
"valid_targets_mean": 5136.1,
"valid_targets_min": 2075
},
{
"epoch": 6.90868843386829,
"grad_norm": 0.2801499093244407,
"learning_rate": 2.146807727257727e-08,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04789487645030022,
"step": 6245,
"valid_targets_mean": 5201.3,
"valid_targets_min": 2016
},
{
"epoch": 6.914222468179303,
"grad_norm": 0.25953453335013227,
"learning_rate": 1.898880944773307e-08,
"loss": 0.0908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04826788604259491,
"step": 6250,
"valid_targets_mean": 5300.8,
"valid_targets_min": 1145
},
{
"epoch": 6.919756502490316,
"grad_norm": 0.2529759224910664,
"learning_rate": 1.666155068692499e-08,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04037823900580406,
"step": 6255,
"valid_targets_mean": 4597.2,
"valid_targets_min": 1963
},
{
"epoch": 6.925290536801328,
"grad_norm": 0.23381027910263688,
"learning_rate": 1.4486318695181577e-08,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03696097061038017,
"step": 6260,
"valid_targets_mean": 4532.3,
"valid_targets_min": 1109
},
{
"epoch": 6.930824571112341,
"grad_norm": 0.2437542812149771,
"learning_rate": 1.246313002096544e-08,
"loss": 0.0904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042215894907712936,
"step": 6265,
"valid_targets_mean": 5127.4,
"valid_targets_min": 2148
},
{
"epoch": 6.9363586054233535,
"grad_norm": 0.25411674940759044,
"learning_rate": 1.0592000056039997e-08,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048433512449264526,
"step": 6270,
"valid_targets_mean": 5093.4,
"valid_targets_min": 2249
},
{
"epoch": 6.941892639734366,
"grad_norm": 0.2424493912852331,
"learning_rate": 8.87294303535402e-09,
"loss": 0.0845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04118829965591431,
"step": 6275,
"valid_targets_mean": 4493.6,
"valid_targets_min": 1745
},
{
"epoch": 6.947426674045379,
"grad_norm": 0.2320256567615275,
"learning_rate": 7.305972036941722e-09,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04444737359881401,
"step": 6280,
"valid_targets_mean": 5985.7,
"valid_targets_min": 1785
},
{
"epoch": 6.952960708356391,
"grad_norm": 0.22506455612538573,
"learning_rate": 5.891098981805065e-09,
"loss": 0.0676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033273909240961075,
"step": 6285,
"valid_targets_mean": 4282.6,
"valid_targets_min": 1345
},
{
"epoch": 6.958494742667405,
"grad_norm": 0.22991189057710432,
"learning_rate": 4.628334633844933e-09,
"loss": 0.0625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030094504356384277,
"step": 6290,
"valid_targets_mean": 4043.1,
"valid_targets_min": 1453
},
{
"epoch": 6.9640287769784175,
"grad_norm": 0.23313445838803135,
"learning_rate": 3.5176885997634247e-09,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030323075130581856,
"step": 6295,
"valid_targets_mean": 3962.6,
"valid_targets_min": 1950
},
{
"epoch": 6.96956281128943,
"grad_norm": 0.23322994906696576,
"learning_rate": 2.5591693289928055e-09,
"loss": 0.0626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03191163390874863,
"step": 6300,
"valid_targets_mean": 4089.9,
"valid_targets_min": 2225
},
{
"epoch": 6.975096845600443,
"grad_norm": 0.21610306998231182,
"learning_rate": 1.7527841136399937e-09,
"loss": 0.0618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031901244074106216,
"step": 6305,
"valid_targets_mean": 4647.0,
"valid_targets_min": 1720
},
{
"epoch": 6.980630879911455,
"grad_norm": 0.22791524852331468,
"learning_rate": 1.098539088422168e-09,
"loss": 0.0635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03343750908970833,
"step": 6310,
"valid_targets_mean": 4220.0,
"valid_targets_min": 1637
},
{
"epoch": 6.986164914222468,
"grad_norm": 0.20503543897763343,
"learning_rate": 5.964392306223587e-10,
"loss": 0.063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029046183452010155,
"step": 6315,
"valid_targets_mean": 4065.2,
"valid_targets_min": 2020
},
{
"epoch": 6.991698948533481,
"grad_norm": 0.21235691685325675,
"learning_rate": 2.464883600539203e-10,
"loss": 0.0626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032713327556848526,
"step": 6320,
"valid_targets_mean": 4378.8,
"valid_targets_min": 2197
},
{
"epoch": 6.997232982844494,
"grad_norm": 0.21559969865151898,
"learning_rate": 4.8689139031665724e-11,
"loss": 0.0622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03392450883984566,
"step": 6325,
"valid_targets_mean": 4250.2,
"valid_targets_min": 2029
},
{
"epoch": 7.0,
"step": 6328,
"total_flos": 1.7062153069854196e+19,
"train_loss": 0.0,
"train_runtime": 1.2427,
"train_samples_per_second": 488356.021,
"train_steps_per_second": 5092.029
}
],
"logging_steps": 5,
"max_steps": 6328,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 750,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.7062153069854196e+19,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}