Files
nemotron-terminal-adapters_…/trainer_state.json
ModelHub XC ca39820f19 初始化项目,由ModelHub XC社区提供模型
Model: laion/nemotron-terminal-adapters_math__Qwen3-8B
Source: Original Platform
2026-05-09 22:28:36 +08:00

18693 lines
522 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 8475,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0029498525073746312,
"grad_norm": 8.773958827225787,
"learning_rate": 1.886792452830189e-07,
"loss": 0.9616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874046862125397,
"step": 5,
"valid_targets_mean": 9206.2,
"valid_targets_min": 1498
},
{
"epoch": 0.0058997050147492625,
"grad_norm": 8.43130406707678,
"learning_rate": 4.2452830188679244e-07,
"loss": 0.9704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660023272037506,
"step": 10,
"valid_targets_mean": 8719.1,
"valid_targets_min": 1566
},
{
"epoch": 0.008849557522123894,
"grad_norm": 7.980973049789234,
"learning_rate": 6.603773584905661e-07,
"loss": 0.9721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31450343132019043,
"step": 15,
"valid_targets_mean": 10767.6,
"valid_targets_min": 1915
},
{
"epoch": 0.011799410029498525,
"grad_norm": 6.592074179405163,
"learning_rate": 8.962264150943397e-07,
"loss": 0.939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821187973022461,
"step": 20,
"valid_targets_mean": 9179.4,
"valid_targets_min": 2072
},
{
"epoch": 0.014749262536873156,
"grad_norm": 5.341472842760085,
"learning_rate": 1.1320754716981133e-06,
"loss": 0.9091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2598068118095398,
"step": 25,
"valid_targets_mean": 7131.3,
"valid_targets_min": 1543
},
{
"epoch": 0.017699115044247787,
"grad_norm": 3.625836875106732,
"learning_rate": 1.3679245283018869e-06,
"loss": 0.8698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28657275438308716,
"step": 30,
"valid_targets_mean": 10059.4,
"valid_targets_min": 1912
},
{
"epoch": 0.02064896755162242,
"grad_norm": 2.4455995461055537,
"learning_rate": 1.6037735849056604e-06,
"loss": 0.8339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25056618452072144,
"step": 35,
"valid_targets_mean": 8692.7,
"valid_targets_min": 2885
},
{
"epoch": 0.02359882005899705,
"grad_norm": 1.671129853566953,
"learning_rate": 1.839622641509434e-06,
"loss": 0.8019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2268742173910141,
"step": 40,
"valid_targets_mean": 9311.7,
"valid_targets_min": 1693
},
{
"epoch": 0.02654867256637168,
"grad_norm": 1.4983532466868172,
"learning_rate": 2.075471698113208e-06,
"loss": 0.7848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24425435066223145,
"step": 45,
"valid_targets_mean": 10148.1,
"valid_targets_min": 2792
},
{
"epoch": 0.029498525073746312,
"grad_norm": 1.1050377261180897,
"learning_rate": 2.3113207547169815e-06,
"loss": 0.7493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2659146189689636,
"step": 50,
"valid_targets_mean": 10758.8,
"valid_targets_min": 2016
},
{
"epoch": 0.032448377581120944,
"grad_norm": 0.84276225776089,
"learning_rate": 2.547169811320755e-06,
"loss": 0.7382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542104721069336,
"step": 55,
"valid_targets_mean": 9880.1,
"valid_targets_min": 1422
},
{
"epoch": 0.035398230088495575,
"grad_norm": 0.7161442776999163,
"learning_rate": 2.7830188679245286e-06,
"loss": 0.7227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537986636161804,
"step": 60,
"valid_targets_mean": 10118.1,
"valid_targets_min": 1520
},
{
"epoch": 0.038348082595870206,
"grad_norm": 0.5278769329869252,
"learning_rate": 3.018867924528302e-06,
"loss": 0.698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22161734104156494,
"step": 65,
"valid_targets_mean": 10715.5,
"valid_targets_min": 1277
},
{
"epoch": 0.04129793510324484,
"grad_norm": 0.48264794318692644,
"learning_rate": 3.2547169811320758e-06,
"loss": 0.6842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23746953904628754,
"step": 70,
"valid_targets_mean": 10908.8,
"valid_targets_min": 689
},
{
"epoch": 0.04424778761061947,
"grad_norm": 0.3981010617617588,
"learning_rate": 3.4905660377358493e-06,
"loss": 0.6673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26581302285194397,
"step": 75,
"valid_targets_mean": 11115.4,
"valid_targets_min": 2402
},
{
"epoch": 0.0471976401179941,
"grad_norm": 0.39704919780613845,
"learning_rate": 3.726415094339623e-06,
"loss": 0.6438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24585619568824768,
"step": 80,
"valid_targets_mean": 11587.3,
"valid_targets_min": 3348
},
{
"epoch": 0.05014749262536873,
"grad_norm": 0.3005424445383612,
"learning_rate": 3.962264150943396e-06,
"loss": 0.629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2160702645778656,
"step": 85,
"valid_targets_mean": 10653.8,
"valid_targets_min": 2047
},
{
"epoch": 0.05309734513274336,
"grad_norm": 0.2623859001613278,
"learning_rate": 4.19811320754717e-06,
"loss": 0.6211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22089292109012604,
"step": 90,
"valid_targets_mean": 11910.6,
"valid_targets_min": 2312
},
{
"epoch": 0.05604719764011799,
"grad_norm": 0.27019333924019306,
"learning_rate": 4.4339622641509435e-06,
"loss": 0.6044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921449899673462,
"step": 95,
"valid_targets_mean": 9248.5,
"valid_targets_min": 1411
},
{
"epoch": 0.058997050147492625,
"grad_norm": 0.24358668760990093,
"learning_rate": 4.6698113207547175e-06,
"loss": 0.5878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19868874549865723,
"step": 100,
"valid_targets_mean": 8963.3,
"valid_targets_min": 1519
},
{
"epoch": 0.061946902654867256,
"grad_norm": 0.2317817621237028,
"learning_rate": 4.905660377358491e-06,
"loss": 0.5809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15674249827861786,
"step": 105,
"valid_targets_mean": 9282.0,
"valid_targets_min": 1902
},
{
"epoch": 0.06489675516224189,
"grad_norm": 0.21518580064198847,
"learning_rate": 5.1415094339622655e-06,
"loss": 0.5668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15662211179733276,
"step": 110,
"valid_targets_mean": 8392.4,
"valid_targets_min": 2588
},
{
"epoch": 0.06784660766961652,
"grad_norm": 0.22321760855402145,
"learning_rate": 5.377358490566038e-06,
"loss": 0.5676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20928239822387695,
"step": 115,
"valid_targets_mean": 11378.3,
"valid_targets_min": 2407
},
{
"epoch": 0.07079646017699115,
"grad_norm": 0.2365011327381435,
"learning_rate": 5.613207547169813e-06,
"loss": 0.5627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18675848841667175,
"step": 120,
"valid_targets_mean": 9986.8,
"valid_targets_min": 2330
},
{
"epoch": 0.07374631268436578,
"grad_norm": 0.21095555367092353,
"learning_rate": 5.849056603773585e-06,
"loss": 0.5494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20561310648918152,
"step": 125,
"valid_targets_mean": 13140.6,
"valid_targets_min": 2373
},
{
"epoch": 0.07669616519174041,
"grad_norm": 0.2254076492475572,
"learning_rate": 6.08490566037736e-06,
"loss": 0.5456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16216091811656952,
"step": 130,
"valid_targets_mean": 9226.3,
"valid_targets_min": 1613
},
{
"epoch": 0.07964601769911504,
"grad_norm": 0.22864199872760177,
"learning_rate": 6.320754716981132e-06,
"loss": 0.5343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15893808007240295,
"step": 135,
"valid_targets_mean": 8972.0,
"valid_targets_min": 2220
},
{
"epoch": 0.08259587020648967,
"grad_norm": 0.22340821685443538,
"learning_rate": 6.556603773584907e-06,
"loss": 0.5382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15970075130462646,
"step": 140,
"valid_targets_mean": 9749.8,
"valid_targets_min": 1853
},
{
"epoch": 0.0855457227138643,
"grad_norm": 0.2105247063608589,
"learning_rate": 6.792452830188679e-06,
"loss": 0.5374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2028973549604416,
"step": 145,
"valid_targets_mean": 12082.2,
"valid_targets_min": 1279
},
{
"epoch": 0.08849557522123894,
"grad_norm": 0.22580596780293535,
"learning_rate": 7.028301886792454e-06,
"loss": 0.5317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16002820432186127,
"step": 150,
"valid_targets_mean": 10171.3,
"valid_targets_min": 2108
},
{
"epoch": 0.09144542772861357,
"grad_norm": 0.2797740687314117,
"learning_rate": 7.264150943396226e-06,
"loss": 0.5311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16304832696914673,
"step": 155,
"valid_targets_mean": 8414.3,
"valid_targets_min": 2331
},
{
"epoch": 0.0943952802359882,
"grad_norm": 0.24060452477660244,
"learning_rate": 7.500000000000001e-06,
"loss": 0.525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168437197804451,
"step": 160,
"valid_targets_mean": 9946.0,
"valid_targets_min": 2071
},
{
"epoch": 0.09734513274336283,
"grad_norm": 0.26990784653362826,
"learning_rate": 7.735849056603775e-06,
"loss": 0.5303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23207911849021912,
"step": 165,
"valid_targets_mean": 11584.8,
"valid_targets_min": 2526
},
{
"epoch": 0.10029498525073746,
"grad_norm": 0.21813379853235298,
"learning_rate": 7.971698113207547e-06,
"loss": 0.5219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17449553310871124,
"step": 170,
"valid_targets_mean": 11271.9,
"valid_targets_min": 2150
},
{
"epoch": 0.10324483775811209,
"grad_norm": 0.2177784266608873,
"learning_rate": 8.207547169811321e-06,
"loss": 0.5211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1942562758922577,
"step": 175,
"valid_targets_mean": 11034.4,
"valid_targets_min": 1379
},
{
"epoch": 0.10619469026548672,
"grad_norm": 0.2365221311955703,
"learning_rate": 8.443396226415095e-06,
"loss": 0.5156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173548623919487,
"step": 180,
"valid_targets_mean": 11233.3,
"valid_targets_min": 1872
},
{
"epoch": 0.10914454277286136,
"grad_norm": 0.22263607666515303,
"learning_rate": 8.67924528301887e-06,
"loss": 0.5137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176674023270607,
"step": 185,
"valid_targets_mean": 10453.3,
"valid_targets_min": 1094
},
{
"epoch": 0.11209439528023599,
"grad_norm": 0.22259600474883798,
"learning_rate": 8.915094339622642e-06,
"loss": 0.5103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21244749426841736,
"step": 190,
"valid_targets_mean": 13592.8,
"valid_targets_min": 2893
},
{
"epoch": 0.11504424778761062,
"grad_norm": 0.23853918792073867,
"learning_rate": 9.150943396226416e-06,
"loss": 0.5119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15338359773159027,
"step": 195,
"valid_targets_mean": 9848.4,
"valid_targets_min": 2305
},
{
"epoch": 0.11799410029498525,
"grad_norm": 0.24544705784022192,
"learning_rate": 9.38679245283019e-06,
"loss": 0.5113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15049920976161957,
"step": 200,
"valid_targets_mean": 8824.9,
"valid_targets_min": 1762
},
{
"epoch": 0.12094395280235988,
"grad_norm": 0.23996923684824645,
"learning_rate": 9.622641509433963e-06,
"loss": 0.5036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17622515559196472,
"step": 205,
"valid_targets_mean": 10279.9,
"valid_targets_min": 993
},
{
"epoch": 0.12389380530973451,
"grad_norm": 0.2356178723103165,
"learning_rate": 9.858490566037736e-06,
"loss": 0.5047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16885659098625183,
"step": 210,
"valid_targets_mean": 9878.6,
"valid_targets_min": 1434
},
{
"epoch": 0.12684365781710916,
"grad_norm": 0.2593343578467735,
"learning_rate": 1.0094339622641511e-05,
"loss": 0.5052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15777814388275146,
"step": 215,
"valid_targets_mean": 9382.0,
"valid_targets_min": 1289
},
{
"epoch": 0.12979351032448377,
"grad_norm": 0.23853635794945394,
"learning_rate": 1.0330188679245284e-05,
"loss": 0.5059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1759573519229889,
"step": 220,
"valid_targets_mean": 9724.2,
"valid_targets_min": 2358
},
{
"epoch": 0.13274336283185842,
"grad_norm": 0.25629620309918427,
"learning_rate": 1.0566037735849058e-05,
"loss": 0.5033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17160122096538544,
"step": 225,
"valid_targets_mean": 11027.6,
"valid_targets_min": 1069
},
{
"epoch": 0.13569321533923304,
"grad_norm": 0.28852388125039813,
"learning_rate": 1.0801886792452832e-05,
"loss": 0.499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1474302113056183,
"step": 230,
"valid_targets_mean": 9196.5,
"valid_targets_min": 536
},
{
"epoch": 0.13864306784660768,
"grad_norm": 0.24690849305589715,
"learning_rate": 1.1037735849056606e-05,
"loss": 0.5006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15746231377124786,
"step": 235,
"valid_targets_mean": 9754.9,
"valid_targets_min": 1806
},
{
"epoch": 0.1415929203539823,
"grad_norm": 0.28233830897850076,
"learning_rate": 1.1273584905660378e-05,
"loss": 0.5022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1537265032529831,
"step": 240,
"valid_targets_mean": 9171.2,
"valid_targets_min": 1140
},
{
"epoch": 0.14454277286135694,
"grad_norm": 0.25448817250054345,
"learning_rate": 1.1509433962264152e-05,
"loss": 0.4989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16555047035217285,
"step": 245,
"valid_targets_mean": 9798.3,
"valid_targets_min": 1344
},
{
"epoch": 0.14749262536873156,
"grad_norm": 0.27603293860374156,
"learning_rate": 1.1745283018867926e-05,
"loss": 0.5022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15127146244049072,
"step": 250,
"valid_targets_mean": 8997.8,
"valid_targets_min": 2398
},
{
"epoch": 0.1504424778761062,
"grad_norm": 0.28094160412298935,
"learning_rate": 1.19811320754717e-05,
"loss": 0.5008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18154668807983398,
"step": 255,
"valid_targets_mean": 10034.7,
"valid_targets_min": 1739
},
{
"epoch": 0.15339233038348082,
"grad_norm": 0.272720858377614,
"learning_rate": 1.2216981132075472e-05,
"loss": 0.4942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14723987877368927,
"step": 260,
"valid_targets_mean": 9813.8,
"valid_targets_min": 1050
},
{
"epoch": 0.15634218289085547,
"grad_norm": 0.24896110011232206,
"learning_rate": 1.2452830188679246e-05,
"loss": 0.4967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15721940994262695,
"step": 265,
"valid_targets_mean": 10142.0,
"valid_targets_min": 2362
},
{
"epoch": 0.1592920353982301,
"grad_norm": 0.2384263642596385,
"learning_rate": 1.268867924528302e-05,
"loss": 0.4927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16213515400886536,
"step": 270,
"valid_targets_mean": 10334.2,
"valid_targets_min": 1215
},
{
"epoch": 0.16224188790560473,
"grad_norm": 0.26632949187377725,
"learning_rate": 1.2924528301886794e-05,
"loss": 0.4914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13655009865760803,
"step": 275,
"valid_targets_mean": 7946.3,
"valid_targets_min": 1646
},
{
"epoch": 0.16519174041297935,
"grad_norm": 0.2848379528640083,
"learning_rate": 1.3160377358490568e-05,
"loss": 0.4907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16915015876293182,
"step": 280,
"valid_targets_mean": 10197.9,
"valid_targets_min": 2517
},
{
"epoch": 0.168141592920354,
"grad_norm": 0.2503018600734144,
"learning_rate": 1.339622641509434e-05,
"loss": 0.5004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1548536717891693,
"step": 285,
"valid_targets_mean": 9506.9,
"valid_targets_min": 2134
},
{
"epoch": 0.1710914454277286,
"grad_norm": 0.24628942797179826,
"learning_rate": 1.3632075471698114e-05,
"loss": 0.4874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15937039256095886,
"step": 290,
"valid_targets_mean": 10417.7,
"valid_targets_min": 1786
},
{
"epoch": 0.17404129793510326,
"grad_norm": 0.27090595503730375,
"learning_rate": 1.3867924528301888e-05,
"loss": 0.4737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16793963313102722,
"step": 295,
"valid_targets_mean": 10820.2,
"valid_targets_min": 2213
},
{
"epoch": 0.17699115044247787,
"grad_norm": 0.26417038077590604,
"learning_rate": 1.4103773584905662e-05,
"loss": 0.4866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18323713541030884,
"step": 300,
"valid_targets_mean": 12955.4,
"valid_targets_min": 1467
},
{
"epoch": 0.17994100294985252,
"grad_norm": 0.23601605137120854,
"learning_rate": 1.4339622641509435e-05,
"loss": 0.4893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1528908610343933,
"step": 305,
"valid_targets_mean": 10078.7,
"valid_targets_min": 1501
},
{
"epoch": 0.18289085545722714,
"grad_norm": 0.2531068673705301,
"learning_rate": 1.4575471698113209e-05,
"loss": 0.4851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13879773020744324,
"step": 310,
"valid_targets_mean": 8772.9,
"valid_targets_min": 1174
},
{
"epoch": 0.18584070796460178,
"grad_norm": 0.27397534098938575,
"learning_rate": 1.4811320754716983e-05,
"loss": 0.4808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16207556426525116,
"step": 315,
"valid_targets_mean": 10604.9,
"valid_targets_min": 1801
},
{
"epoch": 0.1887905604719764,
"grad_norm": 0.2267842788550988,
"learning_rate": 1.5047169811320757e-05,
"loss": 0.4775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14752934873104095,
"step": 320,
"valid_targets_mean": 8825.4,
"valid_targets_min": 2007
},
{
"epoch": 0.19174041297935104,
"grad_norm": 0.2499831182134859,
"learning_rate": 1.5283018867924532e-05,
"loss": 0.476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15672816336154938,
"step": 325,
"valid_targets_mean": 10086.0,
"valid_targets_min": 2308
},
{
"epoch": 0.19469026548672566,
"grad_norm": 0.2631441971415124,
"learning_rate": 1.55188679245283e-05,
"loss": 0.479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14103585481643677,
"step": 330,
"valid_targets_mean": 9196.3,
"valid_targets_min": 2358
},
{
"epoch": 0.1976401179941003,
"grad_norm": 0.2918399531224374,
"learning_rate": 1.5754716981132077e-05,
"loss": 0.4852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13344430923461914,
"step": 335,
"valid_targets_mean": 8499.4,
"valid_targets_min": 1309
},
{
"epoch": 0.20058997050147492,
"grad_norm": 0.2984964884465926,
"learning_rate": 1.599056603773585e-05,
"loss": 0.4832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16676054894924164,
"step": 340,
"valid_targets_mean": 9956.7,
"valid_targets_min": 1540
},
{
"epoch": 0.20353982300884957,
"grad_norm": 0.27016950611621293,
"learning_rate": 1.6226415094339625e-05,
"loss": 0.4772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715359091758728,
"step": 345,
"valid_targets_mean": 10383.4,
"valid_targets_min": 2501
},
{
"epoch": 0.20648967551622419,
"grad_norm": 0.246612135038914,
"learning_rate": 1.6462264150943397e-05,
"loss": 0.4828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1632922887802124,
"step": 350,
"valid_targets_mean": 9967.4,
"valid_targets_min": 1821
},
{
"epoch": 0.20943952802359883,
"grad_norm": 0.26017611465367824,
"learning_rate": 1.669811320754717e-05,
"loss": 0.4765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15242213010787964,
"step": 355,
"valid_targets_mean": 9924.0,
"valid_targets_min": 1816
},
{
"epoch": 0.21238938053097345,
"grad_norm": 0.251691625498555,
"learning_rate": 1.6933962264150945e-05,
"loss": 0.471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16618210077285767,
"step": 360,
"valid_targets_mean": 10049.2,
"valid_targets_min": 1217
},
{
"epoch": 0.2153392330383481,
"grad_norm": 0.2608799009369842,
"learning_rate": 1.716981132075472e-05,
"loss": 0.4829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1781197488307953,
"step": 365,
"valid_targets_mean": 12419.6,
"valid_targets_min": 2271
},
{
"epoch": 0.2182890855457227,
"grad_norm": 0.2709855931241016,
"learning_rate": 1.740566037735849e-05,
"loss": 0.4677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18040911853313446,
"step": 370,
"valid_targets_mean": 10423.2,
"valid_targets_min": 1900
},
{
"epoch": 0.22123893805309736,
"grad_norm": 0.2922486386967908,
"learning_rate": 1.7641509433962265e-05,
"loss": 0.4685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1437935084104538,
"step": 375,
"valid_targets_mean": 8453.0,
"valid_targets_min": 1408
},
{
"epoch": 0.22418879056047197,
"grad_norm": 0.2509932527846505,
"learning_rate": 1.7877358490566038e-05,
"loss": 0.4788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15098921954631805,
"step": 380,
"valid_targets_mean": 9931.7,
"valid_targets_min": 2305
},
{
"epoch": 0.22713864306784662,
"grad_norm": 0.27496741475909753,
"learning_rate": 1.8113207547169813e-05,
"loss": 0.469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17977483570575714,
"step": 385,
"valid_targets_mean": 10178.9,
"valid_targets_min": 1039
},
{
"epoch": 0.23008849557522124,
"grad_norm": 0.33037536151215885,
"learning_rate": 1.834905660377359e-05,
"loss": 0.4732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17215262353420258,
"step": 390,
"valid_targets_mean": 10581.9,
"valid_targets_min": 1697
},
{
"epoch": 0.23303834808259588,
"grad_norm": 0.2590333044167339,
"learning_rate": 1.8584905660377358e-05,
"loss": 0.4833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1654370129108429,
"step": 395,
"valid_targets_mean": 10485.4,
"valid_targets_min": 2081
},
{
"epoch": 0.2359882005899705,
"grad_norm": 0.25165290674930346,
"learning_rate": 1.8820754716981133e-05,
"loss": 0.4738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16054049134254456,
"step": 400,
"valid_targets_mean": 10634.4,
"valid_targets_min": 1494
},
{
"epoch": 0.23893805309734514,
"grad_norm": 0.2558867155213945,
"learning_rate": 1.905660377358491e-05,
"loss": 0.4624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14743725955486298,
"step": 405,
"valid_targets_mean": 9134.9,
"valid_targets_min": 1983
},
{
"epoch": 0.24188790560471976,
"grad_norm": 0.320593320482016,
"learning_rate": 1.929245283018868e-05,
"loss": 0.4771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13047058880329132,
"step": 410,
"valid_targets_mean": 7631.4,
"valid_targets_min": 1308
},
{
"epoch": 0.2448377581120944,
"grad_norm": 0.249814248566448,
"learning_rate": 1.9528301886792454e-05,
"loss": 0.4706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15469786524772644,
"step": 415,
"valid_targets_mean": 11488.8,
"valid_targets_min": 3111
},
{
"epoch": 0.24778761061946902,
"grad_norm": 0.2657696546498897,
"learning_rate": 1.9764150943396226e-05,
"loss": 0.4683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13970687985420227,
"step": 420,
"valid_targets_mean": 9848.1,
"valid_targets_min": 1539
},
{
"epoch": 0.25073746312684364,
"grad_norm": 0.26882223733506905,
"learning_rate": 2e-05,
"loss": 0.4648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17859773337841034,
"step": 425,
"valid_targets_mean": 12024.1,
"valid_targets_min": 2727
},
{
"epoch": 0.2536873156342183,
"grad_norm": 0.246210269985762,
"learning_rate": 2.0235849056603777e-05,
"loss": 0.4701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15420570969581604,
"step": 430,
"valid_targets_mean": 9545.0,
"valid_targets_min": 1882
},
{
"epoch": 0.25663716814159293,
"grad_norm": 0.29785060543263786,
"learning_rate": 2.047169811320755e-05,
"loss": 0.4718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1376991719007492,
"step": 435,
"valid_targets_mean": 8259.6,
"valid_targets_min": 1045
},
{
"epoch": 0.25958702064896755,
"grad_norm": 0.28985379658927735,
"learning_rate": 2.0707547169811325e-05,
"loss": 0.4684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606501042842865,
"step": 440,
"valid_targets_mean": 10127.1,
"valid_targets_min": 1797
},
{
"epoch": 0.26253687315634217,
"grad_norm": 0.2814165129117154,
"learning_rate": 2.0943396226415098e-05,
"loss": 0.4692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14782124757766724,
"step": 445,
"valid_targets_mean": 8850.4,
"valid_targets_min": 1524
},
{
"epoch": 0.26548672566371684,
"grad_norm": 0.2797668741402931,
"learning_rate": 2.1179245283018866e-05,
"loss": 0.4714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12928162515163422,
"step": 450,
"valid_targets_mean": 8547.2,
"valid_targets_min": 1657
},
{
"epoch": 0.26843657817109146,
"grad_norm": 0.2528656289681847,
"learning_rate": 2.1415094339622642e-05,
"loss": 0.4636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13063043355941772,
"step": 455,
"valid_targets_mean": 7498.9,
"valid_targets_min": 2006
},
{
"epoch": 0.2713864306784661,
"grad_norm": 0.2581926598105123,
"learning_rate": 2.1650943396226414e-05,
"loss": 0.4667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16427075862884521,
"step": 460,
"valid_targets_mean": 10987.5,
"valid_targets_min": 2508
},
{
"epoch": 0.2743362831858407,
"grad_norm": 0.2823206577169872,
"learning_rate": 2.188679245283019e-05,
"loss": 0.473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14611220359802246,
"step": 465,
"valid_targets_mean": 10292.0,
"valid_targets_min": 2280
},
{
"epoch": 0.27728613569321536,
"grad_norm": 0.26695133201537186,
"learning_rate": 2.2122641509433966e-05,
"loss": 0.468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15307700634002686,
"step": 470,
"valid_targets_mean": 10601.8,
"valid_targets_min": 1396
},
{
"epoch": 0.28023598820059,
"grad_norm": 0.28255841738322507,
"learning_rate": 2.2358490566037738e-05,
"loss": 0.4624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726362109184265,
"step": 475,
"valid_targets_mean": 9942.6,
"valid_targets_min": 2133
},
{
"epoch": 0.2831858407079646,
"grad_norm": 0.2694490289689112,
"learning_rate": 2.2594339622641514e-05,
"loss": 0.4713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1771799623966217,
"step": 480,
"valid_targets_mean": 9759.4,
"valid_targets_min": 1581
},
{
"epoch": 0.2861356932153392,
"grad_norm": 0.26320630311881227,
"learning_rate": 2.2830188679245286e-05,
"loss": 0.4658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18050238490104675,
"step": 485,
"valid_targets_mean": 10620.5,
"valid_targets_min": 1461
},
{
"epoch": 0.2890855457227139,
"grad_norm": 0.2821384330941035,
"learning_rate": 2.306603773584906e-05,
"loss": 0.4715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13854411244392395,
"step": 490,
"valid_targets_mean": 8787.5,
"valid_targets_min": 2197
},
{
"epoch": 0.2920353982300885,
"grad_norm": 0.2589089232000087,
"learning_rate": 2.330188679245283e-05,
"loss": 0.4677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13725772500038147,
"step": 495,
"valid_targets_mean": 9077.8,
"valid_targets_min": 2800
},
{
"epoch": 0.2949852507374631,
"grad_norm": 0.27484048405379097,
"learning_rate": 2.3537735849056603e-05,
"loss": 0.4649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16023467481136322,
"step": 500,
"valid_targets_mean": 9941.8,
"valid_targets_min": 2260
},
{
"epoch": 0.29793510324483774,
"grad_norm": 0.27097915398189687,
"learning_rate": 2.377358490566038e-05,
"loss": 0.4688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15327778458595276,
"step": 505,
"valid_targets_mean": 10138.6,
"valid_targets_min": 1655
},
{
"epoch": 0.3008849557522124,
"grad_norm": 0.3090554478712165,
"learning_rate": 2.4009433962264154e-05,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1643308848142624,
"step": 510,
"valid_targets_mean": 9809.2,
"valid_targets_min": 1817
},
{
"epoch": 0.30383480825958703,
"grad_norm": 0.26976590724785876,
"learning_rate": 2.4245283018867926e-05,
"loss": 0.4662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18249952793121338,
"step": 515,
"valid_targets_mean": 11053.2,
"valid_targets_min": 1891
},
{
"epoch": 0.30678466076696165,
"grad_norm": 0.30412168245675625,
"learning_rate": 2.4481132075471702e-05,
"loss": 0.4558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17874681949615479,
"step": 520,
"valid_targets_mean": 10950.2,
"valid_targets_min": 2265
},
{
"epoch": 0.30973451327433627,
"grad_norm": 0.2436153196597148,
"learning_rate": 2.4716981132075474e-05,
"loss": 0.4625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472557932138443,
"step": 525,
"valid_targets_mean": 9727.5,
"valid_targets_min": 1294
},
{
"epoch": 0.31268436578171094,
"grad_norm": 0.25885412101342653,
"learning_rate": 2.495283018867925e-05,
"loss": 0.468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16035309433937073,
"step": 530,
"valid_targets_mean": 10823.4,
"valid_targets_min": 2542
},
{
"epoch": 0.31563421828908556,
"grad_norm": 0.30705913319043077,
"learning_rate": 2.5188679245283022e-05,
"loss": 0.4593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15604931116104126,
"step": 535,
"valid_targets_mean": 10381.6,
"valid_targets_min": 1504
},
{
"epoch": 0.3185840707964602,
"grad_norm": 0.28099029262967157,
"learning_rate": 2.542452830188679e-05,
"loss": 0.4574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17848971486091614,
"step": 540,
"valid_targets_mean": 10812.6,
"valid_targets_min": 1055
},
{
"epoch": 0.3215339233038348,
"grad_norm": 0.28014050592117723,
"learning_rate": 2.5660377358490567e-05,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14001238346099854,
"step": 545,
"valid_targets_mean": 9040.8,
"valid_targets_min": 1130
},
{
"epoch": 0.32448377581120946,
"grad_norm": 0.3027064554505464,
"learning_rate": 2.5896226415094343e-05,
"loss": 0.4597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1356821060180664,
"step": 550,
"valid_targets_mean": 9655.9,
"valid_targets_min": 1410
},
{
"epoch": 0.3274336283185841,
"grad_norm": 0.24986437223369426,
"learning_rate": 2.6132075471698115e-05,
"loss": 0.4604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13323450088500977,
"step": 555,
"valid_targets_mean": 8905.6,
"valid_targets_min": 1830
},
{
"epoch": 0.3303834808259587,
"grad_norm": 0.27829745186311433,
"learning_rate": 2.636792452830189e-05,
"loss": 0.4599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13928677141666412,
"step": 560,
"valid_targets_mean": 9882.5,
"valid_targets_min": 2408
},
{
"epoch": 0.3333333333333333,
"grad_norm": 0.2716435864042277,
"learning_rate": 2.6603773584905663e-05,
"loss": 0.4602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14196351170539856,
"step": 565,
"valid_targets_mean": 9463.4,
"valid_targets_min": 1659
},
{
"epoch": 0.336283185840708,
"grad_norm": 0.3535835553630807,
"learning_rate": 2.683962264150944e-05,
"loss": 0.4614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14128056168556213,
"step": 570,
"valid_targets_mean": 11038.2,
"valid_targets_min": 1531
},
{
"epoch": 0.3392330383480826,
"grad_norm": 0.33471177982730127,
"learning_rate": 2.707547169811321e-05,
"loss": 0.4572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605977863073349,
"step": 575,
"valid_targets_mean": 10074.7,
"valid_targets_min": 2085
},
{
"epoch": 0.3421828908554572,
"grad_norm": 0.27189834395930973,
"learning_rate": 2.731132075471698e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13230662047863007,
"step": 580,
"valid_targets_mean": 10108.6,
"valid_targets_min": 1642
},
{
"epoch": 0.34513274336283184,
"grad_norm": 0.32866294091387294,
"learning_rate": 2.7547169811320755e-05,
"loss": 0.4626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1503252238035202,
"step": 585,
"valid_targets_mean": 9673.6,
"valid_targets_min": 997
},
{
"epoch": 0.3480825958702065,
"grad_norm": 0.2960662895794109,
"learning_rate": 2.7783018867924528e-05,
"loss": 0.456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13039669394493103,
"step": 590,
"valid_targets_mean": 8708.4,
"valid_targets_min": 1573
},
{
"epoch": 0.35103244837758113,
"grad_norm": 0.26573228974936325,
"learning_rate": 2.8018867924528303e-05,
"loss": 0.4605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17490148544311523,
"step": 595,
"valid_targets_mean": 12304.2,
"valid_targets_min": 1814
},
{
"epoch": 0.35398230088495575,
"grad_norm": 0.26907409187290865,
"learning_rate": 2.825471698113208e-05,
"loss": 0.4649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15238738059997559,
"step": 600,
"valid_targets_mean": 11132.8,
"valid_targets_min": 1200
},
{
"epoch": 0.35693215339233036,
"grad_norm": 0.2774500653590238,
"learning_rate": 2.849056603773585e-05,
"loss": 0.468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16456542909145355,
"step": 605,
"valid_targets_mean": 10237.6,
"valid_targets_min": 950
},
{
"epoch": 0.35988200589970504,
"grad_norm": 0.25930731596289175,
"learning_rate": 2.8726415094339627e-05,
"loss": 0.46,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13452622294425964,
"step": 610,
"valid_targets_mean": 10417.7,
"valid_targets_min": 2034
},
{
"epoch": 0.36283185840707965,
"grad_norm": 0.24490820051848358,
"learning_rate": 2.89622641509434e-05,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15420666337013245,
"step": 615,
"valid_targets_mean": 11726.6,
"valid_targets_min": 1312
},
{
"epoch": 0.36578171091445427,
"grad_norm": 0.2982872806748629,
"learning_rate": 2.9198113207547175e-05,
"loss": 0.4552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1296735554933548,
"step": 620,
"valid_targets_mean": 8954.2,
"valid_targets_min": 1876
},
{
"epoch": 0.3687315634218289,
"grad_norm": 0.3250742977113956,
"learning_rate": 2.9433962264150944e-05,
"loss": 0.4613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17718186974525452,
"step": 625,
"valid_targets_mean": 10257.4,
"valid_targets_min": 2939
},
{
"epoch": 0.37168141592920356,
"grad_norm": 0.26652767339475386,
"learning_rate": 2.9669811320754716e-05,
"loss": 0.4555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14411255717277527,
"step": 630,
"valid_targets_mean": 9281.1,
"valid_targets_min": 2123
},
{
"epoch": 0.3746312684365782,
"grad_norm": 0.26668461534256777,
"learning_rate": 2.9905660377358492e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16539090871810913,
"step": 635,
"valid_targets_mean": 9339.8,
"valid_targets_min": 2558
},
{
"epoch": 0.3775811209439528,
"grad_norm": 0.29462928332592325,
"learning_rate": 3.0141509433962268e-05,
"loss": 0.4579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15282703936100006,
"step": 640,
"valid_targets_mean": 9360.2,
"valid_targets_min": 2415
},
{
"epoch": 0.3805309734513274,
"grad_norm": 0.2516067578464611,
"learning_rate": 3.037735849056604e-05,
"loss": 0.4552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1402677595615387,
"step": 645,
"valid_targets_mean": 8395.6,
"valid_targets_min": 1630
},
{
"epoch": 0.3834808259587021,
"grad_norm": 0.2498210260731851,
"learning_rate": 3.061320754716981e-05,
"loss": 0.4488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17535334825515747,
"step": 650,
"valid_targets_mean": 12708.2,
"valid_targets_min": 3373
},
{
"epoch": 0.3864306784660767,
"grad_norm": 0.21973934537102108,
"learning_rate": 3.084905660377359e-05,
"loss": 0.4468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14050549268722534,
"step": 655,
"valid_targets_mean": 11102.9,
"valid_targets_min": 2383
},
{
"epoch": 0.3893805309734513,
"grad_norm": 0.270755988116607,
"learning_rate": 3.1084905660377363e-05,
"loss": 0.4565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484229564666748,
"step": 660,
"valid_targets_mean": 9429.2,
"valid_targets_min": 1243
},
{
"epoch": 0.39233038348082594,
"grad_norm": 0.29290363039429895,
"learning_rate": 3.1320754716981136e-05,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17251214385032654,
"step": 665,
"valid_targets_mean": 12589.8,
"valid_targets_min": 1293
},
{
"epoch": 0.3952802359882006,
"grad_norm": 0.2937360725551836,
"learning_rate": 3.155660377358491e-05,
"loss": 0.4512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14358994364738464,
"step": 670,
"valid_targets_mean": 9731.8,
"valid_targets_min": 1129
},
{
"epoch": 0.39823008849557523,
"grad_norm": 0.3156882903522341,
"learning_rate": 3.179245283018868e-05,
"loss": 0.4506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11705832928419113,
"step": 675,
"valid_targets_mean": 8218.8,
"valid_targets_min": 595
},
{
"epoch": 0.40117994100294985,
"grad_norm": 0.2562761263862917,
"learning_rate": 3.202830188679245e-05,
"loss": 0.4566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14067499339580536,
"step": 680,
"valid_targets_mean": 9081.4,
"valid_targets_min": 888
},
{
"epoch": 0.40412979351032446,
"grad_norm": 0.27166104573986943,
"learning_rate": 3.226415094339623e-05,
"loss": 0.4478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15120014548301697,
"step": 685,
"valid_targets_mean": 10127.8,
"valid_targets_min": 1547
},
{
"epoch": 0.40707964601769914,
"grad_norm": 0.25598816634560684,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.4501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14215946197509766,
"step": 690,
"valid_targets_mean": 9777.3,
"valid_targets_min": 1666
},
{
"epoch": 0.41002949852507375,
"grad_norm": 0.25719286137409414,
"learning_rate": 3.2735849056603776e-05,
"loss": 0.4504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13619284331798553,
"step": 695,
"valid_targets_mean": 8813.1,
"valid_targets_min": 2184
},
{
"epoch": 0.41297935103244837,
"grad_norm": 0.2896922208973931,
"learning_rate": 3.297169811320755e-05,
"loss": 0.4582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1457536220550537,
"step": 700,
"valid_targets_mean": 9679.6,
"valid_targets_min": 2445
},
{
"epoch": 0.415929203539823,
"grad_norm": 0.23727416292578302,
"learning_rate": 3.320754716981133e-05,
"loss": 0.4565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14196723699569702,
"step": 705,
"valid_targets_mean": 10510.3,
"valid_targets_min": 1998
},
{
"epoch": 0.41887905604719766,
"grad_norm": 0.30186788865389924,
"learning_rate": 3.34433962264151e-05,
"loss": 0.454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078678011894226,
"step": 710,
"valid_targets_mean": 12465.5,
"valid_targets_min": 1710
},
{
"epoch": 0.4218289085545723,
"grad_norm": 0.2708370944564039,
"learning_rate": 3.367924528301887e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17721615731716156,
"step": 715,
"valid_targets_mean": 10231.8,
"valid_targets_min": 2259
},
{
"epoch": 0.4247787610619469,
"grad_norm": 0.2350755624225508,
"learning_rate": 3.3915094339622644e-05,
"loss": 0.4535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684504598379135,
"step": 720,
"valid_targets_mean": 13320.7,
"valid_targets_min": 1376
},
{
"epoch": 0.4277286135693215,
"grad_norm": 0.2522551418925396,
"learning_rate": 3.415094339622642e-05,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1219257265329361,
"step": 725,
"valid_targets_mean": 8426.0,
"valid_targets_min": 1654
},
{
"epoch": 0.4306784660766962,
"grad_norm": 0.2388555987026393,
"learning_rate": 3.438679245283019e-05,
"loss": 0.4497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13714396953582764,
"step": 730,
"valid_targets_mean": 8610.3,
"valid_targets_min": 2335
},
{
"epoch": 0.4336283185840708,
"grad_norm": 0.2582456062781972,
"learning_rate": 3.462264150943397e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14914974570274353,
"step": 735,
"valid_targets_mean": 9733.9,
"valid_targets_min": 2604
},
{
"epoch": 0.4365781710914454,
"grad_norm": 0.2700913343244362,
"learning_rate": 3.485849056603774e-05,
"loss": 0.4458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12170357257127762,
"step": 740,
"valid_targets_mean": 7887.3,
"valid_targets_min": 961
},
{
"epoch": 0.43952802359882004,
"grad_norm": 0.222415816081342,
"learning_rate": 3.509433962264151e-05,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17051385343074799,
"step": 745,
"valid_targets_mean": 12008.4,
"valid_targets_min": 3631
},
{
"epoch": 0.4424778761061947,
"grad_norm": 0.25946960551263726,
"learning_rate": 3.5330188679245285e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592746078968048,
"step": 750,
"valid_targets_mean": 11155.2,
"valid_targets_min": 2731
},
{
"epoch": 0.44542772861356933,
"grad_norm": 0.25561757233854515,
"learning_rate": 3.5566037735849064e-05,
"loss": 0.4428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1529407799243927,
"step": 755,
"valid_targets_mean": 10674.4,
"valid_targets_min": 1317
},
{
"epoch": 0.44837758112094395,
"grad_norm": 0.24513783517340867,
"learning_rate": 3.580188679245283e-05,
"loss": 0.4481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17502880096435547,
"step": 760,
"valid_targets_mean": 11136.4,
"valid_targets_min": 1890
},
{
"epoch": 0.45132743362831856,
"grad_norm": 0.28955720780331523,
"learning_rate": 3.603773584905661e-05,
"loss": 0.4513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18724988400936127,
"step": 765,
"valid_targets_mean": 12538.8,
"valid_targets_min": 1856
},
{
"epoch": 0.45427728613569324,
"grad_norm": 0.27683507884518554,
"learning_rate": 3.627358490566038e-05,
"loss": 0.4577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17236828804016113,
"step": 770,
"valid_targets_mean": 11351.3,
"valid_targets_min": 1738
},
{
"epoch": 0.45722713864306785,
"grad_norm": 0.26370920620085647,
"learning_rate": 3.650943396226415e-05,
"loss": 0.4472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12365929037332535,
"step": 775,
"valid_targets_mean": 9638.6,
"valid_targets_min": 2769
},
{
"epoch": 0.46017699115044247,
"grad_norm": 0.2492816067379124,
"learning_rate": 3.6745283018867925e-05,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15394821763038635,
"step": 780,
"valid_targets_mean": 10217.3,
"valid_targets_min": 1867
},
{
"epoch": 0.4631268436578171,
"grad_norm": 0.2662678776277218,
"learning_rate": 3.6981132075471704e-05,
"loss": 0.4454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1481439769268036,
"step": 785,
"valid_targets_mean": 10830.1,
"valid_targets_min": 2056
},
{
"epoch": 0.46607669616519176,
"grad_norm": 0.27166721966840673,
"learning_rate": 3.721698113207548e-05,
"loss": 0.4433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11750192940235138,
"step": 790,
"valid_targets_mean": 8065.7,
"valid_targets_min": 2250
},
{
"epoch": 0.4690265486725664,
"grad_norm": 0.2802680400873714,
"learning_rate": 3.745283018867925e-05,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14400440454483032,
"step": 795,
"valid_targets_mean": 10655.2,
"valid_targets_min": 2555
},
{
"epoch": 0.471976401179941,
"grad_norm": 0.25574385214080575,
"learning_rate": 3.768867924528302e-05,
"loss": 0.4452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1591102033853531,
"step": 800,
"valid_targets_mean": 11071.5,
"valid_targets_min": 860
},
{
"epoch": 0.4749262536873156,
"grad_norm": 0.2337795901319177,
"learning_rate": 3.7924528301886794e-05,
"loss": 0.4413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1704762876033783,
"step": 805,
"valid_targets_mean": 11408.9,
"valid_targets_min": 2015
},
{
"epoch": 0.4778761061946903,
"grad_norm": 0.21354425291394666,
"learning_rate": 3.8160377358490566e-05,
"loss": 0.4471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12261828780174255,
"step": 810,
"valid_targets_mean": 9568.1,
"valid_targets_min": 1913
},
{
"epoch": 0.4808259587020649,
"grad_norm": 0.27920147232288245,
"learning_rate": 3.8396226415094345e-05,
"loss": 0.4514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1378454566001892,
"step": 815,
"valid_targets_mean": 9056.0,
"valid_targets_min": 1585
},
{
"epoch": 0.4837758112094395,
"grad_norm": 0.23954199670564313,
"learning_rate": 3.863207547169812e-05,
"loss": 0.4453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1725279539823532,
"step": 820,
"valid_targets_mean": 13044.3,
"valid_targets_min": 2160
},
{
"epoch": 0.48672566371681414,
"grad_norm": 0.27199528594568334,
"learning_rate": 3.886792452830189e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12170670181512833,
"step": 825,
"valid_targets_mean": 9486.9,
"valid_targets_min": 1543
},
{
"epoch": 0.4896755162241888,
"grad_norm": 0.24402116494508275,
"learning_rate": 3.910377358490566e-05,
"loss": 0.4475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12425626814365387,
"step": 830,
"valid_targets_mean": 9637.9,
"valid_targets_min": 1453
},
{
"epoch": 0.49262536873156343,
"grad_norm": 0.2601853493885366,
"learning_rate": 3.933962264150944e-05,
"loss": 0.4498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1890874207019806,
"step": 835,
"valid_targets_mean": 11221.1,
"valid_targets_min": 1861
},
{
"epoch": 0.49557522123893805,
"grad_norm": 0.26759359151306256,
"learning_rate": 3.957547169811321e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12343671172857285,
"step": 840,
"valid_targets_mean": 7896.7,
"valid_targets_min": 1601
},
{
"epoch": 0.49852507374631266,
"grad_norm": 0.27994930659509876,
"learning_rate": 3.9811320754716985e-05,
"loss": 0.4498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1634995937347412,
"step": 845,
"valid_targets_mean": 11206.3,
"valid_targets_min": 2567
},
{
"epoch": 0.5014749262536873,
"grad_norm": 0.31281920185152984,
"learning_rate": 3.999999830335006e-05,
"loss": 0.4382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15493710339069366,
"step": 850,
"valid_targets_mean": 9940.7,
"valid_targets_min": 1487
},
{
"epoch": 0.504424778761062,
"grad_norm": 0.27455549055935935,
"learning_rate": 3.999993892063233e-05,
"loss": 0.4466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14785268902778625,
"step": 855,
"valid_targets_mean": 9426.9,
"valid_targets_min": 1920
},
{
"epoch": 0.5073746312684366,
"grad_norm": 0.2514821993311233,
"learning_rate": 3.999979470570539e-05,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12655514478683472,
"step": 860,
"valid_targets_mean": 7889.9,
"valid_targets_min": 1997
},
{
"epoch": 0.5103244837758112,
"grad_norm": 0.2315638399925816,
"learning_rate": 3.999956565918094e-05,
"loss": 0.4399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12273876368999481,
"step": 865,
"valid_targets_mean": 8702.3,
"valid_targets_min": 2150
},
{
"epoch": 0.5132743362831859,
"grad_norm": 0.27177307915070725,
"learning_rate": 3.9999251782030515e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17223188281059265,
"step": 870,
"valid_targets_mean": 11533.9,
"valid_targets_min": 1871
},
{
"epoch": 0.5162241887905604,
"grad_norm": 0.2530159978008084,
"learning_rate": 3.999885307558546e-05,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14095968008041382,
"step": 875,
"valid_targets_mean": 10099.0,
"valid_targets_min": 2449
},
{
"epoch": 0.5191740412979351,
"grad_norm": 0.23419659787170694,
"learning_rate": 3.999836954153693e-05,
"loss": 0.4375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631159782409668,
"step": 880,
"valid_targets_mean": 10613.0,
"valid_targets_min": 1767
},
{
"epoch": 0.5221238938053098,
"grad_norm": 0.2635996187407809,
"learning_rate": 3.999780118193591e-05,
"loss": 0.4491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14979779720306396,
"step": 885,
"valid_targets_mean": 9735.8,
"valid_targets_min": 1444
},
{
"epoch": 0.5250737463126843,
"grad_norm": 0.23138056829140724,
"learning_rate": 3.999714799919315e-05,
"loss": 0.4543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16043859720230103,
"step": 890,
"valid_targets_mean": 12089.4,
"valid_targets_min": 1483
},
{
"epoch": 0.528023598820059,
"grad_norm": 0.2552416570547656,
"learning_rate": 3.9996409996079216e-05,
"loss": 0.4479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1546708643436432,
"step": 895,
"valid_targets_mean": 9522.6,
"valid_targets_min": 747
},
{
"epoch": 0.5309734513274337,
"grad_norm": 0.27707949183780095,
"learning_rate": 3.999558717572444e-05,
"loss": 0.4341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10108429193496704,
"step": 900,
"valid_targets_mean": 6589.8,
"valid_targets_min": 1001
},
{
"epoch": 0.5339233038348082,
"grad_norm": 0.30013490391556236,
"learning_rate": 3.9994679541618915e-05,
"loss": 0.4496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.141307532787323,
"step": 905,
"valid_targets_mean": 8307.7,
"valid_targets_min": 1442
},
{
"epoch": 0.5368731563421829,
"grad_norm": 0.2380696069906505,
"learning_rate": 3.999368709761248e-05,
"loss": 0.4392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13957419991493225,
"step": 910,
"valid_targets_mean": 9174.5,
"valid_targets_min": 2099
},
{
"epoch": 0.5398230088495575,
"grad_norm": 0.243047986423948,
"learning_rate": 3.999260984791471e-05,
"loss": 0.442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15068325400352478,
"step": 915,
"valid_targets_mean": 9977.2,
"valid_targets_min": 1385
},
{
"epoch": 0.5427728613569321,
"grad_norm": 0.282398462410271,
"learning_rate": 3.9991447797094886e-05,
"loss": 0.4448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12257401645183563,
"step": 920,
"valid_targets_mean": 8322.1,
"valid_targets_min": 2131
},
{
"epoch": 0.5457227138643068,
"grad_norm": 0.2803063967663372,
"learning_rate": 3.999020095008201e-05,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15170587599277496,
"step": 925,
"valid_targets_mean": 10406.2,
"valid_targets_min": 1407
},
{
"epoch": 0.5486725663716814,
"grad_norm": 0.21878506602558695,
"learning_rate": 3.998886931216471e-05,
"loss": 0.4366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.167210191488266,
"step": 930,
"valid_targets_mean": 12493.9,
"valid_targets_min": 2457
},
{
"epoch": 0.551622418879056,
"grad_norm": 0.28765408994466546,
"learning_rate": 3.998745288899132e-05,
"loss": 0.4335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283373236656189,
"step": 935,
"valid_targets_mean": 9960.1,
"valid_targets_min": 2052
},
{
"epoch": 0.5545722713864307,
"grad_norm": 0.2843227805103614,
"learning_rate": 3.998595168656975e-05,
"loss": 0.4495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12957099080085754,
"step": 940,
"valid_targets_mean": 8378.8,
"valid_targets_min": 1560
},
{
"epoch": 0.5575221238938053,
"grad_norm": 0.25406467688649903,
"learning_rate": 3.998436571126755e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1349082589149475,
"step": 945,
"valid_targets_mean": 9472.5,
"valid_targets_min": 2484
},
{
"epoch": 0.56047197640118,
"grad_norm": 0.25433445706846386,
"learning_rate": 3.9982694969811826e-05,
"loss": 0.444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430283486843109,
"step": 950,
"valid_targets_mean": 10299.2,
"valid_targets_min": 878
},
{
"epoch": 0.5634218289085545,
"grad_norm": 0.23787392787588774,
"learning_rate": 3.9980939469289235e-05,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1557752639055252,
"step": 955,
"valid_targets_mean": 10887.9,
"valid_targets_min": 2125
},
{
"epoch": 0.5663716814159292,
"grad_norm": 0.2308555142208238,
"learning_rate": 3.9979099217145944e-05,
"loss": 0.4394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18596434593200684,
"step": 960,
"valid_targets_mean": 12573.0,
"valid_targets_min": 2048
},
{
"epoch": 0.5693215339233039,
"grad_norm": 0.2658698303261006,
"learning_rate": 3.997717422118762e-05,
"loss": 0.445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13433973491191864,
"step": 965,
"valid_targets_mean": 9179.3,
"valid_targets_min": 1147
},
{
"epoch": 0.5722713864306784,
"grad_norm": 0.23518502065874103,
"learning_rate": 3.997516448957936e-05,
"loss": 0.4322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15136614441871643,
"step": 970,
"valid_targets_mean": 10706.8,
"valid_targets_min": 1593
},
{
"epoch": 0.5752212389380531,
"grad_norm": 0.26959385406200537,
"learning_rate": 3.99730700308457e-05,
"loss": 0.4388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14212557673454285,
"step": 975,
"valid_targets_mean": 9218.1,
"valid_targets_min": 2137
},
{
"epoch": 0.5781710914454278,
"grad_norm": 0.29520369839795346,
"learning_rate": 3.997089085387053e-05,
"loss": 0.4406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1661655157804489,
"step": 980,
"valid_targets_mean": 11224.7,
"valid_targets_min": 1822
},
{
"epoch": 0.5811209439528023,
"grad_norm": 0.24272878958124294,
"learning_rate": 3.996862696789711e-05,
"loss": 0.4386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15572072565555573,
"step": 985,
"valid_targets_mean": 11156.6,
"valid_targets_min": 1606
},
{
"epoch": 0.584070796460177,
"grad_norm": 0.22014999106432825,
"learning_rate": 3.9966278382527984e-05,
"loss": 0.4371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16465000808238983,
"step": 990,
"valid_targets_mean": 10960.1,
"valid_targets_min": 1556
},
{
"epoch": 0.5870206489675516,
"grad_norm": 0.22932156241002566,
"learning_rate": 3.9963845107724974e-05,
"loss": 0.4417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1330799162387848,
"step": 995,
"valid_targets_mean": 9461.7,
"valid_targets_min": 1929
},
{
"epoch": 0.5899705014749262,
"grad_norm": 0.25358406476549183,
"learning_rate": 3.9961327153809115e-05,
"loss": 0.4457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.153403177857399,
"step": 1000,
"valid_targets_mean": 9745.5,
"valid_targets_min": 1581
},
{
"epoch": 0.5929203539823009,
"grad_norm": 0.23111027669299938,
"learning_rate": 3.995872453146061e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1502678245306015,
"step": 1005,
"valid_targets_mean": 10080.6,
"valid_targets_min": 2923
},
{
"epoch": 0.5958702064896755,
"grad_norm": 0.24859400144388313,
"learning_rate": 3.9956037251718815e-05,
"loss": 0.4316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14000633358955383,
"step": 1010,
"valid_targets_mean": 8127.2,
"valid_targets_min": 1571
},
{
"epoch": 0.5988200589970502,
"grad_norm": 0.22734263938219632,
"learning_rate": 3.9953265325982154e-05,
"loss": 0.4433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14217329025268555,
"step": 1015,
"valid_targets_mean": 10449.8,
"valid_targets_min": 1912
},
{
"epoch": 0.6017699115044248,
"grad_norm": 0.2617934457733421,
"learning_rate": 3.9950408766008084e-05,
"loss": 0.4408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1299726665019989,
"step": 1020,
"valid_targets_mean": 8532.2,
"valid_targets_min": 1791
},
{
"epoch": 0.6047197640117994,
"grad_norm": 0.25200466318788883,
"learning_rate": 3.994746758391308e-05,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15745247900485992,
"step": 1025,
"valid_targets_mean": 11387.8,
"valid_targets_min": 2003
},
{
"epoch": 0.6076696165191741,
"grad_norm": 0.2522310486948059,
"learning_rate": 3.9944441792172496e-05,
"loss": 0.4409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417302042245865,
"step": 1030,
"valid_targets_mean": 9229.9,
"valid_targets_min": 2522
},
{
"epoch": 0.6106194690265486,
"grad_norm": 0.24087788923556788,
"learning_rate": 3.9941331403620627e-05,
"loss": 0.4382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16813431680202484,
"step": 1035,
"valid_targets_mean": 12198.8,
"valid_targets_min": 1675
},
{
"epoch": 0.6135693215339233,
"grad_norm": 0.26238210737003126,
"learning_rate": 3.993813643145055e-05,
"loss": 0.4408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14091551303863525,
"step": 1040,
"valid_targets_mean": 10017.0,
"valid_targets_min": 1776
},
{
"epoch": 0.616519174041298,
"grad_norm": 0.2317100253921235,
"learning_rate": 3.9934856889214154e-05,
"loss": 0.4373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13581900298595428,
"step": 1045,
"valid_targets_mean": 10342.0,
"valid_targets_min": 1961
},
{
"epoch": 0.6194690265486725,
"grad_norm": 0.21932495712560107,
"learning_rate": 3.993149279082201e-05,
"loss": 0.4399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14504750072956085,
"step": 1050,
"valid_targets_mean": 9962.6,
"valid_targets_min": 2405
},
{
"epoch": 0.6224188790560472,
"grad_norm": 0.23356570302226454,
"learning_rate": 3.9928044150543364e-05,
"loss": 0.4387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12058188766241074,
"step": 1055,
"valid_targets_mean": 8304.7,
"valid_targets_min": 1978
},
{
"epoch": 0.6253687315634219,
"grad_norm": 0.24065917712232185,
"learning_rate": 3.992451098300604e-05,
"loss": 0.436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15964940190315247,
"step": 1060,
"valid_targets_mean": 12342.4,
"valid_targets_min": 2187
},
{
"epoch": 0.6283185840707964,
"grad_norm": 0.21529728843415769,
"learning_rate": 3.9920893303196406e-05,
"loss": 0.4381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1437956839799881,
"step": 1065,
"valid_targets_mean": 9165.0,
"valid_targets_min": 832
},
{
"epoch": 0.6312684365781711,
"grad_norm": 0.22294702084259344,
"learning_rate": 3.99171911264593e-05,
"loss": 0.4389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1432226449251175,
"step": 1070,
"valid_targets_mean": 10573.9,
"valid_targets_min": 2386
},
{
"epoch": 0.6342182890855457,
"grad_norm": 0.2488004867962405,
"learning_rate": 3.991340446849797e-05,
"loss": 0.4451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11577347666025162,
"step": 1075,
"valid_targets_mean": 8261.4,
"valid_targets_min": 1439
},
{
"epoch": 0.6371681415929203,
"grad_norm": 0.31671954979395994,
"learning_rate": 3.990953334537398e-05,
"loss": 0.448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15443119406700134,
"step": 1080,
"valid_targets_mean": 9847.7,
"valid_targets_min": 1767
},
{
"epoch": 0.640117994100295,
"grad_norm": 0.25680278491945663,
"learning_rate": 3.9905577773507184e-05,
"loss": 0.4368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16935217380523682,
"step": 1085,
"valid_targets_mean": 13030.2,
"valid_targets_min": 2483
},
{
"epoch": 0.6430678466076696,
"grad_norm": 0.239359194829167,
"learning_rate": 3.990153776967562e-05,
"loss": 0.4355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13085396587848663,
"step": 1090,
"valid_targets_mean": 9731.1,
"valid_targets_min": 1703
},
{
"epoch": 0.6460176991150443,
"grad_norm": 0.22373425243288575,
"learning_rate": 3.989741335101547e-05,
"loss": 0.4346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14850249886512756,
"step": 1095,
"valid_targets_mean": 10780.1,
"valid_targets_min": 1649
},
{
"epoch": 0.6489675516224189,
"grad_norm": 0.2433722186409111,
"learning_rate": 3.989320453502096e-05,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15189602971076965,
"step": 1100,
"valid_targets_mean": 10743.4,
"valid_targets_min": 1801
},
{
"epoch": 0.6519174041297935,
"grad_norm": 0.3323864666353114,
"learning_rate": 3.988891133954431e-05,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11629551649093628,
"step": 1105,
"valid_targets_mean": 9102.6,
"valid_targets_min": 1830
},
{
"epoch": 0.6548672566371682,
"grad_norm": 0.22889042461049347,
"learning_rate": 3.988453378279563e-05,
"loss": 0.4333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12611937522888184,
"step": 1110,
"valid_targets_mean": 9400.9,
"valid_targets_min": 1853
},
{
"epoch": 0.6578171091445427,
"grad_norm": 0.2543271499306638,
"learning_rate": 3.9880071883342877e-05,
"loss": 0.4267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420837789773941,
"step": 1115,
"valid_targets_mean": 10114.0,
"valid_targets_min": 2144
},
{
"epoch": 0.6607669616519174,
"grad_norm": 0.22975752551359416,
"learning_rate": 3.9875525660111746e-05,
"loss": 0.425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14416566491127014,
"step": 1120,
"valid_targets_mean": 9553.2,
"valid_targets_min": 2181
},
{
"epoch": 0.6637168141592921,
"grad_norm": 0.25343521443481465,
"learning_rate": 3.987089513238559e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15074048936367035,
"step": 1125,
"valid_targets_mean": 9748.7,
"valid_targets_min": 856
},
{
"epoch": 0.6666666666666666,
"grad_norm": 0.22582108402324896,
"learning_rate": 3.986618031980537e-05,
"loss": 0.4384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1590452492237091,
"step": 1130,
"valid_targets_mean": 12207.3,
"valid_targets_min": 2941
},
{
"epoch": 0.6696165191740413,
"grad_norm": 0.25138835363280104,
"learning_rate": 3.9861381242369566e-05,
"loss": 0.4352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1295248568058014,
"step": 1135,
"valid_targets_mean": 9607.7,
"valid_targets_min": 1480
},
{
"epoch": 0.672566371681416,
"grad_norm": 0.21744109580566193,
"learning_rate": 3.985649792043403e-05,
"loss": 0.4445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13683268427848816,
"step": 1140,
"valid_targets_mean": 10516.6,
"valid_targets_min": 1750
},
{
"epoch": 0.6755162241887905,
"grad_norm": 0.24750482724598766,
"learning_rate": 3.9851530374711985e-05,
"loss": 0.4365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12796282768249512,
"step": 1145,
"valid_targets_mean": 9166.2,
"valid_targets_min": 2342
},
{
"epoch": 0.6784660766961652,
"grad_norm": 0.27006974732922817,
"learning_rate": 3.984647862627389e-05,
"loss": 0.4368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16928240656852722,
"step": 1150,
"valid_targets_mean": 10198.2,
"valid_targets_min": 1888
},
{
"epoch": 0.6814159292035398,
"grad_norm": 0.22988670089720328,
"learning_rate": 3.984134269654736e-05,
"loss": 0.4373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14798274636268616,
"step": 1155,
"valid_targets_mean": 9976.0,
"valid_targets_min": 1591
},
{
"epoch": 0.6843657817109144,
"grad_norm": 0.23566250791004936,
"learning_rate": 3.9836122607317083e-05,
"loss": 0.4349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13107168674468994,
"step": 1160,
"valid_targets_mean": 8667.3,
"valid_targets_min": 1636
},
{
"epoch": 0.6873156342182891,
"grad_norm": 0.22239697943516684,
"learning_rate": 3.983081838072469e-05,
"loss": 0.4378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745031625032425,
"step": 1165,
"valid_targets_mean": 11671.9,
"valid_targets_min": 1372
},
{
"epoch": 0.6902654867256637,
"grad_norm": 0.22586990007122548,
"learning_rate": 3.9825430039268734e-05,
"loss": 0.4379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12756019830703735,
"step": 1170,
"valid_targets_mean": 8705.5,
"valid_targets_min": 788
},
{
"epoch": 0.6932153392330384,
"grad_norm": 0.22261089505162365,
"learning_rate": 3.9819957605804514e-05,
"loss": 0.4395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14750631153583527,
"step": 1175,
"valid_targets_mean": 10789.9,
"valid_targets_min": 1629
},
{
"epoch": 0.696165191740413,
"grad_norm": 0.22306615194696608,
"learning_rate": 3.9814401103544044e-05,
"loss": 0.4432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13897669315338135,
"step": 1180,
"valid_targets_mean": 9820.9,
"valid_targets_min": 2079
},
{
"epoch": 0.6991150442477876,
"grad_norm": 0.22317738628263822,
"learning_rate": 3.980876055605591e-05,
"loss": 0.4338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1291494220495224,
"step": 1185,
"valid_targets_mean": 9519.0,
"valid_targets_min": 1443
},
{
"epoch": 0.7020648967551623,
"grad_norm": 0.2256263144128267,
"learning_rate": 3.980303598726519e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14101535081863403,
"step": 1190,
"valid_targets_mean": 11148.6,
"valid_targets_min": 2844
},
{
"epoch": 0.7050147492625368,
"grad_norm": 0.21397313621788763,
"learning_rate": 3.9797227421453345e-05,
"loss": 0.4385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17973126471042633,
"step": 1195,
"valid_targets_mean": 11772.3,
"valid_targets_min": 2041
},
{
"epoch": 0.7079646017699115,
"grad_norm": 0.19691259367572003,
"learning_rate": 3.9791334883258133e-05,
"loss": 0.4338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13496637344360352,
"step": 1200,
"valid_targets_mean": 9464.2,
"valid_targets_min": 2006
},
{
"epoch": 0.7109144542772862,
"grad_norm": 0.21329831639659594,
"learning_rate": 3.978535839767346e-05,
"loss": 0.4389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12946803867816925,
"step": 1205,
"valid_targets_mean": 10115.8,
"valid_targets_min": 2033
},
{
"epoch": 0.7138643067846607,
"grad_norm": 0.2154057849716186,
"learning_rate": 3.977929799004937e-05,
"loss": 0.4281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11410190910100937,
"step": 1210,
"valid_targets_mean": 8914.2,
"valid_targets_min": 1829
},
{
"epoch": 0.7168141592920354,
"grad_norm": 0.2271674738481832,
"learning_rate": 3.977315368609179e-05,
"loss": 0.4307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16380158066749573,
"step": 1215,
"valid_targets_mean": 11594.1,
"valid_targets_min": 1466
},
{
"epoch": 0.7197640117994101,
"grad_norm": 0.2386454065940037,
"learning_rate": 3.9766925511862554e-05,
"loss": 0.4295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14458134770393372,
"step": 1220,
"valid_targets_mean": 10735.3,
"valid_targets_min": 1786
},
{
"epoch": 0.7227138643067846,
"grad_norm": 0.2255030881058441,
"learning_rate": 3.976061349377924e-05,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14954999089241028,
"step": 1225,
"valid_targets_mean": 11454.9,
"valid_targets_min": 2305
},
{
"epoch": 0.7256637168141593,
"grad_norm": 0.2481445013421651,
"learning_rate": 3.975421765861505e-05,
"loss": 0.4384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12814843654632568,
"step": 1230,
"valid_targets_mean": 9119.2,
"valid_targets_min": 933
},
{
"epoch": 0.7286135693215339,
"grad_norm": 0.21781116099994088,
"learning_rate": 3.974773803349869e-05,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1225578561425209,
"step": 1235,
"valid_targets_mean": 9410.8,
"valid_targets_min": 1837
},
{
"epoch": 0.7315634218289085,
"grad_norm": 0.21342911241238924,
"learning_rate": 3.974117464591432e-05,
"loss": 0.4315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12645339965820312,
"step": 1240,
"valid_targets_mean": 9461.3,
"valid_targets_min": 1841
},
{
"epoch": 0.7345132743362832,
"grad_norm": 0.20513947169642738,
"learning_rate": 3.973452752370134e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715991497039795,
"step": 1245,
"valid_targets_mean": 12400.2,
"valid_targets_min": 2042
},
{
"epoch": 0.7374631268436578,
"grad_norm": 0.21563879416279083,
"learning_rate": 3.972779669505434e-05,
"loss": 0.4352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1682026982307434,
"step": 1250,
"valid_targets_mean": 12530.3,
"valid_targets_min": 2926
},
{
"epoch": 0.7404129793510325,
"grad_norm": 0.23091666313240913,
"learning_rate": 3.972098218852296e-05,
"loss": 0.4352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1543908715248108,
"step": 1255,
"valid_targets_mean": 10509.6,
"valid_targets_min": 649
},
{
"epoch": 0.7433628318584071,
"grad_norm": 0.22856855769072065,
"learning_rate": 3.971408403301178e-05,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14025411009788513,
"step": 1260,
"valid_targets_mean": 9454.0,
"valid_targets_min": 2003
},
{
"epoch": 0.7463126843657817,
"grad_norm": 0.2335912261958896,
"learning_rate": 3.970710225778016e-05,
"loss": 0.4349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1344713419675827,
"step": 1265,
"valid_targets_mean": 9103.6,
"valid_targets_min": 1608
},
{
"epoch": 0.7492625368731564,
"grad_norm": 0.22079369010684347,
"learning_rate": 3.9700036892442175e-05,
"loss": 0.4317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13677185773849487,
"step": 1270,
"valid_targets_mean": 9436.6,
"valid_targets_min": 2137
},
{
"epoch": 0.7522123893805309,
"grad_norm": 0.1971068177734515,
"learning_rate": 3.969288796696645e-05,
"loss": 0.4289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13685756921768188,
"step": 1275,
"valid_targets_mean": 9747.0,
"valid_targets_min": 1135
},
{
"epoch": 0.7551622418879056,
"grad_norm": 0.2347117554337764,
"learning_rate": 3.968565551167602e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15099859237670898,
"step": 1280,
"valid_targets_mean": 10079.6,
"valid_targets_min": 2286
},
{
"epoch": 0.7581120943952803,
"grad_norm": 0.2272814602284412,
"learning_rate": 3.967833955724824e-05,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15157118439674377,
"step": 1285,
"valid_targets_mean": 10582.6,
"valid_targets_min": 1657
},
{
"epoch": 0.7610619469026548,
"grad_norm": 0.24637729164796876,
"learning_rate": 3.967094013471464e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1336841583251953,
"step": 1290,
"valid_targets_mean": 8869.7,
"valid_targets_min": 1883
},
{
"epoch": 0.7640117994100295,
"grad_norm": 0.22473990553847215,
"learning_rate": 3.966345727546078e-05,
"loss": 0.4251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1474177986383438,
"step": 1295,
"valid_targets_mean": 10999.8,
"valid_targets_min": 1608
},
{
"epoch": 0.7669616519174042,
"grad_norm": 0.2266397688976117,
"learning_rate": 3.965589101122613e-05,
"loss": 0.4335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14274467527866364,
"step": 1300,
"valid_targets_mean": 10845.2,
"valid_targets_min": 1769
},
{
"epoch": 0.7699115044247787,
"grad_norm": 0.23903918230849802,
"learning_rate": 3.9648241374103936e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15274375677108765,
"step": 1305,
"valid_targets_mean": 11583.4,
"valid_targets_min": 2726
},
{
"epoch": 0.7728613569321534,
"grad_norm": 0.22667591691034675,
"learning_rate": 3.964050839654107e-05,
"loss": 0.4276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12878428399562836,
"step": 1310,
"valid_targets_mean": 9023.2,
"valid_targets_min": 1719
},
{
"epoch": 0.775811209439528,
"grad_norm": 0.20118498187763423,
"learning_rate": 3.963269211133792e-05,
"loss": 0.4314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16713985800743103,
"step": 1315,
"valid_targets_mean": 11621.1,
"valid_targets_min": 1627
},
{
"epoch": 0.7787610619469026,
"grad_norm": 0.23317769615200384,
"learning_rate": 3.962479255164823e-05,
"loss": 0.4285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17432451248168945,
"step": 1320,
"valid_targets_mean": 10227.8,
"valid_targets_min": 2542
},
{
"epoch": 0.7817109144542773,
"grad_norm": 0.20839049675195365,
"learning_rate": 3.961680975097894e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13311053812503815,
"step": 1325,
"valid_targets_mean": 8847.1,
"valid_targets_min": 2962
},
{
"epoch": 0.7846607669616519,
"grad_norm": 0.22533441508609903,
"learning_rate": 3.960874374319009e-05,
"loss": 0.4339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515326201915741,
"step": 1330,
"valid_targets_mean": 11824.5,
"valid_targets_min": 2336
},
{
"epoch": 0.7876106194690266,
"grad_norm": 0.21681982017955925,
"learning_rate": 3.960059456249466e-05,
"loss": 0.4365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17768153548240662,
"step": 1335,
"valid_targets_mean": 13422.8,
"valid_targets_min": 2469
},
{
"epoch": 0.7905604719764012,
"grad_norm": 0.21506616827856356,
"learning_rate": 3.95923622434584e-05,
"loss": 0.4332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1056060940027237,
"step": 1340,
"valid_targets_mean": 8039.5,
"valid_targets_min": 1011
},
{
"epoch": 0.7935103244837758,
"grad_norm": 0.2092664738221549,
"learning_rate": 3.958404682099969e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11958029121160507,
"step": 1345,
"valid_targets_mean": 8162.9,
"valid_targets_min": 1768
},
{
"epoch": 0.7964601769911505,
"grad_norm": 0.21447497725002448,
"learning_rate": 3.957564833038944e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15218974649906158,
"step": 1350,
"valid_targets_mean": 9680.6,
"valid_targets_min": 1517
},
{
"epoch": 0.799410029498525,
"grad_norm": 0.22430754653919985,
"learning_rate": 3.9567166807250876e-05,
"loss": 0.4311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14632052183151245,
"step": 1355,
"valid_targets_mean": 10204.0,
"valid_targets_min": 1856
},
{
"epoch": 0.8023598820058997,
"grad_norm": 0.20821866979698975,
"learning_rate": 3.9558602287559435e-05,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16714532673358917,
"step": 1360,
"valid_targets_mean": 11088.9,
"valid_targets_min": 3033
},
{
"epoch": 0.8053097345132744,
"grad_norm": 0.21842361789585152,
"learning_rate": 3.954995480764257e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12598569691181183,
"step": 1365,
"valid_targets_mean": 8808.9,
"valid_targets_min": 1628
},
{
"epoch": 0.8082595870206489,
"grad_norm": 0.2452191859994776,
"learning_rate": 3.9541224404179646e-05,
"loss": 0.4296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15447130799293518,
"step": 1370,
"valid_targets_mean": 10004.9,
"valid_targets_min": 2090
},
{
"epoch": 0.8112094395280236,
"grad_norm": 0.21351961088739702,
"learning_rate": 3.953241111420174e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15034262835979462,
"step": 1375,
"valid_targets_mean": 11585.9,
"valid_targets_min": 1578
},
{
"epoch": 0.8141592920353983,
"grad_norm": 0.2438372245243314,
"learning_rate": 3.952351497509151e-05,
"loss": 0.4281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585340052843094,
"step": 1380,
"valid_targets_mean": 10658.7,
"valid_targets_min": 1712
},
{
"epoch": 0.8171091445427728,
"grad_norm": 0.2286487537231045,
"learning_rate": 3.9514536024583025e-05,
"loss": 0.4286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16236230731010437,
"step": 1385,
"valid_targets_mean": 11714.4,
"valid_targets_min": 2874
},
{
"epoch": 0.8200589970501475,
"grad_norm": 0.22767053921731062,
"learning_rate": 3.950547430076162e-05,
"loss": 0.4258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12050891667604446,
"step": 1390,
"valid_targets_mean": 9205.3,
"valid_targets_min": 2733
},
{
"epoch": 0.8230088495575221,
"grad_norm": 0.21243248388698746,
"learning_rate": 3.949632984206371e-05,
"loss": 0.4213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11950334906578064,
"step": 1395,
"valid_targets_mean": 8837.8,
"valid_targets_min": 2032
},
{
"epoch": 0.8259587020648967,
"grad_norm": 0.19404822707082142,
"learning_rate": 3.948710268727665e-05,
"loss": 0.4254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13935215771198273,
"step": 1400,
"valid_targets_mean": 10313.7,
"valid_targets_min": 2037
},
{
"epoch": 0.8289085545722714,
"grad_norm": 0.20795543066174288,
"learning_rate": 3.947779287553855e-05,
"loss": 0.4326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11591978371143341,
"step": 1405,
"valid_targets_mean": 8079.2,
"valid_targets_min": 1799
},
{
"epoch": 0.831858407079646,
"grad_norm": 0.22220292602112293,
"learning_rate": 3.946840044633812e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17623038589954376,
"step": 1410,
"valid_targets_mean": 11687.4,
"valid_targets_min": 1660
},
{
"epoch": 0.8348082595870207,
"grad_norm": 0.22466394230939674,
"learning_rate": 3.945892543951452e-05,
"loss": 0.4348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13592171669006348,
"step": 1415,
"valid_targets_mean": 9689.1,
"valid_targets_min": 1213
},
{
"epoch": 0.8377581120943953,
"grad_norm": 0.2254962724331218,
"learning_rate": 3.9449367895257154e-05,
"loss": 0.4298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1883118897676468,
"step": 1420,
"valid_targets_mean": 13727.9,
"valid_targets_min": 2019
},
{
"epoch": 0.8407079646017699,
"grad_norm": 0.21194725404217385,
"learning_rate": 3.9439727854105525e-05,
"loss": 0.4296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12037979066371918,
"step": 1425,
"valid_targets_mean": 8408.8,
"valid_targets_min": 1770
},
{
"epoch": 0.8436578171091446,
"grad_norm": 0.2340701396614431,
"learning_rate": 3.943000535694906e-05,
"loss": 0.434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15494517982006073,
"step": 1430,
"valid_targets_mean": 10496.0,
"valid_targets_min": 1924
},
{
"epoch": 0.8466076696165191,
"grad_norm": 0.19806546741399747,
"learning_rate": 3.9420200445026935e-05,
"loss": 0.4274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13141945004463196,
"step": 1435,
"valid_targets_mean": 9131.2,
"valid_targets_min": 2712
},
{
"epoch": 0.8495575221238938,
"grad_norm": 0.21286070590728243,
"learning_rate": 3.9410313159927884e-05,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14135153591632843,
"step": 1440,
"valid_targets_mean": 8391.5,
"valid_targets_min": 1896
},
{
"epoch": 0.8525073746312685,
"grad_norm": 0.21373668014960542,
"learning_rate": 3.9400343543590055e-05,
"loss": 0.4216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340659260749817,
"step": 1445,
"valid_targets_mean": 9973.9,
"valid_targets_min": 1874
},
{
"epoch": 0.855457227138643,
"grad_norm": 0.19867038831411135,
"learning_rate": 3.9390291638300803e-05,
"loss": 0.4268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15295977890491486,
"step": 1450,
"valid_targets_mean": 11387.2,
"valid_targets_min": 2079
},
{
"epoch": 0.8584070796460177,
"grad_norm": 0.2071025265272414,
"learning_rate": 3.938015748669652e-05,
"loss": 0.4267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1454063355922699,
"step": 1455,
"valid_targets_mean": 9381.8,
"valid_targets_min": 1708
},
{
"epoch": 0.8613569321533924,
"grad_norm": 0.21597614110893262,
"learning_rate": 3.936994113176247e-05,
"loss": 0.4331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13651731610298157,
"step": 1460,
"valid_targets_mean": 8509.3,
"valid_targets_min": 1118
},
{
"epoch": 0.8643067846607669,
"grad_norm": 0.2168658534884769,
"learning_rate": 3.935964261683258e-05,
"loss": 0.4328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14359349012374878,
"step": 1465,
"valid_targets_mean": 10374.7,
"valid_targets_min": 2011
},
{
"epoch": 0.8672566371681416,
"grad_norm": 0.20858730892961191,
"learning_rate": 3.934926198558926e-05,
"loss": 0.4302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17608967423439026,
"step": 1470,
"valid_targets_mean": 12519.0,
"valid_targets_min": 1887
},
{
"epoch": 0.8702064896755162,
"grad_norm": 0.2006306585200802,
"learning_rate": 3.933879928206325e-05,
"loss": 0.4244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375437080860138,
"step": 1475,
"valid_targets_mean": 9916.1,
"valid_targets_min": 1793
},
{
"epoch": 0.8731563421828908,
"grad_norm": 0.2205586415746746,
"learning_rate": 3.9328254550633413e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15739303827285767,
"step": 1480,
"valid_targets_mean": 10340.9,
"valid_targets_min": 1125
},
{
"epoch": 0.8761061946902655,
"grad_norm": 0.19812340046811802,
"learning_rate": 3.9317627836026505e-05,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1516011655330658,
"step": 1485,
"valid_targets_mean": 9584.5,
"valid_targets_min": 2028
},
{
"epoch": 0.8790560471976401,
"grad_norm": 0.21139493708043888,
"learning_rate": 3.930691918331706e-05,
"loss": 0.4345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16548380255699158,
"step": 1490,
"valid_targets_mean": 11590.9,
"valid_targets_min": 2261
},
{
"epoch": 0.8820058997050148,
"grad_norm": 0.21329975804889742,
"learning_rate": 3.929612863792713e-05,
"loss": 0.4285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15393435955047607,
"step": 1495,
"valid_targets_mean": 11354.4,
"valid_targets_min": 1773
},
{
"epoch": 0.8849557522123894,
"grad_norm": 0.2541979721275341,
"learning_rate": 3.928525624562617e-05,
"loss": 0.4301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13612164556980133,
"step": 1500,
"valid_targets_mean": 9635.8,
"valid_targets_min": 2187
},
{
"epoch": 0.887905604719764,
"grad_norm": 0.22539564954558305,
"learning_rate": 3.927430205253077e-05,
"loss": 0.4229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14678379893302917,
"step": 1505,
"valid_targets_mean": 10532.5,
"valid_targets_min": 1940
},
{
"epoch": 0.8908554572271387,
"grad_norm": 0.20356625113991283,
"learning_rate": 3.9263266105104484e-05,
"loss": 0.4278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15266424417495728,
"step": 1510,
"valid_targets_mean": 11384.6,
"valid_targets_min": 2096
},
{
"epoch": 0.8938053097345132,
"grad_norm": 0.21042754257939417,
"learning_rate": 3.9252148450157646e-05,
"loss": 0.4244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14113900065422058,
"step": 1515,
"valid_targets_mean": 10272.5,
"valid_targets_min": 2815
},
{
"epoch": 0.8967551622418879,
"grad_norm": 0.19598960033237253,
"learning_rate": 3.9240949134847164e-05,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16119873523712158,
"step": 1520,
"valid_targets_mean": 11145.4,
"valid_targets_min": 818
},
{
"epoch": 0.8997050147492626,
"grad_norm": 0.19245802334587098,
"learning_rate": 3.922966820667632e-05,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1274881511926651,
"step": 1525,
"valid_targets_mean": 9275.6,
"valid_targets_min": 1757
},
{
"epoch": 0.9026548672566371,
"grad_norm": 0.20722152151745302,
"learning_rate": 3.921830571349455e-05,
"loss": 0.4275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15170887112617493,
"step": 1530,
"valid_targets_mean": 10562.0,
"valid_targets_min": 1778
},
{
"epoch": 0.9056047197640118,
"grad_norm": 0.2211212721089106,
"learning_rate": 3.920686170349728e-05,
"loss": 0.425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14120131731033325,
"step": 1535,
"valid_targets_mean": 9969.5,
"valid_targets_min": 1957
},
{
"epoch": 0.9085545722713865,
"grad_norm": 0.22615337216600126,
"learning_rate": 3.9195336225225694e-05,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15712234377861023,
"step": 1540,
"valid_targets_mean": 10153.2,
"valid_targets_min": 2191
},
{
"epoch": 0.911504424778761,
"grad_norm": 0.20841743928677547,
"learning_rate": 3.918372932756652e-05,
"loss": 0.4335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11234050989151001,
"step": 1545,
"valid_targets_mean": 8849.2,
"valid_targets_min": 324
},
{
"epoch": 0.9144542772861357,
"grad_norm": 0.24202127593053716,
"learning_rate": 3.917204105975186e-05,
"loss": 0.4258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15047121047973633,
"step": 1550,
"valid_targets_mean": 10924.6,
"valid_targets_min": 2710
},
{
"epoch": 0.9174041297935103,
"grad_norm": 0.19857249098394833,
"learning_rate": 3.916027147135894e-05,
"loss": 0.4289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15521690249443054,
"step": 1555,
"valid_targets_mean": 11752.3,
"valid_targets_min": 1969
},
{
"epoch": 0.9203539823008849,
"grad_norm": 0.21436174937187652,
"learning_rate": 3.9148420612309907e-05,
"loss": 0.429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16796237230300903,
"step": 1560,
"valid_targets_mean": 12698.6,
"valid_targets_min": 2768
},
{
"epoch": 0.9233038348082596,
"grad_norm": 0.21760621553388323,
"learning_rate": 3.913648853287167e-05,
"loss": 0.4293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13657817244529724,
"step": 1565,
"valid_targets_mean": 10104.6,
"valid_targets_min": 1652
},
{
"epoch": 0.9262536873156342,
"grad_norm": 0.19337765257103107,
"learning_rate": 3.912447528365559e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14748969674110413,
"step": 1570,
"valid_targets_mean": 11014.7,
"valid_targets_min": 1872
},
{
"epoch": 0.9292035398230089,
"grad_norm": 0.22146689942592468,
"learning_rate": 3.911238091561736e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1421777307987213,
"step": 1575,
"valid_targets_mean": 10039.7,
"valid_targets_min": 2777
},
{
"epoch": 0.9321533923303835,
"grad_norm": 0.20189886878274899,
"learning_rate": 3.910020548005673e-05,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599784791469574,
"step": 1580,
"valid_targets_mean": 11453.5,
"valid_targets_min": 1275
},
{
"epoch": 0.9351032448377581,
"grad_norm": 0.2045400723388353,
"learning_rate": 3.908794902861733e-05,
"loss": 0.4336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12890928983688354,
"step": 1585,
"valid_targets_mean": 8932.7,
"valid_targets_min": 1791
},
{
"epoch": 0.9380530973451328,
"grad_norm": 0.1989335490497034,
"learning_rate": 3.9075611613286385e-05,
"loss": 0.4193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14698082208633423,
"step": 1590,
"valid_targets_mean": 11101.6,
"valid_targets_min": 2707
},
{
"epoch": 0.9410029498525073,
"grad_norm": 0.22960216786420032,
"learning_rate": 3.906319328639457e-05,
"loss": 0.4275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17267057299613953,
"step": 1595,
"valid_targets_mean": 10862.0,
"valid_targets_min": 1591
},
{
"epoch": 0.943952802359882,
"grad_norm": 0.22563473609963453,
"learning_rate": 3.905069410061576e-05,
"loss": 0.4264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15903520584106445,
"step": 1600,
"valid_targets_mean": 10801.4,
"valid_targets_min": 1421
},
{
"epoch": 0.9469026548672567,
"grad_norm": 0.21538014638851252,
"learning_rate": 3.90381141089668e-05,
"loss": 0.4277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417563259601593,
"step": 1605,
"valid_targets_mean": 8929.9,
"valid_targets_min": 1203
},
{
"epoch": 0.9498525073746312,
"grad_norm": 0.20130244582393142,
"learning_rate": 3.902545336480726e-05,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1481684297323227,
"step": 1610,
"valid_targets_mean": 10474.6,
"valid_targets_min": 1041
},
{
"epoch": 0.9528023598820059,
"grad_norm": 0.2296462679204711,
"learning_rate": 3.9012711921839255e-05,
"loss": 0.4289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12770214676856995,
"step": 1615,
"valid_targets_mean": 8967.3,
"valid_targets_min": 2401
},
{
"epoch": 0.9557522123893806,
"grad_norm": 0.21190599582292202,
"learning_rate": 3.899988983410719e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15029430389404297,
"step": 1620,
"valid_targets_mean": 10507.0,
"valid_targets_min": 1811
},
{
"epoch": 0.9587020648967551,
"grad_norm": 0.2076012555064984,
"learning_rate": 3.898698715599754e-05,
"loss": 0.4287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12323871999979019,
"step": 1625,
"valid_targets_mean": 9101.4,
"valid_targets_min": 1896
},
{
"epoch": 0.9616519174041298,
"grad_norm": 0.23218538306869804,
"learning_rate": 3.8974003942238595e-05,
"loss": 0.4243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530805230140686,
"step": 1630,
"valid_targets_mean": 11740.2,
"valid_targets_min": 1329
},
{
"epoch": 0.9646017699115044,
"grad_norm": 0.24503360985761793,
"learning_rate": 3.896094024790026e-05,
"loss": 0.4252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1282130479812622,
"step": 1635,
"valid_targets_mean": 8273.8,
"valid_targets_min": 1581
},
{
"epoch": 0.967551622418879,
"grad_norm": 0.2539213856936481,
"learning_rate": 3.894779612839381e-05,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1584298014640808,
"step": 1640,
"valid_targets_mean": 10531.7,
"valid_targets_min": 2030
},
{
"epoch": 0.9705014749262537,
"grad_norm": 0.21788762425717897,
"learning_rate": 3.893457163947165e-05,
"loss": 0.4203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12848243117332458,
"step": 1645,
"valid_targets_mean": 8572.2,
"valid_targets_min": 1302
},
{
"epoch": 0.9734513274336283,
"grad_norm": 0.2259553001628983,
"learning_rate": 3.892126683722709e-05,
"loss": 0.4304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15158626437187195,
"step": 1650,
"valid_targets_mean": 10365.0,
"valid_targets_min": 1880
},
{
"epoch": 0.976401179941003,
"grad_norm": 0.19968783409752863,
"learning_rate": 3.890788177809407e-05,
"loss": 0.4333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16649773716926575,
"step": 1655,
"valid_targets_mean": 11930.6,
"valid_targets_min": 1431
},
{
"epoch": 0.9793510324483776,
"grad_norm": 0.19109065781129364,
"learning_rate": 3.8894416518846984e-05,
"loss": 0.4244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14009195566177368,
"step": 1660,
"valid_targets_mean": 10015.8,
"valid_targets_min": 1439
},
{
"epoch": 0.9823008849557522,
"grad_norm": 0.20147950450173913,
"learning_rate": 3.88808711166004e-05,
"loss": 0.4264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15372982621192932,
"step": 1665,
"valid_targets_mean": 10110.8,
"valid_targets_min": 2130
},
{
"epoch": 0.9852507374631269,
"grad_norm": 0.20274757156010115,
"learning_rate": 3.886724562880878e-05,
"loss": 0.4287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1347220540046692,
"step": 1670,
"valid_targets_mean": 9938.6,
"valid_targets_min": 1395
},
{
"epoch": 0.9882005899705014,
"grad_norm": 0.20933626991726081,
"learning_rate": 3.8853540113266356e-05,
"loss": 0.434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.170450359582901,
"step": 1675,
"valid_targets_mean": 11508.6,
"valid_targets_min": 1832
},
{
"epoch": 0.9911504424778761,
"grad_norm": 0.1998299607341395,
"learning_rate": 3.883975462810673e-05,
"loss": 0.4221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12960436940193176,
"step": 1680,
"valid_targets_mean": 9993.5,
"valid_targets_min": 2294
},
{
"epoch": 0.9941002949852508,
"grad_norm": 0.2747789084378386,
"learning_rate": 3.882588923180276e-05,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16216714680194855,
"step": 1685,
"valid_targets_mean": 11300.2,
"valid_targets_min": 1578
},
{
"epoch": 0.9970501474926253,
"grad_norm": 0.2060289370907001,
"learning_rate": 3.881194398316622e-05,
"loss": 0.4189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13950684666633606,
"step": 1690,
"valid_targets_mean": 10239.3,
"valid_targets_min": 1636
},
{
"epoch": 1.0,
"grad_norm": 0.2060665846116573,
"learning_rate": 3.8797918941347605e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1244438886642456,
"step": 1695,
"valid_targets_mean": 9906.2,
"valid_targets_min": 1715
},
{
"epoch": 1.0029498525073746,
"grad_norm": 0.2214317321286988,
"learning_rate": 3.878381416583587e-05,
"loss": 0.4111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12244114279747009,
"step": 1700,
"valid_targets_mean": 8369.7,
"valid_targets_min": 1768
},
{
"epoch": 1.0058997050147493,
"grad_norm": 0.2436305117216246,
"learning_rate": 3.876962971645816e-05,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12919296324253082,
"step": 1705,
"valid_targets_mean": 8753.0,
"valid_targets_min": 2256
},
{
"epoch": 1.008849557522124,
"grad_norm": 0.2541456145942789,
"learning_rate": 3.8755365653379554e-05,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15090519189834595,
"step": 1710,
"valid_targets_mean": 10982.1,
"valid_targets_min": 1108
},
{
"epoch": 1.0117994100294985,
"grad_norm": 0.23014848454095105,
"learning_rate": 3.874102203710285e-05,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13246405124664307,
"step": 1715,
"valid_targets_mean": 11002.4,
"valid_targets_min": 2056
},
{
"epoch": 1.0147492625368733,
"grad_norm": 0.22453946076727968,
"learning_rate": 3.8726598928468264e-05,
"loss": 0.4152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1798960417509079,
"step": 1720,
"valid_targets_mean": 12538.0,
"valid_targets_min": 3339
},
{
"epoch": 1.0176991150442478,
"grad_norm": 0.2135015538264713,
"learning_rate": 3.871209638865319e-05,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15504910051822662,
"step": 1725,
"valid_targets_mean": 11040.2,
"valid_targets_min": 993
},
{
"epoch": 1.0206489675516224,
"grad_norm": 0.2035972797318352,
"learning_rate": 3.8697514479171944e-05,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15845829248428345,
"step": 1730,
"valid_targets_mean": 11769.6,
"valid_targets_min": 993
},
{
"epoch": 1.023598820058997,
"grad_norm": 0.21102734058214348,
"learning_rate": 3.868285326187549e-05,
"loss": 0.4087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15515300631523132,
"step": 1735,
"valid_targets_mean": 12242.0,
"valid_targets_min": 1933
},
{
"epoch": 1.0265486725663717,
"grad_norm": 0.21414046560162203,
"learning_rate": 3.8668112798951186e-05,
"loss": 0.4084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11055143177509308,
"step": 1740,
"valid_targets_mean": 8613.3,
"valid_targets_min": 1326
},
{
"epoch": 1.0294985250737463,
"grad_norm": 0.3490042762055538,
"learning_rate": 3.865329315292253e-05,
"loss": 0.4143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15151363611221313,
"step": 1745,
"valid_targets_mean": 10904.8,
"valid_targets_min": 2374
},
{
"epoch": 1.0324483775811208,
"grad_norm": 0.19879886174283662,
"learning_rate": 3.863839438664888e-05,
"loss": 0.4077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11457093805074692,
"step": 1750,
"valid_targets_mean": 9075.7,
"valid_targets_min": 1929
},
{
"epoch": 1.0353982300884956,
"grad_norm": 0.22408334317438344,
"learning_rate": 3.862341656332519e-05,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12300422042608261,
"step": 1755,
"valid_targets_mean": 9564.1,
"valid_targets_min": 1758
},
{
"epoch": 1.0383480825958702,
"grad_norm": 0.20190523650308992,
"learning_rate": 3.8608359746481757e-05,
"loss": 0.4062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12284660339355469,
"step": 1760,
"valid_targets_mean": 9423.4,
"valid_targets_min": 1229
},
{
"epoch": 1.0412979351032448,
"grad_norm": 0.1889811146160302,
"learning_rate": 3.859322399998391e-05,
"loss": 0.411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11543569713830948,
"step": 1765,
"valid_targets_mean": 8829.8,
"valid_targets_min": 1326
},
{
"epoch": 1.0442477876106195,
"grad_norm": 0.20750598590889113,
"learning_rate": 3.85780093880318e-05,
"loss": 0.4168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12260887026786804,
"step": 1770,
"valid_targets_mean": 9662.1,
"valid_targets_min": 1275
},
{
"epoch": 1.047197640117994,
"grad_norm": 0.22141314053223685,
"learning_rate": 3.856271597516007e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14068543910980225,
"step": 1775,
"valid_targets_mean": 10959.3,
"valid_targets_min": 638
},
{
"epoch": 1.0501474926253687,
"grad_norm": 0.21606621123216593,
"learning_rate": 3.8547343826237625e-05,
"loss": 0.4082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1010463610291481,
"step": 1780,
"valid_targets_mean": 7978.1,
"valid_targets_min": 766
},
{
"epoch": 1.0530973451327434,
"grad_norm": 0.21156952456065437,
"learning_rate": 3.853189300646733e-05,
"loss": 0.4096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12438692152500153,
"step": 1785,
"valid_targets_mean": 10245.8,
"valid_targets_min": 1763
},
{
"epoch": 1.056047197640118,
"grad_norm": 0.19194806585850302,
"learning_rate": 3.8516363581385744e-05,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15674549341201782,
"step": 1790,
"valid_targets_mean": 11258.5,
"valid_targets_min": 1816
},
{
"epoch": 1.0589970501474926,
"grad_norm": 0.2107193241639981,
"learning_rate": 3.850075561686284e-05,
"loss": 0.4077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1198762059211731,
"step": 1795,
"valid_targets_mean": 8000.7,
"valid_targets_min": 2223
},
{
"epoch": 1.0619469026548674,
"grad_norm": 0.2148666662551988,
"learning_rate": 3.848506917910173e-05,
"loss": 0.4149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13810782134532928,
"step": 1800,
"valid_targets_mean": 10893.6,
"valid_targets_min": 1409
},
{
"epoch": 1.064896755162242,
"grad_norm": 0.19406443957944047,
"learning_rate": 3.846930433463837e-05,
"loss": 0.4143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13573281466960907,
"step": 1805,
"valid_targets_mean": 10108.5,
"valid_targets_min": 1004
},
{
"epoch": 1.0678466076696165,
"grad_norm": 0.23058912274050483,
"learning_rate": 3.84534611503413e-05,
"loss": 0.4135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1543012261390686,
"step": 1810,
"valid_targets_mean": 12145.3,
"valid_targets_min": 1885
},
{
"epoch": 1.0707964601769913,
"grad_norm": 0.21404882128297154,
"learning_rate": 3.843753969341133e-05,
"loss": 0.409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17230772972106934,
"step": 1815,
"valid_targets_mean": 11707.7,
"valid_targets_min": 2484
},
{
"epoch": 1.0737463126843658,
"grad_norm": 0.21766349751933262,
"learning_rate": 3.84215400313813e-05,
"loss": 0.4123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16566194593906403,
"step": 1820,
"valid_targets_mean": 10948.0,
"valid_targets_min": 1919
},
{
"epoch": 1.0766961651917404,
"grad_norm": 0.21941802778104524,
"learning_rate": 3.840546223211573e-05,
"loss": 0.413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13953745365142822,
"step": 1825,
"valid_targets_mean": 10782.3,
"valid_targets_min": 1761
},
{
"epoch": 1.079646017699115,
"grad_norm": 0.21274994098907102,
"learning_rate": 3.8389306363810603e-05,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12339918315410614,
"step": 1830,
"valid_targets_mean": 9099.6,
"valid_targets_min": 1580
},
{
"epoch": 1.0825958702064897,
"grad_norm": 0.22377623817685083,
"learning_rate": 3.837307249499304e-05,
"loss": 0.4092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11521419882774353,
"step": 1835,
"valid_targets_mean": 9367.8,
"valid_targets_min": 1997
},
{
"epoch": 1.0855457227138643,
"grad_norm": 0.19797643732478384,
"learning_rate": 3.835676069452098e-05,
"loss": 0.4059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17100510001182556,
"step": 1840,
"valid_targets_mean": 12947.3,
"valid_targets_min": 2121
},
{
"epoch": 1.0884955752212389,
"grad_norm": 0.21865904068357092,
"learning_rate": 3.834037103158294e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11623190343379974,
"step": 1845,
"valid_targets_mean": 9119.2,
"valid_targets_min": 581
},
{
"epoch": 1.0914454277286136,
"grad_norm": 0.19819166759077297,
"learning_rate": 3.832390357569771e-05,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13250255584716797,
"step": 1850,
"valid_targets_mean": 10413.7,
"valid_targets_min": 1747
},
{
"epoch": 1.0943952802359882,
"grad_norm": 0.2137794724256389,
"learning_rate": 3.830735839671402e-05,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1471385657787323,
"step": 1855,
"valid_targets_mean": 10754.2,
"valid_targets_min": 2854
},
{
"epoch": 1.0973451327433628,
"grad_norm": 0.20180269762632919,
"learning_rate": 3.829073556481031e-05,
"loss": 0.4046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11916483938694,
"step": 1860,
"valid_targets_mean": 9007.5,
"valid_targets_min": 1396
},
{
"epoch": 1.1002949852507375,
"grad_norm": 0.1967635045770067,
"learning_rate": 3.827403515049435e-05,
"loss": 0.4079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09877189993858337,
"step": 1865,
"valid_targets_mean": 8820.8,
"valid_targets_min": 1666
},
{
"epoch": 1.103244837758112,
"grad_norm": 0.21494925676253426,
"learning_rate": 3.8257257224603017e-05,
"loss": 0.41,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13791577517986298,
"step": 1870,
"valid_targets_mean": 10300.9,
"valid_targets_min": 1870
},
{
"epoch": 1.1061946902654867,
"grad_norm": 0.20240256675457352,
"learning_rate": 3.824040185830196e-05,
"loss": 0.4183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15127933025360107,
"step": 1875,
"valid_targets_mean": 10301.0,
"valid_targets_min": 1872
},
{
"epoch": 1.1091445427728615,
"grad_norm": 0.19891739705938485,
"learning_rate": 3.82234691230853e-05,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11647451668977737,
"step": 1880,
"valid_targets_mean": 8726.2,
"valid_targets_min": 1376
},
{
"epoch": 1.112094395280236,
"grad_norm": 0.22683438639070486,
"learning_rate": 3.82064590907753e-05,
"loss": 0.4165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13766145706176758,
"step": 1885,
"valid_targets_mean": 9197.0,
"valid_targets_min": 1423
},
{
"epoch": 1.1150442477876106,
"grad_norm": 0.21204497029633457,
"learning_rate": 3.818937183352214e-05,
"loss": 0.4118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13173851370811462,
"step": 1890,
"valid_targets_mean": 10090.6,
"valid_targets_min": 1763
},
{
"epoch": 1.1179941002949851,
"grad_norm": 0.2040720064717632,
"learning_rate": 3.81722074238035e-05,
"loss": 0.4054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14814019203186035,
"step": 1895,
"valid_targets_mean": 12130.7,
"valid_targets_min": 2016
},
{
"epoch": 1.12094395280236,
"grad_norm": 0.20133866889947288,
"learning_rate": 3.815496593442437e-05,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15776057541370392,
"step": 1900,
"valid_targets_mean": 12728.4,
"valid_targets_min": 2160
},
{
"epoch": 1.1238938053097345,
"grad_norm": 0.20242503749135837,
"learning_rate": 3.813764743851665e-05,
"loss": 0.4141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15720617771148682,
"step": 1905,
"valid_targets_mean": 10916.8,
"valid_targets_min": 1351
},
{
"epoch": 1.1268436578171093,
"grad_norm": 0.208072373800863,
"learning_rate": 3.812025200953886e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1405029296875,
"step": 1910,
"valid_targets_mean": 9711.5,
"valid_targets_min": 1453
},
{
"epoch": 1.1297935103244838,
"grad_norm": 0.21335388533193136,
"learning_rate": 3.8102779721275876e-05,
"loss": 0.4187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11071514338254929,
"step": 1915,
"valid_targets_mean": 7793.0,
"valid_targets_min": 2061
},
{
"epoch": 1.1327433628318584,
"grad_norm": 0.20639777456737793,
"learning_rate": 3.808523064783855e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15259069204330444,
"step": 1920,
"valid_targets_mean": 10522.3,
"valid_targets_min": 2051
},
{
"epoch": 1.135693215339233,
"grad_norm": 0.20238312463667626,
"learning_rate": 3.806760486366346e-05,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12089171260595322,
"step": 1925,
"valid_targets_mean": 9354.5,
"valid_targets_min": 1660
},
{
"epoch": 1.1386430678466077,
"grad_norm": 0.20356162120879506,
"learning_rate": 3.8049902443512545e-05,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11329087615013123,
"step": 1930,
"valid_targets_mean": 8649.6,
"valid_targets_min": 1301
},
{
"epoch": 1.1415929203539823,
"grad_norm": 0.1804088599383834,
"learning_rate": 3.803212346247279e-05,
"loss": 0.4055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1426897943019867,
"step": 1935,
"valid_targets_mean": 10430.0,
"valid_targets_min": 880
},
{
"epoch": 1.1445427728613569,
"grad_norm": 0.2271543333220535,
"learning_rate": 3.801426799595594e-05,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14367930591106415,
"step": 1940,
"valid_targets_mean": 10661.6,
"valid_targets_min": 1734
},
{
"epoch": 1.1474926253687316,
"grad_norm": 0.1928149869518129,
"learning_rate": 3.799633611969816e-05,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12169966101646423,
"step": 1945,
"valid_targets_mean": 10279.0,
"valid_targets_min": 1395
},
{
"epoch": 1.1504424778761062,
"grad_norm": 0.21134894803857232,
"learning_rate": 3.7978327909759724e-05,
"loss": 0.4067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12604662775993347,
"step": 1950,
"valid_targets_mean": 8528.5,
"valid_targets_min": 2313
},
{
"epoch": 1.1533923303834808,
"grad_norm": 0.20396072826134254,
"learning_rate": 3.796024344252468e-05,
"loss": 0.4106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569386124610901,
"step": 1955,
"valid_targets_mean": 11313.9,
"valid_targets_min": 1467
},
{
"epoch": 1.1563421828908556,
"grad_norm": 0.22194681338512706,
"learning_rate": 3.7942082794700515e-05,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1357463002204895,
"step": 1960,
"valid_targets_mean": 10597.4,
"valid_targets_min": 2147
},
{
"epoch": 1.1592920353982301,
"grad_norm": 0.20539906350360473,
"learning_rate": 3.7923846043317865e-05,
"loss": 0.4109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1538807451725006,
"step": 1965,
"valid_targets_mean": 12742.9,
"valid_targets_min": 1402
},
{
"epoch": 1.1622418879056047,
"grad_norm": 0.20120409032277925,
"learning_rate": 3.790553326573016e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13526630401611328,
"step": 1970,
"valid_targets_mean": 10137.4,
"valid_targets_min": 1357
},
{
"epoch": 1.1651917404129795,
"grad_norm": 0.21338986564297552,
"learning_rate": 3.788714453961331e-05,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13483178615570068,
"step": 1975,
"valid_targets_mean": 10012.6,
"valid_targets_min": 2316
},
{
"epoch": 1.168141592920354,
"grad_norm": 0.21188408754979535,
"learning_rate": 3.786867994296535e-05,
"loss": 0.411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1392839252948761,
"step": 1980,
"valid_targets_mean": 9308.8,
"valid_targets_min": 1282
},
{
"epoch": 1.1710914454277286,
"grad_norm": 0.2039564451558122,
"learning_rate": 3.785013955410617e-05,
"loss": 0.4065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09764277935028076,
"step": 1985,
"valid_targets_mean": 8041.7,
"valid_targets_min": 1623
},
{
"epoch": 1.1740412979351031,
"grad_norm": 0.19136114966992632,
"learning_rate": 3.783152345167711e-05,
"loss": 0.4097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12284572422504425,
"step": 1990,
"valid_targets_mean": 9104.2,
"valid_targets_min": 2701
},
{
"epoch": 1.176991150442478,
"grad_norm": 0.1916739509383337,
"learning_rate": 3.781283171464065e-05,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13541018962860107,
"step": 1995,
"valid_targets_mean": 9892.2,
"valid_targets_min": 1543
},
{
"epoch": 1.1799410029498525,
"grad_norm": 0.21980881264220392,
"learning_rate": 3.779406442228012e-05,
"loss": 0.4089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13939528167247772,
"step": 2000,
"valid_targets_mean": 8413.7,
"valid_targets_min": 1348
},
{
"epoch": 1.182890855457227,
"grad_norm": 0.25391048063546057,
"learning_rate": 3.777522165419929e-05,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12453456223011017,
"step": 2005,
"valid_targets_mean": 9011.9,
"valid_targets_min": 1258
},
{
"epoch": 1.1858407079646018,
"grad_norm": 0.1946857583209541,
"learning_rate": 3.77563034903221e-05,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13194556534290314,
"step": 2010,
"valid_targets_mean": 10724.9,
"valid_targets_min": 1737
},
{
"epoch": 1.1887905604719764,
"grad_norm": 0.19693826294861733,
"learning_rate": 3.773731001089227e-05,
"loss": 0.4166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14914648234844208,
"step": 2015,
"valid_targets_mean": 11330.2,
"valid_targets_min": 2645
},
{
"epoch": 1.191740412979351,
"grad_norm": 0.2073049850541922,
"learning_rate": 3.771824129647299e-05,
"loss": 0.4112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12241712957620621,
"step": 2020,
"valid_targets_mean": 8752.2,
"valid_targets_min": 1943
},
{
"epoch": 1.1946902654867257,
"grad_norm": 0.2085637489120309,
"learning_rate": 3.7699097427946556e-05,
"loss": 0.4122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13761894404888153,
"step": 2025,
"valid_targets_mean": 10287.4,
"valid_targets_min": 1357
},
{
"epoch": 1.1976401179941003,
"grad_norm": 0.222453588302852,
"learning_rate": 3.7679878486514066e-05,
"loss": 0.4078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14405113458633423,
"step": 2030,
"valid_targets_mean": 11753.1,
"valid_targets_min": 2172
},
{
"epoch": 1.2005899705014749,
"grad_norm": 0.24169539701661746,
"learning_rate": 3.7660584553695015e-05,
"loss": 0.4062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13349585235118866,
"step": 2035,
"valid_targets_mean": 10826.9,
"valid_targets_min": 1833
},
{
"epoch": 1.2035398230088497,
"grad_norm": 0.2108273326549157,
"learning_rate": 3.7641215711327016e-05,
"loss": 0.4074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12320627272129059,
"step": 2040,
"valid_targets_mean": 8298.7,
"valid_targets_min": 2118
},
{
"epoch": 1.2064896755162242,
"grad_norm": 0.20442694007571818,
"learning_rate": 3.762177204156539e-05,
"loss": 0.4084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14502795040607452,
"step": 2045,
"valid_targets_mean": 10686.5,
"valid_targets_min": 1710
},
{
"epoch": 1.2094395280235988,
"grad_norm": 0.19955409878173785,
"learning_rate": 3.760225362688287e-05,
"loss": 0.4121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1251523792743683,
"step": 2050,
"valid_targets_mean": 10852.7,
"valid_targets_min": 1179
},
{
"epoch": 1.2123893805309733,
"grad_norm": 0.2103406530212919,
"learning_rate": 3.758266055006922e-05,
"loss": 0.4137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394679844379425,
"step": 2055,
"valid_targets_mean": 9916.9,
"valid_targets_min": 2572
},
{
"epoch": 1.2153392330383481,
"grad_norm": 0.23099560954553897,
"learning_rate": 3.756299289423089e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13078881800174713,
"step": 2060,
"valid_targets_mean": 9324.3,
"valid_targets_min": 2445
},
{
"epoch": 1.2182890855457227,
"grad_norm": 0.20192145184305313,
"learning_rate": 3.7543250742790676e-05,
"loss": 0.4105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13179230690002441,
"step": 2065,
"valid_targets_mean": 9231.1,
"valid_targets_min": 1873
},
{
"epoch": 1.2212389380530975,
"grad_norm": 0.2248883000903419,
"learning_rate": 3.752343417948734e-05,
"loss": 0.4097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14653357863426208,
"step": 2070,
"valid_targets_mean": 10349.4,
"valid_targets_min": 898
},
{
"epoch": 1.224188790560472,
"grad_norm": 0.19674161802721363,
"learning_rate": 3.750354328837529e-05,
"loss": 0.4045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12419191002845764,
"step": 2075,
"valid_targets_mean": 9958.1,
"valid_targets_min": 2833
},
{
"epoch": 1.2271386430678466,
"grad_norm": 0.2040519297416266,
"learning_rate": 3.748357815382419e-05,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13978463411331177,
"step": 2080,
"valid_targets_mean": 9267.8,
"valid_targets_min": 1924
},
{
"epoch": 1.2300884955752212,
"grad_norm": 0.1935700879911901,
"learning_rate": 3.746353886051862e-05,
"loss": 0.4131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14617498219013214,
"step": 2085,
"valid_targets_mean": 11356.9,
"valid_targets_min": 1715
},
{
"epoch": 1.233038348082596,
"grad_norm": 0.20323760274797556,
"learning_rate": 3.7443425493457735e-05,
"loss": 0.4028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15078863501548767,
"step": 2090,
"valid_targets_mean": 9942.5,
"valid_targets_min": 2202
},
{
"epoch": 1.2359882005899705,
"grad_norm": 0.19237355834888428,
"learning_rate": 3.7423238137954835e-05,
"loss": 0.4027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12100933492183685,
"step": 2095,
"valid_targets_mean": 9043.8,
"valid_targets_min": 2039
},
{
"epoch": 1.238938053097345,
"grad_norm": 0.19405452277576316,
"learning_rate": 3.74029768796371e-05,
"loss": 0.4126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12515579164028168,
"step": 2100,
"valid_targets_mean": 10029.0,
"valid_targets_min": 2074
},
{
"epoch": 1.2418879056047198,
"grad_norm": 0.1918975786310472,
"learning_rate": 3.7382641804445136e-05,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13490715622901917,
"step": 2105,
"valid_targets_mean": 12080.2,
"valid_targets_min": 1794
},
{
"epoch": 1.2448377581120944,
"grad_norm": 0.22948564571877864,
"learning_rate": 3.73622329986327e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14957517385482788,
"step": 2110,
"valid_targets_mean": 10673.3,
"valid_targets_min": 1919
},
{
"epoch": 1.247787610619469,
"grad_norm": 0.1956858906108937,
"learning_rate": 3.734175054876626e-05,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13325190544128418,
"step": 2115,
"valid_targets_mean": 10177.9,
"valid_targets_min": 816
},
{
"epoch": 1.2507374631268435,
"grad_norm": 0.20690628762099494,
"learning_rate": 3.7321194541724625e-05,
"loss": 0.4055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585572063922882,
"step": 2120,
"valid_targets_mean": 11231.2,
"valid_targets_min": 2275
},
{
"epoch": 1.2536873156342183,
"grad_norm": 0.1958247690154711,
"learning_rate": 3.7300565064698664e-05,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11031612753868103,
"step": 2125,
"valid_targets_mean": 8387.8,
"valid_targets_min": 1395
},
{
"epoch": 1.2566371681415929,
"grad_norm": 0.2249780519965779,
"learning_rate": 3.727986220519085e-05,
"loss": 0.4014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15190738439559937,
"step": 2130,
"valid_targets_mean": 10092.2,
"valid_targets_min": 1533
},
{
"epoch": 1.2595870206489677,
"grad_norm": 0.19232542968979785,
"learning_rate": 3.7259086051014896e-05,
"loss": 0.4125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13802318274974823,
"step": 2135,
"valid_targets_mean": 11030.4,
"valid_targets_min": 1781
},
{
"epoch": 1.2625368731563422,
"grad_norm": 0.21055352053943993,
"learning_rate": 3.7238236690295433e-05,
"loss": 0.4106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12079479545354843,
"step": 2140,
"valid_targets_mean": 8386.0,
"valid_targets_min": 1623
},
{
"epoch": 1.2654867256637168,
"grad_norm": 0.21340054364438876,
"learning_rate": 3.7217314211467615e-05,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1280185729265213,
"step": 2145,
"valid_targets_mean": 9386.7,
"valid_targets_min": 2248
},
{
"epoch": 1.2684365781710913,
"grad_norm": 0.19654827232796557,
"learning_rate": 3.7196318703276695e-05,
"loss": 0.412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12935896217823029,
"step": 2150,
"valid_targets_mean": 10851.2,
"valid_targets_min": 1999
},
{
"epoch": 1.2713864306784661,
"grad_norm": 0.18684413906547542,
"learning_rate": 3.717525025477772e-05,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12971490621566772,
"step": 2155,
"valid_targets_mean": 10156.7,
"valid_targets_min": 1575
},
{
"epoch": 1.2743362831858407,
"grad_norm": 0.20131635339460882,
"learning_rate": 3.715410895533511e-05,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1318942904472351,
"step": 2160,
"valid_targets_mean": 9176.0,
"valid_targets_min": 1819
},
{
"epoch": 1.2772861356932155,
"grad_norm": 0.20005532418427976,
"learning_rate": 3.713289489462231e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12302594631910324,
"step": 2165,
"valid_targets_mean": 9579.9,
"valid_targets_min": 1936
},
{
"epoch": 1.28023598820059,
"grad_norm": 0.1987319890122761,
"learning_rate": 3.711160816262136e-05,
"loss": 0.4038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13187222182750702,
"step": 2170,
"valid_targets_mean": 10588.2,
"valid_targets_min": 2210
},
{
"epoch": 1.2831858407079646,
"grad_norm": 0.20569943718314818,
"learning_rate": 3.7090248849622575e-05,
"loss": 0.4108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1288871467113495,
"step": 2175,
"valid_targets_mean": 9435.7,
"valid_targets_min": 1343
},
{
"epoch": 1.2861356932153392,
"grad_norm": 0.19481024413783074,
"learning_rate": 3.7068817046224106e-05,
"loss": 0.4121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1117725670337677,
"step": 2180,
"valid_targets_mean": 8765.1,
"valid_targets_min": 2181
},
{
"epoch": 1.289085545722714,
"grad_norm": 0.2075955871038273,
"learning_rate": 3.7047312843331596e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13937462866306305,
"step": 2185,
"valid_targets_mean": 11306.6,
"valid_targets_min": 1251
},
{
"epoch": 1.2920353982300885,
"grad_norm": 0.1966624832512414,
"learning_rate": 3.702573633215778e-05,
"loss": 0.4082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1228807345032692,
"step": 2190,
"valid_targets_mean": 8945.6,
"valid_targets_min": 2289
},
{
"epoch": 1.294985250737463,
"grad_norm": 0.17735257514071073,
"learning_rate": 3.700408760422209e-05,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13248281180858612,
"step": 2195,
"valid_targets_mean": 10275.5,
"valid_targets_min": 2173
},
{
"epoch": 1.2979351032448379,
"grad_norm": 0.20566850050832683,
"learning_rate": 3.698236675135027e-05,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12011992931365967,
"step": 2200,
"valid_targets_mean": 9283.0,
"valid_targets_min": 1861
},
{
"epoch": 1.3008849557522124,
"grad_norm": 0.19471925424106384,
"learning_rate": 3.696057386567401e-05,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11719102412462234,
"step": 2205,
"valid_targets_mean": 8844.1,
"valid_targets_min": 1562
},
{
"epoch": 1.303834808259587,
"grad_norm": 0.20677025054702694,
"learning_rate": 3.6938709039630514e-05,
"loss": 0.4088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11571133136749268,
"step": 2210,
"valid_targets_mean": 9628.9,
"valid_targets_min": 2723
},
{
"epoch": 1.3067846607669615,
"grad_norm": 0.19386983627829316,
"learning_rate": 3.6916772365962146e-05,
"loss": 0.4071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14339354634284973,
"step": 2215,
"valid_targets_mean": 9824.7,
"valid_targets_min": 2124
},
{
"epoch": 1.3097345132743363,
"grad_norm": 0.20733483530915647,
"learning_rate": 3.689476393771601e-05,
"loss": 0.4087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16114959120750427,
"step": 2220,
"valid_targets_mean": 10805.5,
"valid_targets_min": 1645
},
{
"epoch": 1.3126843657817109,
"grad_norm": 0.2074662286669484,
"learning_rate": 3.687268384824358e-05,
"loss": 0.4065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1201554462313652,
"step": 2225,
"valid_targets_mean": 8827.6,
"valid_targets_min": 1488
},
{
"epoch": 1.3156342182890857,
"grad_norm": 0.20787590103008372,
"learning_rate": 3.685053219120027e-05,
"loss": 0.4076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1468854397535324,
"step": 2230,
"valid_targets_mean": 9714.4,
"valid_targets_min": 1897
},
{
"epoch": 1.3185840707964602,
"grad_norm": 0.2130181150365414,
"learning_rate": 3.682830906054508e-05,
"loss": 0.4033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13946279883384705,
"step": 2235,
"valid_targets_mean": 10670.6,
"valid_targets_min": 1889
},
{
"epoch": 1.3215339233038348,
"grad_norm": 0.19106711316771613,
"learning_rate": 3.680601455054015e-05,
"loss": 0.4112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15019375085830688,
"step": 2240,
"valid_targets_mean": 10592.3,
"valid_targets_min": 2458
},
{
"epoch": 1.3244837758112094,
"grad_norm": 0.19726641284267823,
"learning_rate": 3.6783648755750384e-05,
"loss": 0.4007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17111629247665405,
"step": 2245,
"valid_targets_mean": 13763.0,
"valid_targets_min": 1776
},
{
"epoch": 1.3274336283185841,
"grad_norm": 0.18422082465731265,
"learning_rate": 3.6761211771043094e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12834113836288452,
"step": 2250,
"valid_targets_mean": 10454.7,
"valid_targets_min": 1719
},
{
"epoch": 1.3303834808259587,
"grad_norm": 0.18180812278892167,
"learning_rate": 3.673870369158749e-05,
"loss": 0.4103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14465734362602234,
"step": 2255,
"valid_targets_mean": 9654.4,
"valid_targets_min": 1351
},
{
"epoch": 1.3333333333333333,
"grad_norm": 0.1895037587937176,
"learning_rate": 3.671612461285439e-05,
"loss": 0.4026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13590912520885468,
"step": 2260,
"valid_targets_mean": 10966.7,
"valid_targets_min": 1919
},
{
"epoch": 1.336283185840708,
"grad_norm": 0.18289571304655325,
"learning_rate": 3.6693474630615723e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14450351893901825,
"step": 2265,
"valid_targets_mean": 10623.2,
"valid_targets_min": 2312
},
{
"epoch": 1.3392330383480826,
"grad_norm": 0.19387794145565707,
"learning_rate": 3.6670753840944196e-05,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14855991303920746,
"step": 2270,
"valid_targets_mean": 11599.1,
"valid_targets_min": 1690
},
{
"epoch": 1.3421828908554572,
"grad_norm": 0.2129132270060968,
"learning_rate": 3.6647962340212845e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12970374524593353,
"step": 2275,
"valid_targets_mean": 10497.8,
"valid_targets_min": 1494
},
{
"epoch": 1.3451327433628317,
"grad_norm": 0.20779965227080616,
"learning_rate": 3.6625100225094624e-05,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1262437105178833,
"step": 2280,
"valid_targets_mean": 9126.5,
"valid_targets_min": 2499
},
{
"epoch": 1.3480825958702065,
"grad_norm": 0.2017390741108949,
"learning_rate": 3.660216759256202e-05,
"loss": 0.4135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14283165335655212,
"step": 2285,
"valid_targets_mean": 10106.3,
"valid_targets_min": 1729
},
{
"epoch": 1.351032448377581,
"grad_norm": 0.18994227000395517,
"learning_rate": 3.657916453988663e-05,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12617641687393188,
"step": 2290,
"valid_targets_mean": 10339.8,
"valid_targets_min": 1135
},
{
"epoch": 1.3539823008849559,
"grad_norm": 0.2119826690671679,
"learning_rate": 3.655609116463874e-05,
"loss": 0.3999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15031850337982178,
"step": 2295,
"valid_targets_mean": 10505.3,
"valid_targets_min": 1982
},
{
"epoch": 1.3569321533923304,
"grad_norm": 0.21767299900598155,
"learning_rate": 3.65329475646869e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11701009422540665,
"step": 2300,
"valid_targets_mean": 8692.3,
"valid_targets_min": 2029
},
{
"epoch": 1.359882005899705,
"grad_norm": 0.2183834292919999,
"learning_rate": 3.6509733838197564e-05,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16395114362239838,
"step": 2305,
"valid_targets_mean": 11298.5,
"valid_targets_min": 2026
},
{
"epoch": 1.3628318584070795,
"grad_norm": 0.18901010572773513,
"learning_rate": 3.648645008363462e-05,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13451609015464783,
"step": 2310,
"valid_targets_mean": 11260.0,
"valid_targets_min": 1881
},
{
"epoch": 1.3657817109144543,
"grad_norm": 0.2048497137635517,
"learning_rate": 3.646309639975897e-05,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13462871313095093,
"step": 2315,
"valid_targets_mean": 8625.0,
"valid_targets_min": 1667
},
{
"epoch": 1.368731563421829,
"grad_norm": 0.19236734583414303,
"learning_rate": 3.6439672885628166e-05,
"loss": 0.4088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13107746839523315,
"step": 2320,
"valid_targets_mean": 9656.2,
"valid_targets_min": 934
},
{
"epoch": 1.3716814159292037,
"grad_norm": 0.19053766648018297,
"learning_rate": 3.6416179640595915e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13497191667556763,
"step": 2325,
"valid_targets_mean": 9664.0,
"valid_targets_min": 1144
},
{
"epoch": 1.3746312684365782,
"grad_norm": 0.19300409834685217,
"learning_rate": 3.639261676431173e-05,
"loss": 0.409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307114213705063,
"step": 2330,
"valid_targets_mean": 9555.0,
"valid_targets_min": 1431
},
{
"epoch": 1.3775811209439528,
"grad_norm": 0.1915293402622118,
"learning_rate": 3.636898435672045e-05,
"loss": 0.4086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14565394818782806,
"step": 2335,
"valid_targets_mean": 11355.8,
"valid_targets_min": 1551
},
{
"epoch": 1.3805309734513274,
"grad_norm": 0.18757009262408111,
"learning_rate": 3.6345282518061854e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13044847548007965,
"step": 2340,
"valid_targets_mean": 9336.7,
"valid_targets_min": 1510
},
{
"epoch": 1.3834808259587021,
"grad_norm": 0.21574355726659275,
"learning_rate": 3.6321511348870216e-05,
"loss": 0.4108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14156800508499146,
"step": 2345,
"valid_targets_mean": 10439.0,
"valid_targets_min": 950
},
{
"epoch": 1.3864306784660767,
"grad_norm": 0.2220379252664554,
"learning_rate": 3.629767094997387e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283535361289978,
"step": 2350,
"valid_targets_mean": 9239.7,
"valid_targets_min": 1882
},
{
"epoch": 1.3893805309734513,
"grad_norm": 0.20889828514195585,
"learning_rate": 3.6273761422494835e-05,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11462993174791336,
"step": 2355,
"valid_targets_mean": 8878.3,
"valid_targets_min": 1276
},
{
"epoch": 1.392330383480826,
"grad_norm": 0.1971508256806736,
"learning_rate": 3.6249782867848305e-05,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12239646911621094,
"step": 2360,
"valid_targets_mean": 9431.4,
"valid_targets_min": 1698
},
{
"epoch": 1.3952802359882006,
"grad_norm": 0.20606399593524655,
"learning_rate": 3.622573538774227e-05,
"loss": 0.4012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1392350047826767,
"step": 2365,
"valid_targets_mean": 9600.9,
"valid_targets_min": 2070
},
{
"epoch": 1.3982300884955752,
"grad_norm": 0.2006887696751807,
"learning_rate": 3.620161908417711e-05,
"loss": 0.413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13277579843997955,
"step": 2370,
"valid_targets_mean": 9258.9,
"valid_targets_min": 2322
},
{
"epoch": 1.4011799410029497,
"grad_norm": 0.2143607038766854,
"learning_rate": 3.6177434059445094e-05,
"loss": 0.4103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14542219042778015,
"step": 2375,
"valid_targets_mean": 11005.1,
"valid_targets_min": 1545
},
{
"epoch": 1.4041297935103245,
"grad_norm": 0.19051154679740112,
"learning_rate": 3.615318041612998e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375996470451355,
"step": 2380,
"valid_targets_mean": 10616.3,
"valid_targets_min": 1536
},
{
"epoch": 1.407079646017699,
"grad_norm": 0.18605652703530892,
"learning_rate": 3.612885825710659e-05,
"loss": 0.4071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16152793169021606,
"step": 2385,
"valid_targets_mean": 11486.4,
"valid_targets_min": 518
},
{
"epoch": 1.4100294985250739,
"grad_norm": 0.1952639376391805,
"learning_rate": 3.610446768554037e-05,
"loss": 0.409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13920962810516357,
"step": 2390,
"valid_targets_mean": 9616.6,
"valid_targets_min": 1230
},
{
"epoch": 1.4129793510324484,
"grad_norm": 0.18753466403054453,
"learning_rate": 3.608000880488694e-05,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12460490316152573,
"step": 2395,
"valid_targets_mean": 8952.7,
"valid_targets_min": 1587
},
{
"epoch": 1.415929203539823,
"grad_norm": 0.20751763054816902,
"learning_rate": 3.6055481718891664e-05,
"loss": 0.406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15804365277290344,
"step": 2400,
"valid_targets_mean": 11414.2,
"valid_targets_min": 3387
},
{
"epoch": 1.4188790560471976,
"grad_norm": 0.22456567480775044,
"learning_rate": 3.603088653158919e-05,
"loss": 0.4021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18407636880874634,
"step": 2405,
"valid_targets_mean": 12465.5,
"valid_targets_min": 1710
},
{
"epoch": 1.4218289085545723,
"grad_norm": 0.1897115624902503,
"learning_rate": 3.6006223347303055e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15461409091949463,
"step": 2410,
"valid_targets_mean": 10231.8,
"valid_targets_min": 2259
},
{
"epoch": 1.424778761061947,
"grad_norm": 0.18663608515655314,
"learning_rate": 3.5981492270645186e-05,
"loss": 0.3995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14762979745864868,
"step": 2415,
"valid_targets_mean": 13320.7,
"valid_targets_min": 1376
},
{
"epoch": 1.4277286135693215,
"grad_norm": 0.18670962136513533,
"learning_rate": 3.5956693406515514e-05,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10723703354597092,
"step": 2420,
"valid_targets_mean": 8426.0,
"valid_targets_min": 1654
},
{
"epoch": 1.4306784660766962,
"grad_norm": 0.21110550552454987,
"learning_rate": 3.5931826860101464e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11997527629137039,
"step": 2425,
"valid_targets_mean": 8610.3,
"valid_targets_min": 2335
},
{
"epoch": 1.4336283185840708,
"grad_norm": 0.1927862790503147,
"learning_rate": 3.590689273687757e-05,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12968887388706207,
"step": 2430,
"valid_targets_mean": 9733.9,
"valid_targets_min": 2604
},
{
"epoch": 1.4365781710914454,
"grad_norm": 0.18845839982483642,
"learning_rate": 3.588189114260499e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10686099529266357,
"step": 2435,
"valid_targets_mean": 7887.3,
"valid_targets_min": 961
},
{
"epoch": 1.43952802359882,
"grad_norm": 0.1913639955229515,
"learning_rate": 3.585682218333108e-05,
"loss": 0.3973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1498546153306961,
"step": 2440,
"valid_targets_mean": 12008.4,
"valid_targets_min": 3631
},
{
"epoch": 1.4424778761061947,
"grad_norm": 0.19182583587682012,
"learning_rate": 3.583168596538891e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14093820750713348,
"step": 2445,
"valid_targets_mean": 11155.2,
"valid_targets_min": 2731
},
{
"epoch": 1.4454277286135693,
"grad_norm": 0.20882085785585852,
"learning_rate": 3.580648259539686e-05,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13466665148735046,
"step": 2450,
"valid_targets_mean": 10674.4,
"valid_targets_min": 1317
},
{
"epoch": 1.448377581120944,
"grad_norm": 0.1999862673806767,
"learning_rate": 3.578121218025814e-05,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15615367889404297,
"step": 2455,
"valid_targets_mean": 11136.4,
"valid_targets_min": 1890
},
{
"epoch": 1.4513274336283186,
"grad_norm": 0.21154653827787115,
"learning_rate": 3.5755874827160324e-05,
"loss": 0.3973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16489741206169128,
"step": 2460,
"valid_targets_mean": 12538.8,
"valid_targets_min": 1856
},
{
"epoch": 1.4542772861356932,
"grad_norm": 0.20865259658756602,
"learning_rate": 3.573047064357492e-05,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15276436507701874,
"step": 2465,
"valid_targets_mean": 11351.3,
"valid_targets_min": 1738
},
{
"epoch": 1.4572271386430677,
"grad_norm": 0.21166081933048564,
"learning_rate": 3.5704999737256923e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10980367660522461,
"step": 2470,
"valid_targets_mean": 9638.6,
"valid_targets_min": 2769
},
{
"epoch": 1.4601769911504425,
"grad_norm": 0.20547766161198802,
"learning_rate": 3.567946221624431e-05,
"loss": 0.3965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13496387004852295,
"step": 2475,
"valid_targets_mean": 10217.3,
"valid_targets_min": 1867
},
{
"epoch": 1.463126843657817,
"grad_norm": 0.20272356539276168,
"learning_rate": 3.5653858188857637e-05,
"loss": 0.3933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13152998685836792,
"step": 2480,
"valid_targets_mean": 10830.1,
"valid_targets_min": 2056
},
{
"epoch": 1.4660766961651919,
"grad_norm": 0.1928236170984883,
"learning_rate": 3.5628187763699545e-05,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10376954078674316,
"step": 2485,
"valid_targets_mean": 8065.7,
"valid_targets_min": 2250
},
{
"epoch": 1.4690265486725664,
"grad_norm": 0.20906690195005687,
"learning_rate": 3.560245104965431e-05,
"loss": 0.3981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1269378960132599,
"step": 2490,
"valid_targets_mean": 10655.2,
"valid_targets_min": 2555
},
{
"epoch": 1.471976401179941,
"grad_norm": 0.2046303448144277,
"learning_rate": 3.5576648155887366e-05,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14142167568206787,
"step": 2495,
"valid_targets_mean": 11071.5,
"valid_targets_min": 860
},
{
"epoch": 1.4749262536873156,
"grad_norm": 0.20599363038669596,
"learning_rate": 3.555077919184489e-05,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15158352255821228,
"step": 2500,
"valid_targets_mean": 11408.9,
"valid_targets_min": 2015
},
{
"epoch": 1.4778761061946903,
"grad_norm": 0.1788204164478249,
"learning_rate": 3.552484426725329e-05,
"loss": 0.3966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10846086591482162,
"step": 2505,
"valid_targets_mean": 9568.1,
"valid_targets_min": 1913
},
{
"epoch": 1.480825958702065,
"grad_norm": 0.1923751273446749,
"learning_rate": 3.549884349211874e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12155988812446594,
"step": 2510,
"valid_targets_mean": 9056.0,
"valid_targets_min": 1585
},
{
"epoch": 1.4837758112094395,
"grad_norm": 0.20639266762873654,
"learning_rate": 3.5472776976726734e-05,
"loss": 0.393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15222719311714172,
"step": 2515,
"valid_targets_mean": 13044.3,
"valid_targets_min": 2160
},
{
"epoch": 1.4867256637168142,
"grad_norm": 0.22266275834029062,
"learning_rate": 3.5446644831641614e-05,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10895134508609772,
"step": 2520,
"valid_targets_mean": 9486.9,
"valid_targets_min": 1543
},
{
"epoch": 1.4896755162241888,
"grad_norm": 0.21384271957343456,
"learning_rate": 3.54204471677061e-05,
"loss": 0.3968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11045604944229126,
"step": 2525,
"valid_targets_mean": 9637.9,
"valid_targets_min": 1453
},
{
"epoch": 1.4926253687315634,
"grad_norm": 0.21759058269956286,
"learning_rate": 3.539418409604082e-05,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656768023967743,
"step": 2530,
"valid_targets_mean": 11221.1,
"valid_targets_min": 1861
},
{
"epoch": 1.495575221238938,
"grad_norm": 0.22306265795961336,
"learning_rate": 3.536785572804383e-05,
"loss": 0.3984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11005926877260208,
"step": 2535,
"valid_targets_mean": 7896.7,
"valid_targets_min": 1601
},
{
"epoch": 1.4985250737463127,
"grad_norm": 0.18758579596156683,
"learning_rate": 3.534146217539016e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14364221692085266,
"step": 2540,
"valid_targets_mean": 11206.3,
"valid_targets_min": 2567
},
{
"epoch": 1.5014749262536873,
"grad_norm": 0.2141138193508478,
"learning_rate": 3.531500355003131e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13702622056007385,
"step": 2545,
"valid_targets_mean": 9940.7,
"valid_targets_min": 1487
},
{
"epoch": 1.504424778761062,
"grad_norm": 0.20617771305195218,
"learning_rate": 3.528847996419481e-05,
"loss": 0.3954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1305457502603531,
"step": 2550,
"valid_targets_mean": 9426.9,
"valid_targets_min": 1920
},
{
"epoch": 1.5073746312684366,
"grad_norm": 0.22125729323813947,
"learning_rate": 3.526189153038372e-05,
"loss": 0.3979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11197060346603394,
"step": 2555,
"valid_targets_mean": 7889.9,
"valid_targets_min": 1997
},
{
"epoch": 1.5103244837758112,
"grad_norm": 0.20228311822774708,
"learning_rate": 3.523523836137617e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10877414047718048,
"step": 2560,
"valid_targets_mean": 8702.3,
"valid_targets_min": 2150
},
{
"epoch": 1.5132743362831858,
"grad_norm": 0.1924749677621517,
"learning_rate": 3.5208520570224865e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15349164605140686,
"step": 2565,
"valid_targets_mean": 11533.9,
"valid_targets_min": 1871
},
{
"epoch": 1.5162241887905603,
"grad_norm": 0.22515634811956609,
"learning_rate": 3.5181738270256595e-05,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12597164511680603,
"step": 2570,
"valid_targets_mean": 10099.0,
"valid_targets_min": 2449
},
{
"epoch": 1.519174041297935,
"grad_norm": 0.20497870920040415,
"learning_rate": 3.5154891575071816e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1445295214653015,
"step": 2575,
"valid_targets_mean": 10613.0,
"valid_targets_min": 1767
},
{
"epoch": 1.5221238938053099,
"grad_norm": 0.19355635363854126,
"learning_rate": 3.512798059854409e-05,
"loss": 0.3984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132507786154747,
"step": 2580,
"valid_targets_mean": 9735.8,
"valid_targets_min": 1444
},
{
"epoch": 1.5250737463126844,
"grad_norm": 0.19422329710559866,
"learning_rate": 3.510100545481964e-05,
"loss": 0.4035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1423739790916443,
"step": 2585,
"valid_targets_mean": 12089.4,
"valid_targets_min": 1483
},
{
"epoch": 1.528023598820059,
"grad_norm": 0.20363806304130708,
"learning_rate": 3.507396625831687e-05,
"loss": 0.3989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1374133825302124,
"step": 2590,
"valid_targets_mean": 9522.6,
"valid_targets_min": 747
},
{
"epoch": 1.5309734513274336,
"grad_norm": 0.20209241704309913,
"learning_rate": 3.504686312372587e-05,
"loss": 0.3859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09004460275173187,
"step": 2595,
"valid_targets_mean": 6589.8,
"valid_targets_min": 1001
},
{
"epoch": 1.5339233038348081,
"grad_norm": 0.20549443606621662,
"learning_rate": 3.5019696166007936e-05,
"loss": 0.4004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255984753370285,
"step": 2600,
"valid_targets_mean": 8307.7,
"valid_targets_min": 1442
},
{
"epoch": 1.536873156342183,
"grad_norm": 0.189294083469522,
"learning_rate": 3.499246550039506e-05,
"loss": 0.3899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12242449820041656,
"step": 2605,
"valid_targets_mean": 9174.5,
"valid_targets_min": 2099
},
{
"epoch": 1.5398230088495575,
"grad_norm": 0.223437837939735,
"learning_rate": 3.4965171242389485e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13413646817207336,
"step": 2610,
"valid_targets_mean": 9977.2,
"valid_targets_min": 1385
},
{
"epoch": 1.5427728613569323,
"grad_norm": 0.1946804583428626,
"learning_rate": 3.4937813507763155e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10855253040790558,
"step": 2615,
"valid_targets_mean": 8322.1,
"valid_targets_min": 2131
},
{
"epoch": 1.5457227138643068,
"grad_norm": 0.1996768663383723,
"learning_rate": 3.491039241255729e-05,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13678157329559326,
"step": 2620,
"valid_targets_mean": 10406.2,
"valid_targets_min": 1407
},
{
"epoch": 1.5486725663716814,
"grad_norm": 0.19472478670325657,
"learning_rate": 3.488290807308186e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14884641766548157,
"step": 2625,
"valid_targets_mean": 12493.9,
"valid_targets_min": 2457
},
{
"epoch": 1.551622418879056,
"grad_norm": 0.19161386368368877,
"learning_rate": 3.485536060591507e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11435461044311523,
"step": 2630,
"valid_targets_mean": 9960.1,
"valid_targets_min": 2052
},
{
"epoch": 1.5545722713864307,
"grad_norm": 0.2149406169132456,
"learning_rate": 3.482775012790289e-05,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11524064838886261,
"step": 2635,
"valid_targets_mean": 8378.8,
"valid_targets_min": 1560
},
{
"epoch": 1.5575221238938053,
"grad_norm": 0.1976686009933042,
"learning_rate": 3.48000767561586e-05,
"loss": 0.3914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11932376027107239,
"step": 2640,
"valid_targets_mean": 9472.5,
"valid_targets_min": 2484
},
{
"epoch": 1.56047197640118,
"grad_norm": 0.1986083979866418,
"learning_rate": 3.47723406080622e-05,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12804947793483734,
"step": 2645,
"valid_targets_mean": 10299.2,
"valid_targets_min": 878
},
{
"epoch": 1.5634218289085546,
"grad_norm": 0.19875678796513913,
"learning_rate": 3.474454180125998e-05,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.138924703001976,
"step": 2650,
"valid_targets_mean": 10887.9,
"valid_targets_min": 2125
},
{
"epoch": 1.5663716814159292,
"grad_norm": 0.208010638626533,
"learning_rate": 3.4716680453664034e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16505074501037598,
"step": 2655,
"valid_targets_mean": 12573.0,
"valid_targets_min": 2048
},
{
"epoch": 1.5693215339233038,
"grad_norm": 0.2113806560061952,
"learning_rate": 3.4688756683451687e-05,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1205722764134407,
"step": 2660,
"valid_targets_mean": 9179.3,
"valid_targets_min": 1147
},
{
"epoch": 1.5722713864306783,
"grad_norm": 0.19990820921293187,
"learning_rate": 3.466077060906507e-05,
"loss": 0.3867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13424262404441833,
"step": 2665,
"valid_targets_mean": 10706.8,
"valid_targets_min": 1593
},
{
"epoch": 1.575221238938053,
"grad_norm": 0.2035721175968825,
"learning_rate": 3.4632722349210554e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1269957721233368,
"step": 2670,
"valid_targets_mean": 9218.1,
"valid_targets_min": 2137
},
{
"epoch": 1.5781710914454279,
"grad_norm": 0.19354321221920615,
"learning_rate": 3.4604612022858306e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14735949039459229,
"step": 2675,
"valid_targets_mean": 11224.7,
"valid_targets_min": 1822
},
{
"epoch": 1.5811209439528024,
"grad_norm": 0.23544262059333004,
"learning_rate": 3.457643974924174e-05,
"loss": 0.3909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1378946602344513,
"step": 2680,
"valid_targets_mean": 11156.6,
"valid_targets_min": 1606
},
{
"epoch": 1.584070796460177,
"grad_norm": 0.20303218282604443,
"learning_rate": 3.4548205647857035e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1464405059814453,
"step": 2685,
"valid_targets_mean": 10960.1,
"valid_targets_min": 1556
},
{
"epoch": 1.5870206489675516,
"grad_norm": 0.19961288753135736,
"learning_rate": 3.451990983846262e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11880732327699661,
"step": 2690,
"valid_targets_mean": 9461.7,
"valid_targets_min": 1929
},
{
"epoch": 1.5899705014749261,
"grad_norm": 0.22630238402236566,
"learning_rate": 3.4491552441078654e-05,
"loss": 0.3995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13695894181728363,
"step": 2695,
"valid_targets_mean": 9745.5,
"valid_targets_min": 1581
},
{
"epoch": 1.592920353982301,
"grad_norm": 0.22240211592749506,
"learning_rate": 3.446313357598655e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13270913064479828,
"step": 2700,
"valid_targets_mean": 10080.6,
"valid_targets_min": 2923
},
{
"epoch": 1.5958702064896755,
"grad_norm": 0.20453988006624954,
"learning_rate": 3.443465336372842e-05,
"loss": 0.3861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12554414570331573,
"step": 2705,
"valid_targets_mean": 8127.2,
"valid_targets_min": 1571
},
{
"epoch": 1.5988200589970503,
"grad_norm": 0.19769030059580794,
"learning_rate": 3.4406111925106596e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12743881344795227,
"step": 2710,
"valid_targets_mean": 10449.8,
"valid_targets_min": 1912
},
{
"epoch": 1.6017699115044248,
"grad_norm": 0.21819544409639086,
"learning_rate": 3.437750938118312e-05,
"loss": 0.3941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11632522940635681,
"step": 2715,
"valid_targets_mean": 8532.2,
"valid_targets_min": 1791
},
{
"epoch": 1.6047197640117994,
"grad_norm": 0.19796092409366658,
"learning_rate": 3.434884585327922e-05,
"loss": 0.3957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13927127420902252,
"step": 2720,
"valid_targets_mean": 11387.8,
"valid_targets_min": 2003
},
{
"epoch": 1.607669616519174,
"grad_norm": 0.20029936745164265,
"learning_rate": 3.4320121462974766e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12672072649002075,
"step": 2725,
"valid_targets_mean": 9229.9,
"valid_targets_min": 2522
},
{
"epoch": 1.6106194690265485,
"grad_norm": 0.1872592104723706,
"learning_rate": 3.429133633210782e-05,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1504121869802475,
"step": 2730,
"valid_targets_mean": 12198.8,
"valid_targets_min": 1675
},
{
"epoch": 1.6135693215339233,
"grad_norm": 0.186467265613796,
"learning_rate": 3.426249058277407e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12724050879478455,
"step": 2735,
"valid_targets_mean": 10017.0,
"valid_targets_min": 1776
},
{
"epoch": 1.616519174041298,
"grad_norm": 0.17773999259250345,
"learning_rate": 3.423358433732631e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1229085773229599,
"step": 2740,
"valid_targets_mean": 10342.0,
"valid_targets_min": 1961
},
{
"epoch": 1.6194690265486726,
"grad_norm": 0.17658621399418326,
"learning_rate": 3.420461771837396e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12835684418678284,
"step": 2745,
"valid_targets_mean": 9962.6,
"valid_targets_min": 2405
},
{
"epoch": 1.6224188790560472,
"grad_norm": 0.20031625945910475,
"learning_rate": 3.4175590848782495e-05,
"loss": 0.3938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1081707626581192,
"step": 2750,
"valid_targets_mean": 8304.7,
"valid_targets_min": 1978
},
{
"epoch": 1.6253687315634218,
"grad_norm": 0.20896474694567252,
"learning_rate": 3.414650385167298e-05,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14379850029945374,
"step": 2755,
"valid_targets_mean": 12342.4,
"valid_targets_min": 2187
},
{
"epoch": 1.6283185840707963,
"grad_norm": 0.20182015995158958,
"learning_rate": 3.4117356850421485e-05,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12928926944732666,
"step": 2760,
"valid_targets_mean": 9165.0,
"valid_targets_min": 832
},
{
"epoch": 1.631268436578171,
"grad_norm": 0.20103812781549815,
"learning_rate": 3.408814996865863e-05,
"loss": 0.3928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1281728893518448,
"step": 2765,
"valid_targets_mean": 10573.9,
"valid_targets_min": 2386
},
{
"epoch": 1.6342182890855457,
"grad_norm": 0.18029541909036872,
"learning_rate": 3.4058883330268995e-05,
"loss": 0.4005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1050175353884697,
"step": 2770,
"valid_targets_mean": 8261.4,
"valid_targets_min": 1439
},
{
"epoch": 1.6371681415929205,
"grad_norm": 0.2012413957828967,
"learning_rate": 3.402955705939065e-05,
"loss": 0.4041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14012792706489563,
"step": 2775,
"valid_targets_mean": 9847.7,
"valid_targets_min": 1767
},
{
"epoch": 1.640117994100295,
"grad_norm": 0.19178800924013567,
"learning_rate": 3.400017128041459e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15238690376281738,
"step": 2780,
"valid_targets_mean": 13030.2,
"valid_targets_min": 2483
},
{
"epoch": 1.6430678466076696,
"grad_norm": 0.19419884624460312,
"learning_rate": 3.397072611798421e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11771540343761444,
"step": 2785,
"valid_targets_mean": 9731.1,
"valid_targets_min": 1703
},
{
"epoch": 1.6460176991150441,
"grad_norm": 0.19910500058317934,
"learning_rate": 3.394122169699482e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13526403903961182,
"step": 2790,
"valid_targets_mean": 10780.1,
"valid_targets_min": 1649
},
{
"epoch": 1.648967551622419,
"grad_norm": 0.18202549756014805,
"learning_rate": 3.3911658142593044e-05,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13593779504299164,
"step": 2795,
"valid_targets_mean": 10743.4,
"valid_targets_min": 1801
},
{
"epoch": 1.6519174041297935,
"grad_norm": 0.19194239646892167,
"learning_rate": 3.388203558017636e-05,
"loss": 0.4012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10597368329763412,
"step": 2800,
"valid_targets_mean": 9102.6,
"valid_targets_min": 1830
},
{
"epoch": 1.6548672566371683,
"grad_norm": 0.1852839602364545,
"learning_rate": 3.3852354135392534e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11317931115627289,
"step": 2805,
"valid_targets_mean": 9400.9,
"valid_targets_min": 1853
},
{
"epoch": 1.6578171091445428,
"grad_norm": 0.19090895235342278,
"learning_rate": 3.382261393413905e-05,
"loss": 0.3841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1284770369529724,
"step": 2810,
"valid_targets_mean": 10114.0,
"valid_targets_min": 2144
},
{
"epoch": 1.6607669616519174,
"grad_norm": 0.2029009930014119,
"learning_rate": 3.3792815102562646e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13038460910320282,
"step": 2815,
"valid_targets_mean": 9553.2,
"valid_targets_min": 2181
},
{
"epoch": 1.663716814159292,
"grad_norm": 0.20663093892181367,
"learning_rate": 3.3762957767058764e-05,
"loss": 0.3948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13431856036186218,
"step": 2820,
"valid_targets_mean": 9748.7,
"valid_targets_min": 856
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.18749624837860834,
"learning_rate": 3.373304205427096e-05,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14476144313812256,
"step": 2825,
"valid_targets_mean": 12207.3,
"valid_targets_min": 2941
},
{
"epoch": 1.6696165191740413,
"grad_norm": 0.188979400398134,
"learning_rate": 3.370306809109043e-05,
"loss": 0.3919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11705923080444336,
"step": 2830,
"valid_targets_mean": 9607.7,
"valid_targets_min": 1480
},
{
"epoch": 1.672566371681416,
"grad_norm": 0.1822789862555373,
"learning_rate": 3.367303600465543e-05,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12379142642021179,
"step": 2835,
"valid_targets_mean": 10516.6,
"valid_targets_min": 1750
},
{
"epoch": 1.6755162241887906,
"grad_norm": 0.19514377116590026,
"learning_rate": 3.364294592235077e-05,
"loss": 0.393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1143941879272461,
"step": 2840,
"valid_targets_mean": 9166.2,
"valid_targets_min": 2342
},
{
"epoch": 1.6784660766961652,
"grad_norm": 0.1995337838648031,
"learning_rate": 3.361279797180724e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15227705240249634,
"step": 2845,
"valid_targets_mean": 10198.2,
"valid_targets_min": 1888
},
{
"epoch": 1.6814159292035398,
"grad_norm": 0.19203783654469914,
"learning_rate": 3.358259228090109e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13235729932785034,
"step": 2850,
"valid_targets_mean": 9976.0,
"valid_targets_min": 1591
},
{
"epoch": 1.6843657817109143,
"grad_norm": 0.1976180105398448,
"learning_rate": 3.3552328977753506e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1187744140625,
"step": 2855,
"valid_targets_mean": 8667.3,
"valid_targets_min": 1636
},
{
"epoch": 1.6873156342182891,
"grad_norm": 0.19202804434606036,
"learning_rate": 3.3522008190730004e-05,
"loss": 0.394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15723806619644165,
"step": 2860,
"valid_targets_mean": 11671.9,
"valid_targets_min": 1372
},
{
"epoch": 1.6902654867256637,
"grad_norm": 0.19925777636796418,
"learning_rate": 3.349163004843995e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11505947262048721,
"step": 2865,
"valid_targets_mean": 8705.5,
"valid_targets_min": 788
},
{
"epoch": 1.6932153392330385,
"grad_norm": 0.20575461925435287,
"learning_rate": 3.346119467973598e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13286572694778442,
"step": 2870,
"valid_targets_mean": 10789.9,
"valid_targets_min": 1629
},
{
"epoch": 1.696165191740413,
"grad_norm": 0.195789852899565,
"learning_rate": 3.343070221371347e-05,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12431154400110245,
"step": 2875,
"valid_targets_mean": 9820.9,
"valid_targets_min": 2079
},
{
"epoch": 1.6991150442477876,
"grad_norm": 0.19085369231753674,
"learning_rate": 3.340015277970998e-05,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11652038991451263,
"step": 2880,
"valid_targets_mean": 9519.0,
"valid_targets_min": 1443
},
{
"epoch": 1.7020648967551621,
"grad_norm": 0.18434544444359915,
"learning_rate": 3.33695465073047e-05,
"loss": 0.3913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12810981273651123,
"step": 2885,
"valid_targets_mean": 11148.6,
"valid_targets_min": 2844
},
{
"epoch": 1.7050147492625367,
"grad_norm": 0.19182102586594751,
"learning_rate": 3.3338883526317915e-05,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16361527144908905,
"step": 2890,
"valid_targets_mean": 11772.3,
"valid_targets_min": 2041
},
{
"epoch": 1.7079646017699115,
"grad_norm": 0.18685253615301253,
"learning_rate": 3.3308163966810446e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12067534029483795,
"step": 2895,
"valid_targets_mean": 9464.2,
"valid_targets_min": 2006
},
{
"epoch": 1.7109144542772863,
"grad_norm": 0.18789090242459708,
"learning_rate": 3.3277387959083086e-05,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11749487370252609,
"step": 2900,
"valid_targets_mean": 10115.8,
"valid_targets_min": 2033
},
{
"epoch": 1.7138643067846608,
"grad_norm": 0.19142845485695198,
"learning_rate": 3.324655563367608e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10298315435647964,
"step": 2905,
"valid_targets_mean": 8914.2,
"valid_targets_min": 1829
},
{
"epoch": 1.7168141592920354,
"grad_norm": 0.19266959518709054,
"learning_rate": 3.3215667121368536e-05,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14745637774467468,
"step": 2910,
"valid_targets_mean": 11594.1,
"valid_targets_min": 1466
},
{
"epoch": 1.71976401179941,
"grad_norm": 0.19916980056432732,
"learning_rate": 3.3184722553177886e-05,
"loss": 0.3887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13046494126319885,
"step": 2915,
"valid_targets_mean": 10735.3,
"valid_targets_min": 1786
},
{
"epoch": 1.7227138643067845,
"grad_norm": 0.18897005780526288,
"learning_rate": 3.3153722060359345e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13529415428638458,
"step": 2920,
"valid_targets_mean": 11454.9,
"valid_targets_min": 2305
},
{
"epoch": 1.7256637168141593,
"grad_norm": 0.19134823925494687,
"learning_rate": 3.312266577440533e-05,
"loss": 0.3965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11531375348567963,
"step": 2925,
"valid_targets_mean": 9119.2,
"valid_targets_min": 933
},
{
"epoch": 1.7286135693215339,
"grad_norm": 0.2730744331613668,
"learning_rate": 3.30915538270449e-05,
"loss": 0.3965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11113665252923965,
"step": 2930,
"valid_targets_mean": 9410.8,
"valid_targets_min": 1837
},
{
"epoch": 1.7315634218289087,
"grad_norm": 0.1840969708035178,
"learning_rate": 3.306038635024323e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1135941594839096,
"step": 2935,
"valid_targets_mean": 9461.3,
"valid_targets_min": 1841
},
{
"epoch": 1.7345132743362832,
"grad_norm": 0.19348029772223146,
"learning_rate": 3.302916347620102e-05,
"loss": 0.393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1548248678445816,
"step": 2940,
"valid_targets_mean": 12400.2,
"valid_targets_min": 2042
},
{
"epoch": 1.7374631268436578,
"grad_norm": 0.18252156946800238,
"learning_rate": 3.299788533735393e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15255288779735565,
"step": 2945,
"valid_targets_mean": 12530.3,
"valid_targets_min": 2926
},
{
"epoch": 1.7404129793510323,
"grad_norm": 0.18125067932284578,
"learning_rate": 3.296655206637205e-05,
"loss": 0.3924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404009312391281,
"step": 2950,
"valid_targets_mean": 10509.6,
"valid_targets_min": 649
},
{
"epoch": 1.7433628318584071,
"grad_norm": 0.17493040232422627,
"learning_rate": 3.293516379615933e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12707272171974182,
"step": 2955,
"valid_targets_mean": 9454.0,
"valid_targets_min": 2003
},
{
"epoch": 1.7463126843657817,
"grad_norm": 0.19612154842958732,
"learning_rate": 3.2903720659852973e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12193826586008072,
"step": 2960,
"valid_targets_mean": 9103.6,
"valid_targets_min": 1608
},
{
"epoch": 1.7492625368731565,
"grad_norm": 0.18257690930740766,
"learning_rate": 3.287222279082294e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12374929338693619,
"step": 2965,
"valid_targets_mean": 9436.6,
"valid_targets_min": 2137
},
{
"epoch": 1.752212389380531,
"grad_norm": 0.18167704644036603,
"learning_rate": 3.2840670322671316e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12390658259391785,
"step": 2970,
"valid_targets_mean": 9747.0,
"valid_targets_min": 1135
},
{
"epoch": 1.7551622418879056,
"grad_norm": 0.1965094558740685,
"learning_rate": 3.28090633892318e-05,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370033472776413,
"step": 2975,
"valid_targets_mean": 10079.6,
"valid_targets_min": 2286
},
{
"epoch": 1.7581120943952802,
"grad_norm": 0.19269690309905338,
"learning_rate": 3.277740212456909e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1356833130121231,
"step": 2980,
"valid_targets_mean": 10582.6,
"valid_targets_min": 1657
},
{
"epoch": 1.7610619469026547,
"grad_norm": 0.1952694338389336,
"learning_rate": 3.2745686662978355e-05,
"loss": 0.3977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1223859190940857,
"step": 2985,
"valid_targets_mean": 8869.7,
"valid_targets_min": 1883
},
{
"epoch": 1.7640117994100295,
"grad_norm": 0.20350950152630534,
"learning_rate": 3.2713917138984634e-05,
"loss": 0.3838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13408294320106506,
"step": 2990,
"valid_targets_mean": 10999.8,
"valid_targets_min": 1608
},
{
"epoch": 1.7669616519174043,
"grad_norm": 0.19334915963802546,
"learning_rate": 3.268209368734229e-05,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.129969522356987,
"step": 2995,
"valid_targets_mean": 10845.2,
"valid_targets_min": 1769
},
{
"epoch": 1.7699115044247788,
"grad_norm": 0.18099169248601887,
"learning_rate": 3.265021644303441e-05,
"loss": 0.3905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13780558109283447,
"step": 3000,
"valid_targets_mean": 11583.4,
"valid_targets_min": 2726
},
{
"epoch": 1.7728613569321534,
"grad_norm": 0.1896969180469815,
"learning_rate": 3.261828554127227e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11599138379096985,
"step": 3005,
"valid_targets_mean": 9023.2,
"valid_targets_min": 1719
},
{
"epoch": 1.775811209439528,
"grad_norm": 0.19063468212727738,
"learning_rate": 3.258630111749474e-05,
"loss": 0.3905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15030834078788757,
"step": 3010,
"valid_targets_mean": 11621.1,
"valid_targets_min": 1627
},
{
"epoch": 1.7787610619469025,
"grad_norm": 0.20924962814002224,
"learning_rate": 3.255426330736768e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15606912970542908,
"step": 3015,
"valid_targets_mean": 10227.8,
"valid_targets_min": 2542
},
{
"epoch": 1.7817109144542773,
"grad_norm": 0.18928326396508474,
"learning_rate": 3.252217224678342e-05,
"loss": 0.3839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12054719030857086,
"step": 3020,
"valid_targets_mean": 8847.1,
"valid_targets_min": 2962
},
{
"epoch": 1.7846607669616519,
"grad_norm": 0.20098696420819967,
"learning_rate": 3.249002807186016e-05,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.137400820851326,
"step": 3025,
"valid_targets_mean": 11824.5,
"valid_targets_min": 2336
},
{
"epoch": 1.7876106194690267,
"grad_norm": 0.19025621382762697,
"learning_rate": 3.2457830918941384e-05,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631835699081421,
"step": 3030,
"valid_targets_mean": 13422.8,
"valid_targets_min": 2469
},
{
"epoch": 1.7905604719764012,
"grad_norm": 0.1774868607110602,
"learning_rate": 3.242558092459529e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09473612904548645,
"step": 3035,
"valid_targets_mean": 8039.5,
"valid_targets_min": 1011
},
{
"epoch": 1.7935103244837758,
"grad_norm": 0.18665228670374476,
"learning_rate": 3.2393278225614205e-05,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10702696442604065,
"step": 3040,
"valid_targets_mean": 8162.9,
"valid_targets_min": 1768
},
{
"epoch": 1.7964601769911503,
"grad_norm": 0.2199654108080235,
"learning_rate": 3.2360922959014014e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1379621922969818,
"step": 3045,
"valid_targets_mean": 9680.6,
"valid_targets_min": 1517
},
{
"epoch": 1.799410029498525,
"grad_norm": 0.22475118561788887,
"learning_rate": 3.232851526203359e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337410807609558,
"step": 3050,
"valid_targets_mean": 10204.0,
"valid_targets_min": 1856
},
{
"epoch": 1.8023598820058997,
"grad_norm": 0.21577531073711217,
"learning_rate": 3.229605527213415e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492527723312378,
"step": 3055,
"valid_targets_mean": 11088.9,
"valid_targets_min": 3033
},
{
"epoch": 1.8053097345132745,
"grad_norm": 0.1905308663972179,
"learning_rate": 3.2263543126998765e-05,
"loss": 0.3956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11409647762775421,
"step": 3060,
"valid_targets_mean": 8808.9,
"valid_targets_min": 1628
},
{
"epoch": 1.808259587020649,
"grad_norm": 0.19650377661381702,
"learning_rate": 3.223097896453171e-05,
"loss": 0.3887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13997744023799896,
"step": 3065,
"valid_targets_mean": 10004.9,
"valid_targets_min": 2090
},
{
"epoch": 1.8112094395280236,
"grad_norm": 0.2027973299079048,
"learning_rate": 3.2198362922857896e-05,
"loss": 0.3927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13658654689788818,
"step": 3070,
"valid_targets_mean": 11585.9,
"valid_targets_min": 1578
},
{
"epoch": 1.8141592920353982,
"grad_norm": 0.20214465917193142,
"learning_rate": 3.216569514032229e-05,
"loss": 0.3878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428215205669403,
"step": 3075,
"valid_targets_mean": 10658.7,
"valid_targets_min": 1712
},
{
"epoch": 1.8171091445427727,
"grad_norm": 0.20351093437896298,
"learning_rate": 3.213297575548932e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14719177782535553,
"step": 3080,
"valid_targets_mean": 11714.4,
"valid_targets_min": 2874
},
{
"epoch": 1.8200589970501475,
"grad_norm": 0.2021762199445001,
"learning_rate": 3.210020490714231e-05,
"loss": 0.386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10983000695705414,
"step": 3085,
"valid_targets_mean": 9205.3,
"valid_targets_min": 2733
},
{
"epoch": 1.823008849557522,
"grad_norm": 0.2079297438681715,
"learning_rate": 3.206738273428284e-05,
"loss": 0.3852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10927362740039825,
"step": 3090,
"valid_targets_mean": 8837.8,
"valid_targets_min": 2032
},
{
"epoch": 1.8259587020648969,
"grad_norm": 0.2086646841099004,
"learning_rate": 3.2034509376130216e-05,
"loss": 0.3861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1262950301170349,
"step": 3095,
"valid_targets_mean": 10313.7,
"valid_targets_min": 2037
},
{
"epoch": 1.8289085545722714,
"grad_norm": 0.1892482439759891,
"learning_rate": 3.200158497212083e-05,
"loss": 0.3928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10493605583906174,
"step": 3100,
"valid_targets_mean": 8079.2,
"valid_targets_min": 1799
},
{
"epoch": 1.831858407079646,
"grad_norm": 0.20237233479384295,
"learning_rate": 3.1968609661907624e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15934070944786072,
"step": 3105,
"valid_targets_mean": 11687.4,
"valid_targets_min": 1660
},
{
"epoch": 1.8348082595870205,
"grad_norm": 0.19728440008329404,
"learning_rate": 3.193558358535944e-05,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12290243059396744,
"step": 3110,
"valid_targets_mean": 9689.1,
"valid_targets_min": 1213
},
{
"epoch": 1.8377581120943953,
"grad_norm": 0.18298811670162993,
"learning_rate": 3.190250688256045e-05,
"loss": 0.391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1717981994152069,
"step": 3115,
"valid_targets_mean": 13727.9,
"valid_targets_min": 2019
},
{
"epoch": 1.8407079646017699,
"grad_norm": 0.18698664444995303,
"learning_rate": 3.186937969380957e-05,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10982745885848999,
"step": 3120,
"valid_targets_mean": 8408.8,
"valid_targets_min": 1770
},
{
"epoch": 1.8436578171091447,
"grad_norm": 0.20456556558122935,
"learning_rate": 3.183620215961987e-05,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14105704426765442,
"step": 3125,
"valid_targets_mean": 10496.0,
"valid_targets_min": 1924
},
{
"epoch": 1.8466076696165192,
"grad_norm": 0.19477584095116424,
"learning_rate": 3.180297442071796e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.119300976395607,
"step": 3130,
"valid_targets_mean": 9131.2,
"valid_targets_min": 2712
},
{
"epoch": 1.8495575221238938,
"grad_norm": 0.20615521662254552,
"learning_rate": 3.176969661804338e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.128769189119339,
"step": 3135,
"valid_targets_mean": 8391.5,
"valid_targets_min": 1896
},
{
"epoch": 1.8525073746312684,
"grad_norm": 0.18706097563298538,
"learning_rate": 3.173636889274804e-05,
"loss": 0.3845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12298412621021271,
"step": 3140,
"valid_targets_mean": 9973.9,
"valid_targets_min": 1874
},
{
"epoch": 1.855457227138643,
"grad_norm": 0.18296786256497324,
"learning_rate": 3.170299138619561e-05,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13840444386005402,
"step": 3145,
"valid_targets_mean": 11387.2,
"valid_targets_min": 2079
},
{
"epoch": 1.8584070796460177,
"grad_norm": 0.18750099633802875,
"learning_rate": 3.16695642399609e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13286367058753967,
"step": 3150,
"valid_targets_mean": 9381.8,
"valid_targets_min": 1708
},
{
"epoch": 1.8613569321533925,
"grad_norm": 0.18499110557748116,
"learning_rate": 3.1636087595829265e-05,
"loss": 0.3942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12365491688251495,
"step": 3155,
"valid_targets_mean": 8509.3,
"valid_targets_min": 1118
},
{
"epoch": 1.864306784660767,
"grad_norm": 0.1832860638035741,
"learning_rate": 3.160256159579604e-05,
"loss": 0.3941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12997931241989136,
"step": 3160,
"valid_targets_mean": 10374.7,
"valid_targets_min": 2011
},
{
"epoch": 1.8672566371681416,
"grad_norm": 0.18516569508028138,
"learning_rate": 3.156898638206588e-05,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15980814397335052,
"step": 3165,
"valid_targets_mean": 12519.0,
"valid_targets_min": 1887
},
{
"epoch": 1.8702064896755162,
"grad_norm": 0.19172567895750345,
"learning_rate": 3.153536209705219e-05,
"loss": 0.3863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1256943941116333,
"step": 3170,
"valid_targets_mean": 9916.1,
"valid_targets_min": 1793
},
{
"epoch": 1.8731563421828907,
"grad_norm": 0.30905823355413986,
"learning_rate": 3.150168888337654e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14326061308383942,
"step": 3175,
"valid_targets_mean": 10340.9,
"valid_targets_min": 1125
},
{
"epoch": 1.8761061946902655,
"grad_norm": 0.18744713637296262,
"learning_rate": 3.1467966883868016e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13681210577487946,
"step": 3180,
"valid_targets_mean": 9584.5,
"valid_targets_min": 2028
},
{
"epoch": 1.87905604719764,
"grad_norm": 0.18734267628944543,
"learning_rate": 3.143419624156264e-05,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14888234436511993,
"step": 3185,
"valid_targets_mean": 11590.9,
"valid_targets_min": 2261
},
{
"epoch": 1.8820058997050149,
"grad_norm": 0.19649116485647783,
"learning_rate": 3.140037709970277e-05,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408083736896515,
"step": 3190,
"valid_targets_mean": 11354.4,
"valid_targets_min": 1773
},
{
"epoch": 1.8849557522123894,
"grad_norm": 0.17818662817613437,
"learning_rate": 3.136650960173645e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12512937188148499,
"step": 3195,
"valid_targets_mean": 9635.8,
"valid_targets_min": 2187
},
{
"epoch": 1.887905604719764,
"grad_norm": 0.18895452708671834,
"learning_rate": 3.1332593891316866e-05,
"loss": 0.3846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13278134167194366,
"step": 3200,
"valid_targets_mean": 10532.5,
"valid_targets_min": 1940
},
{
"epoch": 1.8908554572271385,
"grad_norm": 0.18407399327994156,
"learning_rate": 3.129863011230168e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13952814042568207,
"step": 3205,
"valid_targets_mean": 11384.6,
"valid_targets_min": 2096
},
{
"epoch": 1.893805309734513,
"grad_norm": 0.2037091941871826,
"learning_rate": 3.126461840875247e-05,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12919670343399048,
"step": 3210,
"valid_targets_mean": 10272.5,
"valid_targets_min": 2815
},
{
"epoch": 1.896755162241888,
"grad_norm": 0.22168382970996411,
"learning_rate": 3.1230558924934056e-05,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14533631503582,
"step": 3215,
"valid_targets_mean": 11145.4,
"valid_targets_min": 818
},
{
"epoch": 1.8997050147492627,
"grad_norm": 0.18055963902795616,
"learning_rate": 3.119645180531395e-05,
"loss": 0.3849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.115432009100914,
"step": 3220,
"valid_targets_mean": 9275.6,
"valid_targets_min": 1757
},
{
"epoch": 1.9026548672566372,
"grad_norm": 0.20541231868387194,
"learning_rate": 3.11622971945617e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13783042132854462,
"step": 3225,
"valid_targets_mean": 10562.0,
"valid_targets_min": 1778
},
{
"epoch": 1.9056047197640118,
"grad_norm": 0.19273506769296583,
"learning_rate": 3.112809523754832e-05,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12814044952392578,
"step": 3230,
"valid_targets_mean": 9969.5,
"valid_targets_min": 1957
},
{
"epoch": 1.9085545722713864,
"grad_norm": 0.18530212003507177,
"learning_rate": 3.109384607934562e-05,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14377827942371368,
"step": 3235,
"valid_targets_mean": 10153.2,
"valid_targets_min": 2191
},
{
"epoch": 1.911504424778761,
"grad_norm": 0.18959418284382742,
"learning_rate": 3.105954986522563e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10337518155574799,
"step": 3240,
"valid_targets_mean": 8849.2,
"valid_targets_min": 324
},
{
"epoch": 1.9144542772861357,
"grad_norm": 0.19079851081682211,
"learning_rate": 3.102520674065998e-05,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13874873518943787,
"step": 3245,
"valid_targets_mean": 10924.6,
"valid_targets_min": 2710
},
{
"epoch": 1.9174041297935103,
"grad_norm": 0.1961476176724746,
"learning_rate": 3.099081685131927e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14250710606575012,
"step": 3250,
"valid_targets_mean": 11752.3,
"valid_targets_min": 1969
},
{
"epoch": 1.920353982300885,
"grad_norm": 0.1958977931346944,
"learning_rate": 3.0956380343072466e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15353846549987793,
"step": 3255,
"valid_targets_mean": 12698.6,
"valid_targets_min": 2768
},
{
"epoch": 1.9233038348082596,
"grad_norm": 0.1997870314794016,
"learning_rate": 3.092189736198625e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12486180663108826,
"step": 3260,
"valid_targets_mean": 10104.6,
"valid_targets_min": 1652
},
{
"epoch": 1.9262536873156342,
"grad_norm": 0.20616461880710768,
"learning_rate": 3.0887368054324456e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13557863235473633,
"step": 3265,
"valid_targets_mean": 11014.7,
"valid_targets_min": 1872
},
{
"epoch": 1.9292035398230087,
"grad_norm": 0.2131487654674189,
"learning_rate": 3.08527925665474e-05,
"loss": 0.3868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13005343079566956,
"step": 3270,
"valid_targets_mean": 10039.7,
"valid_targets_min": 2777
},
{
"epoch": 1.9321533923303835,
"grad_norm": 0.19008851385831405,
"learning_rate": 3.081817104531129e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14494222402572632,
"step": 3275,
"valid_targets_mean": 11453.5,
"valid_targets_min": 1275
},
{
"epoch": 1.935103244837758,
"grad_norm": 0.19372049268738326,
"learning_rate": 3.078350363746756e-05,
"loss": 0.3956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11742343753576279,
"step": 3280,
"valid_targets_mean": 8932.7,
"valid_targets_min": 1791
},
{
"epoch": 1.9380530973451329,
"grad_norm": 0.1779269365091446,
"learning_rate": 3.074879049006232e-05,
"loss": 0.3814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13389301300048828,
"step": 3285,
"valid_targets_mean": 11101.6,
"valid_targets_min": 2707
},
{
"epoch": 1.9410029498525074,
"grad_norm": 0.19998320668730726,
"learning_rate": 3.0714031750335655e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562095731496811,
"step": 3290,
"valid_targets_mean": 10862.0,
"valid_targets_min": 1591
},
{
"epoch": 1.943952802359882,
"grad_norm": 0.18309893130019378,
"learning_rate": 3.067922756572106e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14485730230808258,
"step": 3295,
"valid_targets_mean": 10801.4,
"valid_targets_min": 1421
},
{
"epoch": 1.9469026548672566,
"grad_norm": 0.19390454376598912,
"learning_rate": 3.064437808384477e-05,
"loss": 0.3907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12800556421279907,
"step": 3300,
"valid_targets_mean": 8929.9,
"valid_targets_min": 1203
},
{
"epoch": 1.9498525073746311,
"grad_norm": 0.179528235286811,
"learning_rate": 3.0609483452525176e-05,
"loss": 0.3962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13554666936397552,
"step": 3305,
"valid_targets_mean": 10474.6,
"valid_targets_min": 1041
},
{
"epoch": 1.952802359882006,
"grad_norm": 0.19683332955124822,
"learning_rate": 3.057454381977214e-05,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11626716703176498,
"step": 3310,
"valid_targets_mean": 8967.3,
"valid_targets_min": 2401
},
{
"epoch": 1.9557522123893807,
"grad_norm": 0.18365947696319398,
"learning_rate": 3.053955933378645e-05,
"loss": 0.3869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.137057363986969,
"step": 3315,
"valid_targets_mean": 10507.0,
"valid_targets_min": 1811
},
{
"epoch": 1.9587020648967552,
"grad_norm": 0.1869865865059805,
"learning_rate": 3.0504530142959105e-05,
"loss": 0.3932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11256128549575806,
"step": 3320,
"valid_targets_mean": 9101.4,
"valid_targets_min": 1896
},
{
"epoch": 1.9616519174041298,
"grad_norm": 0.19801017724283992,
"learning_rate": 3.046945639587075e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14004410803318024,
"step": 3325,
"valid_targets_mean": 11740.2,
"valid_targets_min": 1329
},
{
"epoch": 1.9646017699115044,
"grad_norm": 0.18975756312038314,
"learning_rate": 3.0434338241291015e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11776711046695709,
"step": 3330,
"valid_targets_mean": 8273.8,
"valid_targets_min": 1581
},
{
"epoch": 1.967551622418879,
"grad_norm": 0.18066282594029207,
"learning_rate": 3.0399175828177872e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14526595175266266,
"step": 3335,
"valid_targets_mean": 10531.7,
"valid_targets_min": 2030
},
{
"epoch": 1.9705014749262537,
"grad_norm": 0.24555864656109105,
"learning_rate": 3.036396930567705e-05,
"loss": 0.3849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11780230700969696,
"step": 3340,
"valid_targets_mean": 8572.2,
"valid_targets_min": 1302
},
{
"epoch": 1.9734513274336283,
"grad_norm": 0.1929888138428312,
"learning_rate": 3.0328718823121355e-05,
"loss": 0.3942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13801506161689758,
"step": 3345,
"valid_targets_mean": 10365.0,
"valid_targets_min": 1880
},
{
"epoch": 1.976401179941003,
"grad_norm": 0.19478904054138915,
"learning_rate": 3.0293424530030056e-05,
"loss": 0.3963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15185290575027466,
"step": 3350,
"valid_targets_mean": 11930.6,
"valid_targets_min": 1431
},
{
"epoch": 1.9793510324483776,
"grad_norm": 0.19519690417624672,
"learning_rate": 3.0258086576108262e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12830832600593567,
"step": 3355,
"valid_targets_mean": 10015.8,
"valid_targets_min": 1439
},
{
"epoch": 1.9823008849557522,
"grad_norm": 0.1883692069344865,
"learning_rate": 3.0222705111246253e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13900379836559296,
"step": 3360,
"valid_targets_mean": 10110.8,
"valid_targets_min": 2130
},
{
"epoch": 1.9852507374631267,
"grad_norm": 0.18813353910541836,
"learning_rate": 3.0187280285518886e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12365911900997162,
"step": 3365,
"valid_targets_mean": 9938.6,
"valid_targets_min": 1395
},
{
"epoch": 1.9882005899705013,
"grad_norm": 0.5636207002863355,
"learning_rate": 3.015181224918493e-05,
"loss": 0.3968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15566903352737427,
"step": 3370,
"valid_targets_mean": 11508.6,
"valid_targets_min": 1832
},
{
"epoch": 1.991150442477876,
"grad_norm": 0.19814675061839912,
"learning_rate": 3.011630115268644e-05,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11800093948841095,
"step": 3375,
"valid_targets_mean": 9993.5,
"valid_targets_min": 2294
},
{
"epoch": 1.9941002949852509,
"grad_norm": 0.19741184278201546,
"learning_rate": 3.008074714664812e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500239372253418,
"step": 3380,
"valid_targets_mean": 11300.2,
"valid_targets_min": 1578
},
{
"epoch": 1.9970501474926254,
"grad_norm": 0.20703640740260867,
"learning_rate": 3.0045150381876654e-05,
"loss": 0.3829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278185397386551,
"step": 3385,
"valid_targets_mean": 10239.3,
"valid_targets_min": 1636
},
{
"epoch": 2.0,
"grad_norm": 0.1889992510723016,
"learning_rate": 3.0009511009360132e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11499617993831635,
"step": 3390,
"valid_targets_mean": 9906.2,
"valid_targets_min": 1715
},
{
"epoch": 2.0029498525073746,
"grad_norm": 0.21278107260553616,
"learning_rate": 2.9973829180267344e-05,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11433631181716919,
"step": 3395,
"valid_targets_mean": 8588.9,
"valid_targets_min": 1332
},
{
"epoch": 2.005899705014749,
"grad_norm": 0.1803230580174313,
"learning_rate": 2.993810504594717e-05,
"loss": 0.3779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1344345510005951,
"step": 3400,
"valid_targets_mean": 11002.7,
"valid_targets_min": 2057
},
{
"epoch": 2.0088495575221237,
"grad_norm": 0.19004812139972974,
"learning_rate": 2.9902338757927945e-05,
"loss": 0.3787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447649896144867,
"step": 3405,
"valid_targets_mean": 10779.6,
"valid_targets_min": 1624
},
{
"epoch": 2.0117994100294987,
"grad_norm": 0.1754994480283632,
"learning_rate": 2.9866530467916783e-05,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11555009335279465,
"step": 3410,
"valid_targets_mean": 9960.4,
"valid_targets_min": 934
},
{
"epoch": 2.0147492625368733,
"grad_norm": 0.2008870048940001,
"learning_rate": 2.983068032779897e-05,
"loss": 0.3813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313355714082718,
"step": 3415,
"valid_targets_mean": 10384.6,
"valid_targets_min": 1938
},
{
"epoch": 2.017699115044248,
"grad_norm": 0.17804754922004767,
"learning_rate": 2.97947884896373e-05,
"loss": 0.3821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404610574245453,
"step": 3420,
"valid_targets_mean": 12087.9,
"valid_targets_min": 1363
},
{
"epoch": 2.0206489675516224,
"grad_norm": 0.2177881217184323,
"learning_rate": 2.975885510567143e-05,
"loss": 0.3887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10633949935436249,
"step": 3425,
"valid_targets_mean": 9539.9,
"valid_targets_min": 2274
},
{
"epoch": 2.023598820058997,
"grad_norm": 0.18809039627040855,
"learning_rate": 2.9722880328317246e-05,
"loss": 0.3785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12327896058559418,
"step": 3430,
"valid_targets_mean": 9841.0,
"valid_targets_min": 2940
},
{
"epoch": 2.0265486725663715,
"grad_norm": 0.17916281339730925,
"learning_rate": 2.9686864310166206e-05,
"loss": 0.3806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12415190786123276,
"step": 3435,
"valid_targets_mean": 10737.5,
"valid_targets_min": 2207
},
{
"epoch": 2.0294985250737465,
"grad_norm": 0.1843528188235671,
"learning_rate": 2.965080720398469e-05,
"loss": 0.379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10842064023017883,
"step": 3440,
"valid_targets_mean": 10486.7,
"valid_targets_min": 2517
},
{
"epoch": 2.032448377581121,
"grad_norm": 0.19308551789685657,
"learning_rate": 2.9614709162713377e-05,
"loss": 0.3886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10595126450061798,
"step": 3445,
"valid_targets_mean": 8381.7,
"valid_targets_min": 1327
},
{
"epoch": 2.0353982300884956,
"grad_norm": 0.19204697437288043,
"learning_rate": 2.9578570339466553e-05,
"loss": 0.3831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404932737350464,
"step": 3450,
"valid_targets_mean": 10446.8,
"valid_targets_min": 1143
},
{
"epoch": 2.03834808259587,
"grad_norm": 0.1789574739748446,
"learning_rate": 2.95423908875315e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10503190755844116,
"step": 3455,
"valid_targets_mean": 8746.9,
"valid_targets_min": 1190
},
{
"epoch": 2.0412979351032448,
"grad_norm": 0.18398589452173997,
"learning_rate": 2.9506170960367826e-05,
"loss": 0.3832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.124261774122715,
"step": 3460,
"valid_targets_mean": 10087.5,
"valid_targets_min": 1183
},
{
"epoch": 2.0442477876106193,
"grad_norm": 0.19056300671049287,
"learning_rate": 2.9469910711606827e-05,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12515035271644592,
"step": 3465,
"valid_targets_mean": 10579.7,
"valid_targets_min": 1933
},
{
"epoch": 2.047197640117994,
"grad_norm": 0.19450910448739192,
"learning_rate": 2.9433610295050825e-05,
"loss": 0.3938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12465958297252655,
"step": 3470,
"valid_targets_mean": 8302.7,
"valid_targets_min": 1372
},
{
"epoch": 2.050147492625369,
"grad_norm": 0.1845326161792297,
"learning_rate": 2.9397269864672502e-05,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133334219455719,
"step": 3475,
"valid_targets_mean": 9780.0,
"valid_targets_min": 2871
},
{
"epoch": 2.0530973451327434,
"grad_norm": 0.17669162571743713,
"learning_rate": 2.93608895746143e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13513781130313873,
"step": 3480,
"valid_targets_mean": 11931.6,
"valid_targets_min": 2711
},
{
"epoch": 2.056047197640118,
"grad_norm": 0.17475474879616718,
"learning_rate": 2.9324469579187687e-05,
"loss": 0.3813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14042824506759644,
"step": 3485,
"valid_targets_mean": 11337.6,
"valid_targets_min": 2230
},
{
"epoch": 2.0589970501474926,
"grad_norm": 0.1770599580241005,
"learning_rate": 2.928801003287259e-05,
"loss": 0.3909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1170044094324112,
"step": 3490,
"valid_targets_mean": 8988.7,
"valid_targets_min": 1903
},
{
"epoch": 2.061946902654867,
"grad_norm": 0.18907281322057007,
"learning_rate": 2.9251511090316653e-05,
"loss": 0.3863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13288113474845886,
"step": 3495,
"valid_targets_mean": 9600.8,
"valid_targets_min": 1444
},
{
"epoch": 2.0648967551622417,
"grad_norm": 0.19113320061416877,
"learning_rate": 2.9214972906334663e-05,
"loss": 0.3836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1208382397890091,
"step": 3500,
"valid_targets_mean": 9575.3,
"valid_targets_min": 1520
},
{
"epoch": 2.0678466076696167,
"grad_norm": 0.18227771976678786,
"learning_rate": 2.917839563590783e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11254595965147018,
"step": 3505,
"valid_targets_mean": 9455.3,
"valid_targets_min": 1637
},
{
"epoch": 2.0707964601769913,
"grad_norm": 0.18929906045231637,
"learning_rate": 2.914177943418316e-05,
"loss": 0.3854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12085720151662827,
"step": 3510,
"valid_targets_mean": 10024.9,
"valid_targets_min": 1887
},
{
"epoch": 2.073746312684366,
"grad_norm": 0.17363504832025936,
"learning_rate": 2.9105124456472797e-05,
"loss": 0.3863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11590196192264557,
"step": 3515,
"valid_targets_mean": 9300.0,
"valid_targets_min": 1605
},
{
"epoch": 2.0766961651917404,
"grad_norm": 0.17322065693898156,
"learning_rate": 2.9068430858253335e-05,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10647255182266235,
"step": 3520,
"valid_targets_mean": 9143.5,
"valid_targets_min": 1876
},
{
"epoch": 2.079646017699115,
"grad_norm": 0.2131679266056025,
"learning_rate": 2.9031698795165223e-05,
"loss": 0.3847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.144773468375206,
"step": 3525,
"valid_targets_mean": 11088.1,
"valid_targets_min": 2465
},
{
"epoch": 2.0825958702064895,
"grad_norm": 0.18575805832779857,
"learning_rate": 2.8994928423012027e-05,
"loss": 0.3858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11051160842180252,
"step": 3530,
"valid_targets_mean": 9622.8,
"valid_targets_min": 1275
},
{
"epoch": 2.0855457227138645,
"grad_norm": 0.19586130635929078,
"learning_rate": 2.895811989775982e-05,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15362785756587982,
"step": 3535,
"valid_targets_mean": 11946.5,
"valid_targets_min": 1343
},
{
"epoch": 2.088495575221239,
"grad_norm": 0.20219771286262053,
"learning_rate": 2.8921273375536506e-05,
"loss": 0.3781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15547239780426025,
"step": 3540,
"valid_targets_mean": 11678.9,
"valid_targets_min": 1990
},
{
"epoch": 2.0914454277286136,
"grad_norm": 0.1936160339229126,
"learning_rate": 2.888438901263115e-05,
"loss": 0.3811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1208762675523758,
"step": 3545,
"valid_targets_mean": 9289.3,
"valid_targets_min": 1483
},
{
"epoch": 2.094395280235988,
"grad_norm": 0.17413806399911613,
"learning_rate": 2.884746696549334e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1528923362493515,
"step": 3550,
"valid_targets_mean": 12582.7,
"valid_targets_min": 2283
},
{
"epoch": 2.0973451327433628,
"grad_norm": 0.17194009034507063,
"learning_rate": 2.8810507390732487e-05,
"loss": 0.3839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12632685899734497,
"step": 3555,
"valid_targets_mean": 10105.1,
"valid_targets_min": 1272
},
{
"epoch": 2.1002949852507373,
"grad_norm": 0.19009776249260985,
"learning_rate": 2.8773510445117195e-05,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11879489570856094,
"step": 3560,
"valid_targets_mean": 7560.3,
"valid_targets_min": 1859
},
{
"epoch": 2.103244837758112,
"grad_norm": 0.17211994107816161,
"learning_rate": 2.873647628557457e-05,
"loss": 0.3782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12576919794082642,
"step": 3565,
"valid_targets_mean": 9344.3,
"valid_targets_min": 2537
},
{
"epoch": 2.106194690265487,
"grad_norm": 0.17305575511305302,
"learning_rate": 2.8699405069189573e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1216350868344307,
"step": 3570,
"valid_targets_mean": 10676.6,
"valid_targets_min": 2376
},
{
"epoch": 2.1091445427728615,
"grad_norm": 0.17356172191088662,
"learning_rate": 2.866229695320434e-05,
"loss": 0.3827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1366838812828064,
"step": 3575,
"valid_targets_mean": 10206.7,
"valid_targets_min": 1930
},
{
"epoch": 2.112094395280236,
"grad_norm": 0.2080655561460447,
"learning_rate": 2.862515209501753e-05,
"loss": 0.3778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11368487775325775,
"step": 3580,
"valid_targets_mean": 9517.6,
"valid_targets_min": 1673
},
{
"epoch": 2.1150442477876106,
"grad_norm": 0.19332899914412788,
"learning_rate": 2.8587970652183642e-05,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13519152998924255,
"step": 3585,
"valid_targets_mean": 10623.7,
"valid_targets_min": 2951
},
{
"epoch": 2.117994100294985,
"grad_norm": 0.18213962512925527,
"learning_rate": 2.8550752782412353e-05,
"loss": 0.3853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13883964717388153,
"step": 3590,
"valid_targets_mean": 11495.6,
"valid_targets_min": 1657
},
{
"epoch": 2.1209439528023597,
"grad_norm": 0.21689471255079432,
"learning_rate": 2.8513498643567853e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12648020684719086,
"step": 3595,
"valid_targets_mean": 8984.3,
"valid_targets_min": 2901
},
{
"epoch": 2.1238938053097347,
"grad_norm": 0.18398713084327645,
"learning_rate": 2.847620839366816e-05,
"loss": 0.3867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11699029058218002,
"step": 3600,
"valid_targets_mean": 9561.6,
"valid_targets_min": 1535
},
{
"epoch": 2.1268436578171093,
"grad_norm": 0.19909313835659861,
"learning_rate": 2.8438882190884483e-05,
"loss": 0.3983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12598690390586853,
"step": 3605,
"valid_targets_mean": 9382.0,
"valid_targets_min": 1289
},
{
"epoch": 2.129793510324484,
"grad_norm": 0.19239468673634438,
"learning_rate": 2.8401520193540514e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419348418712616,
"step": 3610,
"valid_targets_mean": 9724.2,
"valid_targets_min": 2358
},
{
"epoch": 2.1327433628318584,
"grad_norm": 0.18329010429612305,
"learning_rate": 2.836412256011177e-05,
"loss": 0.3984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13659611344337463,
"step": 3615,
"valid_targets_mean": 11027.6,
"valid_targets_min": 1069
},
{
"epoch": 2.135693215339233,
"grad_norm": 0.1783365761769347,
"learning_rate": 2.8326689449224938e-05,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11838910728693008,
"step": 3620,
"valid_targets_mean": 9196.5,
"valid_targets_min": 536
},
{
"epoch": 2.1386430678466075,
"grad_norm": 0.18628293289232864,
"learning_rate": 2.8289221019657172e-05,
"loss": 0.3981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12682795524597168,
"step": 3625,
"valid_targets_mean": 9754.9,
"valid_targets_min": 1806
},
{
"epoch": 2.1415929203539825,
"grad_norm": 0.1819512424595782,
"learning_rate": 2.8251717430335444e-05,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12250994890928268,
"step": 3630,
"valid_targets_mean": 9171.2,
"valid_targets_min": 1140
},
{
"epoch": 2.144542772861357,
"grad_norm": 0.17284428231008353,
"learning_rate": 2.8214178840335852e-05,
"loss": 0.3997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340324878692627,
"step": 3635,
"valid_targets_mean": 9798.3,
"valid_targets_min": 1344
},
{
"epoch": 2.1474926253687316,
"grad_norm": 0.19470660392467842,
"learning_rate": 2.8176605408882957e-05,
"loss": 0.4013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12144613265991211,
"step": 3640,
"valid_targets_mean": 8997.8,
"valid_targets_min": 2398
},
{
"epoch": 2.150442477876106,
"grad_norm": 0.18160998479053364,
"learning_rate": 2.813899729534911e-05,
"loss": 0.402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1443384438753128,
"step": 3645,
"valid_targets_mean": 10034.7,
"valid_targets_min": 1739
},
{
"epoch": 2.1533923303834808,
"grad_norm": 0.17558747890590443,
"learning_rate": 2.8101354659253765e-05,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11908899247646332,
"step": 3650,
"valid_targets_mean": 9813.8,
"valid_targets_min": 1050
},
{
"epoch": 2.1563421828908553,
"grad_norm": 0.16794874388601116,
"learning_rate": 2.806367766026281e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1262470781803131,
"step": 3655,
"valid_targets_mean": 10142.0,
"valid_targets_min": 2362
},
{
"epoch": 2.15929203539823,
"grad_norm": 0.18623675332508144,
"learning_rate": 2.8025966458187886e-05,
"loss": 0.3971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1318787783384323,
"step": 3660,
"valid_targets_mean": 10334.2,
"valid_targets_min": 1215
},
{
"epoch": 2.162241887905605,
"grad_norm": 0.17693481520897764,
"learning_rate": 2.7988221212985708e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11097447574138641,
"step": 3665,
"valid_targets_mean": 7946.3,
"valid_targets_min": 1646
},
{
"epoch": 2.1651917404129795,
"grad_norm": 0.18784856297361613,
"learning_rate": 2.7950442084757394e-05,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13702723383903503,
"step": 3670,
"valid_targets_mean": 10197.9,
"valid_targets_min": 2517
},
{
"epoch": 2.168141592920354,
"grad_norm": 0.1827780965965856,
"learning_rate": 2.791262923374778e-05,
"loss": 0.4084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1261982023715973,
"step": 3675,
"valid_targets_mean": 9506.9,
"valid_targets_min": 2134
},
{
"epoch": 2.1710914454277286,
"grad_norm": 0.1859839322818085,
"learning_rate": 2.787478282034473e-05,
"loss": 0.3978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1325964778661728,
"step": 3680,
"valid_targets_mean": 10417.7,
"valid_targets_min": 1786
},
{
"epoch": 2.174041297935103,
"grad_norm": 0.1639518540971534,
"learning_rate": 2.783690300507849e-05,
"loss": 0.3852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1373385339975357,
"step": 3685,
"valid_targets_mean": 10820.2,
"valid_targets_min": 2213
},
{
"epoch": 2.1769911504424777,
"grad_norm": 0.17159152749861892,
"learning_rate": 2.7798989948620962e-05,
"loss": 0.3962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14926663041114807,
"step": 3690,
"valid_targets_mean": 12955.4,
"valid_targets_min": 1467
},
{
"epoch": 2.1799410029498527,
"grad_norm": 0.18047206481601527,
"learning_rate": 2.7761043811785065e-05,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12459855526685715,
"step": 3695,
"valid_targets_mean": 10078.7,
"valid_targets_min": 1501
},
{
"epoch": 2.1828908554572273,
"grad_norm": 0.19306413780026327,
"learning_rate": 2.7723064755524018e-05,
"loss": 0.3979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11301134526729584,
"step": 3700,
"valid_targets_mean": 8772.9,
"valid_targets_min": 1174
},
{
"epoch": 2.185840707964602,
"grad_norm": 0.18676754801787854,
"learning_rate": 2.768505294093067e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13223782181739807,
"step": 3705,
"valid_targets_mean": 10604.9,
"valid_targets_min": 1801
},
{
"epoch": 2.1887905604719764,
"grad_norm": 0.1762536216691242,
"learning_rate": 2.764700852923682e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12154674530029297,
"step": 3710,
"valid_targets_mean": 8825.4,
"valid_targets_min": 2007
},
{
"epoch": 2.191740412979351,
"grad_norm": 0.17120906094368002,
"learning_rate": 2.7608931681812548e-05,
"loss": 0.3907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1289297640323639,
"step": 3715,
"valid_targets_mean": 10086.0,
"valid_targets_min": 2308
},
{
"epoch": 2.1946902654867255,
"grad_norm": 0.17585644290659275,
"learning_rate": 2.7570822560165494e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11464974284172058,
"step": 3720,
"valid_targets_mean": 9196.3,
"valid_targets_min": 2358
},
{
"epoch": 2.1976401179941005,
"grad_norm": 0.17193676556874152,
"learning_rate": 2.75326813259402e-05,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10923153162002563,
"step": 3725,
"valid_targets_mean": 8499.4,
"valid_targets_min": 1309
},
{
"epoch": 2.200589970501475,
"grad_norm": 0.17740306662737546,
"learning_rate": 2.7494508140917423e-05,
"loss": 0.3979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13836762309074402,
"step": 3730,
"valid_targets_mean": 9956.7,
"valid_targets_min": 1540
},
{
"epoch": 2.2035398230088497,
"grad_norm": 0.18082605228455478,
"learning_rate": 2.7456303167013435e-05,
"loss": 0.3932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14022909104824066,
"step": 3735,
"valid_targets_mean": 10383.4,
"valid_targets_min": 2501
},
{
"epoch": 2.206489675516224,
"grad_norm": 0.1783469044956506,
"learning_rate": 2.7418066566279348e-05,
"loss": 0.398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1336425542831421,
"step": 3740,
"valid_targets_mean": 9967.4,
"valid_targets_min": 1821
},
{
"epoch": 2.2094395280235988,
"grad_norm": 0.1691487313763563,
"learning_rate": 2.7379798500900424e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1256037950515747,
"step": 3745,
"valid_targets_mean": 9924.0,
"valid_targets_min": 1816
},
{
"epoch": 2.2123893805309733,
"grad_norm": 0.18101957895595286,
"learning_rate": 2.7341499133195385e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13777321577072144,
"step": 3750,
"valid_targets_mean": 10049.2,
"valid_targets_min": 1217
},
{
"epoch": 2.215339233038348,
"grad_norm": 0.17450735843383483,
"learning_rate": 2.7303168625615718e-05,
"loss": 0.401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14749610424041748,
"step": 3755,
"valid_targets_mean": 12419.6,
"valid_targets_min": 2271
},
{
"epoch": 2.218289085545723,
"grad_norm": 0.1845441504660646,
"learning_rate": 2.7264807140745017e-05,
"loss": 0.3884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14936435222625732,
"step": 3760,
"valid_targets_mean": 10423.2,
"valid_targets_min": 1900
},
{
"epoch": 2.2212389380530975,
"grad_norm": 0.18470787390804666,
"learning_rate": 2.722641484129825e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12111598998308182,
"step": 3765,
"valid_targets_mean": 8453.0,
"valid_targets_min": 1408
},
{
"epoch": 2.224188790560472,
"grad_norm": 0.17056997100554727,
"learning_rate": 2.7187991890121076e-05,
"loss": 0.4008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12580421566963196,
"step": 3770,
"valid_targets_mean": 9931.7,
"valid_targets_min": 2305
},
{
"epoch": 2.2271386430678466,
"grad_norm": 0.18783881320534634,
"learning_rate": 2.7149538450189204e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510670930147171,
"step": 3775,
"valid_targets_mean": 10178.9,
"valid_targets_min": 1039
},
{
"epoch": 2.230088495575221,
"grad_norm": 0.1739931085046215,
"learning_rate": 2.7111054684607644e-05,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14426995813846588,
"step": 3780,
"valid_targets_mean": 10581.9,
"valid_targets_min": 1697
},
{
"epoch": 2.2330383480825957,
"grad_norm": 0.17254501855584767,
"learning_rate": 2.7072540756610027e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14102444052696228,
"step": 3785,
"valid_targets_mean": 10485.4,
"valid_targets_min": 2081
},
{
"epoch": 2.2359882005899703,
"grad_norm": 0.16449191575448785,
"learning_rate": 2.703399682955794e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13488492369651794,
"step": 3790,
"valid_targets_mean": 10634.4,
"valid_targets_min": 1494
},
{
"epoch": 2.2389380530973453,
"grad_norm": 0.1764118124541508,
"learning_rate": 2.6995423066940206e-05,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12274979054927826,
"step": 3795,
"valid_targets_mean": 9134.9,
"valid_targets_min": 1983
},
{
"epoch": 2.24188790560472,
"grad_norm": 0.18680929847990685,
"learning_rate": 2.6956819632372194e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10951778292655945,
"step": 3800,
"valid_targets_mean": 7631.4,
"valid_targets_min": 1308
},
{
"epoch": 2.2448377581120944,
"grad_norm": 0.20523570522718323,
"learning_rate": 2.6918186689595134e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293448507785797,
"step": 3805,
"valid_targets_mean": 11488.8,
"valid_targets_min": 3111
},
{
"epoch": 2.247787610619469,
"grad_norm": 0.17597635789172644,
"learning_rate": 2.687952440247543e-05,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1164768636226654,
"step": 3810,
"valid_targets_mean": 9848.1,
"valid_targets_min": 1539
},
{
"epoch": 2.2507374631268435,
"grad_norm": 0.18144303661230346,
"learning_rate": 2.6840832935003942e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15120357275009155,
"step": 3815,
"valid_targets_mean": 12024.1,
"valid_targets_min": 2727
},
{
"epoch": 2.2536873156342185,
"grad_norm": 0.1847443407254508,
"learning_rate": 2.68021124512953e-05,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12879443168640137,
"step": 3820,
"valid_targets_mean": 9545.0,
"valid_targets_min": 1882
},
{
"epoch": 2.256637168141593,
"grad_norm": 0.18701048508634804,
"learning_rate": 2.6763363115587218e-05,
"loss": 0.3954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11498545110225677,
"step": 3825,
"valid_targets_mean": 8259.6,
"valid_targets_min": 1045
},
{
"epoch": 2.2595870206489677,
"grad_norm": 0.18824323332335477,
"learning_rate": 2.6724585092239784e-05,
"loss": 0.3932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13292992115020752,
"step": 3830,
"valid_targets_mean": 10127.1,
"valid_targets_min": 1797
},
{
"epoch": 2.262536873156342,
"grad_norm": 0.20140870554938575,
"learning_rate": 2.668577854573477e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12686914205551147,
"step": 3835,
"valid_targets_mean": 8850.4,
"valid_targets_min": 1524
},
{
"epoch": 2.265486725663717,
"grad_norm": 0.17288624780173162,
"learning_rate": 2.6646943640674937e-05,
"loss": 0.3963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1073978841304779,
"step": 3840,
"valid_targets_mean": 8547.2,
"valid_targets_min": 1657
},
{
"epoch": 2.2684365781710913,
"grad_norm": 0.18135599145281248,
"learning_rate": 2.6608080541783316e-05,
"loss": 0.3905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11137989163398743,
"step": 3845,
"valid_targets_mean": 7498.9,
"valid_targets_min": 2006
},
{
"epoch": 2.271386430678466,
"grad_norm": 0.1858489858186105,
"learning_rate": 2.6569189413902544e-05,
"loss": 0.3944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13760294020175934,
"step": 3850,
"valid_targets_mean": 10987.5,
"valid_targets_min": 2508
},
{
"epoch": 2.274336283185841,
"grad_norm": 0.17666569108019423,
"learning_rate": 2.6530270421994146e-05,
"loss": 0.3992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1223081648349762,
"step": 3855,
"valid_targets_mean": 10292.0,
"valid_targets_min": 2280
},
{
"epoch": 2.2772861356932155,
"grad_norm": 0.18248461786488382,
"learning_rate": 2.6491323731137818e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13024061918258667,
"step": 3860,
"valid_targets_mean": 10601.8,
"valid_targets_min": 1396
},
{
"epoch": 2.28023598820059,
"grad_norm": 0.18453098272423848,
"learning_rate": 2.6452349506530762e-05,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1465938836336136,
"step": 3865,
"valid_targets_mean": 9942.6,
"valid_targets_min": 2133
},
{
"epoch": 2.2831858407079646,
"grad_norm": 0.1800510324678868,
"learning_rate": 2.6413347913486967e-05,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15016867220401764,
"step": 3870,
"valid_targets_mean": 9759.4,
"valid_targets_min": 1581
},
{
"epoch": 2.286135693215339,
"grad_norm": 0.1840760855307141,
"learning_rate": 2.637431911743649e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509101539850235,
"step": 3875,
"valid_targets_mean": 10620.5,
"valid_targets_min": 1461
},
{
"epoch": 2.2890855457227137,
"grad_norm": 0.20046019039716598,
"learning_rate": 2.63352632839248e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11841368675231934,
"step": 3880,
"valid_targets_mean": 8787.5,
"valid_targets_min": 2197
},
{
"epoch": 2.2920353982300883,
"grad_norm": 0.17185687883942527,
"learning_rate": 2.629618057861202e-05,
"loss": 0.3971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11624648422002792,
"step": 3885,
"valid_targets_mean": 9077.8,
"valid_targets_min": 2800
},
{
"epoch": 2.2949852507374633,
"grad_norm": 0.1740597178196862,
"learning_rate": 2.625707116727228e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13334083557128906,
"step": 3890,
"valid_targets_mean": 9941.8,
"valid_targets_min": 2260
},
{
"epoch": 2.297935103244838,
"grad_norm": 0.17155366850277412,
"learning_rate": 2.6217935215792967e-05,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13235624134540558,
"step": 3895,
"valid_targets_mean": 10138.6,
"valid_targets_min": 1655
},
{
"epoch": 2.3008849557522124,
"grad_norm": 0.18246331548218217,
"learning_rate": 2.6178772890174057e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14090922474861145,
"step": 3900,
"valid_targets_mean": 9809.2,
"valid_targets_min": 1817
},
{
"epoch": 2.303834808259587,
"grad_norm": 0.18779345629629093,
"learning_rate": 2.6139584356527385e-05,
"loss": 0.3968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15629766881465912,
"step": 3905,
"valid_targets_mean": 11053.2,
"valid_targets_min": 1891
},
{
"epoch": 2.3067846607669615,
"grad_norm": 0.17739964048057022,
"learning_rate": 2.610036978107595e-05,
"loss": 0.3874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15338581800460815,
"step": 3910,
"valid_targets_mean": 10950.2,
"valid_targets_min": 2265
},
{
"epoch": 2.309734513274336,
"grad_norm": 0.19609733988432582,
"learning_rate": 2.6061129330153212e-05,
"loss": 0.3941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12699197232723236,
"step": 3915,
"valid_targets_mean": 9727.5,
"valid_targets_min": 1294
},
{
"epoch": 2.312684365781711,
"grad_norm": 0.18288278960145077,
"learning_rate": 2.602186317020239e-05,
"loss": 0.3978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13509252667427063,
"step": 3920,
"valid_targets_mean": 10823.4,
"valid_targets_min": 2542
},
{
"epoch": 2.3156342182890857,
"grad_norm": 0.19152225870964204,
"learning_rate": 2.598257146777575e-05,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1314992904663086,
"step": 3925,
"valid_targets_mean": 10381.6,
"valid_targets_min": 1504
},
{
"epoch": 2.3185840707964602,
"grad_norm": 0.17075307828765438,
"learning_rate": 2.5943254389533888e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1531062126159668,
"step": 3930,
"valid_targets_mean": 10812.6,
"valid_targets_min": 1055
},
{
"epoch": 2.321533923303835,
"grad_norm": 0.17132496778995138,
"learning_rate": 2.5903912102245053e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11895540356636047,
"step": 3935,
"valid_targets_mean": 9040.8,
"valid_targets_min": 1130
},
{
"epoch": 2.3244837758112094,
"grad_norm": 0.18685408915114127,
"learning_rate": 2.5864544772784407e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11604495346546173,
"step": 3940,
"valid_targets_mean": 9655.9,
"valid_targets_min": 1410
},
{
"epoch": 2.327433628318584,
"grad_norm": 0.16879584787533836,
"learning_rate": 2.5825152568133343e-05,
"loss": 0.3924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11255620419979095,
"step": 3945,
"valid_targets_mean": 8905.6,
"valid_targets_min": 1830
},
{
"epoch": 2.330383480825959,
"grad_norm": 0.1864666442297191,
"learning_rate": 2.5785735655378745e-05,
"loss": 0.3919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11839946359395981,
"step": 3950,
"valid_targets_mean": 9882.5,
"valid_targets_min": 2408
},
{
"epoch": 2.3333333333333335,
"grad_norm": 0.23730696535755824,
"learning_rate": 2.5746294201712326e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12219962477684021,
"step": 3955,
"valid_targets_mean": 9463.4,
"valid_targets_min": 1659
},
{
"epoch": 2.336283185840708,
"grad_norm": 0.16420168897254991,
"learning_rate": 2.5706828374429873e-05,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11978039145469666,
"step": 3960,
"valid_targets_mean": 11038.2,
"valid_targets_min": 1531
},
{
"epoch": 2.3392330383480826,
"grad_norm": 0.18849127213452108,
"learning_rate": 2.5667338340930563e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1379072070121765,
"step": 3965,
"valid_targets_mean": 10074.7,
"valid_targets_min": 2085
},
{
"epoch": 2.342182890855457,
"grad_norm": 0.171765781113225,
"learning_rate": 2.5627824268716247e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11300992965698242,
"step": 3970,
"valid_targets_mean": 10108.6,
"valid_targets_min": 1642
},
{
"epoch": 2.3451327433628317,
"grad_norm": 0.17177249459813396,
"learning_rate": 2.5588286325390744e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12897521257400513,
"step": 3975,
"valid_targets_mean": 9673.6,
"valid_targets_min": 997
},
{
"epoch": 2.3480825958702063,
"grad_norm": 0.17701611497782288,
"learning_rate": 2.5548724678659115e-05,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11329556256532669,
"step": 3980,
"valid_targets_mean": 8708.4,
"valid_targets_min": 1573
},
{
"epoch": 2.3510324483775813,
"grad_norm": 0.25579883316916374,
"learning_rate": 2.550913949632697e-05,
"loss": 0.3938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14847159385681152,
"step": 3985,
"valid_targets_mean": 12304.2,
"valid_targets_min": 1814
},
{
"epoch": 2.353982300884956,
"grad_norm": 0.16613061378431035,
"learning_rate": 2.5469530946299746e-05,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13126221299171448,
"step": 3990,
"valid_targets_mean": 11132.8,
"valid_targets_min": 1200
},
{
"epoch": 2.3569321533923304,
"grad_norm": 0.17686783624732347,
"learning_rate": 2.542989919658199e-05,
"loss": 0.4007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14059323072433472,
"step": 3995,
"valid_targets_mean": 10237.6,
"valid_targets_min": 950
},
{
"epoch": 2.359882005899705,
"grad_norm": 0.20215416996696808,
"learning_rate": 2.5390244415276666e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1143152043223381,
"step": 4000,
"valid_targets_mean": 10417.7,
"valid_targets_min": 2034
},
{
"epoch": 2.3628318584070795,
"grad_norm": 0.17655569706363347,
"learning_rate": 2.5350566770584423e-05,
"loss": 0.3846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13264046609401703,
"step": 4005,
"valid_targets_mean": 11726.6,
"valid_targets_min": 1312
},
{
"epoch": 2.365781710914454,
"grad_norm": 0.17920640711803199,
"learning_rate": 2.5310866430802877e-05,
"loss": 0.391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11140947043895721,
"step": 4010,
"valid_targets_mean": 8954.2,
"valid_targets_min": 1876
},
{
"epoch": 2.3687315634218287,
"grad_norm": 0.2076440770678389,
"learning_rate": 2.527114356432593e-05,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15259167551994324,
"step": 4015,
"valid_targets_mean": 10257.4,
"valid_targets_min": 2939
},
{
"epoch": 2.3716814159292037,
"grad_norm": 0.1884915676583662,
"learning_rate": 2.5231398339643022e-05,
"loss": 0.3907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12428969889879227,
"step": 4020,
"valid_targets_mean": 9281.1,
"valid_targets_min": 2123
},
{
"epoch": 2.3746312684365782,
"grad_norm": 0.18874802459911955,
"learning_rate": 2.519163092533843e-05,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14149920642375946,
"step": 4025,
"valid_targets_mean": 9339.8,
"valid_targets_min": 2558
},
{
"epoch": 2.377581120943953,
"grad_norm": 0.17723065208387231,
"learning_rate": 2.5151841490090537e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307816505432129,
"step": 4030,
"valid_targets_mean": 9360.2,
"valid_targets_min": 2415
},
{
"epoch": 2.3805309734513274,
"grad_norm": 0.17421579470262544,
"learning_rate": 2.5112030202671154e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11921098828315735,
"step": 4035,
"valid_targets_mean": 8395.6,
"valid_targets_min": 1630
},
{
"epoch": 2.383480825958702,
"grad_norm": 0.17031332521729364,
"learning_rate": 2.507219723194477e-05,
"loss": 0.3844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14918190240859985,
"step": 4040,
"valid_targets_mean": 12708.2,
"valid_targets_min": 3373
},
{
"epoch": 2.386430678466077,
"grad_norm": 0.17823669644393042,
"learning_rate": 2.5032342746867844e-05,
"loss": 0.3827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1188630759716034,
"step": 4045,
"valid_targets_mean": 11102.9,
"valid_targets_min": 2383
},
{
"epoch": 2.3893805309734515,
"grad_norm": 0.17538450361576227,
"learning_rate": 2.49924669164881e-05,
"loss": 0.3935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12793388962745667,
"step": 4050,
"valid_targets_mean": 9429.2,
"valid_targets_min": 1243
},
{
"epoch": 2.392330383480826,
"grad_norm": 0.17032901916386253,
"learning_rate": 2.495256990994378e-05,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15003778040409088,
"step": 4055,
"valid_targets_mean": 12589.8,
"valid_targets_min": 1293
},
{
"epoch": 2.3952802359882006,
"grad_norm": 0.17182426265268705,
"learning_rate": 2.4912651896462967e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12547190487384796,
"step": 4060,
"valid_targets_mean": 9731.8,
"valid_targets_min": 1129
},
{
"epoch": 2.398230088495575,
"grad_norm": 0.17298035699811434,
"learning_rate": 2.487271304536284e-05,
"loss": 0.3879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.101053886115551,
"step": 4065,
"valid_targets_mean": 8218.8,
"valid_targets_min": 595
},
{
"epoch": 2.4011799410029497,
"grad_norm": 0.16731123092758138,
"learning_rate": 2.4832753526048977e-05,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12202181667089462,
"step": 4070,
"valid_targets_mean": 9081.4,
"valid_targets_min": 888
},
{
"epoch": 2.4041297935103243,
"grad_norm": 0.17594985833188911,
"learning_rate": 2.4792773508014597e-05,
"loss": 0.3858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13053381443023682,
"step": 4075,
"valid_targets_mean": 10127.8,
"valid_targets_min": 1547
},
{
"epoch": 2.4070796460176993,
"grad_norm": 0.1725954639777345,
"learning_rate": 2.4752773160839885e-05,
"loss": 0.388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12309059500694275,
"step": 4080,
"valid_targets_mean": 9777.3,
"valid_targets_min": 1666
},
{
"epoch": 2.410029498525074,
"grad_norm": 0.17639722633497423,
"learning_rate": 2.4712752654191254e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11810016632080078,
"step": 4085,
"valid_targets_mean": 8813.1,
"valid_targets_min": 2184
},
{
"epoch": 2.4129793510324484,
"grad_norm": 0.1845806404741444,
"learning_rate": 2.467271215782061e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12740883231163025,
"step": 4090,
"valid_targets_mean": 9679.6,
"valid_targets_min": 2445
},
{
"epoch": 2.415929203539823,
"grad_norm": 0.18118441307550773,
"learning_rate": 2.4632651841564673e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12179508060216904,
"step": 4095,
"valid_targets_mean": 10510.3,
"valid_targets_min": 1998
},
{
"epoch": 2.4188790560471976,
"grad_norm": 0.18764285880053957,
"learning_rate": 2.4592571875344217e-05,
"loss": 0.3786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726941615343094,
"step": 4100,
"valid_targets_mean": 12465.5,
"valid_targets_min": 1710
},
{
"epoch": 2.421828908554572,
"grad_norm": 0.18199183358032803,
"learning_rate": 2.4552472429163357e-05,
"loss": 0.3711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14343643188476562,
"step": 4105,
"valid_targets_mean": 10231.8,
"valid_targets_min": 2259
},
{
"epoch": 2.4247787610619467,
"grad_norm": 0.1725750391349139,
"learning_rate": 2.4512353673108847e-05,
"loss": 0.3753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1398804783821106,
"step": 4110,
"valid_targets_mean": 13320.7,
"valid_targets_min": 1376
},
{
"epoch": 2.4277286135693217,
"grad_norm": 0.18305122770334165,
"learning_rate": 2.4472215777349346e-05,
"loss": 0.3667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10101216286420822,
"step": 4115,
"valid_targets_mean": 8426.0,
"valid_targets_min": 1654
},
{
"epoch": 2.4306784660766962,
"grad_norm": 0.1926083380216005,
"learning_rate": 2.4432058912134695e-05,
"loss": 0.3714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11317503452301025,
"step": 4120,
"valid_targets_mean": 8610.3,
"valid_targets_min": 2335
},
{
"epoch": 2.433628318584071,
"grad_norm": 0.2196195456089233,
"learning_rate": 2.439188324779518e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12208309769630432,
"step": 4125,
"valid_targets_mean": 9733.9,
"valid_targets_min": 2604
},
{
"epoch": 2.4365781710914454,
"grad_norm": 0.2002734068453938,
"learning_rate": 2.435168895474085e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09944422543048859,
"step": 4130,
"valid_targets_mean": 7887.3,
"valid_targets_min": 961
},
{
"epoch": 2.43952802359882,
"grad_norm": 0.1974919985284759,
"learning_rate": 2.4311476203460753e-05,
"loss": 0.3722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14025208353996277,
"step": 4135,
"valid_targets_mean": 12008.4,
"valid_targets_min": 3631
},
{
"epoch": 2.442477876106195,
"grad_norm": 0.1992481010119958,
"learning_rate": 2.4271245164522244e-05,
"loss": 0.3792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13258278369903564,
"step": 4140,
"valid_targets_mean": 11155.2,
"valid_targets_min": 2731
},
{
"epoch": 2.4454277286135695,
"grad_norm": 0.18912241428488177,
"learning_rate": 2.4230996008570237e-05,
"loss": 0.367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1264360398054123,
"step": 4145,
"valid_targets_mean": 10674.4,
"valid_targets_min": 1317
},
{
"epoch": 2.448377581120944,
"grad_norm": 0.18223546620888548,
"learning_rate": 2.4190728906326496e-05,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14574602246284485,
"step": 4150,
"valid_targets_mean": 11136.4,
"valid_targets_min": 1890
},
{
"epoch": 2.4513274336283186,
"grad_norm": 0.20209171805214524,
"learning_rate": 2.4150444028588896e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15436725318431854,
"step": 4155,
"valid_targets_mean": 12538.8,
"valid_targets_min": 1856
},
{
"epoch": 2.454277286135693,
"grad_norm": 0.1981802269778582,
"learning_rate": 2.411014154623073e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14357636868953705,
"step": 4160,
"valid_targets_mean": 11351.3,
"valid_targets_min": 1738
},
{
"epoch": 2.4572271386430677,
"grad_norm": 0.18767130154313147,
"learning_rate": 2.4069821630199938e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10319440811872482,
"step": 4165,
"valid_targets_mean": 9638.6,
"valid_targets_min": 2769
},
{
"epoch": 2.4601769911504423,
"grad_norm": 0.20106308424588426,
"learning_rate": 2.402948445151843e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12477102875709534,
"step": 4170,
"valid_targets_mean": 10217.3,
"valid_targets_min": 1867
},
{
"epoch": 2.4631268436578173,
"grad_norm": 0.1878349564170574,
"learning_rate": 2.3989130181281323e-05,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12376038730144501,
"step": 4175,
"valid_targets_mean": 10830.1,
"valid_targets_min": 2056
},
{
"epoch": 2.466076696165192,
"grad_norm": 0.182326417226956,
"learning_rate": 2.3948758990656232e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09735498577356339,
"step": 4180,
"valid_targets_mean": 8065.7,
"valid_targets_min": 2250
},
{
"epoch": 2.4690265486725664,
"grad_norm": 0.17881624649061542,
"learning_rate": 2.3908371050882554e-05,
"loss": 0.3733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11818811297416687,
"step": 4185,
"valid_targets_mean": 10655.2,
"valid_targets_min": 2555
},
{
"epoch": 2.471976401179941,
"grad_norm": 0.2015720023458747,
"learning_rate": 2.3867966533270716e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320725679397583,
"step": 4190,
"valid_targets_mean": 11071.5,
"valid_targets_min": 860
},
{
"epoch": 2.4749262536873156,
"grad_norm": 0.19971733040726514,
"learning_rate": 2.3827545609201462e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14172565937042236,
"step": 4195,
"valid_targets_mean": 11408.9,
"valid_targets_min": 2015
},
{
"epoch": 2.47787610619469,
"grad_norm": 0.1895322692289199,
"learning_rate": 2.3787108450125133e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10191375017166138,
"step": 4200,
"valid_targets_mean": 9568.1,
"valid_targets_min": 1913
},
{
"epoch": 2.4808259587020647,
"grad_norm": 0.189797790905414,
"learning_rate": 2.3746655227560932e-05,
"loss": 0.3743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11338387429714203,
"step": 4205,
"valid_targets_mean": 9056.0,
"valid_targets_min": 1585
},
{
"epoch": 2.4837758112094397,
"grad_norm": 0.19042071073474165,
"learning_rate": 2.3706186113096187e-05,
"loss": 0.3688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1429302990436554,
"step": 4210,
"valid_targets_mean": 13044.3,
"valid_targets_min": 2160
},
{
"epoch": 2.4867256637168142,
"grad_norm": 0.194122243175992,
"learning_rate": 2.366570127838564e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10320837795734406,
"step": 4215,
"valid_targets_mean": 9486.9,
"valid_targets_min": 1543
},
{
"epoch": 2.489675516224189,
"grad_norm": 0.17235334362756774,
"learning_rate": 2.362520089515073e-05,
"loss": 0.374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10433302819728851,
"step": 4220,
"valid_targets_mean": 9637.9,
"valid_targets_min": 1453
},
{
"epoch": 2.4926253687315634,
"grad_norm": 0.17737199801949888,
"learning_rate": 2.358468513517882e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1555056869983673,
"step": 4225,
"valid_targets_mean": 11221.1,
"valid_targets_min": 1861
},
{
"epoch": 2.495575221238938,
"grad_norm": 0.1776538389094094,
"learning_rate": 2.35441541703225e-05,
"loss": 0.3734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10380370914936066,
"step": 4230,
"valid_targets_mean": 7896.7,
"valid_targets_min": 1601
},
{
"epoch": 2.4985250737463125,
"grad_norm": 0.16806275136850427,
"learning_rate": 2.3503608172498878e-05,
"loss": 0.3737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1344701498746872,
"step": 4235,
"valid_targets_mean": 11206.3,
"valid_targets_min": 2567
},
{
"epoch": 2.501474926253687,
"grad_norm": 0.1838042863563555,
"learning_rate": 2.346304731368879e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12868273258209229,
"step": 4240,
"valid_targets_mean": 9940.7,
"valid_targets_min": 1487
},
{
"epoch": 2.504424778761062,
"grad_norm": 0.1882399630093764,
"learning_rate": 2.3422471765936124e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12242631614208221,
"step": 4245,
"valid_targets_mean": 9426.9,
"valid_targets_min": 1920
},
{
"epoch": 2.5073746312684366,
"grad_norm": 0.1927731789030749,
"learning_rate": 2.338188170134709e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1051219254732132,
"step": 4250,
"valid_targets_mean": 7889.9,
"valid_targets_min": 1997
},
{
"epoch": 2.510324483775811,
"grad_norm": 0.19010092340967272,
"learning_rate": 2.3341277292089446e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10231277346611023,
"step": 4255,
"valid_targets_mean": 8702.3,
"valid_targets_min": 2150
},
{
"epoch": 2.5132743362831858,
"grad_norm": 0.18926011510358104,
"learning_rate": 2.33006587103918e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14327773451805115,
"step": 4260,
"valid_targets_mean": 11533.9,
"valid_targets_min": 1871
},
{
"epoch": 2.5162241887905603,
"grad_norm": 0.19331180232935863,
"learning_rate": 2.3260026128542886e-05,
"loss": 0.3586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11851916462182999,
"step": 4265,
"valid_targets_mean": 10099.0,
"valid_targets_min": 2449
},
{
"epoch": 2.5191740412979353,
"grad_norm": 0.19110202290037573,
"learning_rate": 2.3219379718890814e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13638907670974731,
"step": 4270,
"valid_targets_mean": 10613.0,
"valid_targets_min": 1767
},
{
"epoch": 2.52212389380531,
"grad_norm": 0.18240060005875852,
"learning_rate": 2.317871965384235e-05,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12266083061695099,
"step": 4275,
"valid_targets_mean": 9735.8,
"valid_targets_min": 1444
},
{
"epoch": 2.5250737463126844,
"grad_norm": 0.19650112914503412,
"learning_rate": 2.3138046105862175e-05,
"loss": 0.3779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13388144969940186,
"step": 4280,
"valid_targets_mean": 12089.4,
"valid_targets_min": 1483
},
{
"epoch": 2.528023598820059,
"grad_norm": 0.18887624139751505,
"learning_rate": 2.3097359247472156e-05,
"loss": 0.3742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12826773524284363,
"step": 4285,
"valid_targets_mean": 9522.6,
"valid_targets_min": 747
},
{
"epoch": 2.5309734513274336,
"grad_norm": 0.1966567564253813,
"learning_rate": 2.3056659251250637e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08406929671764374,
"step": 4290,
"valid_targets_mean": 6589.8,
"valid_targets_min": 1001
},
{
"epoch": 2.533923303834808,
"grad_norm": 0.18282408339040876,
"learning_rate": 2.301594628983166e-05,
"loss": 0.3742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11688566207885742,
"step": 4295,
"valid_targets_mean": 8307.7,
"valid_targets_min": 1442
},
{
"epoch": 2.5368731563421827,
"grad_norm": 0.1875617083131164,
"learning_rate": 2.2975220535904286e-05,
"loss": 0.3645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11464380472898483,
"step": 4300,
"valid_targets_mean": 9174.5,
"valid_targets_min": 2099
},
{
"epoch": 2.5398230088495577,
"grad_norm": 0.1882850853875356,
"learning_rate": 2.2934482162211827e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.127057284116745,
"step": 4305,
"valid_targets_mean": 9977.2,
"valid_targets_min": 1385
},
{
"epoch": 2.5427728613569323,
"grad_norm": 0.1889501349131273,
"learning_rate": 2.2893731341551117e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10239008069038391,
"step": 4310,
"valid_targets_mean": 8322.1,
"valid_targets_min": 2131
},
{
"epoch": 2.545722713864307,
"grad_norm": 0.17697629988020622,
"learning_rate": 2.285296824677179e-05,
"loss": 0.3745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12793973088264465,
"step": 4315,
"valid_targets_mean": 10406.2,
"valid_targets_min": 1407
},
{
"epoch": 2.5486725663716814,
"grad_norm": 0.19561789633386095,
"learning_rate": 2.2812193050775552e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140027716755867,
"step": 4320,
"valid_targets_mean": 12493.9,
"valid_targets_min": 2457
},
{
"epoch": 2.551622418879056,
"grad_norm": 0.1802313241831928,
"learning_rate": 2.2771405926515423e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10761629045009613,
"step": 4325,
"valid_targets_mean": 9960.1,
"valid_targets_min": 2052
},
{
"epoch": 2.554572271386431,
"grad_norm": 0.1751657945259594,
"learning_rate": 2.2730607046995026e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10588338226079941,
"step": 4330,
"valid_targets_mean": 8378.8,
"valid_targets_min": 1560
},
{
"epoch": 2.557522123893805,
"grad_norm": 0.19248830700949682,
"learning_rate": 2.2689796585267843e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11182724684476852,
"step": 4335,
"valid_targets_mean": 9472.5,
"valid_targets_min": 2484
},
{
"epoch": 2.56047197640118,
"grad_norm": 0.18435708690786634,
"learning_rate": 2.2648974714436473e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11992965638637543,
"step": 4340,
"valid_targets_mean": 10299.2,
"valid_targets_min": 878
},
{
"epoch": 2.5634218289085546,
"grad_norm": 0.17894693429898967,
"learning_rate": 2.260814160765194e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13005350530147552,
"step": 4345,
"valid_targets_mean": 10887.9,
"valid_targets_min": 2125
},
{
"epoch": 2.566371681415929,
"grad_norm": 0.17833561968446868,
"learning_rate": 2.2567297438112896e-05,
"loss": 0.3667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15313655138015747,
"step": 4350,
"valid_targets_mean": 12573.0,
"valid_targets_min": 2048
},
{
"epoch": 2.5693215339233038,
"grad_norm": 0.18379146848722314,
"learning_rate": 2.2526442379064926e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11305586993694305,
"step": 4355,
"valid_targets_mean": 9179.3,
"valid_targets_min": 1147
},
{
"epoch": 2.5722713864306783,
"grad_norm": 0.1753040455053401,
"learning_rate": 2.2485576603799804e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1262725293636322,
"step": 4360,
"valid_targets_mean": 10706.8,
"valid_targets_min": 1593
},
{
"epoch": 2.5752212389380533,
"grad_norm": 0.18485595887788345,
"learning_rate": 2.2444700285654765e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11888639628887177,
"step": 4365,
"valid_targets_mean": 9218.1,
"valid_targets_min": 2137
},
{
"epoch": 2.578171091445428,
"grad_norm": 0.19103757174545843,
"learning_rate": 2.240381359801175e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13815957307815552,
"step": 4370,
"valid_targets_mean": 11224.7,
"valid_targets_min": 1822
},
{
"epoch": 2.5811209439528024,
"grad_norm": 0.18190256491713522,
"learning_rate": 2.236291671429669e-05,
"loss": 0.367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1305564045906067,
"step": 4375,
"valid_targets_mean": 11156.6,
"valid_targets_min": 1606
},
{
"epoch": 2.584070796460177,
"grad_norm": 0.1912488927143699,
"learning_rate": 2.232200980797877e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13565358519554138,
"step": 4380,
"valid_targets_mean": 10960.1,
"valid_targets_min": 1556
},
{
"epoch": 2.5870206489675516,
"grad_norm": 0.19092041778251356,
"learning_rate": 2.2281093052569677e-05,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1110101193189621,
"step": 4385,
"valid_targets_mean": 9461.7,
"valid_targets_min": 1929
},
{
"epoch": 2.589970501474926,
"grad_norm": 0.1909995367933586,
"learning_rate": 2.224016662162289e-05,
"loss": 0.3754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283772736787796,
"step": 4390,
"valid_targets_mean": 9745.5,
"valid_targets_min": 1581
},
{
"epoch": 2.5929203539823007,
"grad_norm": 0.1875279301690173,
"learning_rate": 2.2199230688732906e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12525217235088348,
"step": 4395,
"valid_targets_mean": 10080.6,
"valid_targets_min": 2923
},
{
"epoch": 2.5958702064896757,
"grad_norm": 0.20272720547415712,
"learning_rate": 2.2158285427534537e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11715195327997208,
"step": 4400,
"valid_targets_mean": 8127.2,
"valid_targets_min": 1571
},
{
"epoch": 2.5988200589970503,
"grad_norm": 0.17990153107875204,
"learning_rate": 2.2117331011702164e-05,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11927230656147003,
"step": 4405,
"valid_targets_mean": 10449.8,
"valid_targets_min": 1912
},
{
"epoch": 2.601769911504425,
"grad_norm": 0.18373357287582748,
"learning_rate": 2.2076367614948997e-05,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10929173231124878,
"step": 4410,
"valid_targets_mean": 8532.2,
"valid_targets_min": 1791
},
{
"epoch": 2.6047197640117994,
"grad_norm": 0.18399152008258768,
"learning_rate": 2.2035395411026338e-05,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1311100572347641,
"step": 4415,
"valid_targets_mean": 11387.8,
"valid_targets_min": 2003
},
{
"epoch": 2.607669616519174,
"grad_norm": 0.18439145618369485,
"learning_rate": 2.1994414573722834e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11850002408027649,
"step": 4420,
"valid_targets_mean": 9229.9,
"valid_targets_min": 2522
},
{
"epoch": 2.6106194690265485,
"grad_norm": 0.18488957845098064,
"learning_rate": 2.195342527686379e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14204034209251404,
"step": 4425,
"valid_targets_mean": 12198.8,
"valid_targets_min": 1675
},
{
"epoch": 2.613569321533923,
"grad_norm": 0.19286103565402618,
"learning_rate": 2.191242769431035e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1183563768863678,
"step": 4430,
"valid_targets_mean": 10017.0,
"valid_targets_min": 1776
},
{
"epoch": 2.616519174041298,
"grad_norm": 0.17380589005055547,
"learning_rate": 2.1871421999958823e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11534374952316284,
"step": 4435,
"valid_targets_mean": 10342.0,
"valid_targets_min": 1961
},
{
"epoch": 2.6194690265486726,
"grad_norm": 0.18262589410060973,
"learning_rate": 2.1830408367739922e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11956163495779037,
"step": 4440,
"valid_targets_mean": 9962.6,
"valid_targets_min": 2405
},
{
"epoch": 2.622418879056047,
"grad_norm": 0.18353878588806358,
"learning_rate": 2.1789386971618033e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10075725615024567,
"step": 4445,
"valid_targets_mean": 8304.7,
"valid_targets_min": 1978
},
{
"epoch": 2.6253687315634218,
"grad_norm": 0.18338574101129995,
"learning_rate": 2.1748357985590464e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13569006323814392,
"step": 4450,
"valid_targets_mean": 12342.4,
"valid_targets_min": 2187
},
{
"epoch": 2.6283185840707963,
"grad_norm": 0.18731950611432518,
"learning_rate": 2.1707321583686723e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11985199898481369,
"step": 4455,
"valid_targets_mean": 9165.0,
"valid_targets_min": 832
},
{
"epoch": 2.6312684365781713,
"grad_norm": 0.18179109075455493,
"learning_rate": 2.166627793996778e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11996208131313324,
"step": 4460,
"valid_targets_mean": 10573.9,
"valid_targets_min": 2386
},
{
"epoch": 2.6342182890855455,
"grad_norm": 0.17639732749552067,
"learning_rate": 2.162522722852531e-05,
"loss": 0.3753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09830086678266525,
"step": 4465,
"valid_targets_mean": 8261.4,
"valid_targets_min": 1439
},
{
"epoch": 2.6371681415929205,
"grad_norm": 0.18624863734756492,
"learning_rate": 2.1584169623480977e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1318359673023224,
"step": 4470,
"valid_targets_mean": 9847.7,
"valid_targets_min": 1767
},
{
"epoch": 2.640117994100295,
"grad_norm": 0.18671149749630092,
"learning_rate": 2.1543105298985677e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.142843559384346,
"step": 4475,
"valid_targets_mean": 13030.2,
"valid_targets_min": 2483
},
{
"epoch": 2.6430678466076696,
"grad_norm": 0.17576915778049942,
"learning_rate": 2.150203442921881e-05,
"loss": 0.3656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11096139997243881,
"step": 4480,
"valid_targets_mean": 9731.1,
"valid_targets_min": 1703
},
{
"epoch": 2.646017699115044,
"grad_norm": 0.19021455051682687,
"learning_rate": 2.146095718838754e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1263219118118286,
"step": 4485,
"valid_targets_mean": 10780.1,
"valid_targets_min": 1649
},
{
"epoch": 2.6489675516224187,
"grad_norm": 0.25149441730176714,
"learning_rate": 2.1419873750726047e-05,
"loss": 0.3745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12710106372833252,
"step": 4490,
"valid_targets_mean": 10743.4,
"valid_targets_min": 1801
},
{
"epoch": 2.6519174041297937,
"grad_norm": 0.19309226911864125,
"learning_rate": 2.137878429049481e-05,
"loss": 0.3757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09978538751602173,
"step": 4495,
"valid_targets_mean": 9102.6,
"valid_targets_min": 1830
},
{
"epoch": 2.6548672566371683,
"grad_norm": 0.187598366499337,
"learning_rate": 2.133768898197984e-05,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10561759769916534,
"step": 4500,
"valid_targets_mean": 9400.9,
"valid_targets_min": 1853
},
{
"epoch": 2.657817109144543,
"grad_norm": 0.18176956089972085,
"learning_rate": 2.129658799949197e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11985710263252258,
"step": 4505,
"valid_targets_mean": 10114.0,
"valid_targets_min": 2144
},
{
"epoch": 2.6607669616519174,
"grad_norm": 0.19152705920323992,
"learning_rate": 2.1255481517366076e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12177897989749908,
"step": 4510,
"valid_targets_mean": 9553.2,
"valid_targets_min": 2181
},
{
"epoch": 2.663716814159292,
"grad_norm": 0.20006455174532503,
"learning_rate": 2.1214369709960384e-05,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12645691633224487,
"step": 4515,
"valid_targets_mean": 9748.7,
"valid_targets_min": 856
},
{
"epoch": 2.6666666666666665,
"grad_norm": 0.1951469538446342,
"learning_rate": 2.1173252751655697e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1358049213886261,
"step": 4520,
"valid_targets_mean": 12207.3,
"valid_targets_min": 2941
},
{
"epoch": 2.669616519174041,
"grad_norm": 0.17741183567028762,
"learning_rate": 2.113213081685466e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1099037230014801,
"step": 4525,
"valid_targets_mean": 9607.7,
"valid_targets_min": 1480
},
{
"epoch": 2.672566371681416,
"grad_norm": 0.17114246748827758,
"learning_rate": 2.109100407998105e-05,
"loss": 0.3756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1161927580833435,
"step": 4530,
"valid_targets_mean": 10516.6,
"valid_targets_min": 1750
},
{
"epoch": 2.6755162241887906,
"grad_norm": 0.1736298535501412,
"learning_rate": 2.104987271547899e-05,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10709735751152039,
"step": 4535,
"valid_targets_mean": 9166.2,
"valid_targets_min": 2342
},
{
"epoch": 2.678466076696165,
"grad_norm": 0.18858861763150891,
"learning_rate": 2.1008736897812233e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14287090301513672,
"step": 4540,
"valid_targets_mean": 10198.2,
"valid_targets_min": 1888
},
{
"epoch": 2.6814159292035398,
"grad_norm": 0.20388340088823198,
"learning_rate": 2.0967596801463433e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12462417036294937,
"step": 4545,
"valid_targets_mean": 9976.0,
"valid_targets_min": 1591
},
{
"epoch": 2.6843657817109143,
"grad_norm": 0.18788704479085547,
"learning_rate": 2.0926452600933388e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11166876554489136,
"step": 4550,
"valid_targets_mean": 8667.3,
"valid_targets_min": 1636
},
{
"epoch": 2.6873156342182893,
"grad_norm": 0.18354787267923775,
"learning_rate": 2.0885304470740294e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14732298254966736,
"step": 4555,
"valid_targets_mean": 11671.9,
"valid_targets_min": 1372
},
{
"epoch": 2.6902654867256635,
"grad_norm": 0.1982192113522515,
"learning_rate": 2.084415258541903e-05,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10863981395959854,
"step": 4560,
"valid_targets_mean": 8705.5,
"valid_targets_min": 788
},
{
"epoch": 2.6932153392330385,
"grad_norm": 0.18149704019737828,
"learning_rate": 2.0802997119520393e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12404702603816986,
"step": 4565,
"valid_targets_mean": 10789.9,
"valid_targets_min": 1629
},
{
"epoch": 2.696165191740413,
"grad_norm": 0.1792480079906465,
"learning_rate": 2.0761838247610372e-05,
"loss": 0.3748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11676395684480667,
"step": 4570,
"valid_targets_mean": 9820.9,
"valid_targets_min": 2079
},
{
"epoch": 2.6991150442477876,
"grad_norm": 0.16606762751806176,
"learning_rate": 2.0720676144269407e-05,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11027930676937103,
"step": 4575,
"valid_targets_mean": 9519.0,
"valid_targets_min": 1443
},
{
"epoch": 2.702064896755162,
"grad_norm": 0.16722925771852787,
"learning_rate": 2.067951098409162e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1202898919582367,
"step": 4580,
"valid_targets_mean": 11148.6,
"valid_targets_min": 2844
},
{
"epoch": 2.7050147492625367,
"grad_norm": 0.18963004352089147,
"learning_rate": 2.0638342941684146e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15341144800186157,
"step": 4585,
"valid_targets_mean": 11772.3,
"valid_targets_min": 2041
},
{
"epoch": 2.7079646017699117,
"grad_norm": 0.1807969224641405,
"learning_rate": 2.0597172191666304e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1127198189496994,
"step": 4590,
"valid_targets_mean": 9464.2,
"valid_targets_min": 2006
},
{
"epoch": 2.7109144542772863,
"grad_norm": 0.1765733977482184,
"learning_rate": 2.05559989086689e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11121810972690582,
"step": 4595,
"valid_targets_mean": 10115.8,
"valid_targets_min": 2033
},
{
"epoch": 2.713864306784661,
"grad_norm": 0.18313305838435828,
"learning_rate": 2.0514823267333517e-05,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09712762385606766,
"step": 4600,
"valid_targets_mean": 8914.2,
"valid_targets_min": 1829
},
{
"epoch": 2.7168141592920354,
"grad_norm": 0.19119710102039167,
"learning_rate": 2.0473645442311704e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1367199420928955,
"step": 4605,
"valid_targets_mean": 11594.1,
"valid_targets_min": 1466
},
{
"epoch": 2.71976401179941,
"grad_norm": 0.17179732392777203,
"learning_rate": 2.04324656082643e-05,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12338307499885559,
"step": 4610,
"valid_targets_mean": 10735.3,
"valid_targets_min": 1786
},
{
"epoch": 2.7227138643067845,
"grad_norm": 0.19797993394417737,
"learning_rate": 2.0391283939860642e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12678474187850952,
"step": 4615,
"valid_targets_mean": 11454.9,
"valid_targets_min": 2305
},
{
"epoch": 2.725663716814159,
"grad_norm": 0.18470224773039076,
"learning_rate": 2.0350100611777857e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10877864062786102,
"step": 4620,
"valid_targets_mean": 9119.2,
"valid_targets_min": 933
},
{
"epoch": 2.728613569321534,
"grad_norm": 0.18900877777413866,
"learning_rate": 2.0308915798700125e-05,
"loss": 0.3718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10504063218832016,
"step": 4625,
"valid_targets_mean": 9410.8,
"valid_targets_min": 1837
},
{
"epoch": 2.7315634218289087,
"grad_norm": 0.17971348147208774,
"learning_rate": 2.0267729675317907e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10653070360422134,
"step": 4630,
"valid_targets_mean": 9461.3,
"valid_targets_min": 1841
},
{
"epoch": 2.734513274336283,
"grad_norm": 0.17252415962273776,
"learning_rate": 2.022654241632723e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14466625452041626,
"step": 4635,
"valid_targets_mean": 12400.2,
"valid_targets_min": 2042
},
{
"epoch": 2.737463126843658,
"grad_norm": 0.17425963981703763,
"learning_rate": 2.018535419642894e-05,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14283370971679688,
"step": 4640,
"valid_targets_mean": 12530.3,
"valid_targets_min": 2926
},
{
"epoch": 2.7404129793510323,
"grad_norm": 0.23167496325337464,
"learning_rate": 2.0144165190327944e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.131038635969162,
"step": 4645,
"valid_targets_mean": 10509.6,
"valid_targets_min": 649
},
{
"epoch": 2.7433628318584073,
"grad_norm": 0.17833373920160922,
"learning_rate": 2.0102975572732503e-05,
"loss": 0.3643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11860808730125427,
"step": 4650,
"valid_targets_mean": 9454.0,
"valid_targets_min": 2003
},
{
"epoch": 2.7463126843657815,
"grad_norm": 0.17324651993806348,
"learning_rate": 2.0061785518353468e-05,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11439033597707748,
"step": 4655,
"valid_targets_mean": 9103.6,
"valid_targets_min": 1608
},
{
"epoch": 2.7492625368731565,
"grad_norm": 0.19583402036382658,
"learning_rate": 2.002059520190352e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11621478199958801,
"step": 4660,
"valid_targets_mean": 9436.6,
"valid_targets_min": 2137
},
{
"epoch": 2.752212389380531,
"grad_norm": 0.19255695069921716,
"learning_rate": 1.9979404798096488e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11613614857196808,
"step": 4665,
"valid_targets_mean": 9747.0,
"valid_targets_min": 1135
},
{
"epoch": 2.7551622418879056,
"grad_norm": 0.18838882767985898,
"learning_rate": 1.9938214481646542e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12855328619480133,
"step": 4670,
"valid_targets_mean": 10079.6,
"valid_targets_min": 2286
},
{
"epoch": 2.75811209439528,
"grad_norm": 0.18275839926832513,
"learning_rate": 1.9897024427267503e-05,
"loss": 0.3736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12765586376190186,
"step": 4675,
"valid_targets_mean": 10582.6,
"valid_targets_min": 1657
},
{
"epoch": 2.7610619469026547,
"grad_norm": 0.1834833774953928,
"learning_rate": 1.9855834809672062e-05,
"loss": 0.3721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11331748217344284,
"step": 4680,
"valid_targets_mean": 8869.7,
"valid_targets_min": 1883
},
{
"epoch": 2.7640117994100297,
"grad_norm": 0.19381022380541693,
"learning_rate": 1.981464580357107e-05,
"loss": 0.3595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12564757466316223,
"step": 4685,
"valid_targets_mean": 10999.8,
"valid_targets_min": 1608
},
{
"epoch": 2.7669616519174043,
"grad_norm": 0.18231953861993394,
"learning_rate": 1.9773457583672774e-05,
"loss": 0.3688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12267229706048965,
"step": 4690,
"valid_targets_mean": 10845.2,
"valid_targets_min": 1769
},
{
"epoch": 2.769911504424779,
"grad_norm": 0.1755478274789862,
"learning_rate": 1.9732270324682096e-05,
"loss": 0.366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12882521748542786,
"step": 4695,
"valid_targets_mean": 11583.4,
"valid_targets_min": 2726
},
{
"epoch": 2.7728613569321534,
"grad_norm": 0.17971417614952098,
"learning_rate": 1.9691084201299882e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10892309248447418,
"step": 4700,
"valid_targets_mean": 9023.2,
"valid_targets_min": 1719
},
{
"epoch": 2.775811209439528,
"grad_norm": 0.19549557753074975,
"learning_rate": 1.9649899388222146e-05,
"loss": 0.367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14118340611457825,
"step": 4705,
"valid_targets_mean": 11621.1,
"valid_targets_min": 1627
},
{
"epoch": 2.7787610619469025,
"grad_norm": 0.19667987961284608,
"learning_rate": 1.9608716060139364e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14556458592414856,
"step": 4710,
"valid_targets_mean": 10227.8,
"valid_targets_min": 2542
},
{
"epoch": 2.781710914454277,
"grad_norm": 0.19029304074955575,
"learning_rate": 1.9567534391735704e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11205069720745087,
"step": 4715,
"valid_targets_mean": 8847.1,
"valid_targets_min": 2962
},
{
"epoch": 2.784660766961652,
"grad_norm": 0.19017228149174456,
"learning_rate": 1.95263545576883e-05,
"loss": 0.3688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12900149822235107,
"step": 4720,
"valid_targets_mean": 11824.5,
"valid_targets_min": 2336
},
{
"epoch": 2.7876106194690267,
"grad_norm": 0.17552727463563755,
"learning_rate": 1.9485176732666483e-05,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15375812351703644,
"step": 4725,
"valid_targets_mean": 13422.8,
"valid_targets_min": 2469
},
{
"epoch": 2.7905604719764012,
"grad_norm": 0.17668174384809351,
"learning_rate": 1.9444001091331106e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0886571928858757,
"step": 4730,
"valid_targets_mean": 8039.5,
"valid_targets_min": 1011
},
{
"epoch": 2.793510324483776,
"grad_norm": 0.18169782556029626,
"learning_rate": 1.9402827808333703e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09978793561458588,
"step": 4735,
"valid_targets_mean": 8162.9,
"valid_targets_min": 1768
},
{
"epoch": 2.7964601769911503,
"grad_norm": 0.19792473116928858,
"learning_rate": 1.936165705831586e-05,
"loss": 0.366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1303151547908783,
"step": 4740,
"valid_targets_mean": 9680.6,
"valid_targets_min": 1517
},
{
"epoch": 2.799410029498525,
"grad_norm": 0.19539839901298892,
"learning_rate": 1.9320489015908382e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12567034363746643,
"step": 4745,
"valid_targets_mean": 10204.0,
"valid_targets_min": 1856
},
{
"epoch": 2.8023598820058995,
"grad_norm": 0.18421451976344766,
"learning_rate": 1.9279323855730607e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1409921497106552,
"step": 4750,
"valid_targets_mean": 11088.9,
"valid_targets_min": 3033
},
{
"epoch": 2.8053097345132745,
"grad_norm": 0.1832810400326197,
"learning_rate": 1.923816175238963e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10676514357328415,
"step": 4755,
"valid_targets_mean": 8808.9,
"valid_targets_min": 1628
},
{
"epoch": 2.808259587020649,
"grad_norm": 0.1810538852883411,
"learning_rate": 1.9197002880479617e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12992864847183228,
"step": 4760,
"valid_targets_mean": 10004.9,
"valid_targets_min": 2090
},
{
"epoch": 2.8112094395280236,
"grad_norm": 0.1738368857577118,
"learning_rate": 1.9155847414580976e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12918700277805328,
"step": 4765,
"valid_targets_mean": 11585.9,
"valid_targets_min": 1578
},
{
"epoch": 2.814159292035398,
"grad_norm": 0.18899097255754913,
"learning_rate": 1.911469552925971e-05,
"loss": 0.3648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13440260291099548,
"step": 4770,
"valid_targets_mean": 10658.7,
"valid_targets_min": 1712
},
{
"epoch": 2.8171091445427727,
"grad_norm": 0.1795972722764541,
"learning_rate": 1.9073547399066622e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385485976934433,
"step": 4775,
"valid_targets_mean": 11714.4,
"valid_targets_min": 2874
},
{
"epoch": 2.8200589970501477,
"grad_norm": 0.18542696771062736,
"learning_rate": 1.903240319853657e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10369464010000229,
"step": 4780,
"valid_targets_mean": 9205.3,
"valid_targets_min": 2733
},
{
"epoch": 2.823008849557522,
"grad_norm": 0.1781187344729139,
"learning_rate": 1.899126310218777e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10259953886270523,
"step": 4785,
"valid_targets_mean": 8837.8,
"valid_targets_min": 2032
},
{
"epoch": 2.825958702064897,
"grad_norm": 0.17727229452137436,
"learning_rate": 1.8950127284521017e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11819326877593994,
"step": 4790,
"valid_targets_mean": 10313.7,
"valid_targets_min": 2037
},
{
"epoch": 2.8289085545722714,
"grad_norm": 0.18090764145907315,
"learning_rate": 1.890899592001895e-05,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09841946512460709,
"step": 4795,
"valid_targets_mean": 8079.2,
"valid_targets_min": 1799
},
{
"epoch": 2.831858407079646,
"grad_norm": 0.17355190974088425,
"learning_rate": 1.886786918314534e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14969128370285034,
"step": 4800,
"valid_targets_mean": 11687.4,
"valid_targets_min": 1660
},
{
"epoch": 2.8348082595870205,
"grad_norm": 0.17647187850701593,
"learning_rate": 1.8826747248344313e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11566095054149628,
"step": 4805,
"valid_targets_mean": 9689.1,
"valid_targets_min": 1213
},
{
"epoch": 2.837758112094395,
"grad_norm": 0.17722114617807447,
"learning_rate": 1.8785630290039623e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1614227592945099,
"step": 4810,
"valid_targets_mean": 13727.9,
"valid_targets_min": 2019
},
{
"epoch": 2.84070796460177,
"grad_norm": 0.1773785236767756,
"learning_rate": 1.8744518482633934e-05,
"loss": 0.3651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10308026522397995,
"step": 4815,
"valid_targets_mean": 8408.8,
"valid_targets_min": 1770
},
{
"epoch": 2.8436578171091447,
"grad_norm": 0.17990207506219663,
"learning_rate": 1.8703412000508038e-05,
"loss": 0.37,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13289114832878113,
"step": 4820,
"valid_targets_mean": 10496.0,
"valid_targets_min": 1924
},
{
"epoch": 2.8466076696165192,
"grad_norm": 0.1775576622667924,
"learning_rate": 1.8662311018020164e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1118200272321701,
"step": 4825,
"valid_targets_mean": 9131.2,
"valid_targets_min": 2712
},
{
"epoch": 2.849557522123894,
"grad_norm": 0.19810895558544087,
"learning_rate": 1.8621215709505193e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12048914283514023,
"step": 4830,
"valid_targets_mean": 8391.5,
"valid_targets_min": 1896
},
{
"epoch": 2.8525073746312684,
"grad_norm": 0.17216688915829712,
"learning_rate": 1.8580126249273963e-05,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11605193465948105,
"step": 4835,
"valid_targets_mean": 9973.9,
"valid_targets_min": 1874
},
{
"epoch": 2.855457227138643,
"grad_norm": 0.16684034444297652,
"learning_rate": 1.853904281161247e-05,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12890911102294922,
"step": 4840,
"valid_targets_mean": 11387.2,
"valid_targets_min": 2079
},
{
"epoch": 2.8584070796460175,
"grad_norm": 0.1778916844191916,
"learning_rate": 1.8497965570781194e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12453418970108032,
"step": 4845,
"valid_targets_mean": 9381.8,
"valid_targets_min": 1708
},
{
"epoch": 2.8613569321533925,
"grad_norm": 0.180746525736262,
"learning_rate": 1.845689470101433e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11520042270421982,
"step": 4850,
"valid_targets_mean": 8509.3,
"valid_targets_min": 1118
},
{
"epoch": 2.864306784660767,
"grad_norm": 0.17748264133156372,
"learning_rate": 1.8415830376519023e-05,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12190565466880798,
"step": 4855,
"valid_targets_mean": 10374.7,
"valid_targets_min": 2011
},
{
"epoch": 2.8672566371681416,
"grad_norm": 0.17404569841144527,
"learning_rate": 1.8374772771474697e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507178097963333,
"step": 4860,
"valid_targets_mean": 12519.0,
"valid_targets_min": 1887
},
{
"epoch": 2.870206489675516,
"grad_norm": 0.17223673440063744,
"learning_rate": 1.8333722060032224e-05,
"loss": 0.3614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11666902899742126,
"step": 4865,
"valid_targets_mean": 9916.1,
"valid_targets_min": 1793
},
{
"epoch": 2.8731563421828907,
"grad_norm": 0.18930517136336042,
"learning_rate": 1.8292678416313283e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1369718611240387,
"step": 4870,
"valid_targets_mean": 10340.9,
"valid_targets_min": 1125
},
{
"epoch": 2.8761061946902657,
"grad_norm": 0.18700065727926024,
"learning_rate": 1.8251642014409543e-05,
"loss": 0.3634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12782393395900726,
"step": 4875,
"valid_targets_mean": 9584.5,
"valid_targets_min": 2028
},
{
"epoch": 2.87905604719764,
"grad_norm": 0.18553220648070542,
"learning_rate": 1.821061302838198e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13950929045677185,
"step": 4880,
"valid_targets_mean": 11590.9,
"valid_targets_min": 2261
},
{
"epoch": 2.882005899705015,
"grad_norm": 0.17299523715979212,
"learning_rate": 1.8169591632260085e-05,
"loss": 0.3667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13274073600769043,
"step": 4885,
"valid_targets_mean": 11354.4,
"valid_targets_min": 1773
},
{
"epoch": 2.8849557522123894,
"grad_norm": 0.17027993458233717,
"learning_rate": 1.8128578000041187e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11688661575317383,
"step": 4890,
"valid_targets_mean": 9635.8,
"valid_targets_min": 2187
},
{
"epoch": 2.887905604719764,
"grad_norm": 0.3110297576805822,
"learning_rate": 1.8087572305689657e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12430237233638763,
"step": 4895,
"valid_targets_mean": 10532.5,
"valid_targets_min": 1940
},
{
"epoch": 2.8908554572271385,
"grad_norm": 0.17883439437077342,
"learning_rate": 1.8046574723136218e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13129037618637085,
"step": 4900,
"valid_targets_mean": 11384.6,
"valid_targets_min": 2096
},
{
"epoch": 2.893805309734513,
"grad_norm": 0.18072943139923472,
"learning_rate": 1.800558542627717e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12233418971300125,
"step": 4905,
"valid_targets_mean": 10272.5,
"valid_targets_min": 2815
},
{
"epoch": 2.896755162241888,
"grad_norm": 0.17850264298888707,
"learning_rate": 1.7964604588973672e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13789036870002747,
"step": 4910,
"valid_targets_mean": 11145.4,
"valid_targets_min": 818
},
{
"epoch": 2.8997050147492627,
"grad_norm": 0.17401095636087435,
"learning_rate": 1.792363238505101e-05,
"loss": 0.3614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10849230736494064,
"step": 4915,
"valid_targets_mean": 9275.6,
"valid_targets_min": 1757
},
{
"epoch": 2.9026548672566372,
"grad_norm": 0.16868747509879806,
"learning_rate": 1.788266898829784e-05,
"loss": 0.3658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12984463572502136,
"step": 4920,
"valid_targets_mean": 10562.0,
"valid_targets_min": 1778
},
{
"epoch": 2.905604719764012,
"grad_norm": 0.1713118209228475,
"learning_rate": 1.784171457246547e-05,
"loss": 0.364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11977224051952362,
"step": 4925,
"valid_targets_mean": 9969.5,
"valid_targets_min": 1957
},
{
"epoch": 2.9085545722713864,
"grad_norm": 0.2051711163286173,
"learning_rate": 1.7800769311267097e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13498347997665405,
"step": 4930,
"valid_targets_mean": 10153.2,
"valid_targets_min": 2191
},
{
"epoch": 2.911504424778761,
"grad_norm": 0.182851398303451,
"learning_rate": 1.7759833378377115e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0971779078245163,
"step": 4935,
"valid_targets_mean": 8849.2,
"valid_targets_min": 324
},
{
"epoch": 2.9144542772861355,
"grad_norm": 0.16859808466952741,
"learning_rate": 1.771890694743032e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13063043355941772,
"step": 4940,
"valid_targets_mean": 10924.6,
"valid_targets_min": 2710
},
{
"epoch": 2.9174041297935105,
"grad_norm": 0.17589862305516682,
"learning_rate": 1.7677990192021233e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13488222658634186,
"step": 4945,
"valid_targets_mean": 11752.3,
"valid_targets_min": 1969
},
{
"epoch": 2.920353982300885,
"grad_norm": 0.19190635425255817,
"learning_rate": 1.7637083285703316e-05,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14491617679595947,
"step": 4950,
"valid_targets_mean": 12698.6,
"valid_targets_min": 2768
},
{
"epoch": 2.9233038348082596,
"grad_norm": 0.17127630744296202,
"learning_rate": 1.759618640198826e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1178339272737503,
"step": 4955,
"valid_targets_mean": 10104.6,
"valid_targets_min": 1652
},
{
"epoch": 2.926253687315634,
"grad_norm": 0.17277595293584214,
"learning_rate": 1.755529971434524e-05,
"loss": 0.3713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12804704904556274,
"step": 4960,
"valid_targets_mean": 11014.7,
"valid_targets_min": 1872
},
{
"epoch": 2.9292035398230087,
"grad_norm": 0.186889514672382,
"learning_rate": 1.7514423396200206e-05,
"loss": 0.3642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12300354987382889,
"step": 4965,
"valid_targets_mean": 10039.7,
"valid_targets_min": 2777
},
{
"epoch": 2.9321533923303837,
"grad_norm": 0.1736172015814307,
"learning_rate": 1.7473557620935077e-05,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13639748096466064,
"step": 4970,
"valid_targets_mean": 11453.5,
"valid_targets_min": 1275
},
{
"epoch": 2.935103244837758,
"grad_norm": 0.1787502910261031,
"learning_rate": 1.7432702561887114e-05,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11030873656272888,
"step": 4975,
"valid_targets_mean": 8932.7,
"valid_targets_min": 1791
},
{
"epoch": 2.938053097345133,
"grad_norm": 0.18325247424037175,
"learning_rate": 1.7391858392348064e-05,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12594400346279144,
"step": 4980,
"valid_targets_mean": 11101.6,
"valid_targets_min": 2707
},
{
"epoch": 2.9410029498525074,
"grad_norm": 0.1737878744545687,
"learning_rate": 1.7351025285563526e-05,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1459430754184723,
"step": 4985,
"valid_targets_mean": 10862.0,
"valid_targets_min": 1591
},
{
"epoch": 2.943952802359882,
"grad_norm": 0.17763844955193459,
"learning_rate": 1.7310203414732167e-05,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1361452341079712,
"step": 4990,
"valid_targets_mean": 10801.4,
"valid_targets_min": 1421
},
{
"epoch": 2.9469026548672566,
"grad_norm": 0.19567527222659836,
"learning_rate": 1.726939295300498e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11888530105352402,
"step": 4995,
"valid_targets_mean": 8929.9,
"valid_targets_min": 1203
},
{
"epoch": 2.949852507374631,
"grad_norm": 0.1729651318808521,
"learning_rate": 1.7228594073484584e-05,
"loss": 0.3722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12663039565086365,
"step": 5000,
"valid_targets_mean": 10474.6,
"valid_targets_min": 1041
},
{
"epoch": 2.952802359882006,
"grad_norm": 0.177560869754914,
"learning_rate": 1.718780694922445e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10894748568534851,
"step": 5005,
"valid_targets_mean": 8967.3,
"valid_targets_min": 2401
},
{
"epoch": 2.9557522123893807,
"grad_norm": 0.1874803467578325,
"learning_rate": 1.7147031753228218e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1277991235256195,
"step": 5010,
"valid_targets_mean": 10507.0,
"valid_targets_min": 1811
},
{
"epoch": 2.9587020648967552,
"grad_norm": 0.2360296953225136,
"learning_rate": 1.7106268658448886e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10516766458749771,
"step": 5015,
"valid_targets_mean": 9101.4,
"valid_targets_min": 1896
},
{
"epoch": 2.96165191740413,
"grad_norm": 0.1951433840169243,
"learning_rate": 1.7065517837788183e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13209852576255798,
"step": 5020,
"valid_targets_mean": 11740.2,
"valid_targets_min": 1329
},
{
"epoch": 2.9646017699115044,
"grad_norm": 0.17905616793607196,
"learning_rate": 1.7024779464095717e-05,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11057194322347641,
"step": 5025,
"valid_targets_mean": 8273.8,
"valid_targets_min": 1581
},
{
"epoch": 2.967551622418879,
"grad_norm": 0.18826370887418117,
"learning_rate": 1.6984053710168348e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13581299781799316,
"step": 5030,
"valid_targets_mean": 10531.7,
"valid_targets_min": 2030
},
{
"epoch": 2.9705014749262535,
"grad_norm": 0.20867348643719316,
"learning_rate": 1.6943340748749367e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11186973750591278,
"step": 5035,
"valid_targets_mean": 8572.2,
"valid_targets_min": 1302
},
{
"epoch": 2.9734513274336285,
"grad_norm": 0.17361471549307683,
"learning_rate": 1.690264075252785e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12840047478675842,
"step": 5040,
"valid_targets_mean": 10365.0,
"valid_targets_min": 1880
},
{
"epoch": 2.976401179941003,
"grad_norm": 0.1737568252146911,
"learning_rate": 1.6861953894137832e-05,
"loss": 0.3733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14282283186912537,
"step": 5045,
"valid_targets_mean": 11930.6,
"valid_targets_min": 1431
},
{
"epoch": 2.9793510324483776,
"grad_norm": 0.1905453510522682,
"learning_rate": 1.682128034615765e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12144088000059128,
"step": 5050,
"valid_targets_mean": 10015.8,
"valid_targets_min": 1439
},
{
"epoch": 2.982300884955752,
"grad_norm": 0.18806211439617518,
"learning_rate": 1.678062028110919e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13041338324546814,
"step": 5055,
"valid_targets_mean": 10110.8,
"valid_targets_min": 2130
},
{
"epoch": 2.9852507374631267,
"grad_norm": 0.17057233696793214,
"learning_rate": 1.6739973871457117e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11651427298784256,
"step": 5060,
"valid_targets_mean": 9938.6,
"valid_targets_min": 1395
},
{
"epoch": 2.9882005899705013,
"grad_norm": 0.19975824600519373,
"learning_rate": 1.6699341289608208e-05,
"loss": 0.3757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15038277208805084,
"step": 5065,
"valid_targets_mean": 11508.6,
"valid_targets_min": 1832
},
{
"epoch": 2.991150442477876,
"grad_norm": 0.197023590973958,
"learning_rate": 1.665872270791056e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11097166687250137,
"step": 5070,
"valid_targets_mean": 9993.5,
"valid_targets_min": 2294
},
{
"epoch": 2.994100294985251,
"grad_norm": 0.18671541620967982,
"learning_rate": 1.6618118298652916e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14129869639873505,
"step": 5075,
"valid_targets_mean": 11300.2,
"valid_targets_min": 1578
},
{
"epoch": 2.9970501474926254,
"grad_norm": 0.18303216917284046,
"learning_rate": 1.6577528234063875e-05,
"loss": 0.3605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12070619314908981,
"step": 5080,
"valid_targets_mean": 10239.3,
"valid_targets_min": 1636
},
{
"epoch": 3.0,
"grad_norm": 0.16870803400701356,
"learning_rate": 1.6536952686311224e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1085338443517685,
"step": 5085,
"valid_targets_mean": 9906.2,
"valid_targets_min": 1715
},
{
"epoch": 3.0029498525073746,
"grad_norm": 0.18072419280153204,
"learning_rate": 1.649639182750113e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1007838100194931,
"step": 5090,
"valid_targets_mean": 8127.4,
"valid_targets_min": 1551
},
{
"epoch": 3.005899705014749,
"grad_norm": 0.15411803854002304,
"learning_rate": 1.6455845829677505e-05,
"loss": 0.3554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10417066514492035,
"step": 5095,
"valid_targets_mean": 11154.4,
"valid_targets_min": 1853
},
{
"epoch": 3.0088495575221237,
"grad_norm": 0.16448402874286094,
"learning_rate": 1.6415314864821188e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11009702831506729,
"step": 5100,
"valid_targets_mean": 10077.0,
"valid_targets_min": 2839
},
{
"epoch": 3.0117994100294987,
"grad_norm": 0.1629342663277792,
"learning_rate": 1.6374799104849277e-05,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320076584815979,
"step": 5105,
"valid_targets_mean": 11536.6,
"valid_targets_min": 1416
},
{
"epoch": 3.0147492625368733,
"grad_norm": 0.17706779013507282,
"learning_rate": 1.6334298721614366e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11719324439764023,
"step": 5110,
"valid_targets_mean": 9054.6,
"valid_targets_min": 2757
},
{
"epoch": 3.017699115044248,
"grad_norm": 0.16250629050829413,
"learning_rate": 1.6293813886903823e-05,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08248552680015564,
"step": 5115,
"valid_targets_mean": 7162.3,
"valid_targets_min": 1845
},
{
"epoch": 3.0206489675516224,
"grad_norm": 0.1673905828249734,
"learning_rate": 1.6253344772439078e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12373922765254974,
"step": 5120,
"valid_targets_mean": 9473.3,
"valid_targets_min": 1920
},
{
"epoch": 3.023598820058997,
"grad_norm": 0.17125857977161707,
"learning_rate": 1.6212891549874867e-05,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12039509415626526,
"step": 5125,
"valid_targets_mean": 9270.4,
"valid_targets_min": 1592
},
{
"epoch": 3.0265486725663715,
"grad_norm": 0.172291439074316,
"learning_rate": 1.617245439079854e-05,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13650575280189514,
"step": 5130,
"valid_targets_mean": 11259.1,
"valid_targets_min": 1297
},
{
"epoch": 3.0294985250737465,
"grad_norm": 0.16609076305046538,
"learning_rate": 1.6132033466729283e-05,
"loss": 0.3598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13094520568847656,
"step": 5135,
"valid_targets_mean": 10381.7,
"valid_targets_min": 2567
},
{
"epoch": 3.032448377581121,
"grad_norm": 0.18662285949967705,
"learning_rate": 1.609162894911745e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11098338663578033,
"step": 5140,
"valid_targets_mean": 8885.5,
"valid_targets_min": 2312
},
{
"epoch": 3.0353982300884956,
"grad_norm": 0.1648803495007328,
"learning_rate": 1.6051241009343765e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13519926369190216,
"step": 5145,
"valid_targets_mean": 11761.5,
"valid_targets_min": 2617
},
{
"epoch": 3.03834808259587,
"grad_norm": 0.1687028365758394,
"learning_rate": 1.601086981871868e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12321673333644867,
"step": 5150,
"valid_targets_mean": 10408.8,
"valid_targets_min": 1710
},
{
"epoch": 3.0412979351032448,
"grad_norm": 0.17926476212590314,
"learning_rate": 1.597051554848158e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12310653924942017,
"step": 5155,
"valid_targets_mean": 9813.8,
"valid_targets_min": 2186
},
{
"epoch": 3.0442477876106193,
"grad_norm": 0.16155502872177424,
"learning_rate": 1.593017836980007e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10764841735363007,
"step": 5160,
"valid_targets_mean": 9058.5,
"valid_targets_min": 2561
},
{
"epoch": 3.047197640117994,
"grad_norm": 0.16579859522052634,
"learning_rate": 1.588985845376928e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14767128229141235,
"step": 5165,
"valid_targets_mean": 12223.3,
"valid_targets_min": 2051
},
{
"epoch": 3.050147492625369,
"grad_norm": 0.1855108695222736,
"learning_rate": 1.584955597141111e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13401386141777039,
"step": 5170,
"valid_targets_mean": 11200.6,
"valid_targets_min": 1879
},
{
"epoch": 3.0530973451327434,
"grad_norm": 0.17007622797255426,
"learning_rate": 1.580927109367351e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11102022230625153,
"step": 5175,
"valid_targets_mean": 10038.4,
"valid_targets_min": 2566
},
{
"epoch": 3.056047197640118,
"grad_norm": 0.19256034755210089,
"learning_rate": 1.5769003991429773e-05,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1243845671415329,
"step": 5180,
"valid_targets_mean": 9665.2,
"valid_targets_min": 1763
},
{
"epoch": 3.0589970501474926,
"grad_norm": 0.18192539127795151,
"learning_rate": 1.5728754835477763e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12346881628036499,
"step": 5185,
"valid_targets_mean": 9427.3,
"valid_targets_min": 1939
},
{
"epoch": 3.061946902654867,
"grad_norm": 0.18276321434981857,
"learning_rate": 1.568852379653925e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13931599259376526,
"step": 5190,
"valid_targets_mean": 10823.2,
"valid_targets_min": 1001
},
{
"epoch": 3.0648967551622417,
"grad_norm": 0.18096595886413822,
"learning_rate": 1.5648311045259156e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11066380143165588,
"step": 5195,
"valid_targets_mean": 8042.4,
"valid_targets_min": 1638
},
{
"epoch": 3.0678466076696167,
"grad_norm": 0.18094107164281462,
"learning_rate": 1.5608116752204828e-05,
"loss": 0.3594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11712948232889175,
"step": 5200,
"valid_targets_mean": 9074.4,
"valid_targets_min": 1475
},
{
"epoch": 3.0707964601769913,
"grad_norm": 0.17043468207653303,
"learning_rate": 1.5567941087865315e-05,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14815612137317657,
"step": 5205,
"valid_targets_mean": 11863.6,
"valid_targets_min": 2660
},
{
"epoch": 3.073746312684366,
"grad_norm": 0.16707843868690472,
"learning_rate": 1.5527784222650654e-05,
"loss": 0.3714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10225613415241241,
"step": 5210,
"valid_targets_mean": 8764.0,
"valid_targets_min": 1401
},
{
"epoch": 3.0766961651917404,
"grad_norm": 0.17086362845957914,
"learning_rate": 1.5487646326891156e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11746655404567719,
"step": 5215,
"valid_targets_mean": 8993.1,
"valid_targets_min": 1661
},
{
"epoch": 3.079646017699115,
"grad_norm": 0.17306648583138773,
"learning_rate": 1.5447527570836646e-05,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16646556556224823,
"step": 5220,
"valid_targets_mean": 12450.0,
"valid_targets_min": 2341
},
{
"epoch": 3.0825958702064895,
"grad_norm": 0.2517036739097649,
"learning_rate": 1.5407428124655793e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11005858331918716,
"step": 5225,
"valid_targets_mean": 9356.4,
"valid_targets_min": 2251
},
{
"epoch": 3.0855457227138645,
"grad_norm": 0.17036008905978894,
"learning_rate": 1.536734815843533e-05,
"loss": 0.3562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13720500469207764,
"step": 5230,
"valid_targets_mean": 10593.5,
"valid_targets_min": 2311
},
{
"epoch": 3.088495575221239,
"grad_norm": 0.1741623626944122,
"learning_rate": 1.5327287842179393e-05,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12113802134990692,
"step": 5235,
"valid_targets_mean": 11272.2,
"valid_targets_min": 2072
},
{
"epoch": 3.0914454277286136,
"grad_norm": 0.16679691239324818,
"learning_rate": 1.5287247345808753e-05,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11631931364536285,
"step": 5240,
"valid_targets_mean": 10755.2,
"valid_targets_min": 2573
},
{
"epoch": 3.094395280235988,
"grad_norm": 0.17445815348061394,
"learning_rate": 1.5247226839160123e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13419607281684875,
"step": 5245,
"valid_targets_mean": 11588.6,
"valid_targets_min": 1224
},
{
"epoch": 3.0973451327433628,
"grad_norm": 0.19235039716576158,
"learning_rate": 1.5207226491985408e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12204791605472565,
"step": 5250,
"valid_targets_mean": 10232.4,
"valid_targets_min": 1085
},
{
"epoch": 3.1002949852507373,
"grad_norm": 0.16580047720364316,
"learning_rate": 1.5167246473951033e-05,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12935838103294373,
"step": 5255,
"valid_targets_mean": 11208.1,
"valid_targets_min": 1385
},
{
"epoch": 3.103244837758112,
"grad_norm": 0.16982903541829203,
"learning_rate": 1.5127286954637162e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1330590546131134,
"step": 5260,
"valid_targets_mean": 11080.8,
"valid_targets_min": 1637
},
{
"epoch": 3.106194690265487,
"grad_norm": 0.17281557035552203,
"learning_rate": 1.5087348103537037e-05,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10759001970291138,
"step": 5265,
"valid_targets_mean": 9888.8,
"valid_targets_min": 2043
},
{
"epoch": 3.1091445427728615,
"grad_norm": 0.1761369685053977,
"learning_rate": 1.504743009005623e-05,
"loss": 0.3682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14634013175964355,
"step": 5270,
"valid_targets_mean": 11535.3,
"valid_targets_min": 2343
},
{
"epoch": 3.112094395280236,
"grad_norm": 0.16417048428949194,
"learning_rate": 1.5007533083511907e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1197446882724762,
"step": 5275,
"valid_targets_mean": 9942.7,
"valid_targets_min": 1725
},
{
"epoch": 3.1150442477876106,
"grad_norm": 0.15378812401178915,
"learning_rate": 1.4967657253132157e-05,
"loss": 0.3585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10902900993824005,
"step": 5280,
"valid_targets_mean": 9485.1,
"valid_targets_min": 2381
},
{
"epoch": 3.117994100294985,
"grad_norm": 0.16069117781194026,
"learning_rate": 1.4927802768055228e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13259164988994598,
"step": 5285,
"valid_targets_mean": 11853.2,
"valid_targets_min": 2085
},
{
"epoch": 3.1209439528023597,
"grad_norm": 0.1694320573562657,
"learning_rate": 1.488796979732885e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12871789932250977,
"step": 5290,
"valid_targets_mean": 11962.8,
"valid_targets_min": 2572
},
{
"epoch": 3.1238938053097347,
"grad_norm": 0.16505966881946538,
"learning_rate": 1.4848158509909465e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15198102593421936,
"step": 5295,
"valid_targets_mean": 13259.6,
"valid_targets_min": 1574
},
{
"epoch": 3.1268436578171093,
"grad_norm": 0.17879388520449493,
"learning_rate": 1.480836907466158e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10954461991786957,
"step": 5300,
"valid_targets_mean": 8538.3,
"valid_targets_min": 3063
},
{
"epoch": 3.129793510324484,
"grad_norm": 0.19905872823764165,
"learning_rate": 1.4768601660356981e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11861936748027802,
"step": 5305,
"valid_targets_mean": 9845.7,
"valid_targets_min": 1576
},
{
"epoch": 3.1327433628318584,
"grad_norm": 0.17338452190584372,
"learning_rate": 1.4728856435674073e-05,
"loss": 0.3606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1204066053032875,
"step": 5310,
"valid_targets_mean": 10769.1,
"valid_targets_min": 1379
},
{
"epoch": 3.135693215339233,
"grad_norm": 0.1665094296724231,
"learning_rate": 1.468913356919713e-05,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12827160954475403,
"step": 5315,
"valid_targets_mean": 11192.5,
"valid_targets_min": 2772
},
{
"epoch": 3.1386430678466075,
"grad_norm": 0.17163264744974516,
"learning_rate": 1.4649433229415588e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12414673715829849,
"step": 5320,
"valid_targets_mean": 10055.3,
"valid_targets_min": 2891
},
{
"epoch": 3.1415929203539825,
"grad_norm": 0.16476755230856108,
"learning_rate": 1.4609755584723337e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12396431714296341,
"step": 5325,
"valid_targets_mean": 10126.3,
"valid_targets_min": 2399
},
{
"epoch": 3.144542772861357,
"grad_norm": 0.16898117291359036,
"learning_rate": 1.4570100803418007e-05,
"loss": 0.3643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11845681071281433,
"step": 5330,
"valid_targets_mean": 10440.6,
"valid_targets_min": 2024
},
{
"epoch": 3.1474926253687316,
"grad_norm": 0.19387693997806396,
"learning_rate": 1.453046905370026e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125502347946167,
"step": 5335,
"valid_targets_mean": 9680.2,
"valid_targets_min": 2135
},
{
"epoch": 3.150442477876106,
"grad_norm": 0.16587740191579503,
"learning_rate": 1.449086050367303e-05,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11140230298042297,
"step": 5340,
"valid_targets_mean": 10028.0,
"valid_targets_min": 2571
},
{
"epoch": 3.1533923303834808,
"grad_norm": 0.17288688854657777,
"learning_rate": 1.445127532134089e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12293601781129837,
"step": 5345,
"valid_targets_mean": 9146.0,
"valid_targets_min": 1782
},
{
"epoch": 3.1563421828908553,
"grad_norm": 0.16196207264850515,
"learning_rate": 1.4411713674609257e-05,
"loss": 0.3626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10983482003211975,
"step": 5350,
"valid_targets_mean": 10024.1,
"valid_targets_min": 1820
},
{
"epoch": 3.15929203539823,
"grad_norm": 0.17745654941894476,
"learning_rate": 1.4372175731283755e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10657268762588501,
"step": 5355,
"valid_targets_mean": 9066.4,
"valid_targets_min": 1758
},
{
"epoch": 3.162241887905605,
"grad_norm": 0.17093813404945338,
"learning_rate": 1.4332661659069444e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11457949876785278,
"step": 5360,
"valid_targets_mean": 11200.9,
"valid_targets_min": 1825
},
{
"epoch": 3.1651917404129795,
"grad_norm": 0.16284984460105134,
"learning_rate": 1.4293171625570135e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10767051577568054,
"step": 5365,
"valid_targets_mean": 9578.0,
"valid_targets_min": 969
},
{
"epoch": 3.168141592920354,
"grad_norm": 0.1672772887572211,
"learning_rate": 1.4253705798287677e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10364119708538055,
"step": 5370,
"valid_targets_mean": 8988.4,
"valid_targets_min": 1622
},
{
"epoch": 3.1710914454277286,
"grad_norm": 0.1716741515555153,
"learning_rate": 1.4214264344621262e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11365842074155807,
"step": 5375,
"valid_targets_mean": 8939.7,
"valid_targets_min": 2704
},
{
"epoch": 3.174041297935103,
"grad_norm": 0.1756823532541479,
"learning_rate": 1.4174847431866665e-05,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11407135426998138,
"step": 5380,
"valid_targets_mean": 11132.0,
"valid_targets_min": 1617
},
{
"epoch": 3.1769911504424777,
"grad_norm": 0.16762380566161988,
"learning_rate": 1.4135455227215603e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11980577558279037,
"step": 5385,
"valid_targets_mean": 10267.6,
"valid_targets_min": 2290
},
{
"epoch": 3.1799410029498527,
"grad_norm": 0.16270258722311065,
"learning_rate": 1.4096087897754954e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10883092880249023,
"step": 5390,
"valid_targets_mean": 11235.0,
"valid_targets_min": 1714
},
{
"epoch": 3.1828908554572273,
"grad_norm": 0.19664867619345416,
"learning_rate": 1.4056745610466119e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1180739551782608,
"step": 5395,
"valid_targets_mean": 9939.6,
"valid_targets_min": 1119
},
{
"epoch": 3.185840707964602,
"grad_norm": 0.16986561951035176,
"learning_rate": 1.4017428532224256e-05,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12023471295833588,
"step": 5400,
"valid_targets_mean": 9699.6,
"valid_targets_min": 1382
},
{
"epoch": 3.1887905604719764,
"grad_norm": 0.16401247342669617,
"learning_rate": 1.3978136829797615e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11187541484832764,
"step": 5405,
"valid_targets_mean": 9500.3,
"valid_targets_min": 2101
},
{
"epoch": 3.191740412979351,
"grad_norm": 0.17203129490880129,
"learning_rate": 1.3938870669846793e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11447340250015259,
"step": 5410,
"valid_targets_mean": 10089.6,
"valid_targets_min": 2019
},
{
"epoch": 3.1946902654867255,
"grad_norm": 0.16112318127681288,
"learning_rate": 1.3899630218924055e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12341278791427612,
"step": 5415,
"valid_targets_mean": 11681.5,
"valid_targets_min": 2765
},
{
"epoch": 3.1976401179941005,
"grad_norm": 0.1652986251915982,
"learning_rate": 1.3860415643472625e-05,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09924346208572388,
"step": 5420,
"valid_targets_mean": 9450.3,
"valid_targets_min": 1236
},
{
"epoch": 3.200589970501475,
"grad_norm": 0.17009722063486218,
"learning_rate": 1.3821227109825946e-05,
"loss": 0.3645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12092237919569016,
"step": 5425,
"valid_targets_mean": 10375.5,
"valid_targets_min": 1709
},
{
"epoch": 3.2035398230088497,
"grad_norm": 0.18484989650554937,
"learning_rate": 1.3782064784207041e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10624641180038452,
"step": 5430,
"valid_targets_mean": 7647.3,
"valid_targets_min": 1474
},
{
"epoch": 3.206489675516224,
"grad_norm": 0.15974643344864622,
"learning_rate": 1.3742928832727726e-05,
"loss": 0.3648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09058540314435959,
"step": 5435,
"valid_targets_mean": 7829.2,
"valid_targets_min": 1407
},
{
"epoch": 3.2094395280235988,
"grad_norm": 0.18499061576038137,
"learning_rate": 1.3703819421387988e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10127178579568863,
"step": 5440,
"valid_targets_mean": 8146.3,
"valid_targets_min": 2212
},
{
"epoch": 3.2123893805309733,
"grad_norm": 0.17670280789378795,
"learning_rate": 1.366473671607521e-05,
"loss": 0.3657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14998787641525269,
"step": 5445,
"valid_targets_mean": 12941.1,
"valid_targets_min": 1757
},
{
"epoch": 3.215339233038348,
"grad_norm": 0.17641480449937122,
"learning_rate": 1.3625680882563517e-05,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11825121939182281,
"step": 5450,
"valid_targets_mean": 10206.6,
"valid_targets_min": 2056
},
{
"epoch": 3.218289085545723,
"grad_norm": 0.17433353100016663,
"learning_rate": 1.3586652086513038e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12670403718948364,
"step": 5455,
"valid_targets_mean": 9321.0,
"valid_targets_min": 2443
},
{
"epoch": 3.2212389380530975,
"grad_norm": 0.17405182564049818,
"learning_rate": 1.3547650493469244e-05,
"loss": 0.3658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14105822145938873,
"step": 5460,
"valid_targets_mean": 11845.5,
"valid_targets_min": 1503
},
{
"epoch": 3.224188790560472,
"grad_norm": 0.17630323471438666,
"learning_rate": 1.3508676268862187e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12641315162181854,
"step": 5465,
"valid_targets_mean": 10094.4,
"valid_targets_min": 1091
},
{
"epoch": 3.2271386430678466,
"grad_norm": 0.17724466941372247,
"learning_rate": 1.3469729578005858e-05,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12962406873703003,
"step": 5470,
"valid_targets_mean": 9290.2,
"valid_targets_min": 2482
},
{
"epoch": 3.230088495575221,
"grad_norm": 0.17295330887453264,
"learning_rate": 1.3430810586097462e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12997081875801086,
"step": 5475,
"valid_targets_mean": 10670.7,
"valid_targets_min": 1532
},
{
"epoch": 3.2330383480825957,
"grad_norm": 0.1868078668062745,
"learning_rate": 1.339191945821669e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13852176070213318,
"step": 5480,
"valid_targets_mean": 11688.2,
"valid_targets_min": 1261
},
{
"epoch": 3.2359882005899703,
"grad_norm": 0.15959566606879444,
"learning_rate": 1.3353056359325072e-05,
"loss": 0.3648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12794829905033112,
"step": 5485,
"valid_targets_mean": 10035.3,
"valid_targets_min": 1364
},
{
"epoch": 3.2389380530973453,
"grad_norm": 0.1671205820811924,
"learning_rate": 1.3314221454265233e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10383822023868561,
"step": 5490,
"valid_targets_mean": 8238.5,
"valid_targets_min": 1363
},
{
"epoch": 3.24188790560472,
"grad_norm": 0.1768265159476027,
"learning_rate": 1.3275414907760222e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13004903495311737,
"step": 5495,
"valid_targets_mean": 10542.8,
"valid_targets_min": 1877
},
{
"epoch": 3.2448377581120944,
"grad_norm": 0.1695460964551601,
"learning_rate": 1.3236636884412785e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10654259473085403,
"step": 5500,
"valid_targets_mean": 10243.8,
"valid_targets_min": 2529
},
{
"epoch": 3.247787610619469,
"grad_norm": 0.15806011542943854,
"learning_rate": 1.3197887548704706e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10573803633451462,
"step": 5505,
"valid_targets_mean": 9045.6,
"valid_targets_min": 2196
},
{
"epoch": 3.2507374631268435,
"grad_norm": 0.16394676727838023,
"learning_rate": 1.3159167064996064e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14225220680236816,
"step": 5510,
"valid_targets_mean": 10520.3,
"valid_targets_min": 2974
},
{
"epoch": 3.2536873156342185,
"grad_norm": 0.17557994335059957,
"learning_rate": 1.3120475597524575e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1023373156785965,
"step": 5515,
"valid_targets_mean": 8490.1,
"valid_targets_min": 1698
},
{
"epoch": 3.256637168141593,
"grad_norm": 0.1772121802620938,
"learning_rate": 1.3081813310404872e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12516672909259796,
"step": 5520,
"valid_targets_mean": 10266.6,
"valid_targets_min": 2086
},
{
"epoch": 3.2595870206489677,
"grad_norm": 0.16860638201476127,
"learning_rate": 1.3043180367627816e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10529131442308426,
"step": 5525,
"valid_targets_mean": 8899.9,
"valid_targets_min": 1091
},
{
"epoch": 3.262536873156342,
"grad_norm": 0.16809946742678483,
"learning_rate": 1.30045769330598e-05,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13498874008655548,
"step": 5530,
"valid_targets_mean": 12777.8,
"valid_targets_min": 2085
},
{
"epoch": 3.265486725663717,
"grad_norm": 0.1664783405579296,
"learning_rate": 1.2966003170442068e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10611608624458313,
"step": 5535,
"valid_targets_mean": 8542.1,
"valid_targets_min": 1275
},
{
"epoch": 3.2684365781710913,
"grad_norm": 0.17522851488020888,
"learning_rate": 1.2927459243389976e-05,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11877696961164474,
"step": 5540,
"valid_targets_mean": 9471.2,
"valid_targets_min": 1875
},
{
"epoch": 3.271386430678466,
"grad_norm": 0.1740811217541218,
"learning_rate": 1.2888945315392358e-05,
"loss": 0.3589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12354566901922226,
"step": 5545,
"valid_targets_mean": 9979.3,
"valid_targets_min": 2317
},
{
"epoch": 3.274336283185841,
"grad_norm": 0.1855988907885218,
"learning_rate": 1.28504615498108e-05,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10054697096347809,
"step": 5550,
"valid_targets_mean": 7764.0,
"valid_targets_min": 1398
},
{
"epoch": 3.2772861356932155,
"grad_norm": 0.17877226686806805,
"learning_rate": 1.2812008109878925e-05,
"loss": 0.3634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11428143084049225,
"step": 5555,
"valid_targets_mean": 8935.4,
"valid_targets_min": 1626
},
{
"epoch": 3.28023598820059,
"grad_norm": 0.16683919827362095,
"learning_rate": 1.277358515870176e-05,
"loss": 0.3571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1391943246126175,
"step": 5560,
"valid_targets_mean": 11983.7,
"valid_targets_min": 2161
},
{
"epoch": 3.2831858407079646,
"grad_norm": 0.18749132103457708,
"learning_rate": 1.2735192859254988e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12208181619644165,
"step": 5565,
"valid_targets_mean": 9960.0,
"valid_targets_min": 1896
},
{
"epoch": 3.286135693215339,
"grad_norm": 0.17707993776381883,
"learning_rate": 1.2696831374384287e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11540719121694565,
"step": 5570,
"valid_targets_mean": 9256.6,
"valid_targets_min": 1791
},
{
"epoch": 3.2890855457227137,
"grad_norm": 0.16692477088106328,
"learning_rate": 1.2658500866804622e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12894247472286224,
"step": 5575,
"valid_targets_mean": 10841.3,
"valid_targets_min": 1796
},
{
"epoch": 3.2920353982300883,
"grad_norm": 0.15885310521115004,
"learning_rate": 1.2620201499099588e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1357426792383194,
"step": 5580,
"valid_targets_mean": 11841.5,
"valid_targets_min": 2575
},
{
"epoch": 3.2949852507374633,
"grad_norm": 0.18151023028453872,
"learning_rate": 1.2581933433720658e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1206400990486145,
"step": 5585,
"valid_targets_mean": 9533.8,
"valid_targets_min": 1760
},
{
"epoch": 3.297935103244838,
"grad_norm": 0.1576662184734288,
"learning_rate": 1.2543696832986577e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12325617671012878,
"step": 5590,
"valid_targets_mean": 11093.8,
"valid_targets_min": 2478
},
{
"epoch": 3.3008849557522124,
"grad_norm": 0.16248650260323072,
"learning_rate": 1.2505491859082585e-05,
"loss": 0.364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14523741602897644,
"step": 5595,
"valid_targets_mean": 12308.4,
"valid_targets_min": 2441
},
{
"epoch": 3.303834808259587,
"grad_norm": 0.1697568324931673,
"learning_rate": 1.2467318674059808e-05,
"loss": 0.3645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13691668212413788,
"step": 5600,
"valid_targets_mean": 10976.5,
"valid_targets_min": 2610
},
{
"epoch": 3.3067846607669615,
"grad_norm": 0.1561936447555479,
"learning_rate": 1.2429177439834512e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1259647160768509,
"step": 5605,
"valid_targets_mean": 10802.3,
"valid_targets_min": 1914
},
{
"epoch": 3.309734513274336,
"grad_norm": 0.15423817220564448,
"learning_rate": 1.2391068318187459e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12037042528390884,
"step": 5610,
"valid_targets_mean": 11692.9,
"valid_targets_min": 2256
},
{
"epoch": 3.312684365781711,
"grad_norm": 0.16888848959955774,
"learning_rate": 1.2352991470763184e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09414775669574738,
"step": 5615,
"valid_targets_mean": 7951.5,
"valid_targets_min": 2257
},
{
"epoch": 3.3156342182890857,
"grad_norm": 0.16908333147958188,
"learning_rate": 1.2314947059069335e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11395449936389923,
"step": 5620,
"valid_targets_mean": 8913.4,
"valid_targets_min": 2553
},
{
"epoch": 3.3185840707964602,
"grad_norm": 0.1651710524663912,
"learning_rate": 1.227693524447599e-05,
"loss": 0.3657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11249791085720062,
"step": 5625,
"valid_targets_mean": 10005.8,
"valid_targets_min": 1375
},
{
"epoch": 3.321533923303835,
"grad_norm": 0.17144720901775296,
"learning_rate": 1.2238956188214936e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14235293865203857,
"step": 5630,
"valid_targets_mean": 11095.1,
"valid_targets_min": 3126
},
{
"epoch": 3.3244837758112094,
"grad_norm": 0.16362249587364253,
"learning_rate": 1.2201010051379043e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12004884332418442,
"step": 5635,
"valid_targets_mean": 9365.7,
"valid_targets_min": 1396
},
{
"epoch": 3.327433628318584,
"grad_norm": 0.16857686837608443,
"learning_rate": 1.2163096994921518e-05,
"loss": 0.3696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1059444323182106,
"step": 5640,
"valid_targets_mean": 9492.3,
"valid_targets_min": 1480
},
{
"epoch": 3.330383480825959,
"grad_norm": 0.1597626038930533,
"learning_rate": 1.2125217179655278e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11164246499538422,
"step": 5645,
"valid_targets_mean": 9468.8,
"valid_targets_min": 1678
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.1792298222255779,
"learning_rate": 1.2087370766252228e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13133028149604797,
"step": 5650,
"valid_targets_mean": 10842.1,
"valid_targets_min": 1206
},
{
"epoch": 3.336283185840708,
"grad_norm": 0.18065578316617883,
"learning_rate": 1.2049557915242616e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13570484519004822,
"step": 5655,
"valid_targets_mean": 10905.9,
"valid_targets_min": 1230
},
{
"epoch": 3.3392330383480826,
"grad_norm": 0.16218754902076543,
"learning_rate": 1.2011778787014297e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10976435244083405,
"step": 5660,
"valid_targets_mean": 9180.0,
"valid_targets_min": 1869
},
{
"epoch": 3.342182890855457,
"grad_norm": 0.16358824521292456,
"learning_rate": 1.1974033541812124e-05,
"loss": 0.3594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13786596059799194,
"step": 5665,
"valid_targets_mean": 11668.7,
"valid_targets_min": 2090
},
{
"epoch": 3.3451327433628317,
"grad_norm": 0.17494440281924994,
"learning_rate": 1.1936322339737193e-05,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13460367918014526,
"step": 5670,
"valid_targets_mean": 10886.5,
"valid_targets_min": 2834
},
{
"epoch": 3.3480825958702063,
"grad_norm": 0.18096806292604525,
"learning_rate": 1.1898645340746242e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1231859102845192,
"step": 5675,
"valid_targets_mean": 9843.6,
"valid_targets_min": 1609
},
{
"epoch": 3.3510324483775813,
"grad_norm": 0.1659915993499302,
"learning_rate": 1.1861002704650897e-05,
"loss": 0.3689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11928001046180725,
"step": 5680,
"valid_targets_mean": 10241.2,
"valid_targets_min": 2562
},
{
"epoch": 3.353982300884956,
"grad_norm": 0.1735036326764437,
"learning_rate": 1.1823394591117048e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12572640180587769,
"step": 5685,
"valid_targets_mean": 10534.2,
"valid_targets_min": 1480
},
{
"epoch": 3.3569321533923304,
"grad_norm": 0.16324620999370973,
"learning_rate": 1.1785821159664158e-05,
"loss": 0.3595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12011720985174179,
"step": 5690,
"valid_targets_mean": 11762.8,
"valid_targets_min": 2092
},
{
"epoch": 3.359882005899705,
"grad_norm": 0.1612218314865116,
"learning_rate": 1.174828256966456e-05,
"loss": 0.3553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11624462157487869,
"step": 5695,
"valid_targets_mean": 11185.9,
"valid_targets_min": 1579
},
{
"epoch": 3.3628318584070795,
"grad_norm": 0.16525818633723133,
"learning_rate": 1.1710778980342834e-05,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12180322408676147,
"step": 5700,
"valid_targets_mean": 9581.1,
"valid_targets_min": 2162
},
{
"epoch": 3.365781710914454,
"grad_norm": 0.17000114316124038,
"learning_rate": 1.1673310550775066e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11625468730926514,
"step": 5705,
"valid_targets_mean": 10227.8,
"valid_targets_min": 832
},
{
"epoch": 3.3687315634218287,
"grad_norm": 0.16674908078453304,
"learning_rate": 1.1635877439888232e-05,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15849077701568604,
"step": 5710,
"valid_targets_mean": 11126.4,
"valid_targets_min": 1768
},
{
"epoch": 3.3716814159292037,
"grad_norm": 0.16244915053131123,
"learning_rate": 1.1598479806459493e-05,
"loss": 0.3708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11129726469516754,
"step": 5715,
"valid_targets_mean": 10253.1,
"valid_targets_min": 2074
},
{
"epoch": 3.3746312684365782,
"grad_norm": 0.1720907804169401,
"learning_rate": 1.1561117809115522e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12222810089588165,
"step": 5720,
"valid_targets_mean": 10034.1,
"valid_targets_min": 2135
},
{
"epoch": 3.377581120943953,
"grad_norm": 0.16006227650596366,
"learning_rate": 1.1523791606331844e-05,
"loss": 0.3722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12712764739990234,
"step": 5725,
"valid_targets_mean": 11439.1,
"valid_targets_min": 1921
},
{
"epoch": 3.3805309734513274,
"grad_norm": 0.1844916337446282,
"learning_rate": 1.1486501356432157e-05,
"loss": 0.3576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12447535246610641,
"step": 5730,
"valid_targets_mean": 9926.1,
"valid_targets_min": 2217
},
{
"epoch": 3.383480825958702,
"grad_norm": 0.17250265514425828,
"learning_rate": 1.1449247217587654e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12348814308643341,
"step": 5735,
"valid_targets_mean": 10439.4,
"valid_targets_min": 2181
},
{
"epoch": 3.386430678466077,
"grad_norm": 0.17414640085174973,
"learning_rate": 1.1412029347816364e-05,
"loss": 0.3656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12620124220848083,
"step": 5740,
"valid_targets_mean": 10171.7,
"valid_targets_min": 1676
},
{
"epoch": 3.3893805309734515,
"grad_norm": 0.17188785739593934,
"learning_rate": 1.1374847904982476e-05,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11639649420976639,
"step": 5745,
"valid_targets_mean": 9770.0,
"valid_targets_min": 1417
},
{
"epoch": 3.392330383480826,
"grad_norm": 0.16379536749749107,
"learning_rate": 1.1337703046795658e-05,
"loss": 0.3645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13657310605049133,
"step": 5750,
"valid_targets_mean": 11708.1,
"valid_targets_min": 1751
},
{
"epoch": 3.3952802359882006,
"grad_norm": 0.1835047259245895,
"learning_rate": 1.1300594930810428e-05,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1326453983783722,
"step": 5755,
"valid_targets_mean": 10102.0,
"valid_targets_min": 1956
},
{
"epoch": 3.398230088495575,
"grad_norm": 0.1606630887122043,
"learning_rate": 1.1263523714425433e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11090432107448578,
"step": 5760,
"valid_targets_mean": 10676.0,
"valid_targets_min": 805
},
{
"epoch": 3.4011799410029497,
"grad_norm": 0.17060284412602886,
"learning_rate": 1.1226489554882808e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12317381799221039,
"step": 5765,
"valid_targets_mean": 11039.3,
"valid_targets_min": 2536
},
{
"epoch": 3.4041297935103243,
"grad_norm": 0.18149054238359424,
"learning_rate": 1.1189492609267518e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12160060554742813,
"step": 5770,
"valid_targets_mean": 9479.5,
"valid_targets_min": 1980
},
{
"epoch": 3.4070796460176993,
"grad_norm": 0.15777568100406267,
"learning_rate": 1.1152533034506668e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12296357750892639,
"step": 5775,
"valid_targets_mean": 10496.0,
"valid_targets_min": 2590
},
{
"epoch": 3.410029498525074,
"grad_norm": 0.17773974058522804,
"learning_rate": 1.1115610987368858e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567886620759964,
"step": 5780,
"valid_targets_mean": 11851.6,
"valid_targets_min": 1998
},
{
"epoch": 3.4129793510324484,
"grad_norm": 0.15238485468696308,
"learning_rate": 1.1078726624463504e-05,
"loss": 0.3595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10325300693511963,
"step": 5785,
"valid_targets_mean": 9576.4,
"valid_targets_min": 1763
},
{
"epoch": 3.415929203539823,
"grad_norm": 0.15714087387831013,
"learning_rate": 1.1041880102240184e-05,
"loss": 0.3658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10524867475032806,
"step": 5790,
"valid_targets_mean": 8958.1,
"valid_targets_min": 1310
},
{
"epoch": 3.4188790560471976,
"grad_norm": 0.16033185917374054,
"learning_rate": 1.1005071576987984e-05,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12304713577032089,
"step": 5795,
"valid_targets_mean": 10463.5,
"valid_targets_min": 2114
},
{
"epoch": 3.421828908554572,
"grad_norm": 0.1873816855988947,
"learning_rate": 1.096830120483478e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11564882099628448,
"step": 5800,
"valid_targets_mean": 9729.3,
"valid_targets_min": 1082
},
{
"epoch": 3.4247787610619467,
"grad_norm": 0.1607099901079245,
"learning_rate": 1.0931569141746672e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13356913626194,
"step": 5805,
"valid_targets_mean": 12371.8,
"valid_targets_min": 2109
},
{
"epoch": 3.4277286135693217,
"grad_norm": 0.1665172667935528,
"learning_rate": 1.089487554352721e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11274045705795288,
"step": 5810,
"valid_targets_mean": 9811.8,
"valid_targets_min": 2354
},
{
"epoch": 3.4306784660766962,
"grad_norm": 0.1516818925090918,
"learning_rate": 1.085822056581685e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11470094323158264,
"step": 5815,
"valid_targets_mean": 10083.3,
"valid_targets_min": 1855
},
{
"epoch": 3.433628318584071,
"grad_norm": 0.16050534256161125,
"learning_rate": 1.0821604364092173e-05,
"loss": 0.3598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10790784657001495,
"step": 5820,
"valid_targets_mean": 8987.7,
"valid_targets_min": 1528
},
{
"epoch": 3.4365781710914454,
"grad_norm": 0.15780365845904865,
"learning_rate": 1.0785027093665338e-05,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11171510070562363,
"step": 5825,
"valid_targets_mean": 9973.6,
"valid_targets_min": 2086
},
{
"epoch": 3.43952802359882,
"grad_norm": 0.15230714390743114,
"learning_rate": 1.074848890968335e-05,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13318592309951782,
"step": 5830,
"valid_targets_mean": 11855.9,
"valid_targets_min": 1948
},
{
"epoch": 3.442477876106195,
"grad_norm": 0.16470290904412074,
"learning_rate": 1.0711989967127411e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11730567365884781,
"step": 5835,
"valid_targets_mean": 10060.4,
"valid_targets_min": 1194
},
{
"epoch": 3.4454277286135695,
"grad_norm": 0.18454157641952232,
"learning_rate": 1.067553042081232e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1288733184337616,
"step": 5840,
"valid_targets_mean": 10188.3,
"valid_targets_min": 1425
},
{
"epoch": 3.448377581120944,
"grad_norm": 0.16574266792943357,
"learning_rate": 1.0639110425385706e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14179229736328125,
"step": 5845,
"valid_targets_mean": 10892.8,
"valid_targets_min": 2394
},
{
"epoch": 3.4513274336283186,
"grad_norm": 0.16678421583777908,
"learning_rate": 1.0602730135327506e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1217309832572937,
"step": 5850,
"valid_targets_mean": 11444.2,
"valid_targets_min": 1168
},
{
"epoch": 3.454277286135693,
"grad_norm": 0.16968315847539236,
"learning_rate": 1.0566389704949182e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1125468909740448,
"step": 5855,
"valid_targets_mean": 8869.1,
"valid_targets_min": 1835
},
{
"epoch": 3.4572271386430677,
"grad_norm": 0.1627605634002582,
"learning_rate": 1.0530089288393186e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12059512734413147,
"step": 5860,
"valid_targets_mean": 10218.8,
"valid_targets_min": 1490
},
{
"epoch": 3.4601769911504423,
"grad_norm": 0.16403510964024512,
"learning_rate": 1.0493829039632177e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1418202966451645,
"step": 5865,
"valid_targets_mean": 12011.1,
"valid_targets_min": 1228
},
{
"epoch": 3.4631268436578173,
"grad_norm": 0.17134085314800312,
"learning_rate": 1.0457609112468505e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13072720170021057,
"step": 5870,
"valid_targets_mean": 9414.9,
"valid_targets_min": 2166
},
{
"epoch": 3.466076696165192,
"grad_norm": 0.17700321377311182,
"learning_rate": 1.0421429660533456e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10390730202198029,
"step": 5875,
"valid_targets_mean": 8437.3,
"valid_targets_min": 2591
},
{
"epoch": 3.4690265486725664,
"grad_norm": 0.16339951264714045,
"learning_rate": 1.038529083728663e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1167861744761467,
"step": 5880,
"valid_targets_mean": 10423.9,
"valid_targets_min": 1563
},
{
"epoch": 3.471976401179941,
"grad_norm": 0.15604649534709167,
"learning_rate": 1.0349192796015315e-05,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11106991767883301,
"step": 5885,
"valid_targets_mean": 10573.0,
"valid_targets_min": 1979
},
{
"epoch": 3.4749262536873156,
"grad_norm": 0.16586097181275214,
"learning_rate": 1.0313135689833795e-05,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11501479148864746,
"step": 5890,
"valid_targets_mean": 9576.9,
"valid_targets_min": 1775
},
{
"epoch": 3.47787610619469,
"grad_norm": 0.1676293724345518,
"learning_rate": 1.0277119671682762e-05,
"loss": 0.3714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14278097450733185,
"step": 5895,
"valid_targets_mean": 12086.6,
"valid_targets_min": 2387
},
{
"epoch": 3.4808259587020647,
"grad_norm": 0.18486186420421635,
"learning_rate": 1.0241144894328571e-05,
"loss": 0.3604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10634157061576843,
"step": 5900,
"valid_targets_mean": 9452.8,
"valid_targets_min": 1872
},
{
"epoch": 3.4837758112094397,
"grad_norm": 0.1606984225160234,
"learning_rate": 1.0205211510362711e-05,
"loss": 0.3651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13014531135559082,
"step": 5905,
"valid_targets_mean": 10363.9,
"valid_targets_min": 2676
},
{
"epoch": 3.4867256637168142,
"grad_norm": 0.16521860033718624,
"learning_rate": 1.0169319672201032e-05,
"loss": 0.3594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10334562510251999,
"step": 5910,
"valid_targets_mean": 8599.8,
"valid_targets_min": 1704
},
{
"epoch": 3.489675516224189,
"grad_norm": 0.17246533091080463,
"learning_rate": 1.013346953208322e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12668567895889282,
"step": 5915,
"valid_targets_mean": 9828.8,
"valid_targets_min": 1672
},
{
"epoch": 3.4926253687315634,
"grad_norm": 0.17718900262395443,
"learning_rate": 1.0097661242072058e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10251834243535995,
"step": 5920,
"valid_targets_mean": 9252.2,
"valid_targets_min": 1382
},
{
"epoch": 3.495575221238938,
"grad_norm": 0.1706768671141397,
"learning_rate": 1.006189495405283e-05,
"loss": 0.3657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13219738006591797,
"step": 5925,
"valid_targets_mean": 9495.1,
"valid_targets_min": 872
},
{
"epoch": 3.4985250737463125,
"grad_norm": 0.16744200861029962,
"learning_rate": 1.0026170819732664e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12546458840370178,
"step": 5930,
"valid_targets_mean": 10810.9,
"valid_targets_min": 1698
},
{
"epoch": 3.501474926253687,
"grad_norm": 0.19280117217492482,
"learning_rate": 9.990488990639878e-06,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10583603382110596,
"step": 5935,
"valid_targets_mean": 9692.6,
"valid_targets_min": 2361
},
{
"epoch": 3.504424778761062,
"grad_norm": 0.17427047444951693,
"learning_rate": 9.954849618123354e-06,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12246609479188919,
"step": 5940,
"valid_targets_mean": 10629.6,
"valid_targets_min": 861
},
{
"epoch": 3.5073746312684366,
"grad_norm": 0.16144722770141756,
"learning_rate": 9.919252853351895e-06,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12689387798309326,
"step": 5945,
"valid_targets_mean": 11336.1,
"valid_targets_min": 1485
},
{
"epoch": 3.510324483775811,
"grad_norm": 0.17751770876828085,
"learning_rate": 9.883698847313567e-06,
"loss": 0.3606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1402921825647354,
"step": 5950,
"valid_targets_mean": 10965.7,
"valid_targets_min": 1453
},
{
"epoch": 3.5132743362831858,
"grad_norm": 0.16111628346749318,
"learning_rate": 9.848187750815078e-06,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10104361176490784,
"step": 5955,
"valid_targets_mean": 9067.2,
"valid_targets_min": 1415
},
{
"epoch": 3.5162241887905603,
"grad_norm": 0.17491887195807487,
"learning_rate": 9.812719714481116e-06,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10616336017847061,
"step": 5960,
"valid_targets_mean": 8690.3,
"valid_targets_min": 1929
},
{
"epoch": 3.5191740412979353,
"grad_norm": 0.16660955612607778,
"learning_rate": 9.77729488875375e-06,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11444689333438873,
"step": 5965,
"valid_targets_mean": 9147.6,
"valid_targets_min": 2141
},
{
"epoch": 3.52212389380531,
"grad_norm": 0.16246815509165646,
"learning_rate": 9.741913423891743e-06,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1039552316069603,
"step": 5970,
"valid_targets_mean": 8341.9,
"valid_targets_min": 1249
},
{
"epoch": 3.5250737463126844,
"grad_norm": 0.161823649040674,
"learning_rate": 9.706575469969945e-06,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11723171174526215,
"step": 5975,
"valid_targets_mean": 10117.9,
"valid_targets_min": 2552
},
{
"epoch": 3.528023598820059,
"grad_norm": 0.14801245024385287,
"learning_rate": 9.671281176878648e-06,
"loss": 0.3606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10321583598852158,
"step": 5980,
"valid_targets_mean": 9323.1,
"valid_targets_min": 2004
},
{
"epoch": 3.5309734513274336,
"grad_norm": 0.16517006713119983,
"learning_rate": 9.636030694322954e-06,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1235896423459053,
"step": 5985,
"valid_targets_mean": 9358.4,
"valid_targets_min": 2727
},
{
"epoch": 3.533923303834808,
"grad_norm": 0.15787575860756062,
"learning_rate": 9.600824171822131e-06,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14009323716163635,
"step": 5990,
"valid_targets_mean": 10875.3,
"valid_targets_min": 1560
},
{
"epoch": 3.5368731563421827,
"grad_norm": 0.16337294055437676,
"learning_rate": 9.565661758708989e-06,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13032642006874084,
"step": 5995,
"valid_targets_mean": 10745.1,
"valid_targets_min": 2356
},
{
"epoch": 3.5398230088495577,
"grad_norm": 0.1644220317684143,
"learning_rate": 9.530543604129257e-06,
"loss": 0.3657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10932029783725739,
"step": 6000,
"valid_targets_mean": 9117.4,
"valid_targets_min": 2033
},
{
"epoch": 3.5427728613569323,
"grad_norm": 0.19450356644800085,
"learning_rate": 9.495469857040895e-06,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09607994556427002,
"step": 6005,
"valid_targets_mean": 8322.1,
"valid_targets_min": 2131
},
{
"epoch": 3.545722713864307,
"grad_norm": 0.17538929126825079,
"learning_rate": 9.460440666213564e-06,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11947473138570786,
"step": 6010,
"valid_targets_mean": 10406.2,
"valid_targets_min": 1407
},
{
"epoch": 3.5486725663716814,
"grad_norm": 0.1664245322565486,
"learning_rate": 9.425456180227863e-06,
"loss": 0.3398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309795081615448,
"step": 6015,
"valid_targets_mean": 12493.9,
"valid_targets_min": 2457
},
{
"epoch": 3.551622418879056,
"grad_norm": 0.15993576182334512,
"learning_rate": 9.390516547474841e-06,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10049040615558624,
"step": 6020,
"valid_targets_mean": 9960.1,
"valid_targets_min": 2052
},
{
"epoch": 3.554572271386431,
"grad_norm": 0.1703810082388185,
"learning_rate": 9.355621916155233e-06,
"loss": 0.3497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09826871007680893,
"step": 6025,
"valid_targets_mean": 8378.8,
"valid_targets_min": 1560
},
{
"epoch": 3.557522123893805,
"grad_norm": 0.17052371007062495,
"learning_rate": 9.320772434278944e-06,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10447744280099869,
"step": 6030,
"valid_targets_mean": 9472.5,
"valid_targets_min": 2484
},
{
"epoch": 3.56047197640118,
"grad_norm": 0.1740402728099229,
"learning_rate": 9.285968249664348e-06,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11183241754770279,
"step": 6035,
"valid_targets_mean": 10299.2,
"valid_targets_min": 878
},
{
"epoch": 3.5634218289085546,
"grad_norm": 0.1727260880217204,
"learning_rate": 9.251209509937678e-06,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12178777903318405,
"step": 6040,
"valid_targets_mean": 10887.9,
"valid_targets_min": 2125
},
{
"epoch": 3.566371681415929,
"grad_norm": 0.1664269769495361,
"learning_rate": 9.216496362532444e-06,
"loss": 0.3427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14320679008960724,
"step": 6045,
"valid_targets_mean": 12573.0,
"valid_targets_min": 2048
},
{
"epoch": 3.5693215339233038,
"grad_norm": 0.20720455649601438,
"learning_rate": 9.181828954688711e-06,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10612769424915314,
"step": 6050,
"valid_targets_mean": 9179.3,
"valid_targets_min": 1147
},
{
"epoch": 3.5722713864306783,
"grad_norm": 0.17616659494798745,
"learning_rate": 9.147207433452606e-06,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1183801218867302,
"step": 6055,
"valid_targets_mean": 10706.8,
"valid_targets_min": 1593
},
{
"epoch": 3.5752212389380533,
"grad_norm": 0.19353117371557066,
"learning_rate": 9.112631945675543e-06,
"loss": 0.3415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11053000390529633,
"step": 6060,
"valid_targets_mean": 9218.1,
"valid_targets_min": 2137
},
{
"epoch": 3.578171091445428,
"grad_norm": 0.1824706599342028,
"learning_rate": 9.07810263801376e-06,
"loss": 0.3482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12948954105377197,
"step": 6065,
"valid_targets_mean": 11224.7,
"valid_targets_min": 1822
},
{
"epoch": 3.5811209439528024,
"grad_norm": 0.17690069727924032,
"learning_rate": 9.04361965692754e-06,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12248221039772034,
"step": 6070,
"valid_targets_mean": 11156.6,
"valid_targets_min": 1606
},
{
"epoch": 3.584070796460177,
"grad_norm": 0.1808717891925985,
"learning_rate": 9.009183148680732e-06,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12746146321296692,
"step": 6075,
"valid_targets_mean": 10960.1,
"valid_targets_min": 1556
},
{
"epoch": 3.5870206489675516,
"grad_norm": 0.17184531748341997,
"learning_rate": 8.97479325934002e-06,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10450553894042969,
"step": 6080,
"valid_targets_mean": 9461.7,
"valid_targets_min": 1929
},
{
"epoch": 3.589970501474926,
"grad_norm": 0.173522586995958,
"learning_rate": 8.940450134774372e-06,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11991443485021591,
"step": 6085,
"valid_targets_mean": 9745.5,
"valid_targets_min": 1581
},
{
"epoch": 3.5929203539823007,
"grad_norm": 0.17891278385912598,
"learning_rate": 8.906153920654386e-06,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1171131432056427,
"step": 6090,
"valid_targets_mean": 10080.6,
"valid_targets_min": 2923
},
{
"epoch": 3.5958702064896757,
"grad_norm": 0.1727148337513361,
"learning_rate": 8.871904762451684e-06,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10876183956861496,
"step": 6095,
"valid_targets_mean": 8127.2,
"valid_targets_min": 1571
},
{
"epoch": 3.5988200589970503,
"grad_norm": 0.16448376053014324,
"learning_rate": 8.837702805438302e-06,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11159020662307739,
"step": 6100,
"valid_targets_mean": 10449.8,
"valid_targets_min": 1912
},
{
"epoch": 3.601769911504425,
"grad_norm": 0.17316648159091635,
"learning_rate": 8.803548194686052e-06,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10270095616579056,
"step": 6105,
"valid_targets_mean": 8532.2,
"valid_targets_min": 1791
},
{
"epoch": 3.6047197640117994,
"grad_norm": 0.1648039518875971,
"learning_rate": 8.769441075065952e-06,
"loss": 0.3486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12315913289785385,
"step": 6110,
"valid_targets_mean": 11387.8,
"valid_targets_min": 2003
},
{
"epoch": 3.607669616519174,
"grad_norm": 0.1700750326347402,
"learning_rate": 8.735381591247531e-06,
"loss": 0.3482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11073935031890869,
"step": 6115,
"valid_targets_mean": 9229.9,
"valid_targets_min": 2522
},
{
"epoch": 3.6106194690265485,
"grad_norm": 0.1650958529279955,
"learning_rate": 8.701369887698316e-06,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132333442568779,
"step": 6120,
"valid_targets_mean": 12198.8,
"valid_targets_min": 1675
},
{
"epoch": 3.613569321533923,
"grad_norm": 0.17293858668863504,
"learning_rate": 8.667406108683139e-06,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1118520200252533,
"step": 6125,
"valid_targets_mean": 10017.0,
"valid_targets_min": 1776
},
{
"epoch": 3.616519174041298,
"grad_norm": 0.16660377768247725,
"learning_rate": 8.633490398263554e-06,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10835165530443192,
"step": 6130,
"valid_targets_mean": 10342.0,
"valid_targets_min": 1961
},
{
"epoch": 3.6194690265486726,
"grad_norm": 0.16884560005763607,
"learning_rate": 8.599622900297237e-06,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11159470677375793,
"step": 6135,
"valid_targets_mean": 9962.6,
"valid_targets_min": 2405
},
{
"epoch": 3.622418879056047,
"grad_norm": 0.1759270006257247,
"learning_rate": 8.565803758437362e-06,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09441868960857391,
"step": 6140,
"valid_targets_mean": 8304.7,
"valid_targets_min": 1978
},
{
"epoch": 3.6253687315634218,
"grad_norm": 0.18070673900085818,
"learning_rate": 8.53203311613199e-06,
"loss": 0.3427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12781083583831787,
"step": 6145,
"valid_targets_mean": 12342.4,
"valid_targets_min": 2187
},
{
"epoch": 3.6283185840707963,
"grad_norm": 0.17753626529384683,
"learning_rate": 8.498311116623468e-06,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11087179183959961,
"step": 6150,
"valid_targets_mean": 9165.0,
"valid_targets_min": 832
},
{
"epoch": 3.6312684365781713,
"grad_norm": 0.1646166036937146,
"learning_rate": 8.46463790294782e-06,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11283563077449799,
"step": 6155,
"valid_targets_mean": 10573.9,
"valid_targets_min": 2386
},
{
"epoch": 3.6342182890855455,
"grad_norm": 0.16202203309587745,
"learning_rate": 8.431013617934137e-06,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0927003026008606,
"step": 6160,
"valid_targets_mean": 8261.4,
"valid_targets_min": 1439
},
{
"epoch": 3.6371681415929205,
"grad_norm": 0.17678122262561619,
"learning_rate": 8.397438404203967e-06,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12316885590553284,
"step": 6165,
"valid_targets_mean": 9847.7,
"valid_targets_min": 1767
},
{
"epoch": 3.640117994100295,
"grad_norm": 0.1680766739382681,
"learning_rate": 8.363912404170738e-06,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1343480795621872,
"step": 6170,
"valid_targets_mean": 13030.2,
"valid_targets_min": 2483
},
{
"epoch": 3.6430678466076696,
"grad_norm": 0.18380350198660017,
"learning_rate": 8.330435760039106e-06,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.104166179895401,
"step": 6175,
"valid_targets_mean": 9731.1,
"valid_targets_min": 1703
},
{
"epoch": 3.646017699115044,
"grad_norm": 0.16599997979774428,
"learning_rate": 8.297008613804391e-06,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11891473829746246,
"step": 6180,
"valid_targets_mean": 10780.1,
"valid_targets_min": 1649
},
{
"epoch": 3.6489675516224187,
"grad_norm": 0.167945203058584,
"learning_rate": 8.263631107251959e-06,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12040609866380692,
"step": 6185,
"valid_targets_mean": 10743.4,
"valid_targets_min": 1801
},
{
"epoch": 3.6519174041297937,
"grad_norm": 0.16579591867118337,
"learning_rate": 8.230303381956626e-06,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09442141652107239,
"step": 6190,
"valid_targets_mean": 9102.6,
"valid_targets_min": 1830
},
{
"epoch": 3.6548672566371683,
"grad_norm": 0.16262630444579598,
"learning_rate": 8.197025579282048e-06,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0995297059416771,
"step": 6195,
"valid_targets_mean": 9400.9,
"valid_targets_min": 1853
},
{
"epoch": 3.657817109144543,
"grad_norm": 0.16235716247631857,
"learning_rate": 8.163797840380123e-06,
"loss": 0.337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11255133152008057,
"step": 6200,
"valid_targets_mean": 10114.0,
"valid_targets_min": 2144
},
{
"epoch": 3.6607669616519174,
"grad_norm": 0.1754927540173778,
"learning_rate": 8.130620306190433e-06,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11358267068862915,
"step": 6205,
"valid_targets_mean": 9553.2,
"valid_targets_min": 2181
},
{
"epoch": 3.663716814159292,
"grad_norm": 0.17062171541474505,
"learning_rate": 8.097493117439554e-06,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11900287866592407,
"step": 6210,
"valid_targets_mean": 9748.7,
"valid_targets_min": 856
},
{
"epoch": 3.6666666666666665,
"grad_norm": 0.16773458814080258,
"learning_rate": 8.064416414640572e-06,
"loss": 0.3501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12731051445007324,
"step": 6215,
"valid_targets_mean": 12207.3,
"valid_targets_min": 2941
},
{
"epoch": 3.669616519174041,
"grad_norm": 0.168416961836028,
"learning_rate": 8.031390338092378e-06,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10286203026771545,
"step": 6220,
"valid_targets_mean": 9607.7,
"valid_targets_min": 1480
},
{
"epoch": 3.672566371681416,
"grad_norm": 0.16945037472215474,
"learning_rate": 7.998415027879179e-06,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10942085087299347,
"step": 6225,
"valid_targets_mean": 10516.6,
"valid_targets_min": 1750
},
{
"epoch": 3.6755162241887906,
"grad_norm": 0.17600897641430144,
"learning_rate": 7.965490623869794e-06,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1005764976143837,
"step": 6230,
"valid_targets_mean": 9166.2,
"valid_targets_min": 2342
},
{
"epoch": 3.678466076696165,
"grad_norm": 0.17173774425396918,
"learning_rate": 7.932617265717167e-06,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13368156552314758,
"step": 6235,
"valid_targets_mean": 10198.2,
"valid_targets_min": 1888
},
{
"epoch": 3.6814159292035398,
"grad_norm": 0.1745358047065503,
"learning_rate": 7.899795092857696e-06,
"loss": 0.3476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11775140464305878,
"step": 6240,
"valid_targets_mean": 9976.0,
"valid_targets_min": 1591
},
{
"epoch": 3.6843657817109143,
"grad_norm": 0.17554957959750347,
"learning_rate": 7.867024244510673e-06,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10555160790681839,
"step": 6245,
"valid_targets_mean": 8667.3,
"valid_targets_min": 1636
},
{
"epoch": 3.6873156342182893,
"grad_norm": 0.17524218274714723,
"learning_rate": 7.834304859677716e-06,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13906937837600708,
"step": 6250,
"valid_targets_mean": 11671.9,
"valid_targets_min": 1372
},
{
"epoch": 3.6902654867256635,
"grad_norm": 0.17554401621953275,
"learning_rate": 7.801637077142104e-06,
"loss": 0.3483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1021658331155777,
"step": 6255,
"valid_targets_mean": 8705.5,
"valid_targets_min": 788
},
{
"epoch": 3.6932153392330385,
"grad_norm": 0.16643085352425324,
"learning_rate": 7.769021035468299e-06,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11641626060009003,
"step": 6260,
"valid_targets_mean": 10789.9,
"valid_targets_min": 1629
},
{
"epoch": 3.696165191740413,
"grad_norm": 0.16909368644232686,
"learning_rate": 7.736456873001237e-06,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10872875154018402,
"step": 6265,
"valid_targets_mean": 9820.9,
"valid_targets_min": 2079
},
{
"epoch": 3.6991150442477876,
"grad_norm": 0.15963667721381897,
"learning_rate": 7.703944727865862e-06,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10363304615020752,
"step": 6270,
"valid_targets_mean": 9519.0,
"valid_targets_min": 1443
},
{
"epoch": 3.702064896755162,
"grad_norm": 0.16511138622677904,
"learning_rate": 7.671484737966419e-06,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11367395520210266,
"step": 6275,
"valid_targets_mean": 11148.6,
"valid_targets_min": 2844
},
{
"epoch": 3.7050147492625367,
"grad_norm": 0.18024864216215955,
"learning_rate": 7.639077040985988e-06,
"loss": 0.3476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14413657784461975,
"step": 6280,
"valid_targets_mean": 11772.3,
"valid_targets_min": 2041
},
{
"epoch": 3.7079646017699117,
"grad_norm": 0.1715775268186753,
"learning_rate": 7.606721774385799e-06,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10575740039348602,
"step": 6285,
"valid_targets_mean": 9464.2,
"valid_targets_min": 2006
},
{
"epoch": 3.7109144542772863,
"grad_norm": 0.178496726739179,
"learning_rate": 7.574419075404718e-06,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10551615059375763,
"step": 6290,
"valid_targets_mean": 10115.8,
"valid_targets_min": 2033
},
{
"epoch": 3.713864306784661,
"grad_norm": 0.16922995334986288,
"learning_rate": 7.5421690810586235e-06,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09147170186042786,
"step": 6295,
"valid_targets_mean": 8914.2,
"valid_targets_min": 1829
},
{
"epoch": 3.7168141592920354,
"grad_norm": 0.1698282291677968,
"learning_rate": 7.509971928139848e-06,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12778304517269135,
"step": 6300,
"valid_targets_mean": 11594.1,
"valid_targets_min": 1466
},
{
"epoch": 3.71976401179941,
"grad_norm": 0.16512789906024777,
"learning_rate": 7.477827753216589e-06,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11623457819223404,
"step": 6305,
"valid_targets_mean": 10735.3,
"valid_targets_min": 1786
},
{
"epoch": 3.7227138643067845,
"grad_norm": 0.17231015736096786,
"learning_rate": 7.445736692632326e-06,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11947697401046753,
"step": 6310,
"valid_targets_mean": 11454.9,
"valid_targets_min": 2305
},
{
"epoch": 3.725663716814159,
"grad_norm": 0.1641230791590994,
"learning_rate": 7.413698882505271e-06,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10247132927179337,
"step": 6315,
"valid_targets_mean": 9119.2,
"valid_targets_min": 933
},
{
"epoch": 3.728613569321534,
"grad_norm": 0.16978357719585283,
"learning_rate": 7.381714458727726e-06,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09884299337863922,
"step": 6320,
"valid_targets_mean": 9410.8,
"valid_targets_min": 1837
},
{
"epoch": 3.7315634218289087,
"grad_norm": 0.15757721589249796,
"learning_rate": 7.349783556965588e-06,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0996585488319397,
"step": 6325,
"valid_targets_mean": 9461.3,
"valid_targets_min": 1841
},
{
"epoch": 3.734513274336283,
"grad_norm": 0.16646465943939942,
"learning_rate": 7.317906312657714e-06,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1353026032447815,
"step": 6330,
"valid_targets_mean": 12400.2,
"valid_targets_min": 2042
},
{
"epoch": 3.737463126843658,
"grad_norm": 0.1554771877383893,
"learning_rate": 7.286082861015371e-06,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13425269722938538,
"step": 6335,
"valid_targets_mean": 12530.3,
"valid_targets_min": 2926
},
{
"epoch": 3.7404129793510323,
"grad_norm": 0.181300037618926,
"learning_rate": 7.25431333702165e-06,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12450385838747025,
"step": 6340,
"valid_targets_mean": 10509.6,
"valid_targets_min": 649
},
{
"epoch": 3.7433628318584073,
"grad_norm": 0.1640895467509584,
"learning_rate": 7.222597875430915e-06,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11129672080278397,
"step": 6345,
"valid_targets_mean": 9454.0,
"valid_targets_min": 2003
},
{
"epoch": 3.7463126843657815,
"grad_norm": 0.16861575775932142,
"learning_rate": 7.190936610768207e-06,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10709446668624878,
"step": 6350,
"valid_targets_mean": 9103.6,
"valid_targets_min": 1608
},
{
"epoch": 3.7492625368731565,
"grad_norm": 0.17534385015787332,
"learning_rate": 7.159329677328688e-06,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10979295521974564,
"step": 6355,
"valid_targets_mean": 9436.6,
"valid_targets_min": 2137
},
{
"epoch": 3.752212389380531,
"grad_norm": 0.1709407442953378,
"learning_rate": 7.127777209177067e-06,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10932078212499619,
"step": 6360,
"valid_targets_mean": 9747.0,
"valid_targets_min": 1135
},
{
"epoch": 3.7551622418879056,
"grad_norm": 0.1692586176282364,
"learning_rate": 7.096279340147032e-06,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11985991895198822,
"step": 6365,
"valid_targets_mean": 10079.6,
"valid_targets_min": 2286
},
{
"epoch": 3.75811209439528,
"grad_norm": 0.16424785026958424,
"learning_rate": 7.064836203840675e-06,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11962170153856277,
"step": 6370,
"valid_targets_mean": 10582.6,
"valid_targets_min": 1657
},
{
"epoch": 3.7610619469026547,
"grad_norm": 0.17826076992497336,
"learning_rate": 7.033447933627959e-06,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10628711432218552,
"step": 6375,
"valid_targets_mean": 8869.7,
"valid_targets_min": 1883
},
{
"epoch": 3.7640117994100297,
"grad_norm": 0.18140433917301785,
"learning_rate": 7.002114662646078e-06,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1187339499592781,
"step": 6380,
"valid_targets_mean": 10999.8,
"valid_targets_min": 1608
},
{
"epoch": 3.7669616519174043,
"grad_norm": 0.16342405697264487,
"learning_rate": 6.970836523798992e-06,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11724892258644104,
"step": 6385,
"valid_targets_mean": 10845.2,
"valid_targets_min": 1769
},
{
"epoch": 3.769911504424779,
"grad_norm": 0.1769109723907381,
"learning_rate": 6.939613649756773e-06,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12063444405794144,
"step": 6390,
"valid_targets_mean": 11583.4,
"valid_targets_min": 2726
},
{
"epoch": 3.7728613569321534,
"grad_norm": 0.16774493767056747,
"learning_rate": 6.908446172955103e-06,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1022709459066391,
"step": 6395,
"valid_targets_mean": 9023.2,
"valid_targets_min": 1719
},
{
"epoch": 3.775811209439528,
"grad_norm": 0.16532399248445567,
"learning_rate": 6.877334225594677e-06,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1327495276927948,
"step": 6400,
"valid_targets_mean": 11621.1,
"valid_targets_min": 1627
},
{
"epoch": 3.7787610619469025,
"grad_norm": 0.17263632707334922,
"learning_rate": 6.846277939640653e-06,
"loss": 0.3407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13509851694107056,
"step": 6405,
"valid_targets_mean": 10227.8,
"valid_targets_min": 2542
},
{
"epoch": 3.781710914454277,
"grad_norm": 0.1668878067844066,
"learning_rate": 6.8152774468221195e-06,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10570927709341049,
"step": 6410,
"valid_targets_mean": 8847.1,
"valid_targets_min": 2962
},
{
"epoch": 3.784660766961652,
"grad_norm": 0.17606729721917502,
"learning_rate": 6.78433287863147e-06,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12169715762138367,
"step": 6415,
"valid_targets_mean": 11824.5,
"valid_targets_min": 2336
},
{
"epoch": 3.7876106194690267,
"grad_norm": 0.174587558240972,
"learning_rate": 6.7534443663239314e-06,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14479205012321472,
"step": 6420,
"valid_targets_mean": 13422.8,
"valid_targets_min": 2469
},
{
"epoch": 3.7905604719764012,
"grad_norm": 0.16719235317425998,
"learning_rate": 6.7226120409169185e-06,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08362986892461777,
"step": 6425,
"valid_targets_mean": 8039.5,
"valid_targets_min": 1011
},
{
"epoch": 3.793510324483776,
"grad_norm": 0.16546216405386466,
"learning_rate": 6.6918360331895674e-06,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09400837868452072,
"step": 6430,
"valid_targets_mean": 8162.9,
"valid_targets_min": 1768
},
{
"epoch": 3.7964601769911503,
"grad_norm": 0.17191373561059659,
"learning_rate": 6.661116473682088e-06,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.122324638068676,
"step": 6435,
"valid_targets_mean": 9680.6,
"valid_targets_min": 1517
},
{
"epoch": 3.799410029498525,
"grad_norm": 0.16322793961765103,
"learning_rate": 6.630453492695304e-06,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11813613772392273,
"step": 6440,
"valid_targets_mean": 10204.0,
"valid_targets_min": 1856
},
{
"epoch": 3.8023598820058995,
"grad_norm": 0.1652451657616475,
"learning_rate": 6.5998472202900254e-06,
"loss": 0.3427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13308531045913696,
"step": 6445,
"valid_targets_mean": 11088.9,
"valid_targets_min": 3033
},
{
"epoch": 3.8053097345132745,
"grad_norm": 0.16790780251020782,
"learning_rate": 6.5692977862865285e-06,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10099241137504578,
"step": 6450,
"valid_targets_mean": 8808.9,
"valid_targets_min": 1628
},
{
"epoch": 3.808259587020649,
"grad_norm": 0.17544823543649818,
"learning_rate": 6.538805320264028e-06,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1215641126036644,
"step": 6455,
"valid_targets_mean": 10004.9,
"valid_targets_min": 2090
},
{
"epoch": 3.8112094395280236,
"grad_norm": 0.15764389972156023,
"learning_rate": 6.508369951560054e-06,
"loss": 0.3497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12080827355384827,
"step": 6460,
"valid_targets_mean": 11585.9,
"valid_targets_min": 1578
},
{
"epoch": 3.814159292035398,
"grad_norm": 0.18037623858830892,
"learning_rate": 6.477991809270005e-06,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12614494562149048,
"step": 6465,
"valid_targets_mean": 10658.7,
"valid_targets_min": 1712
},
{
"epoch": 3.8171091445427727,
"grad_norm": 0.16246465667800158,
"learning_rate": 6.447671022246495e-06,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1316598355770111,
"step": 6470,
"valid_targets_mean": 11714.4,
"valid_targets_min": 2874
},
{
"epoch": 3.8200589970501477,
"grad_norm": 0.1671932168668726,
"learning_rate": 6.4174077190989134e-06,
"loss": 0.3416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09807242453098297,
"step": 6475,
"valid_targets_mean": 9205.3,
"valid_targets_min": 2733
},
{
"epoch": 3.823008849557522,
"grad_norm": 0.1558550238873647,
"learning_rate": 6.387202028192765e-06,
"loss": 0.3411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09681665897369385,
"step": 6480,
"valid_targets_mean": 8837.8,
"valid_targets_min": 2032
},
{
"epoch": 3.825958702064897,
"grad_norm": 0.1599149693693091,
"learning_rate": 6.357054077649236e-06,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1108127236366272,
"step": 6485,
"valid_targets_mean": 10313.7,
"valid_targets_min": 2037
},
{
"epoch": 3.8289085545722714,
"grad_norm": 0.2814540103412294,
"learning_rate": 6.326963995344575e-06,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09222610294818878,
"step": 6490,
"valid_targets_mean": 8079.2,
"valid_targets_min": 1799
},
{
"epoch": 3.831858407079646,
"grad_norm": 0.16787270480252503,
"learning_rate": 6.296931908909578e-06,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14041510224342346,
"step": 6495,
"valid_targets_mean": 11687.4,
"valid_targets_min": 1660
},
{
"epoch": 3.8348082595870205,
"grad_norm": 0.16222885250068517,
"learning_rate": 6.266957945729044e-06,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10812919586896896,
"step": 6500,
"valid_targets_mean": 9689.1,
"valid_targets_min": 1213
},
{
"epoch": 3.837758112094395,
"grad_norm": 0.1619680212917784,
"learning_rate": 6.237042232941241e-06,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15254142880439758,
"step": 6505,
"valid_targets_mean": 13727.9,
"valid_targets_min": 2019
},
{
"epoch": 3.84070796460177,
"grad_norm": 0.16666940188615342,
"learning_rate": 6.207184897437355e-06,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09690691530704498,
"step": 6510,
"valid_targets_mean": 8408.8,
"valid_targets_min": 1770
},
{
"epoch": 3.8436578171091447,
"grad_norm": 0.1653920328156485,
"learning_rate": 6.17738606586096e-06,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12510699033737183,
"step": 6515,
"valid_targets_mean": 10496.0,
"valid_targets_min": 1924
},
{
"epoch": 3.8466076696165192,
"grad_norm": 0.17052174641185705,
"learning_rate": 6.1476458646074765e-06,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10477550327777863,
"step": 6520,
"valid_targets_mean": 9131.2,
"valid_targets_min": 2712
},
{
"epoch": 3.849557522123894,
"grad_norm": 0.17419686871265677,
"learning_rate": 6.117964419823632e-06,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11350217461585999,
"step": 6525,
"valid_targets_mean": 8391.5,
"valid_targets_min": 1896
},
{
"epoch": 3.8525073746312684,
"grad_norm": 0.16258801176668275,
"learning_rate": 6.088341857406952e-06,
"loss": 0.3404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10940175503492355,
"step": 6530,
"valid_targets_mean": 9973.9,
"valid_targets_min": 1874
},
{
"epoch": 3.855457227138643,
"grad_norm": 0.15465794427933052,
"learning_rate": 6.058778303005184e-06,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11987055838108063,
"step": 6535,
"valid_targets_mean": 11387.2,
"valid_targets_min": 2079
},
{
"epoch": 3.8584070796460175,
"grad_norm": 0.16673934443470403,
"learning_rate": 6.029273882015794e-06,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11683391779661179,
"step": 6540,
"valid_targets_mean": 9381.8,
"valid_targets_min": 1708
},
{
"epoch": 3.8613569321533925,
"grad_norm": 0.17985237846474775,
"learning_rate": 5.999828719585419e-06,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1079455316066742,
"step": 6545,
"valid_targets_mean": 8509.3,
"valid_targets_min": 1118
},
{
"epoch": 3.864306784660767,
"grad_norm": 0.16617501395918077,
"learning_rate": 5.9704429406093555e-06,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11439075320959091,
"step": 6550,
"valid_targets_mean": 10374.7,
"valid_targets_min": 2011
},
{
"epoch": 3.8672566371681416,
"grad_norm": 0.1659912761912214,
"learning_rate": 5.941116669731011e-06,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14208897948265076,
"step": 6555,
"valid_targets_mean": 12519.0,
"valid_targets_min": 1887
},
{
"epoch": 3.870206489675516,
"grad_norm": 0.17092514673071188,
"learning_rate": 5.9118500313413795e-06,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10985920578241348,
"step": 6560,
"valid_targets_mean": 9916.1,
"valid_targets_min": 1793
},
{
"epoch": 3.8731563421828907,
"grad_norm": 0.1747700268580997,
"learning_rate": 5.882643149578522e-06,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12933915853500366,
"step": 6565,
"valid_targets_mean": 10340.9,
"valid_targets_min": 1125
},
{
"epoch": 3.8761061946902657,
"grad_norm": 0.1701245952171269,
"learning_rate": 5.853496148327032e-06,
"loss": 0.3427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12071774899959564,
"step": 6570,
"valid_targets_mean": 9584.5,
"valid_targets_min": 2028
},
{
"epoch": 3.87905604719764,
"grad_norm": 0.17367176274171137,
"learning_rate": 5.824409151217507e-06,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13250917196273804,
"step": 6575,
"valid_targets_mean": 11590.9,
"valid_targets_min": 2261
},
{
"epoch": 3.882005899705015,
"grad_norm": 0.16070228970994752,
"learning_rate": 5.79538228162605e-06,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12515580654144287,
"step": 6580,
"valid_targets_mean": 11354.4,
"valid_targets_min": 1773
},
{
"epoch": 3.8849557522123894,
"grad_norm": 0.16170822860983441,
"learning_rate": 5.76641566267369e-06,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11002568900585175,
"step": 6585,
"valid_targets_mean": 9635.8,
"valid_targets_min": 2187
},
{
"epoch": 3.887905604719764,
"grad_norm": 0.1722451727249354,
"learning_rate": 5.737509417225933e-06,
"loss": 0.3404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11824969947338104,
"step": 6590,
"valid_targets_mean": 10532.5,
"valid_targets_min": 1940
},
{
"epoch": 3.8908554572271385,
"grad_norm": 0.1556413370229152,
"learning_rate": 5.70866366789218e-06,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12434402853250504,
"step": 6595,
"valid_targets_mean": 11384.6,
"valid_targets_min": 2096
},
{
"epoch": 3.893805309734513,
"grad_norm": 0.1656739848194637,
"learning_rate": 5.679878537025238e-06,
"loss": 0.3415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11528940498828888,
"step": 6600,
"valid_targets_mean": 10272.5,
"valid_targets_min": 2815
},
{
"epoch": 3.896755162241888,
"grad_norm": 0.1618610591918246,
"learning_rate": 5.65115414672079e-06,
"loss": 0.3487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13066346943378448,
"step": 6605,
"valid_targets_mean": 11145.4,
"valid_targets_min": 818
},
{
"epoch": 3.8997050147492627,
"grad_norm": 0.16099503298446652,
"learning_rate": 5.622490618816881e-06,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10254774987697601,
"step": 6610,
"valid_targets_mean": 9275.6,
"valid_targets_min": 1757
},
{
"epoch": 3.9026548672566372,
"grad_norm": 0.16139572620781348,
"learning_rate": 5.5938880748934144e-06,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12209212779998779,
"step": 6615,
"valid_targets_mean": 10562.0,
"valid_targets_min": 1778
},
{
"epoch": 3.905604719764012,
"grad_norm": 0.16912364039387326,
"learning_rate": 5.565346636271587e-06,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11217247694730759,
"step": 6620,
"valid_targets_mean": 9969.5,
"valid_targets_min": 1957
},
{
"epoch": 3.9085545722713864,
"grad_norm": 0.16403825414110845,
"learning_rate": 5.536866424013463e-06,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278546005487442,
"step": 6625,
"valid_targets_mean": 10153.2,
"valid_targets_min": 2191
},
{
"epoch": 3.911504424778761,
"grad_norm": 0.16830399382047592,
"learning_rate": 5.508447558921346e-06,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09282360225915909,
"step": 6630,
"valid_targets_mean": 8849.2,
"valid_targets_min": 324
},
{
"epoch": 3.9144542772861355,
"grad_norm": 0.15924541084825097,
"learning_rate": 5.480090161537388e-06,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12358694523572922,
"step": 6635,
"valid_targets_mean": 10924.6,
"valid_targets_min": 2710
},
{
"epoch": 3.9174041297935105,
"grad_norm": 0.15560194458761062,
"learning_rate": 5.451794352142965e-06,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1277778148651123,
"step": 6640,
"valid_targets_mean": 11752.3,
"valid_targets_min": 1969
},
{
"epoch": 3.920353982300885,
"grad_norm": 0.16863501499682176,
"learning_rate": 5.423560250758264e-06,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13744091987609863,
"step": 6645,
"valid_targets_mean": 12698.6,
"valid_targets_min": 2768
},
{
"epoch": 3.9233038348082596,
"grad_norm": 0.16556811433623927,
"learning_rate": 5.395387977141702e-06,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11003266274929047,
"step": 6650,
"valid_targets_mean": 10104.6,
"valid_targets_min": 1652
},
{
"epoch": 3.926253687315634,
"grad_norm": 0.1566548731455713,
"learning_rate": 5.367277650789455e-06,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12147540599107742,
"step": 6655,
"valid_targets_mean": 11014.7,
"valid_targets_min": 1872
},
{
"epoch": 3.9292035398230087,
"grad_norm": 0.16800747281497158,
"learning_rate": 5.339229390934941e-06,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11620292067527771,
"step": 6660,
"valid_targets_mean": 10039.7,
"valid_targets_min": 2777
},
{
"epoch": 3.9321533923303837,
"grad_norm": 0.16958647093311707,
"learning_rate": 5.311243316548312e-06,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12884800136089325,
"step": 6665,
"valid_targets_mean": 11453.5,
"valid_targets_min": 1275
},
{
"epoch": 3.935103244837758,
"grad_norm": 0.16445607485119396,
"learning_rate": 5.2833195463359725e-06,
"loss": 0.351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10376372933387756,
"step": 6670,
"valid_targets_mean": 8932.7,
"valid_targets_min": 1791
},
{
"epoch": 3.938053097345133,
"grad_norm": 0.17134724997512896,
"learning_rate": 5.2554581987400155e-06,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11989767104387283,
"step": 6675,
"valid_targets_mean": 11101.6,
"valid_targets_min": 2707
},
{
"epoch": 3.9410029498525074,
"grad_norm": 0.1715643102378431,
"learning_rate": 5.227659391937812e-06,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13737812638282776,
"step": 6680,
"valid_targets_mean": 10862.0,
"valid_targets_min": 1591
},
{
"epoch": 3.943952802359882,
"grad_norm": 0.16952566207322528,
"learning_rate": 5.199923243841402e-06,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12849953770637512,
"step": 6685,
"valid_targets_mean": 10801.4,
"valid_targets_min": 1421
},
{
"epoch": 3.9469026548672566,
"grad_norm": 0.1717652002538149,
"learning_rate": 5.172249872097108e-06,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11228206753730774,
"step": 6690,
"valid_targets_mean": 8929.9,
"valid_targets_min": 1203
},
{
"epoch": 3.949852507374631,
"grad_norm": 0.16253902540810058,
"learning_rate": 5.144639394084938e-06,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11897753924131393,
"step": 6695,
"valid_targets_mean": 10474.6,
"valid_targets_min": 1041
},
{
"epoch": 3.952802359882006,
"grad_norm": 0.16657433949683387,
"learning_rate": 5.117091926918145e-06,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10188919305801392,
"step": 6700,
"valid_targets_mean": 8967.3,
"valid_targets_min": 2401
},
{
"epoch": 3.9557522123893807,
"grad_norm": 0.1673520592720761,
"learning_rate": 5.089607587442709e-06,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12093910574913025,
"step": 6705,
"valid_targets_mean": 10507.0,
"valid_targets_min": 1811
},
{
"epoch": 3.9587020648967552,
"grad_norm": 0.16051963913152287,
"learning_rate": 5.062186492236849e-06,
"loss": 0.35,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1005478948354721,
"step": 6710,
"valid_targets_mean": 9101.4,
"valid_targets_min": 1896
},
{
"epoch": 3.96165191740413,
"grad_norm": 0.1567988848736846,
"learning_rate": 5.034828757610526e-06,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12492018938064575,
"step": 6715,
"valid_targets_mean": 11740.2,
"valid_targets_min": 1329
},
{
"epoch": 3.9646017699115044,
"grad_norm": 0.16986019942555441,
"learning_rate": 5.007534499604945e-06,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1041763573884964,
"step": 6720,
"valid_targets_mean": 8273.8,
"valid_targets_min": 1581
},
{
"epoch": 3.967551622418879,
"grad_norm": 0.16521714927339842,
"learning_rate": 4.980303833992073e-06,
"loss": 0.3486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275613158941269,
"step": 6725,
"valid_targets_mean": 10531.7,
"valid_targets_min": 2030
},
{
"epoch": 3.9705014749262535,
"grad_norm": 0.16816919039174055,
"learning_rate": 4.953136876274129e-06,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10549589991569519,
"step": 6730,
"valid_targets_mean": 8572.2,
"valid_targets_min": 1302
},
{
"epoch": 3.9734513274336285,
"grad_norm": 0.16156063084133174,
"learning_rate": 4.9260337416831315e-06,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12027633190155029,
"step": 6735,
"valid_targets_mean": 10365.0,
"valid_targets_min": 1880
},
{
"epoch": 3.976401179941003,
"grad_norm": 0.16418086724764425,
"learning_rate": 4.898994545180362e-06,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135321706533432,
"step": 6740,
"valid_targets_mean": 11930.6,
"valid_targets_min": 1431
},
{
"epoch": 3.9793510324483776,
"grad_norm": 0.16120879940989763,
"learning_rate": 4.872019401455914e-06,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11530904471874237,
"step": 6745,
"valid_targets_mean": 10015.8,
"valid_targets_min": 1439
},
{
"epoch": 3.982300884955752,
"grad_norm": 0.16461230557595902,
"learning_rate": 4.845108424928187e-06,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12305441498756409,
"step": 6750,
"valid_targets_mean": 10110.8,
"valid_targets_min": 2130
},
{
"epoch": 3.9852507374631267,
"grad_norm": 0.16618178125583494,
"learning_rate": 4.8182617297434074e-06,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11000995337963104,
"step": 6755,
"valid_targets_mean": 9938.6,
"valid_targets_min": 1395
},
{
"epoch": 3.9882005899705013,
"grad_norm": 0.17046042797200478,
"learning_rate": 4.791479429775147e-06,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14216330647468567,
"step": 6760,
"valid_targets_mean": 11508.6,
"valid_targets_min": 1832
},
{
"epoch": 3.991150442477876,
"grad_norm": 0.1518400194788491,
"learning_rate": 4.764761638623836e-06,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10530564188957214,
"step": 6765,
"valid_targets_mean": 9993.5,
"valid_targets_min": 2294
},
{
"epoch": 3.994100294985251,
"grad_norm": 0.1665719804740287,
"learning_rate": 4.738108469616285e-06,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1330103576183319,
"step": 6770,
"valid_targets_mean": 11300.2,
"valid_targets_min": 1578
},
{
"epoch": 3.9970501474926254,
"grad_norm": 0.163422115739297,
"learning_rate": 4.711520035805197e-06,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11337786912918091,
"step": 6775,
"valid_targets_mean": 10239.3,
"valid_targets_min": 1636
},
{
"epoch": 4.0,
"grad_norm": 0.17143272673619384,
"learning_rate": 4.6849964499686925e-06,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10329215228557587,
"step": 6780,
"valid_targets_mean": 9906.2,
"valid_targets_min": 1715
},
{
"epoch": 4.002949852507375,
"grad_norm": 0.16365821049173732,
"learning_rate": 4.65853782460985e-06,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09373873472213745,
"step": 6785,
"valid_targets_mean": 7547.9,
"valid_targets_min": 1398
},
{
"epoch": 4.005899705014749,
"grad_norm": 0.164443088571593,
"learning_rate": 4.632144271956169e-06,
"loss": 0.3509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1149953305721283,
"step": 6790,
"valid_targets_mean": 9679.5,
"valid_targets_min": 2137
},
{
"epoch": 4.008849557522124,
"grad_norm": 0.16651425905881423,
"learning_rate": 4.6058159039591875e-06,
"loss": 0.3539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10481321811676025,
"step": 6795,
"valid_targets_mean": 8938.5,
"valid_targets_min": 2170
},
{
"epoch": 4.011799410029498,
"grad_norm": 0.15841736021868594,
"learning_rate": 4.579552832293903e-06,
"loss": 0.3539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1180085763335228,
"step": 6800,
"valid_targets_mean": 10395.2,
"valid_targets_min": 2412
},
{
"epoch": 4.014749262536873,
"grad_norm": 0.16169146415784627,
"learning_rate": 4.5533551683583935e-06,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12989673018455505,
"step": 6805,
"valid_targets_mean": 10598.5,
"valid_targets_min": 1780
},
{
"epoch": 4.017699115044247,
"grad_norm": 0.1611965264717543,
"learning_rate": 4.527223023273275e-06,
"loss": 0.353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12244442850351334,
"step": 6810,
"valid_targets_mean": 10495.7,
"valid_targets_min": 1490
},
{
"epoch": 4.020648967551622,
"grad_norm": 0.15473504780481703,
"learning_rate": 4.501156507881262e-06,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1352512538433075,
"step": 6815,
"valid_targets_mean": 12575.5,
"valid_targets_min": 1549
},
{
"epoch": 4.023598820058997,
"grad_norm": 0.15054625331409213,
"learning_rate": 4.4751557327467145e-06,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13213303685188293,
"step": 6820,
"valid_targets_mean": 11952.8,
"valid_targets_min": 1639
},
{
"epoch": 4.0265486725663715,
"grad_norm": 0.16572229917038309,
"learning_rate": 4.449220808155103e-06,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11531409621238708,
"step": 6825,
"valid_targets_mean": 10646.2,
"valid_targets_min": 1310
},
{
"epoch": 4.0294985250737465,
"grad_norm": 0.15671781348401131,
"learning_rate": 4.42335184411264e-06,
"loss": 0.3572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11736129224300385,
"step": 6830,
"valid_targets_mean": 10609.1,
"valid_targets_min": 1471
},
{
"epoch": 4.032448377581121,
"grad_norm": 0.14812414015958358,
"learning_rate": 4.3975489503457e-06,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1351662576198578,
"step": 6835,
"valid_targets_mean": 12694.0,
"valid_targets_min": 1997
},
{
"epoch": 4.035398230088496,
"grad_norm": 0.1612795719679882,
"learning_rate": 4.371812236300468e-06,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12117096781730652,
"step": 6840,
"valid_targets_mean": 10021.1,
"valid_targets_min": 1342
},
{
"epoch": 4.038348082595871,
"grad_norm": 0.16538082905966264,
"learning_rate": 4.346141811142368e-06,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12282433360815048,
"step": 6845,
"valid_targets_mean": 10509.8,
"valid_targets_min": 2085
},
{
"epoch": 4.041297935103245,
"grad_norm": 0.16131890977155694,
"learning_rate": 4.320537783755694e-06,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11613143980503082,
"step": 6850,
"valid_targets_mean": 9730.3,
"valid_targets_min": 2631
},
{
"epoch": 4.04424778761062,
"grad_norm": 0.17654596470525524,
"learning_rate": 4.295000262743083e-06,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10903732478618622,
"step": 6855,
"valid_targets_mean": 9231.4,
"valid_targets_min": 2422
},
{
"epoch": 4.047197640117994,
"grad_norm": 0.17150669044213787,
"learning_rate": 4.2695293564250815e-06,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12391988188028336,
"step": 6860,
"valid_targets_mean": 9515.6,
"valid_targets_min": 1609
},
{
"epoch": 4.050147492625369,
"grad_norm": 0.15235581223553574,
"learning_rate": 4.244125172839684e-06,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09287584573030472,
"step": 6865,
"valid_targets_mean": 9326.3,
"valid_targets_min": 1804
},
{
"epoch": 4.053097345132743,
"grad_norm": 0.14906974124510863,
"learning_rate": 4.21878781974186e-06,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09931151568889618,
"step": 6870,
"valid_targets_mean": 8140.9,
"valid_targets_min": 1842
},
{
"epoch": 4.056047197640118,
"grad_norm": 0.16023146247364678,
"learning_rate": 4.193517404603142e-06,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10166919231414795,
"step": 6875,
"valid_targets_mean": 8372.6,
"valid_targets_min": 2308
},
{
"epoch": 4.058997050147493,
"grad_norm": 0.15800640221773357,
"learning_rate": 4.168314034611091e-06,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12523864209651947,
"step": 6880,
"valid_targets_mean": 10681.7,
"valid_targets_min": 1131
},
{
"epoch": 4.061946902654867,
"grad_norm": 0.1654824330981487,
"learning_rate": 4.143177816668931e-06,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12416894733905792,
"step": 6885,
"valid_targets_mean": 9500.6,
"valid_targets_min": 2254
},
{
"epoch": 4.064896755162242,
"grad_norm": 0.1656973469362214,
"learning_rate": 4.118108857395011e-06,
"loss": 0.3547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12975981831550598,
"step": 6890,
"valid_targets_mean": 11167.9,
"valid_targets_min": 2228
},
{
"epoch": 4.067846607669616,
"grad_norm": 0.16228434232902877,
"learning_rate": 4.093107263122433e-06,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12434341013431549,
"step": 6895,
"valid_targets_mean": 10814.7,
"valid_targets_min": 2296
},
{
"epoch": 4.070796460176991,
"grad_norm": 0.14909841844413213,
"learning_rate": 4.068173139898541e-06,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.109537772834301,
"step": 6900,
"valid_targets_mean": 10893.3,
"valid_targets_min": 1884
},
{
"epoch": 4.073746312684365,
"grad_norm": 0.15803593887854933,
"learning_rate": 4.043306593484493e-06,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11893521994352341,
"step": 6905,
"valid_targets_mean": 11079.8,
"valid_targets_min": 3070
},
{
"epoch": 4.07669616519174,
"grad_norm": 0.1614974693410678,
"learning_rate": 4.018507729354815e-06,
"loss": 0.3537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09593460708856583,
"step": 6910,
"valid_targets_mean": 8570.8,
"valid_targets_min": 1983
},
{
"epoch": 4.079646017699115,
"grad_norm": 0.1606360032844375,
"learning_rate": 3.99377665269695e-06,
"loss": 0.3571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14845268428325653,
"step": 6915,
"valid_targets_mean": 12068.4,
"valid_targets_min": 3185
},
{
"epoch": 4.0825958702064895,
"grad_norm": 0.14277977783783713,
"learning_rate": 3.969113468410813e-06,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10441142320632935,
"step": 6920,
"valid_targets_mean": 11027.8,
"valid_targets_min": 2368
},
{
"epoch": 4.0855457227138645,
"grad_norm": 0.16483615071706414,
"learning_rate": 3.944518281108343e-06,
"loss": 0.351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10914063453674316,
"step": 6925,
"valid_targets_mean": 9420.6,
"valid_targets_min": 1195
},
{
"epoch": 4.088495575221239,
"grad_norm": 0.16405075701609317,
"learning_rate": 3.919991195113062e-06,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13144291937351227,
"step": 6930,
"valid_targets_mean": 10658.9,
"valid_targets_min": 1980
},
{
"epoch": 4.091445427728614,
"grad_norm": 0.15517719230540983,
"learning_rate": 3.895532314459631e-06,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13165420293807983,
"step": 6935,
"valid_targets_mean": 11138.8,
"valid_targets_min": 2227
},
{
"epoch": 4.094395280235988,
"grad_norm": 0.15695515651139186,
"learning_rate": 3.87114174289341e-06,
"loss": 0.3568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11405207216739655,
"step": 6940,
"valid_targets_mean": 9765.3,
"valid_targets_min": 1932
},
{
"epoch": 4.097345132743363,
"grad_norm": 0.17367930962714068,
"learning_rate": 3.846819583870025e-06,
"loss": 0.3563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11271396279335022,
"step": 6945,
"valid_targets_mean": 9676.6,
"valid_targets_min": 1745
},
{
"epoch": 4.100294985250738,
"grad_norm": 0.17161773141660588,
"learning_rate": 3.822565940554912e-06,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11096750199794769,
"step": 6950,
"valid_targets_mean": 10371.6,
"valid_targets_min": 1888
},
{
"epoch": 4.103244837758112,
"grad_norm": 0.16258274272264253,
"learning_rate": 3.7983809158228902e-06,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11564739048480988,
"step": 6955,
"valid_targets_mean": 8439.3,
"valid_targets_min": 1277
},
{
"epoch": 4.106194690265487,
"grad_norm": 0.1693204121188279,
"learning_rate": 3.7742646122577297e-06,
"loss": 0.35,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1281132996082306,
"step": 6960,
"valid_targets_mean": 11040.0,
"valid_targets_min": 2677
},
{
"epoch": 4.109144542772861,
"grad_norm": 0.151024673086712,
"learning_rate": 3.7502171321517057e-06,
"loss": 0.3518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09777649492025375,
"step": 6965,
"valid_targets_mean": 8500.1,
"valid_targets_min": 2033
},
{
"epoch": 4.112094395280236,
"grad_norm": 0.18444964223806018,
"learning_rate": 3.7262385775051722e-06,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11289547383785248,
"step": 6970,
"valid_targets_mean": 9576.9,
"valid_targets_min": 969
},
{
"epoch": 4.115044247787611,
"grad_norm": 0.1614686465505653,
"learning_rate": 3.702329050026132e-06,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11157312244176865,
"step": 6975,
"valid_targets_mean": 8877.5,
"valid_targets_min": 1814
},
{
"epoch": 4.117994100294985,
"grad_norm": 0.17523462686891175,
"learning_rate": 3.6784886511297947e-06,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12200837582349777,
"step": 6980,
"valid_targets_mean": 9325.3,
"valid_targets_min": 1594
},
{
"epoch": 4.12094395280236,
"grad_norm": 0.1631631704226555,
"learning_rate": 3.654717481938148e-06,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10229149460792542,
"step": 6985,
"valid_targets_mean": 9552.2,
"valid_targets_min": 1684
},
{
"epoch": 4.123893805309734,
"grad_norm": 0.15629991294424075,
"learning_rate": 3.631015643279556e-06,
"loss": 0.3518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10814925283193588,
"step": 6990,
"valid_targets_mean": 8981.8,
"valid_targets_min": 1527
},
{
"epoch": 4.126843657817109,
"grad_norm": 0.17070790018436796,
"learning_rate": 3.6073832356882734e-06,
"loss": 0.3518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1253635287284851,
"step": 6995,
"valid_targets_mean": 10686.9,
"valid_targets_min": 2034
},
{
"epoch": 4.129793510324483,
"grad_norm": 0.16450992652358207,
"learning_rate": 3.5838203594040933e-06,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320553421974182,
"step": 7000,
"valid_targets_mean": 10600.8,
"valid_targets_min": 489
},
{
"epoch": 4.132743362831858,
"grad_norm": 0.15081212631556418,
"learning_rate": 3.560327114371842e-06,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11111602932214737,
"step": 7005,
"valid_targets_mean": 9837.0,
"valid_targets_min": 2066
},
{
"epoch": 4.135693215339233,
"grad_norm": 0.14274429369209427,
"learning_rate": 3.536903600241033e-06,
"loss": 0.3528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11591881513595581,
"step": 7010,
"valid_targets_mean": 11523.9,
"valid_targets_min": 2625
},
{
"epoch": 4.1386430678466075,
"grad_norm": 0.15333519477139126,
"learning_rate": 3.5135499163653885e-06,
"loss": 0.353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12132668495178223,
"step": 7015,
"valid_targets_mean": 11195.9,
"valid_targets_min": 3507
},
{
"epoch": 4.1415929203539825,
"grad_norm": 0.16346855146116562,
"learning_rate": 3.4902661618024356e-06,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12647776305675507,
"step": 7020,
"valid_targets_mean": 9740.0,
"valid_targets_min": 1768
},
{
"epoch": 4.144542772861357,
"grad_norm": 0.15472435020929068,
"learning_rate": 3.467052435313105e-06,
"loss": 0.3598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0965496152639389,
"step": 7025,
"valid_targets_mean": 8208.5,
"valid_targets_min": 1597
},
{
"epoch": 4.147492625368732,
"grad_norm": 0.1565591225922802,
"learning_rate": 3.443908835361267e-06,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12220700830221176,
"step": 7030,
"valid_targets_mean": 10105.2,
"valid_targets_min": 1622
},
{
"epoch": 4.150442477876107,
"grad_norm": 0.16216119191777653,
"learning_rate": 3.4208354601133764e-06,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10918645560741425,
"step": 7035,
"valid_targets_mean": 8631.7,
"valid_targets_min": 1531
},
{
"epoch": 4.153392330383481,
"grad_norm": 0.15150502470187602,
"learning_rate": 3.3978324074379777e-06,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1369277685880661,
"step": 7040,
"valid_targets_mean": 12891.5,
"valid_targets_min": 2405
},
{
"epoch": 4.156342182890856,
"grad_norm": 0.15950154019979157,
"learning_rate": 3.3748997749053824e-06,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11721132695674896,
"step": 7045,
"valid_targets_mean": 9850.0,
"valid_targets_min": 1924
},
{
"epoch": 4.15929203539823,
"grad_norm": 0.15273820356160808,
"learning_rate": 3.3520376597871572e-06,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12347143888473511,
"step": 7050,
"valid_targets_mean": 11106.8,
"valid_targets_min": 1673
},
{
"epoch": 4.162241887905605,
"grad_norm": 0.15376128423998026,
"learning_rate": 3.3292461590558056e-06,
"loss": 0.3585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1032019555568695,
"step": 7055,
"valid_targets_mean": 8959.6,
"valid_targets_min": 457
},
{
"epoch": 4.165191740412979,
"grad_norm": 0.15639978630694426,
"learning_rate": 3.3065253693842815e-06,
"loss": 0.3482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10558753460645676,
"step": 7060,
"valid_targets_mean": 8709.6,
"valid_targets_min": 2292
},
{
"epoch": 4.168141592920354,
"grad_norm": 0.1608503151554277,
"learning_rate": 3.2838753871456187e-06,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11058098077774048,
"step": 7065,
"valid_targets_mean": 9885.4,
"valid_targets_min": 1487
},
{
"epoch": 4.171091445427729,
"grad_norm": 0.16021384382226492,
"learning_rate": 3.2612963084125116e-06,
"loss": 0.3576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12647023797035217,
"step": 7070,
"valid_targets_mean": 10233.0,
"valid_targets_min": 1671
},
{
"epoch": 4.174041297935103,
"grad_norm": 0.1591375323482639,
"learning_rate": 3.238788228956913e-06,
"loss": 0.3604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09633976966142654,
"step": 7075,
"valid_targets_mean": 8591.2,
"valid_targets_min": 1590
},
{
"epoch": 4.176991150442478,
"grad_norm": 0.16074130498635006,
"learning_rate": 3.216351244249616e-06,
"loss": 0.3519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11467361450195312,
"step": 7080,
"valid_targets_mean": 10684.5,
"valid_targets_min": 1611
},
{
"epoch": 4.179941002949852,
"grad_norm": 0.153650155824368,
"learning_rate": 3.193985449459858e-06,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11654568463563919,
"step": 7085,
"valid_targets_mean": 10672.2,
"valid_targets_min": 1664
},
{
"epoch": 4.182890855457227,
"grad_norm": 0.15872416144427312,
"learning_rate": 3.17169093945493e-06,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09964530169963837,
"step": 7090,
"valid_targets_mean": 9493.7,
"valid_targets_min": 1927
},
{
"epoch": 4.185840707964601,
"grad_norm": 0.16000582646104505,
"learning_rate": 3.149467808799729e-06,
"loss": 0.3549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12831947207450867,
"step": 7095,
"valid_targets_mean": 10516.8,
"valid_targets_min": 1508
},
{
"epoch": 4.188790560471976,
"grad_norm": 0.14935677128155156,
"learning_rate": 3.127316151756421e-06,
"loss": 0.353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14910808205604553,
"step": 7100,
"valid_targets_mean": 13157.5,
"valid_targets_min": 2815
},
{
"epoch": 4.191740412979351,
"grad_norm": 0.15483681811534517,
"learning_rate": 3.1052360622839895e-06,
"loss": 0.3554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12956783175468445,
"step": 7105,
"valid_targets_mean": 11703.2,
"valid_targets_min": 1570
},
{
"epoch": 4.1946902654867255,
"grad_norm": 0.14466320946338967,
"learning_rate": 3.0832276340378573e-06,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13992691040039062,
"step": 7110,
"valid_targets_mean": 12907.7,
"valid_targets_min": 1243
},
{
"epoch": 4.1976401179941005,
"grad_norm": 0.157117658276334,
"learning_rate": 3.061290960369492e-06,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13075107336044312,
"step": 7115,
"valid_targets_mean": 10809.4,
"valid_targets_min": 1625
},
{
"epoch": 4.200589970501475,
"grad_norm": 0.16367009287077325,
"learning_rate": 3.0394261343259978e-06,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11082293093204498,
"step": 7120,
"valid_targets_mean": 9769.5,
"valid_targets_min": 2194
},
{
"epoch": 4.20353982300885,
"grad_norm": 0.161926795541957,
"learning_rate": 3.017633248649736e-06,
"loss": 0.3598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13230161368846893,
"step": 7125,
"valid_targets_mean": 10109.1,
"valid_targets_min": 1969
},
{
"epoch": 4.206489675516224,
"grad_norm": 0.1477163900435012,
"learning_rate": 2.9959123957779203e-06,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12325777858495712,
"step": 7130,
"valid_targets_mean": 11069.5,
"valid_targets_min": 2258
},
{
"epoch": 4.209439528023599,
"grad_norm": 0.15506843168361162,
"learning_rate": 2.9742636678422253e-06,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11096407473087311,
"step": 7135,
"valid_targets_mean": 9698.0,
"valid_targets_min": 2368
},
{
"epoch": 4.212389380530974,
"grad_norm": 0.16109254954313149,
"learning_rate": 2.952687156668408e-06,
"loss": 0.3529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11004975438117981,
"step": 7140,
"valid_targets_mean": 9400.0,
"valid_targets_min": 1805
},
{
"epoch": 4.215339233038348,
"grad_norm": 0.14890135216272918,
"learning_rate": 2.931182953775895e-06,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10987749695777893,
"step": 7145,
"valid_targets_mean": 11538.3,
"valid_targets_min": 2481
},
{
"epoch": 4.218289085545723,
"grad_norm": 0.15280391232069168,
"learning_rate": 2.909751150377429e-06,
"loss": 0.3518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11714964359998703,
"step": 7150,
"valid_targets_mean": 10323.9,
"valid_targets_min": 1960
},
{
"epoch": 4.221238938053097,
"grad_norm": 0.1603710398345934,
"learning_rate": 2.888391837378641e-06,
"loss": 0.353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13210344314575195,
"step": 7155,
"valid_targets_mean": 10748.8,
"valid_targets_min": 1490
},
{
"epoch": 4.224188790560472,
"grad_norm": 0.14641270144989635,
"learning_rate": 2.8671051053776944e-06,
"loss": 0.3561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11850255727767944,
"step": 7160,
"valid_targets_mean": 11708.2,
"valid_targets_min": 2442
},
{
"epoch": 4.227138643067847,
"grad_norm": 0.16286550427689112,
"learning_rate": 2.8458910446648923e-06,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11870785057544708,
"step": 7165,
"valid_targets_mean": 8852.9,
"valid_targets_min": 216
},
{
"epoch": 4.230088495575221,
"grad_norm": 0.1556260555961893,
"learning_rate": 2.8247497452222883e-06,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11046218127012253,
"step": 7170,
"valid_targets_mean": 9240.8,
"valid_targets_min": 1875
},
{
"epoch": 4.233038348082596,
"grad_norm": 0.1586469227537557,
"learning_rate": 2.803681296723313e-06,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10672442615032196,
"step": 7175,
"valid_targets_mean": 8434.4,
"valid_targets_min": 1529
},
{
"epoch": 4.23598820058997,
"grad_norm": 0.15901563453616538,
"learning_rate": 2.7826857885323934e-06,
"loss": 0.3611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10011562705039978,
"step": 7180,
"valid_targets_mean": 8519.2,
"valid_targets_min": 1630
},
{
"epoch": 4.238938053097345,
"grad_norm": 0.15867627879458304,
"learning_rate": 2.761763309704568e-06,
"loss": 0.3537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11282973736524582,
"step": 7185,
"valid_targets_mean": 9477.0,
"valid_targets_min": 1957
},
{
"epoch": 4.241887905604719,
"grad_norm": 0.15255571081123262,
"learning_rate": 2.7409139489851066e-06,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12214551120996475,
"step": 7190,
"valid_targets_mean": 10635.3,
"valid_targets_min": 2955
},
{
"epoch": 4.244837758112094,
"grad_norm": 0.15171028129243372,
"learning_rate": 2.7201377948091614e-06,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11917664855718613,
"step": 7195,
"valid_targets_mean": 11111.0,
"valid_targets_min": 2898
},
{
"epoch": 4.247787610619469,
"grad_norm": 0.15175919291626522,
"learning_rate": 2.699434935301335e-06,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1180785596370697,
"step": 7200,
"valid_targets_mean": 10576.7,
"valid_targets_min": 2780
},
{
"epoch": 4.2507374631268435,
"grad_norm": 0.16419494179861108,
"learning_rate": 2.67880545827538e-06,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14159059524536133,
"step": 7205,
"valid_targets_mean": 12024.1,
"valid_targets_min": 2727
},
{
"epoch": 4.2536873156342185,
"grad_norm": 0.15479354424867625,
"learning_rate": 2.65824945123375e-06,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11950947344303131,
"step": 7210,
"valid_targets_mean": 9545.0,
"valid_targets_min": 1882
},
{
"epoch": 4.256637168141593,
"grad_norm": 0.16371358786704585,
"learning_rate": 2.6377670013672998e-06,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10644177347421646,
"step": 7215,
"valid_targets_mean": 8259.6,
"valid_targets_min": 1045
},
{
"epoch": 4.259587020648968,
"grad_norm": 0.15805330816406019,
"learning_rate": 2.6173581955548644e-06,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12316429615020752,
"step": 7220,
"valid_targets_mean": 10127.1,
"valid_targets_min": 1797
},
{
"epoch": 4.262536873156342,
"grad_norm": 0.1595140145705862,
"learning_rate": 2.597023120362907e-06,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11776896566152573,
"step": 7225,
"valid_targets_mean": 8850.4,
"valid_targets_min": 1524
},
{
"epoch": 4.265486725663717,
"grad_norm": 0.15507688803698258,
"learning_rate": 2.576761862045174e-06,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09920550137758255,
"step": 7230,
"valid_targets_mean": 8547.2,
"valid_targets_min": 1657
},
{
"epoch": 4.268436578171092,
"grad_norm": 0.1613867067717064,
"learning_rate": 2.5565745065422733e-06,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10289187729358673,
"step": 7235,
"valid_targets_mean": 7498.9,
"valid_targets_min": 2006
},
{
"epoch": 4.271386430678466,
"grad_norm": 0.15493360164306041,
"learning_rate": 2.536461139481383e-06,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283939778804779,
"step": 7240,
"valid_targets_mean": 10987.5,
"valid_targets_min": 2508
},
{
"epoch": 4.274336283185841,
"grad_norm": 0.14748392784313846,
"learning_rate": 2.516421846175814e-06,
"loss": 0.3698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11385820806026459,
"step": 7245,
"valid_targets_mean": 10292.0,
"valid_targets_min": 2280
},
{
"epoch": 4.277286135693215,
"grad_norm": 0.1479679407796802,
"learning_rate": 2.4964567116247172e-06,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12190468609333038,
"step": 7250,
"valid_targets_mean": 10601.8,
"valid_targets_min": 1396
},
{
"epoch": 4.28023598820059,
"grad_norm": 0.15897034975450886,
"learning_rate": 2.476565820512664e-06,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13549286127090454,
"step": 7255,
"valid_targets_mean": 9942.6,
"valid_targets_min": 2133
},
{
"epoch": 4.283185840707965,
"grad_norm": 0.1540025059352752,
"learning_rate": 2.4567492572093298e-06,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1373451054096222,
"step": 7260,
"valid_targets_mean": 9759.4,
"valid_targets_min": 1581
},
{
"epoch": 4.286135693215339,
"grad_norm": 0.14967079433299837,
"learning_rate": 2.4370071057691135e-06,
"loss": 0.3646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13896623253822327,
"step": 7265,
"valid_targets_mean": 10620.5,
"valid_targets_min": 1461
},
{
"epoch": 4.289085545722714,
"grad_norm": 0.1635262716112185,
"learning_rate": 2.4173394499307846e-06,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11073658615350723,
"step": 7270,
"valid_targets_mean": 8787.5,
"valid_targets_min": 2197
},
{
"epoch": 4.292035398230088,
"grad_norm": 0.15662348738576132,
"learning_rate": 2.3977463731171336e-06,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10898212343454361,
"step": 7275,
"valid_targets_mean": 9077.8,
"valid_targets_min": 2800
},
{
"epoch": 4.294985250737463,
"grad_norm": 0.15856289750370217,
"learning_rate": 2.378227958434616e-06,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12312222272157669,
"step": 7280,
"valid_targets_mean": 9941.8,
"valid_targets_min": 2260
},
{
"epoch": 4.297935103244837,
"grad_norm": 0.14811468463044616,
"learning_rate": 2.3587842886729905e-06,
"loss": 0.37,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12280742079019547,
"step": 7285,
"valid_targets_mean": 10138.6,
"valid_targets_min": 1655
},
{
"epoch": 4.300884955752212,
"grad_norm": 0.15642409319377618,
"learning_rate": 2.3394154463049847e-06,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13053852319717407,
"step": 7290,
"valid_targets_mean": 9809.2,
"valid_targets_min": 1817
},
{
"epoch": 4.303834808259587,
"grad_norm": 0.15905712907842334,
"learning_rate": 2.3201215134859424e-06,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14553436636924744,
"step": 7295,
"valid_targets_mean": 11053.2,
"valid_targets_min": 1891
},
{
"epoch": 4.3067846607669615,
"grad_norm": 0.15633498376543936,
"learning_rate": 2.300902572053445e-06,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1423797309398651,
"step": 7300,
"valid_targets_mean": 10950.2,
"valid_targets_min": 2265
},
{
"epoch": 4.3097345132743365,
"grad_norm": 0.15432556400228098,
"learning_rate": 2.281758703527015e-06,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11870302259922028,
"step": 7305,
"valid_targets_mean": 9727.5,
"valid_targets_min": 1294
},
{
"epoch": 4.312684365781711,
"grad_norm": 0.14855891542283822,
"learning_rate": 2.2626899891077337e-06,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1254224181175232,
"step": 7310,
"valid_targets_mean": 10823.4,
"valid_targets_min": 2542
},
{
"epoch": 4.315634218289086,
"grad_norm": 0.1481578289958286,
"learning_rate": 2.243696509677904e-06,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12209489196538925,
"step": 7315,
"valid_targets_mean": 10381.6,
"valid_targets_min": 1504
},
{
"epoch": 4.31858407079646,
"grad_norm": 0.154762941329994,
"learning_rate": 2.2247783458007133e-06,
"loss": 0.3634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14160534739494324,
"step": 7320,
"valid_targets_mean": 10812.6,
"valid_targets_min": 1055
},
{
"epoch": 4.321533923303835,
"grad_norm": 0.15270881348781443,
"learning_rate": 2.2059355777198888e-06,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11081090569496155,
"step": 7325,
"valid_targets_mean": 9040.8,
"valid_targets_min": 1130
},
{
"epoch": 4.32448377581121,
"grad_norm": 0.1548144163105394,
"learning_rate": 2.1871682853593555e-06,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10774673521518707,
"step": 7330,
"valid_targets_mean": 9655.9,
"valid_targets_min": 1410
},
{
"epoch": 4.327433628318584,
"grad_norm": 0.1504121646183315,
"learning_rate": 2.1684765483228997e-06,
"loss": 0.3646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10418853163719177,
"step": 7335,
"valid_targets_mean": 8905.6,
"valid_targets_min": 1830
},
{
"epoch": 4.330383480825959,
"grad_norm": 0.14775000972766456,
"learning_rate": 2.1498604458938344e-06,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11074630171060562,
"step": 7340,
"valid_targets_mean": 9882.5,
"valid_targets_min": 2408
},
{
"epoch": 4.333333333333333,
"grad_norm": 0.15125604827288272,
"learning_rate": 2.1313200570346513e-06,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1144319623708725,
"step": 7345,
"valid_targets_mean": 9463.4,
"valid_targets_min": 1659
},
{
"epoch": 4.336283185840708,
"grad_norm": 0.15304017102252931,
"learning_rate": 2.112855460386698e-06,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.111595019698143,
"step": 7350,
"valid_targets_mean": 11038.2,
"valid_targets_min": 1531
},
{
"epoch": 4.339233038348082,
"grad_norm": 0.15292973670461382,
"learning_rate": 2.094466734269849e-06,
"loss": 0.3639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12869225442409515,
"step": 7355,
"valid_targets_mean": 10074.7,
"valid_targets_min": 2085
},
{
"epoch": 4.342182890855457,
"grad_norm": 0.14270513753434333,
"learning_rate": 2.076153956682139e-06,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10554344952106476,
"step": 7360,
"valid_targets_mean": 10108.6,
"valid_targets_min": 1642
},
{
"epoch": 4.345132743362832,
"grad_norm": 0.15014445897583023,
"learning_rate": 2.057917205299489e-06,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12004509568214417,
"step": 7365,
"valid_targets_mean": 9673.6,
"valid_targets_min": 997
},
{
"epoch": 4.348082595870206,
"grad_norm": 0.1576340334574788,
"learning_rate": 2.0397565574753255e-06,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10483772307634354,
"step": 7370,
"valid_targets_mean": 8708.4,
"valid_targets_min": 1573
},
{
"epoch": 4.351032448377581,
"grad_norm": 0.148042243945791,
"learning_rate": 2.0216720902402764e-06,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13991913199424744,
"step": 7375,
"valid_targets_mean": 12304.2,
"valid_targets_min": 1814
},
{
"epoch": 4.353982300884955,
"grad_norm": 0.16331630126439883,
"learning_rate": 2.0036638803018425e-06,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12212497740983963,
"step": 7380,
"valid_targets_mean": 11132.8,
"valid_targets_min": 1200
},
{
"epoch": 4.35693215339233,
"grad_norm": 0.15437374905079762,
"learning_rate": 1.98573200404407e-06,
"loss": 0.3732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13012322783470154,
"step": 7385,
"valid_targets_mean": 10237.6,
"valid_targets_min": 950
},
{
"epoch": 4.359882005899705,
"grad_norm": 0.15337072869070487,
"learning_rate": 1.9678765375272223e-06,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10758992284536362,
"step": 7390,
"valid_targets_mean": 10417.7,
"valid_targets_min": 2034
},
{
"epoch": 4.3628318584070795,
"grad_norm": 0.14886015288265325,
"learning_rate": 1.9500975564874626e-06,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12389254570007324,
"step": 7395,
"valid_targets_mean": 11726.6,
"valid_targets_min": 1312
},
{
"epoch": 4.3657817109144545,
"grad_norm": 0.1529975346049962,
"learning_rate": 1.9323951363365423e-06,
"loss": 0.3643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1035454124212265,
"step": 7400,
"valid_targets_mean": 8954.2,
"valid_targets_min": 1876
},
{
"epoch": 4.368731563421829,
"grad_norm": 0.16267312185022692,
"learning_rate": 1.9147693521614475e-06,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419374942779541,
"step": 7405,
"valid_targets_mean": 10257.4,
"valid_targets_min": 2939
},
{
"epoch": 4.371681415929204,
"grad_norm": 0.15661576832988683,
"learning_rate": 1.8972202787241345e-06,
"loss": 0.3634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11530675739049911,
"step": 7410,
"valid_targets_mean": 9281.1,
"valid_targets_min": 2123
},
{
"epoch": 4.374631268436578,
"grad_norm": 0.16089922557143402,
"learning_rate": 1.8797479904611448e-06,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313277781009674,
"step": 7415,
"valid_targets_mean": 9339.8,
"valid_targets_min": 2558
},
{
"epoch": 4.377581120943953,
"grad_norm": 0.1719192971303852,
"learning_rate": 1.8623525614833582e-06,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1218654215335846,
"step": 7420,
"valid_targets_mean": 9360.2,
"valid_targets_min": 2415
},
{
"epoch": 4.380530973451328,
"grad_norm": 0.1661511961649541,
"learning_rate": 1.8450340655756304e-06,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11054585874080658,
"step": 7425,
"valid_targets_mean": 8395.6,
"valid_targets_min": 1630
},
{
"epoch": 4.383480825958702,
"grad_norm": 0.15705768164396808,
"learning_rate": 1.8277925761964965e-06,
"loss": 0.3589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14034216105937958,
"step": 7430,
"valid_targets_mean": 12708.2,
"valid_targets_min": 3373
},
{
"epoch": 4.386430678466077,
"grad_norm": 0.14410972407670963,
"learning_rate": 1.8106281664778701e-06,
"loss": 0.3565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1108931228518486,
"step": 7435,
"valid_targets_mean": 11102.9,
"valid_targets_min": 2383
},
{
"epoch": 4.389380530973451,
"grad_norm": 0.1585707239081277,
"learning_rate": 1.7935409092247002e-06,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11846847832202911,
"step": 7440,
"valid_targets_mean": 9429.2,
"valid_targets_min": 1243
},
{
"epoch": 4.392330383480826,
"grad_norm": 0.15606287790344534,
"learning_rate": 1.7765308769147105e-06,
"loss": 0.3626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13980810344219208,
"step": 7445,
"valid_targets_mean": 12589.8,
"valid_targets_min": 1293
},
{
"epoch": 4.395280235988201,
"grad_norm": 0.14761791334704993,
"learning_rate": 1.75959814169804e-06,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11588216572999954,
"step": 7450,
"valid_targets_mean": 9731.8,
"valid_targets_min": 1129
},
{
"epoch": 4.398230088495575,
"grad_norm": 0.1523426665062693,
"learning_rate": 1.7427427753969884e-06,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09459323436021805,
"step": 7455,
"valid_targets_mean": 8218.8,
"valid_targets_min": 595
},
{
"epoch": 4.40117994100295,
"grad_norm": 0.15717516506454268,
"learning_rate": 1.7259648495056568e-06,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1137595921754837,
"step": 7460,
"valid_targets_mean": 9081.4,
"valid_targets_min": 888
},
{
"epoch": 4.404129793510324,
"grad_norm": 0.14821901334735668,
"learning_rate": 1.709264435189699e-06,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12101010233163834,
"step": 7465,
"valid_targets_mean": 10127.8,
"valid_targets_min": 1547
},
{
"epoch": 4.407079646017699,
"grad_norm": 0.14856901343181347,
"learning_rate": 1.6926416032859826e-06,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11522223055362701,
"step": 7470,
"valid_targets_mean": 9777.3,
"valid_targets_min": 1666
},
{
"epoch": 4.410029498525073,
"grad_norm": 0.14887002814263378,
"learning_rate": 1.676096424302298e-06,
"loss": 0.3626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10992522537708282,
"step": 7475,
"valid_targets_mean": 8813.1,
"valid_targets_min": 2184
},
{
"epoch": 4.412979351032448,
"grad_norm": 0.15536381393469378,
"learning_rate": 1.6596289684170642e-06,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11852423846721649,
"step": 7480,
"valid_targets_mean": 9679.6,
"valid_targets_min": 2445
},
{
"epoch": 4.415929203539823,
"grad_norm": 0.14499491945938592,
"learning_rate": 1.6432393054790274e-06,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11371295899152756,
"step": 7485,
"valid_targets_mean": 10510.3,
"valid_targets_min": 1998
},
{
"epoch": 4.4188790560471976,
"grad_norm": 0.1610486095581393,
"learning_rate": 1.6269275050069677e-06,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595916897058487,
"step": 7490,
"valid_targets_mean": 12465.5,
"valid_targets_min": 1710
},
{
"epoch": 4.421828908554573,
"grad_norm": 0.16414754925895014,
"learning_rate": 1.6106936361893977e-06,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13262584805488586,
"step": 7495,
"valid_targets_mean": 10231.8,
"valid_targets_min": 2259
},
{
"epoch": 4.424778761061947,
"grad_norm": 0.15688636504001732,
"learning_rate": 1.5945377678842766e-06,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13062500953674316,
"step": 7500,
"valid_targets_mean": 13320.7,
"valid_targets_min": 1376
},
{
"epoch": 4.427728613569322,
"grad_norm": 0.150362961681588,
"learning_rate": 1.5784599686187085e-06,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09411562979221344,
"step": 7505,
"valid_targets_mean": 8426.0,
"valid_targets_min": 1654
},
{
"epoch": 4.430678466076696,
"grad_norm": 0.16055863518167604,
"learning_rate": 1.5624603065886734e-06,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10464043915271759,
"step": 7510,
"valid_targets_mean": 8610.3,
"valid_targets_min": 2335
},
{
"epoch": 4.433628318584071,
"grad_norm": 0.15928012971833783,
"learning_rate": 1.5465388496587053e-06,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11390765011310577,
"step": 7515,
"valid_targets_mean": 9733.9,
"valid_targets_min": 2604
},
{
"epoch": 4.436578171091446,
"grad_norm": 0.15983062111463275,
"learning_rate": 1.53069566536163e-06,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09258467704057693,
"step": 7520,
"valid_targets_mean": 7887.3,
"valid_targets_min": 961
},
{
"epoch": 4.43952802359882,
"grad_norm": 0.1480222383713337,
"learning_rate": 1.5149308208982726e-06,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298375427722931,
"step": 7525,
"valid_targets_mean": 12008.4,
"valid_targets_min": 3631
},
{
"epoch": 4.442477876106195,
"grad_norm": 0.1528172900821816,
"learning_rate": 1.4992443831371596e-06,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12460409104824066,
"step": 7530,
"valid_targets_mean": 11155.2,
"valid_targets_min": 2731
},
{
"epoch": 4.445427728613569,
"grad_norm": 0.15414750220527093,
"learning_rate": 1.4836364186142582e-06,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11743897199630737,
"step": 7535,
"valid_targets_mean": 10674.4,
"valid_targets_min": 1317
},
{
"epoch": 4.448377581120944,
"grad_norm": 0.15382813152212646,
"learning_rate": 1.468106993532674e-06,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13689687848091125,
"step": 7540,
"valid_targets_mean": 11136.4,
"valid_targets_min": 1890
},
{
"epoch": 4.451327433628318,
"grad_norm": 0.15966041725784386,
"learning_rate": 1.4526561737623811e-06,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14471429586410522,
"step": 7545,
"valid_targets_mean": 12538.8,
"valid_targets_min": 1856
},
{
"epoch": 4.454277286135693,
"grad_norm": 0.15405263130677785,
"learning_rate": 1.4372840248399378e-06,
"loss": 0.3552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1332360804080963,
"step": 7550,
"valid_targets_mean": 11351.3,
"valid_targets_min": 1738
},
{
"epoch": 4.457227138643068,
"grad_norm": 0.1454681616170232,
"learning_rate": 1.421990611968207e-06,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09641964733600616,
"step": 7555,
"valid_targets_mean": 9638.6,
"valid_targets_min": 2769
},
{
"epoch": 4.460176991150442,
"grad_norm": 0.15619107717952554,
"learning_rate": 1.4067760000160968e-06,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11662718653678894,
"step": 7560,
"valid_targets_mean": 10217.3,
"valid_targets_min": 1867
},
{
"epoch": 4.463126843657817,
"grad_norm": 0.1643135977247633,
"learning_rate": 1.3916402535182494e-06,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1154789924621582,
"step": 7565,
"valid_targets_mean": 10830.1,
"valid_targets_min": 2056
},
{
"epoch": 4.466076696165191,
"grad_norm": 0.15658719880104097,
"learning_rate": 1.37658343667481e-06,
"loss": 0.3419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09098144620656967,
"step": 7570,
"valid_targets_mean": 8065.7,
"valid_targets_min": 2250
},
{
"epoch": 4.469026548672566,
"grad_norm": 0.15305545076889765,
"learning_rate": 1.3616056133511245e-06,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10880333185195923,
"step": 7575,
"valid_targets_mean": 10655.2,
"valid_targets_min": 2555
},
{
"epoch": 4.4719764011799406,
"grad_norm": 0.15316371686221492,
"learning_rate": 1.346706847077477e-06,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12371876835823059,
"step": 7580,
"valid_targets_mean": 11071.5,
"valid_targets_min": 860
},
{
"epoch": 4.474926253687316,
"grad_norm": 0.17027456090998858,
"learning_rate": 1.3318872010488227e-06,
"loss": 0.3398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13155479729175568,
"step": 7585,
"valid_targets_mean": 11408.9,
"valid_targets_min": 2015
},
{
"epoch": 4.477876106194691,
"grad_norm": 0.15247149515898822,
"learning_rate": 1.3171467381245217e-06,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09567923843860626,
"step": 7590,
"valid_targets_mean": 9568.1,
"valid_targets_min": 1913
},
{
"epoch": 4.480825958702065,
"grad_norm": 0.1606651379781345,
"learning_rate": 1.3024855208280628e-06,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10479949414730072,
"step": 7595,
"valid_targets_mean": 9056.0,
"valid_targets_min": 1585
},
{
"epoch": 4.48377581120944,
"grad_norm": 0.1511496049987001,
"learning_rate": 1.2879036113468103e-06,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1336202174425125,
"step": 7600,
"valid_targets_mean": 13044.3,
"valid_targets_min": 2160
},
{
"epoch": 4.486725663716814,
"grad_norm": 0.1547336928002793,
"learning_rate": 1.273401071531739e-06,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09686368703842163,
"step": 7605,
"valid_targets_mean": 9486.9,
"valid_targets_min": 1543
},
{
"epoch": 4.489675516224189,
"grad_norm": 0.1499179724291536,
"learning_rate": 1.2589779628971498e-06,
"loss": 0.3476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09721426665782928,
"step": 7610,
"valid_targets_mean": 9637.9,
"valid_targets_min": 1453
},
{
"epoch": 4.492625368731564,
"grad_norm": 0.16171085592994147,
"learning_rate": 1.2446343466204525e-06,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1449803113937378,
"step": 7615,
"valid_targets_mean": 11221.1,
"valid_targets_min": 1861
},
{
"epoch": 4.495575221238938,
"grad_norm": 0.1615174407179875,
"learning_rate": 1.2303702835418485e-06,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09636390209197998,
"step": 7620,
"valid_targets_mean": 7896.7,
"valid_targets_min": 1601
},
{
"epoch": 4.498525073746313,
"grad_norm": 0.1515588014050659,
"learning_rate": 1.2161858341641342e-06,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12471356987953186,
"step": 7625,
"valid_targets_mean": 11206.3,
"valid_targets_min": 2567
},
{
"epoch": 4.501474926253687,
"grad_norm": 0.15162574672995982,
"learning_rate": 1.2020810586524e-06,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12063919007778168,
"step": 7630,
"valid_targets_mean": 9940.7,
"valid_targets_min": 1487
},
{
"epoch": 4.504424778761062,
"grad_norm": 0.15943299985208736,
"learning_rate": 1.1880560168337896e-06,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11519865691661835,
"step": 7635,
"valid_targets_mean": 9426.9,
"valid_targets_min": 1920
},
{
"epoch": 4.507374631268437,
"grad_norm": 0.1662033503787035,
"learning_rate": 1.1741107681972496e-06,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09789461642503738,
"step": 7640,
"valid_targets_mean": 7889.9,
"valid_targets_min": 1997
},
{
"epoch": 4.510324483775811,
"grad_norm": 0.16145641216897003,
"learning_rate": 1.1602453718932715e-06,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09589747339487076,
"step": 7645,
"valid_targets_mean": 8702.3,
"valid_targets_min": 2150
},
{
"epoch": 4.513274336283186,
"grad_norm": 0.15162396305291637,
"learning_rate": 1.1464598867336528e-06,
"loss": 0.3379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134039506316185,
"step": 7650,
"valid_targets_mean": 11533.9,
"valid_targets_min": 1871
},
{
"epoch": 4.51622418879056,
"grad_norm": 0.15346636062924254,
"learning_rate": 1.132754371191218e-06,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10973073542118073,
"step": 7655,
"valid_targets_mean": 10099.0,
"valid_targets_min": 2449
},
{
"epoch": 4.519174041297935,
"grad_norm": 0.1559081775420403,
"learning_rate": 1.119128883399614e-06,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12783056497573853,
"step": 7660,
"valid_targets_mean": 10613.0,
"valid_targets_min": 1767
},
{
"epoch": 4.522123893805309,
"grad_norm": 0.20211025090903367,
"learning_rate": 1.1055834811530165e-06,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11391949653625488,
"step": 7665,
"valid_targets_mean": 9735.8,
"valid_targets_min": 1444
},
{
"epoch": 4.525073746312684,
"grad_norm": 0.14976916014788086,
"learning_rate": 1.0921182219059335e-06,
"loss": 0.353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12497693300247192,
"step": 7670,
"valid_targets_mean": 12089.4,
"valid_targets_min": 1483
},
{
"epoch": 4.5280235988200594,
"grad_norm": 0.15886160420092751,
"learning_rate": 1.0787331627729182e-06,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11860600858926773,
"step": 7675,
"valid_targets_mean": 9522.6,
"valid_targets_min": 747
},
{
"epoch": 4.530973451327434,
"grad_norm": 0.16522051263967721,
"learning_rate": 1.0654283605283488e-06,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07913932204246521,
"step": 7680,
"valid_targets_mean": 6589.8,
"valid_targets_min": 1001
},
{
"epoch": 4.533923303834809,
"grad_norm": 0.1709157193165234,
"learning_rate": 1.05220387160619e-06,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10800658166408539,
"step": 7685,
"valid_targets_mean": 8307.7,
"valid_targets_min": 1442
},
{
"epoch": 4.536873156342183,
"grad_norm": 0.15626400784626918,
"learning_rate": 1.0390597520997426e-06,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1069958508014679,
"step": 7690,
"valid_targets_mean": 9174.5,
"valid_targets_min": 2099
},
{
"epoch": 4.539823008849558,
"grad_norm": 0.1512271056093135,
"learning_rate": 1.0259960577614091e-06,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11784885823726654,
"step": 7695,
"valid_targets_mean": 9977.2,
"valid_targets_min": 1385
},
{
"epoch": 4.542772861356932,
"grad_norm": 0.1507369858580233,
"learning_rate": 1.0130128440024633e-06,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.093796007335186,
"step": 7700,
"valid_targets_mean": 8322.1,
"valid_targets_min": 2131
},
{
"epoch": 4.545722713864307,
"grad_norm": 0.15852677988252023,
"learning_rate": 1.0001101658928092e-06,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1161518543958664,
"step": 7705,
"valid_targets_mean": 10406.2,
"valid_targets_min": 1407
},
{
"epoch": 4.548672566371682,
"grad_norm": 0.1531404932874041,
"learning_rate": 9.872880781607463e-07,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12724629044532776,
"step": 7710,
"valid_targets_mean": 12493.9,
"valid_targets_min": 2457
},
{
"epoch": 4.551622418879056,
"grad_norm": 0.15451521393434178,
"learning_rate": 9.745466351927458e-07,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09752607345581055,
"step": 7715,
"valid_targets_mean": 9960.1,
"valid_targets_min": 2052
},
{
"epoch": 4.554572271386431,
"grad_norm": 0.16431695986849715,
"learning_rate": 9.618858910332073e-07,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09468859434127808,
"step": 7720,
"valid_targets_mean": 8378.8,
"valid_targets_min": 1560
},
{
"epoch": 4.557522123893805,
"grad_norm": 0.15548881510456924,
"learning_rate": 9.493058993842408e-07,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10117464512586594,
"step": 7725,
"valid_targets_mean": 9472.5,
"valid_targets_min": 2484
},
{
"epoch": 4.56047197640118,
"grad_norm": 0.15239276402032617,
"learning_rate": 9.368067136054337e-07,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1087859570980072,
"step": 7730,
"valid_targets_mean": 10299.2,
"valid_targets_min": 878
},
{
"epoch": 4.563421828908554,
"grad_norm": 0.15751354324521347,
"learning_rate": 9.243883867136239e-07,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11837193369865417,
"step": 7735,
"valid_targets_mean": 10887.9,
"valid_targets_min": 2125
},
{
"epoch": 4.566371681415929,
"grad_norm": 0.1636132491545048,
"learning_rate": 9.120509713826786e-07,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383325159549713,
"step": 7740,
"valid_targets_mean": 12573.0,
"valid_targets_min": 2048
},
{
"epoch": 4.569321533923304,
"grad_norm": 0.1582734920218057,
"learning_rate": 8.997945199432668e-07,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10354599356651306,
"step": 7745,
"valid_targets_mean": 9179.3,
"valid_targets_min": 1147
},
{
"epoch": 4.572271386430678,
"grad_norm": 0.14978615383191066,
"learning_rate": 8.876190843826426e-07,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11529295146465302,
"step": 7750,
"valid_targets_mean": 10706.8,
"valid_targets_min": 1593
},
{
"epoch": 4.575221238938053,
"grad_norm": 0.163412064717712,
"learning_rate": 8.755247163444137e-07,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10770249366760254,
"step": 7755,
"valid_targets_mean": 9218.1,
"valid_targets_min": 2137
},
{
"epoch": 4.578171091445427,
"grad_norm": 0.15646391023643355,
"learning_rate": 8.635114671283351e-07,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1251239776611328,
"step": 7760,
"valid_targets_mean": 11224.7,
"valid_targets_min": 1822
},
{
"epoch": 4.5811209439528024,
"grad_norm": 0.1583802965925948,
"learning_rate": 8.515793876900957e-07,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11912311613559723,
"step": 7765,
"valid_targets_mean": 11156.6,
"valid_targets_min": 1606
},
{
"epoch": 4.584070796460177,
"grad_norm": 0.15774668340457346,
"learning_rate": 8.397285286410683e-07,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12353400886058807,
"step": 7770,
"valid_targets_mean": 10960.1,
"valid_targets_min": 1556
},
{
"epoch": 4.587020648967552,
"grad_norm": 0.15917041823937758,
"learning_rate": 8.279589402481458e-07,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10141907632350922,
"step": 7775,
"valid_targets_mean": 9461.7,
"valid_targets_min": 1929
},
{
"epoch": 4.589970501474927,
"grad_norm": 0.15450283281262311,
"learning_rate": 8.162706724334812e-07,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1162460520863533,
"step": 7780,
"valid_targets_mean": 9745.5,
"valid_targets_min": 1581
},
{
"epoch": 4.592920353982301,
"grad_norm": 0.1618381177008798,
"learning_rate": 8.046637747743125e-07,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11386996507644653,
"step": 7785,
"valid_targets_mean": 10080.6,
"valid_targets_min": 2923
},
{
"epoch": 4.595870206489676,
"grad_norm": 0.18422670497164972,
"learning_rate": 7.931382965027245e-07,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10538017004728317,
"step": 7790,
"valid_targets_mean": 8127.2,
"valid_targets_min": 1571
},
{
"epoch": 4.59882005899705,
"grad_norm": 0.16123401086696665,
"learning_rate": 7.816942865054566e-07,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1084161102771759,
"step": 7795,
"valid_targets_mean": 10449.8,
"valid_targets_min": 1912
},
{
"epoch": 4.601769911504425,
"grad_norm": 0.16819343140393953,
"learning_rate": 7.703317933236886e-07,
"loss": 0.3365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09945972263813019,
"step": 7800,
"valid_targets_mean": 8532.2,
"valid_targets_min": 1791
},
{
"epoch": 4.604719764011799,
"grad_norm": 0.15125655287965598,
"learning_rate": 7.590508651528372e-07,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11926385760307312,
"step": 7805,
"valid_targets_mean": 11387.8,
"valid_targets_min": 2003
},
{
"epoch": 4.607669616519174,
"grad_norm": 0.16124756947368554,
"learning_rate": 7.478515498423577e-07,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10725908726453781,
"step": 7810,
"valid_targets_mean": 9229.9,
"valid_targets_min": 2522
},
{
"epoch": 4.610619469026549,
"grad_norm": 0.1519505295088245,
"learning_rate": 7.367338948955183e-07,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12884555757045746,
"step": 7815,
"valid_targets_mean": 12198.8,
"valid_targets_min": 1675
},
{
"epoch": 4.613569321533923,
"grad_norm": 0.15228717890035376,
"learning_rate": 7.256979474692327e-07,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10891731083393097,
"step": 7820,
"valid_targets_mean": 10017.0,
"valid_targets_min": 1776
},
{
"epoch": 4.616519174041298,
"grad_norm": 0.15429967262842637,
"learning_rate": 7.147437543738278e-07,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10560815781354904,
"step": 7825,
"valid_targets_mean": 10342.0,
"valid_targets_min": 1961
},
{
"epoch": 4.619469026548672,
"grad_norm": 0.16656461258723682,
"learning_rate": 7.038713620728699e-07,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10848058760166168,
"step": 7830,
"valid_targets_mean": 9962.6,
"valid_targets_min": 2405
},
{
"epoch": 4.622418879056047,
"grad_norm": 0.16021833897800697,
"learning_rate": 6.930808166829517e-07,
"loss": 0.3359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0915953516960144,
"step": 7835,
"valid_targets_mean": 8304.7,
"valid_targets_min": 1978
},
{
"epoch": 4.625368731563422,
"grad_norm": 0.23996441726172854,
"learning_rate": 6.823721639735015e-07,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12475943565368652,
"step": 7840,
"valid_targets_mean": 12342.4,
"valid_targets_min": 2187
},
{
"epoch": 4.628318584070796,
"grad_norm": 0.16033087598275933,
"learning_rate": 6.71745449366592e-07,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10748793929815292,
"step": 7845,
"valid_targets_mean": 9165.0,
"valid_targets_min": 832
},
{
"epoch": 4.631268436578171,
"grad_norm": 0.15047647806461162,
"learning_rate": 6.612007179367452e-07,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10964348912239075,
"step": 7850,
"valid_targets_mean": 10573.9,
"valid_targets_min": 2386
},
{
"epoch": 4.6342182890855455,
"grad_norm": 0.15419414615308352,
"learning_rate": 6.507380144107433e-07,
"loss": 0.3424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09014791250228882,
"step": 7855,
"valid_targets_mean": 8261.4,
"valid_targets_min": 1439
},
{
"epoch": 4.6371681415929205,
"grad_norm": 0.16020362869640542,
"learning_rate": 6.403573831674292e-07,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11980140209197998,
"step": 7860,
"valid_targets_mean": 9847.7,
"valid_targets_min": 1767
},
{
"epoch": 4.6401179941002955,
"grad_norm": 0.148405962516986,
"learning_rate": 6.300588682375375e-07,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13102710247039795,
"step": 7865,
"valid_targets_mean": 13030.2,
"valid_targets_min": 2483
},
{
"epoch": 4.64306784660767,
"grad_norm": 0.1548714133654885,
"learning_rate": 6.198425133034836e-07,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1018887311220169,
"step": 7870,
"valid_targets_mean": 9731.1,
"valid_targets_min": 1703
},
{
"epoch": 4.646017699115045,
"grad_norm": 0.1658282019537656,
"learning_rate": 6.097083616992039e-07,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1153990775346756,
"step": 7875,
"valid_targets_mean": 10780.1,
"valid_targets_min": 1649
},
{
"epoch": 4.648967551622419,
"grad_norm": 0.16452590143085927,
"learning_rate": 5.996564564099494e-07,
"loss": 0.3415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11689519882202148,
"step": 7880,
"valid_targets_mean": 10743.4,
"valid_targets_min": 1801
},
{
"epoch": 4.651917404129794,
"grad_norm": 0.15959360618773735,
"learning_rate": 5.89686840072119e-07,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09219282865524292,
"step": 7885,
"valid_targets_mean": 9102.6,
"valid_targets_min": 1830
},
{
"epoch": 4.654867256637168,
"grad_norm": 0.15017011191767232,
"learning_rate": 5.797995549730684e-07,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09676504135131836,
"step": 7890,
"valid_targets_mean": 9400.9,
"valid_targets_min": 1853
},
{
"epoch": 4.657817109144543,
"grad_norm": 0.14712118858804588,
"learning_rate": 5.699946430509417e-07,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10959380120038986,
"step": 7895,
"valid_targets_mean": 10114.0,
"valid_targets_min": 2144
},
{
"epoch": 4.660766961651918,
"grad_norm": 0.1667434562433671,
"learning_rate": 5.602721458944783e-07,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11018405854701996,
"step": 7900,
"valid_targets_mean": 9553.2,
"valid_targets_min": 2181
},
{
"epoch": 4.663716814159292,
"grad_norm": 0.15459681678025006,
"learning_rate": 5.50632104742852e-07,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11551558971405029,
"step": 7905,
"valid_targets_mean": 9748.7,
"valid_targets_min": 856
},
{
"epoch": 4.666666666666667,
"grad_norm": 0.16022184516651483,
"learning_rate": 5.410745604854861e-07,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12363321334123611,
"step": 7910,
"valid_targets_mean": 12207.3,
"valid_targets_min": 2941
},
{
"epoch": 4.669616519174041,
"grad_norm": 0.16639336868212634,
"learning_rate": 5.315995536618856e-07,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1000465601682663,
"step": 7915,
"valid_targets_mean": 9607.7,
"valid_targets_min": 1480
},
{
"epoch": 4.672566371681416,
"grad_norm": 0.15139280931936996,
"learning_rate": 5.222071244614579e-07,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10658089816570282,
"step": 7920,
"valid_targets_mean": 10516.6,
"valid_targets_min": 1750
},
{
"epoch": 4.67551622418879,
"grad_norm": 0.15377735360447695,
"learning_rate": 5.128973127233572e-07,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09791351854801178,
"step": 7925,
"valid_targets_mean": 9166.2,
"valid_targets_min": 2342
},
{
"epoch": 4.678466076696165,
"grad_norm": 0.16515324786442742,
"learning_rate": 5.036701579362935e-07,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12997247278690338,
"step": 7930,
"valid_targets_mean": 10198.2,
"valid_targets_min": 1888
},
{
"epoch": 4.68141592920354,
"grad_norm": 0.15525919346374295,
"learning_rate": 4.94525699238384e-07,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11433418095111847,
"step": 7935,
"valid_targets_mean": 9976.0,
"valid_targets_min": 1591
},
{
"epoch": 4.684365781710914,
"grad_norm": 0.1597583329611498,
"learning_rate": 4.854639754169776e-07,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10255442559719086,
"step": 7940,
"valid_targets_mean": 8667.3,
"valid_targets_min": 1636
},
{
"epoch": 4.687315634218289,
"grad_norm": 0.1574500233002011,
"learning_rate": 4.7648502490849737e-07,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13483873009681702,
"step": 7945,
"valid_targets_mean": 11671.9,
"valid_targets_min": 1372
},
{
"epoch": 4.6902654867256635,
"grad_norm": 0.16094356927855527,
"learning_rate": 4.675888857982669e-07,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09947562962770462,
"step": 7950,
"valid_targets_mean": 8705.5,
"valid_targets_min": 788
},
{
"epoch": 4.6932153392330385,
"grad_norm": 0.15295367535591084,
"learning_rate": 4.587755958203599e-07,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11330919712781906,
"step": 7955,
"valid_targets_mean": 10789.9,
"valid_targets_min": 1629
},
{
"epoch": 4.696165191740413,
"grad_norm": 0.15713245388762861,
"learning_rate": 4.5004519235743336e-07,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1057049110531807,
"step": 7960,
"valid_targets_mean": 9820.9,
"valid_targets_min": 2079
},
{
"epoch": 4.699115044247788,
"grad_norm": 0.1474422612887287,
"learning_rate": 4.4139771244056993e-07,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10105115175247192,
"step": 7965,
"valid_targets_mean": 9519.0,
"valid_targets_min": 1443
},
{
"epoch": 4.702064896755163,
"grad_norm": 0.15196052029218166,
"learning_rate": 4.328331927491247e-07,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11080189794301987,
"step": 7970,
"valid_targets_mean": 11148.6,
"valid_targets_min": 2844
},
{
"epoch": 4.705014749262537,
"grad_norm": 0.1568521251058333,
"learning_rate": 4.243516696105632e-07,
"loss": 0.3383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14061200618743896,
"step": 7975,
"valid_targets_mean": 11772.3,
"valid_targets_min": 2041
},
{
"epoch": 4.707964601769912,
"grad_norm": 0.1545804308119341,
"learning_rate": 4.159531790003146e-07,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.103056401014328,
"step": 7980,
"valid_targets_mean": 9464.2,
"valid_targets_min": 2006
},
{
"epoch": 4.710914454277286,
"grad_norm": 0.1503169086247212,
"learning_rate": 4.076377565416079e-07,
"loss": 0.3416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10284608602523804,
"step": 7985,
"valid_targets_mean": 10115.8,
"valid_targets_min": 2033
},
{
"epoch": 4.713864306784661,
"grad_norm": 0.1465495169158907,
"learning_rate": 3.9940543750534025e-07,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08931340277194977,
"step": 7990,
"valid_targets_mean": 8914.2,
"valid_targets_min": 1829
},
{
"epoch": 4.716814159292035,
"grad_norm": 0.15023344789396648,
"learning_rate": 3.9125625680990876e-07,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12425112724304199,
"step": 7995,
"valid_targets_mean": 11594.1,
"valid_targets_min": 1466
},
{
"epoch": 4.71976401179941,
"grad_norm": 0.1625604279941507,
"learning_rate": 3.8319024902106373e-07,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11338561773300171,
"step": 8000,
"valid_targets_mean": 10735.3,
"valid_targets_min": 1786
},
{
"epoch": 4.722713864306785,
"grad_norm": 0.1518588563470732,
"learning_rate": 3.7520744835177537e-07,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11632370948791504,
"step": 8005,
"valid_targets_mean": 11454.9,
"valid_targets_min": 2305
},
{
"epoch": 4.725663716814159,
"grad_norm": 0.15237511826928452,
"learning_rate": 3.6730788866207847e-07,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09955699741840363,
"step": 8010,
"valid_targets_mean": 9119.2,
"valid_targets_min": 933
},
{
"epoch": 4.728613569321534,
"grad_norm": 0.14939438036133001,
"learning_rate": 3.594916034589324e-07,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09637914597988129,
"step": 8015,
"valid_targets_mean": 9410.8,
"valid_targets_min": 1837
},
{
"epoch": 4.731563421828908,
"grad_norm": 0.16739548238864774,
"learning_rate": 3.5175862589607034e-07,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09700131416320801,
"step": 8020,
"valid_targets_mean": 9461.3,
"valid_targets_min": 1841
},
{
"epoch": 4.734513274336283,
"grad_norm": 0.15421867043528203,
"learning_rate": 3.441089887738769e-07,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13177192211151123,
"step": 8025,
"valid_targets_mean": 12400.2,
"valid_targets_min": 2042
},
{
"epoch": 4.737463126843657,
"grad_norm": 0.15354486453580096,
"learning_rate": 3.365427245392239e-07,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1302848756313324,
"step": 8030,
"valid_targets_mean": 12530.3,
"valid_targets_min": 2926
},
{
"epoch": 4.740412979351032,
"grad_norm": 0.15922122301009237,
"learning_rate": 3.290598652853638e-07,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12136721611022949,
"step": 8035,
"valid_targets_mean": 10509.6,
"valid_targets_min": 649
},
{
"epoch": 4.743362831858407,
"grad_norm": 0.15200559708461336,
"learning_rate": 3.216604427517611e-07,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10849249362945557,
"step": 8040,
"valid_targets_mean": 9454.0,
"valid_targets_min": 2003
},
{
"epoch": 4.7463126843657815,
"grad_norm": 0.15844438088801377,
"learning_rate": 3.1434448832398547e-07,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10437265783548355,
"step": 8045,
"valid_targets_mean": 9103.6,
"valid_targets_min": 1608
},
{
"epoch": 4.7492625368731565,
"grad_norm": 0.15440075823729557,
"learning_rate": 3.0711203303355417e-07,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10706086456775665,
"step": 8050,
"valid_targets_mean": 9436.6,
"valid_targets_min": 2137
},
{
"epoch": 4.752212389380531,
"grad_norm": 0.15650013232286086,
"learning_rate": 2.9996310755782354e-07,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10674930363893509,
"step": 8055,
"valid_targets_mean": 9747.0,
"valid_targets_min": 1135
},
{
"epoch": 4.755162241887906,
"grad_norm": 0.16010100514936637,
"learning_rate": 2.92897742219842e-07,
"loss": 0.3379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11662594974040985,
"step": 8060,
"valid_targets_mean": 10079.6,
"valid_targets_min": 2286
},
{
"epoch": 4.758112094395281,
"grad_norm": 0.18313454619062772,
"learning_rate": 2.859159669882261e-07,
"loss": 0.3425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11656038463115692,
"step": 8065,
"valid_targets_mean": 10582.6,
"valid_targets_min": 1657
},
{
"epoch": 4.761061946902655,
"grad_norm": 0.16022588278414174,
"learning_rate": 2.7901781147704257e-07,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10365186631679535,
"step": 8070,
"valid_targets_mean": 8869.7,
"valid_targets_min": 1883
},
{
"epoch": 4.76401179941003,
"grad_norm": 0.1541843916278012,
"learning_rate": 2.7220330494566404e-07,
"loss": 0.33,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11602887511253357,
"step": 8075,
"valid_targets_mean": 10999.8,
"valid_targets_min": 1608
},
{
"epoch": 4.766961651917404,
"grad_norm": 0.1593256933790957,
"learning_rate": 2.654724762986649e-07,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1141844168305397,
"step": 8080,
"valid_targets_mean": 10845.2,
"valid_targets_min": 1769
},
{
"epoch": 4.769911504424779,
"grad_norm": 0.14692227157712975,
"learning_rate": 2.588253540856811e-07,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1177644431591034,
"step": 8085,
"valid_targets_mean": 11583.4,
"valid_targets_min": 2726
},
{
"epoch": 4.772861356932154,
"grad_norm": 0.15635500681838485,
"learning_rate": 2.5226196650130596e-07,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09946940094232559,
"step": 8090,
"valid_targets_mean": 9023.2,
"valid_targets_min": 1719
},
{
"epoch": 4.775811209439528,
"grad_norm": 0.15542240912952268,
"learning_rate": 2.4578234138495693e-07,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12937146425247192,
"step": 8095,
"valid_targets_mean": 11621.1,
"valid_targets_min": 1627
},
{
"epoch": 4.778761061946903,
"grad_norm": 0.1989805763466194,
"learning_rate": 2.3938650622076453e-07,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1308184713125229,
"step": 8100,
"valid_targets_mean": 10227.8,
"valid_targets_min": 2542
},
{
"epoch": 4.781710914454277,
"grad_norm": 0.15854722710821223,
"learning_rate": 2.3307448813744805e-07,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1028071716427803,
"step": 8105,
"valid_targets_mean": 8847.1,
"valid_targets_min": 2962
},
{
"epoch": 4.784660766961652,
"grad_norm": 0.15384075094610822,
"learning_rate": 2.2684631390821775e-07,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11849691718816757,
"step": 8110,
"valid_targets_mean": 11824.5,
"valid_targets_min": 2336
},
{
"epoch": 4.787610619469026,
"grad_norm": 0.15427674682254122,
"learning_rate": 2.207020099506374e-07,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14145824313163757,
"step": 8115,
"valid_targets_mean": 13422.8,
"valid_targets_min": 2469
},
{
"epoch": 4.790560471976401,
"grad_norm": 0.15160113657943072,
"learning_rate": 2.1464160232653518e-07,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08148768544197083,
"step": 8120,
"valid_targets_mean": 8039.5,
"valid_targets_min": 1011
},
{
"epoch": 4.793510324483776,
"grad_norm": 0.15059629364878185,
"learning_rate": 2.0866511674187518e-07,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09149783104658127,
"step": 8125,
"valid_targets_mean": 8162.9,
"valid_targets_min": 1768
},
{
"epoch": 4.79646017699115,
"grad_norm": 0.16384131384526676,
"learning_rate": 2.0277257854665944e-07,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11894331872463226,
"step": 8130,
"valid_targets_mean": 9680.6,
"valid_targets_min": 1517
},
{
"epoch": 4.799410029498525,
"grad_norm": 0.1602386352213527,
"learning_rate": 1.9696401273481713e-07,
"loss": 0.337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11503320187330246,
"step": 8135,
"valid_targets_mean": 10204.0,
"valid_targets_min": 1856
},
{
"epoch": 4.8023598820058995,
"grad_norm": 0.1545511562562192,
"learning_rate": 1.9123944394409567e-07,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12917274236679077,
"step": 8140,
"valid_targets_mean": 11088.9,
"valid_targets_min": 3033
},
{
"epoch": 4.8053097345132745,
"grad_norm": 0.16017065168337155,
"learning_rate": 1.8559889645596073e-07,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09840681403875351,
"step": 8145,
"valid_targets_mean": 8808.9,
"valid_targets_min": 1628
},
{
"epoch": 4.808259587020649,
"grad_norm": 0.16153661164958696,
"learning_rate": 1.8004239419548985e-07,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11837130039930344,
"step": 8150,
"valid_targets_mean": 10004.9,
"valid_targets_min": 2090
},
{
"epoch": 4.811209439528024,
"grad_norm": 0.15843824142798069,
"learning_rate": 1.745699607312723e-07,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11763490736484528,
"step": 8155,
"valid_targets_mean": 11585.9,
"valid_targets_min": 1578
},
{
"epoch": 4.814159292035399,
"grad_norm": 0.15594867162929354,
"learning_rate": 1.6918161927531375e-07,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12264040857553482,
"step": 8160,
"valid_targets_mean": 10658.7,
"valid_targets_min": 1712
},
{
"epoch": 4.817109144542773,
"grad_norm": 0.15355379471150807,
"learning_rate": 1.6387739268292513e-07,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12840881943702698,
"step": 8165,
"valid_targets_mean": 11714.4,
"valid_targets_min": 2874
},
{
"epoch": 4.820058997050148,
"grad_norm": 0.15764893679634057,
"learning_rate": 1.5865730345263842e-07,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09563873708248138,
"step": 8170,
"valid_targets_mean": 9205.3,
"valid_targets_min": 2733
},
{
"epoch": 4.823008849557522,
"grad_norm": 0.15015239794660265,
"learning_rate": 1.5352137372611097e-07,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09439783543348312,
"step": 8175,
"valid_targets_mean": 8837.8,
"valid_targets_min": 2032
},
{
"epoch": 4.825958702064897,
"grad_norm": 0.15549841438969475,
"learning_rate": 1.484696252880169e-07,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10786696523427963,
"step": 8180,
"valid_targets_mean": 10313.7,
"valid_targets_min": 2037
},
{
"epoch": 4.828908554572271,
"grad_norm": 0.15517700272853036,
"learning_rate": 1.4350207956597583e-07,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09071081876754761,
"step": 8185,
"valid_targets_mean": 8079.2,
"valid_targets_min": 1799
},
{
"epoch": 4.831858407079646,
"grad_norm": 0.1551730940635976,
"learning_rate": 1.3861875763043987e-07,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1367199718952179,
"step": 8190,
"valid_targets_mean": 11687.4,
"valid_targets_min": 1660
},
{
"epoch": 4.834808259587021,
"grad_norm": 0.1513284388442919,
"learning_rate": 1.3381968019462678e-07,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10539837181568146,
"step": 8195,
"valid_targets_mean": 9689.1,
"valid_targets_min": 1213
},
{
"epoch": 4.837758112094395,
"grad_norm": 0.1579977975628611,
"learning_rate": 1.2910486761441577e-07,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1488528698682785,
"step": 8200,
"valid_targets_mean": 13727.9,
"valid_targets_min": 2019
},
{
"epoch": 4.84070796460177,
"grad_norm": 0.1645343788926088,
"learning_rate": 1.2447433988826306e-07,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09441319108009338,
"step": 8205,
"valid_targets_mean": 8408.8,
"valid_targets_min": 1770
},
{
"epoch": 4.843657817109144,
"grad_norm": 0.17102694080450573,
"learning_rate": 1.1992811665712423e-07,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1222073882818222,
"step": 8210,
"valid_targets_mean": 10496.0,
"valid_targets_min": 1924
},
{
"epoch": 4.846607669616519,
"grad_norm": 0.15282193505100267,
"learning_rate": 1.1546621720436745e-07,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10215400159358978,
"step": 8215,
"valid_targets_mean": 9131.2,
"valid_targets_min": 2712
},
{
"epoch": 4.849557522123893,
"grad_norm": 0.16566507473867742,
"learning_rate": 1.1108866045569156e-07,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11062388122081757,
"step": 8220,
"valid_targets_mean": 8391.5,
"valid_targets_min": 1896
},
{
"epoch": 4.852507374631268,
"grad_norm": 0.1511859347180266,
"learning_rate": 1.0679546497903926e-07,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10670909285545349,
"step": 8225,
"valid_targets_mean": 9973.9,
"valid_targets_min": 1874
},
{
"epoch": 4.855457227138643,
"grad_norm": 0.14973828526729327,
"learning_rate": 1.0258664898453507e-07,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11628145724534988,
"step": 8230,
"valid_targets_mean": 11387.2,
"valid_targets_min": 2079
},
{
"epoch": 4.8584070796460175,
"grad_norm": 0.15653880756528876,
"learning_rate": 9.846223032438318e-08,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11390264332294464,
"step": 8235,
"valid_targets_mean": 9381.8,
"valid_targets_min": 1708
},
{
"epoch": 4.8613569321533925,
"grad_norm": 0.16974042052187077,
"learning_rate": 9.442222649282296e-08,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10504934191703796,
"step": 8240,
"valid_targets_mean": 8509.3,
"valid_targets_min": 1118
},
{
"epoch": 4.864306784660767,
"grad_norm": 0.15268761111173068,
"learning_rate": 9.046665462602244e-08,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11172182857990265,
"step": 8245,
"valid_targets_mean": 10374.7,
"valid_targets_min": 2011
},
{
"epoch": 4.867256637168142,
"grad_norm": 0.16194877779100575,
"learning_rate": 8.659553150203392e-08,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13858763873577118,
"step": 8250,
"valid_targets_mean": 12519.0,
"valid_targets_min": 1887
},
{
"epoch": 4.870206489675516,
"grad_norm": 0.1553367162188952,
"learning_rate": 8.280887354069844e-08,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10727658867835999,
"step": 8255,
"valid_targets_mean": 9916.1,
"valid_targets_min": 1793
},
{
"epoch": 4.873156342182891,
"grad_norm": 0.17928672354183484,
"learning_rate": 7.910669680359473e-08,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12614883482456207,
"step": 8260,
"valid_targets_mean": 10340.9,
"valid_targets_min": 1125
},
{
"epoch": 4.876106194690266,
"grad_norm": 0.16037472573730496,
"learning_rate": 7.548901699396372e-08,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11756325513124466,
"step": 8265,
"valid_targets_mean": 9584.5,
"valid_targets_min": 2028
},
{
"epoch": 4.87905604719764,
"grad_norm": 0.15676084316110542,
"learning_rate": 7.195584945663969e-08,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12959174811840057,
"step": 8270,
"valid_targets_mean": 11590.9,
"valid_targets_min": 2261
},
{
"epoch": 4.882005899705015,
"grad_norm": 0.14981931967427253,
"learning_rate": 6.850720917799036e-08,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12228604406118393,
"step": 8275,
"valid_targets_mean": 11354.4,
"valid_targets_min": 1773
},
{
"epoch": 4.88495575221239,
"grad_norm": 0.1492517770434556,
"learning_rate": 6.5143110785848e-08,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1076161116361618,
"step": 8280,
"valid_targets_mean": 9635.8,
"valid_targets_min": 2187
},
{
"epoch": 4.887905604719764,
"grad_norm": 0.15883459016225324,
"learning_rate": 6.186356854944953e-08,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11498965322971344,
"step": 8285,
"valid_targets_mean": 10532.5,
"valid_targets_min": 1940
},
{
"epoch": 4.890855457227139,
"grad_norm": 0.1512683940726875,
"learning_rate": 5.866859637938094e-08,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12131491303443909,
"step": 8290,
"valid_targets_mean": 11384.6,
"valid_targets_min": 2096
},
{
"epoch": 4.893805309734513,
"grad_norm": 0.16374210576442358,
"learning_rate": 5.555820782750854e-08,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11251075565814972,
"step": 8295,
"valid_targets_mean": 10272.5,
"valid_targets_min": 2815
},
{
"epoch": 4.896755162241888,
"grad_norm": 0.15550531670351886,
"learning_rate": 5.253241608693005e-08,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12761548161506653,
"step": 8300,
"valid_targets_mean": 11145.4,
"valid_targets_min": 818
},
{
"epoch": 4.899705014749262,
"grad_norm": 0.16691708037129438,
"learning_rate": 4.959123399191468e-08,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10028710216283798,
"step": 8305,
"valid_targets_mean": 9275.6,
"valid_targets_min": 1757
},
{
"epoch": 4.902654867256637,
"grad_norm": 0.15042742074564838,
"learning_rate": 4.673467401784981e-08,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11940623074769974,
"step": 8310,
"valid_targets_mean": 10562.0,
"valid_targets_min": 1778
},
{
"epoch": 4.905604719764012,
"grad_norm": 0.15515324897077903,
"learning_rate": 4.396274828118774e-08,
"loss": 0.3357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10962172597646713,
"step": 8315,
"valid_targets_mean": 9969.5,
"valid_targets_min": 1957
},
{
"epoch": 4.908554572271386,
"grad_norm": 0.15830692983786696,
"learning_rate": 4.127546853939013e-08,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12479501217603683,
"step": 8320,
"valid_targets_mean": 10153.2,
"valid_targets_min": 2191
},
{
"epoch": 4.911504424778761,
"grad_norm": 0.15919506975556477,
"learning_rate": 3.867284619089029e-08,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0909244641661644,
"step": 8325,
"valid_targets_mean": 8849.2,
"valid_targets_min": 324
},
{
"epoch": 4.9144542772861355,
"grad_norm": 0.1531424595801704,
"learning_rate": 3.615489227502877e-08,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12087876349687576,
"step": 8330,
"valid_targets_mean": 10924.6,
"valid_targets_min": 2710
},
{
"epoch": 4.9174041297935105,
"grad_norm": 0.17922580684050662,
"learning_rate": 3.372161747202007e-08,
"loss": 0.3411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12497780472040176,
"step": 8335,
"valid_targets_mean": 11752.3,
"valid_targets_min": 1969
},
{
"epoch": 4.920353982300885,
"grad_norm": 0.15961290538181538,
"learning_rate": 3.137303210289711e-08,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13402295112609863,
"step": 8340,
"valid_targets_mean": 12698.6,
"valid_targets_min": 2768
},
{
"epoch": 4.92330383480826,
"grad_norm": 0.15686414808002838,
"learning_rate": 2.9109146129475686e-08,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10782062262296677,
"step": 8345,
"valid_targets_mean": 10104.6,
"valid_targets_min": 1652
},
{
"epoch": 4.926253687315635,
"grad_norm": 0.1539726659200968,
"learning_rate": 2.69299691543079e-08,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11887013912200928,
"step": 8350,
"valid_targets_mean": 11014.7,
"valid_targets_min": 1872
},
{
"epoch": 4.929203539823009,
"grad_norm": 0.15614057446465482,
"learning_rate": 2.483551042064214e-08,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11364469677209854,
"step": 8355,
"valid_targets_mean": 10039.7,
"valid_targets_min": 2777
},
{
"epoch": 4.932153392330384,
"grad_norm": 0.15395208293261126,
"learning_rate": 2.2825778812385347e-08,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12622305750846863,
"step": 8360,
"valid_targets_mean": 11453.5,
"valid_targets_min": 1275
},
{
"epoch": 4.935103244837758,
"grad_norm": 0.15579370316332758,
"learning_rate": 2.090078285405639e-08,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10148319602012634,
"step": 8365,
"valid_targets_mean": 8932.7,
"valid_targets_min": 1791
},
{
"epoch": 4.938053097345133,
"grad_norm": 0.14897559185560402,
"learning_rate": 1.90605307107683e-08,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11737137287855148,
"step": 8370,
"valid_targets_mean": 11101.6,
"valid_targets_min": 2707
},
{
"epoch": 4.941002949852507,
"grad_norm": 0.1593622012689512,
"learning_rate": 1.7305030188177195e-08,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13405683636665344,
"step": 8375,
"valid_targets_mean": 10862.0,
"valid_targets_min": 1591
},
{
"epoch": 4.943952802359882,
"grad_norm": 0.15857040855180185,
"learning_rate": 1.563428873245343e-08,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1257179081439972,
"step": 8380,
"valid_targets_mean": 10801.4,
"valid_targets_min": 1421
},
{
"epoch": 4.946902654867257,
"grad_norm": 0.16797684271769017,
"learning_rate": 1.4048313430252702e-08,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10947559773921967,
"step": 8385,
"valid_targets_mean": 8929.9,
"valid_targets_min": 1203
},
{
"epoch": 4.949852507374631,
"grad_norm": 0.15234476430572783,
"learning_rate": 1.2547111008689438e-08,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11667993664741516,
"step": 8390,
"valid_targets_mean": 10474.6,
"valid_targets_min": 1041
},
{
"epoch": 4.952802359882006,
"grad_norm": 0.16171341308080303,
"learning_rate": 1.1130687835292364e-08,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0994919091463089,
"step": 8395,
"valid_targets_mean": 8967.3,
"valid_targets_min": 2401
},
{
"epoch": 4.95575221238938,
"grad_norm": 0.15653748086188524,
"learning_rate": 9.79904991800007e-09,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11829991638660431,
"step": 8400,
"valid_targets_mean": 10507.0,
"valid_targets_min": 1811
},
{
"epoch": 4.958702064896755,
"grad_norm": 0.15627283558458796,
"learning_rate": 8.552202905116603e-09,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0984392911195755,
"step": 8405,
"valid_targets_mean": 9101.4,
"valid_targets_min": 1896
},
{
"epoch": 4.961651917404129,
"grad_norm": 0.15721821511741407,
"learning_rate": 7.390152085298141e-09,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12197485566139221,
"step": 8410,
"valid_targets_mean": 11740.2,
"valid_targets_min": 1329
},
{
"epoch": 4.964601769911504,
"grad_norm": 0.16234745408852572,
"learning_rate": 6.312902387526354e-09,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10215374082326889,
"step": 8415,
"valid_targets_mean": 8273.8,
"valid_targets_min": 1581
},
{
"epoch": 4.967551622418879,
"grad_norm": 0.15791372499868073,
"learning_rate": 5.320458381090632e-09,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12479733675718307,
"step": 8420,
"valid_targets_mean": 10531.7,
"valid_targets_min": 2030
},
{
"epoch": 4.9705014749262535,
"grad_norm": 0.1578360190843846,
"learning_rate": 4.412824275563665e-09,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10316172242164612,
"step": 8425,
"valid_targets_mean": 8572.2,
"valid_targets_min": 1302
},
{
"epoch": 4.9734513274336285,
"grad_norm": 0.15983241448664054,
"learning_rate": 3.5900039207859005e-09,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11723663657903671,
"step": 8430,
"valid_targets_mean": 10365.0,
"valid_targets_min": 1880
},
{
"epoch": 4.976401179941003,
"grad_norm": 0.1625826476293185,
"learning_rate": 2.852000806854438e-09,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13278573751449585,
"step": 8435,
"valid_targets_mean": 11930.6,
"valid_targets_min": 1431
},
{
"epoch": 4.979351032448378,
"grad_norm": 0.14992069896746002,
"learning_rate": 2.198818064098607e-09,
"loss": 0.3388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11306165158748627,
"step": 8440,
"valid_targets_mean": 10015.8,
"valid_targets_min": 1439
},
{
"epoch": 4.982300884955752,
"grad_norm": 0.16714353240958918,
"learning_rate": 1.6304584630733033e-09,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12046494334936142,
"step": 8445,
"valid_targets_mean": 10110.8,
"valid_targets_min": 2130
},
{
"epoch": 4.985250737463127,
"grad_norm": 0.15472606493144128,
"learning_rate": 1.1469244145456693e-09,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10794627666473389,
"step": 8450,
"valid_targets_mean": 9938.6,
"valid_targets_min": 1395
},
{
"epoch": 4.988200589970502,
"grad_norm": 0.17796065764885294,
"learning_rate": 7.482179694884295e-10,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13961243629455566,
"step": 8455,
"valid_targets_mean": 11508.6,
"valid_targets_min": 1832
},
{
"epoch": 4.991150442477876,
"grad_norm": 0.1512951487988943,
"learning_rate": 4.3434081905990857e-10,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1032632440328598,
"step": 8460,
"valid_targets_mean": 9993.5,
"valid_targets_min": 2294
},
{
"epoch": 4.994100294985251,
"grad_norm": 0.16434925179454232,
"learning_rate": 2.0529429461069174e-10,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13042443990707397,
"step": 8465,
"valid_targets_mean": 11300.2,
"valid_targets_min": 1578
},
{
"epoch": 4.997050147492625,
"grad_norm": 0.1540038581679221,
"learning_rate": 6.107936766808209e-11,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11116141080856323,
"step": 8470,
"valid_targets_mean": 10239.3,
"valid_targets_min": 1636
},
{
"epoch": 5.0,
"grad_norm": 0.1529484565508345,
"learning_rate": 1.6966499405413062e-12,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10146471858024597,
"step": 8475,
"valid_targets_mean": 9906.2,
"valid_targets_min": 1715
},
{
"epoch": 5.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10146471858024597,
"step": 8475,
"total_flos": 2.892950530069994e+19,
"train_loss": 0.05187808655707885,
"train_runtime": 37600.0558,
"train_samples_per_second": 21.635,
"train_steps_per_second": 0.225,
"valid_targets_mean": 9906.2,
"valid_targets_min": 1715
}
],
"logging_steps": 5,
"max_steps": 8475,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 300,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 2.892950530069994e+19,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}