Files
g1_subagent_e1_gpt_long_tacc/trainer_state.json

9563 lines
265 KiB
JSON
Raw Normal View History

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4326,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008090614886731391,
"grad_norm": 11.186269453387633,
"learning_rate": 3.695150115473441e-07,
"loss": 0.8139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8276135325431824,
"step": 5,
"valid_targets_mean": 7367.1,
"valid_targets_min": 1791
},
{
"epoch": 0.016181229773462782,
"grad_norm": 11.232529644323693,
"learning_rate": 8.314087759815243e-07,
"loss": 0.7781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7600369453430176,
"step": 10,
"valid_targets_mean": 8089.4,
"valid_targets_min": 5145
},
{
"epoch": 0.024271844660194174,
"grad_norm": 10.15603607573941,
"learning_rate": 1.2933025404157046e-06,
"loss": 0.7791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7623764872550964,
"step": 15,
"valid_targets_mean": 7736.6,
"valid_targets_min": 2978
},
{
"epoch": 0.032362459546925564,
"grad_norm": 8.428519297500355,
"learning_rate": 1.7551963048498846e-06,
"loss": 0.756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7740650177001953,
"step": 20,
"valid_targets_mean": 7745.0,
"valid_targets_min": 2988
},
{
"epoch": 0.040453074433656956,
"grad_norm": 5.849750741120756,
"learning_rate": 2.217090069284065e-06,
"loss": 0.6945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7195521593093872,
"step": 25,
"valid_targets_mean": 7508.9,
"valid_targets_min": 3292
},
{
"epoch": 0.04854368932038835,
"grad_norm": 3.999112186202206,
"learning_rate": 2.678983833718245e-06,
"loss": 0.6908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7112835645675659,
"step": 30,
"valid_targets_mean": 7365.6,
"valid_targets_min": 3274
},
{
"epoch": 0.05663430420711974,
"grad_norm": 2.3642895753979727,
"learning_rate": 3.1408775981524254e-06,
"loss": 0.6478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7030115127563477,
"step": 35,
"valid_targets_mean": 7283.9,
"valid_targets_min": 2285
},
{
"epoch": 0.06472491909385113,
"grad_norm": 1.5453038086692914,
"learning_rate": 3.6027713625866056e-06,
"loss": 0.6036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.614423394203186,
"step": 40,
"valid_targets_mean": 7289.2,
"valid_targets_min": 2822
},
{
"epoch": 0.07281553398058252,
"grad_norm": 1.2616787513943852,
"learning_rate": 4.064665127020786e-06,
"loss": 0.559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5736663341522217,
"step": 45,
"valid_targets_mean": 7387.5,
"valid_targets_min": 3823
},
{
"epoch": 0.08090614886731391,
"grad_norm": 1.0884084428534417,
"learning_rate": 4.526558891454966e-06,
"loss": 0.5749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.564963161945343,
"step": 50,
"valid_targets_mean": 6462.8,
"valid_targets_min": 1285
},
{
"epoch": 0.0889967637540453,
"grad_norm": 0.8836061625007553,
"learning_rate": 4.988452655889146e-06,
"loss": 0.577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5905070900917053,
"step": 55,
"valid_targets_mean": 9115.1,
"valid_targets_min": 5927
},
{
"epoch": 0.0970873786407767,
"grad_norm": 0.8333417163648019,
"learning_rate": 5.450346420323326e-06,
"loss": 0.5768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5808031558990479,
"step": 60,
"valid_targets_mean": 7797.2,
"valid_targets_min": 1985
},
{
"epoch": 0.10517799352750809,
"grad_norm": 0.7005772125420773,
"learning_rate": 5.912240184757506e-06,
"loss": 0.5193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4872642159461975,
"step": 65,
"valid_targets_mean": 7330.4,
"valid_targets_min": 2779
},
{
"epoch": 0.11326860841423948,
"grad_norm": 0.7219020916672013,
"learning_rate": 6.374133949191687e-06,
"loss": 0.499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48490405082702637,
"step": 70,
"valid_targets_mean": 7086.4,
"valid_targets_min": 2870
},
{
"epoch": 0.12135922330097088,
"grad_norm": 0.5860056349140036,
"learning_rate": 6.836027713625867e-06,
"loss": 0.534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.538621187210083,
"step": 75,
"valid_targets_mean": 8391.3,
"valid_targets_min": 880
},
{
"epoch": 0.12944983818770225,
"grad_norm": 0.6746262711354033,
"learning_rate": 7.297921478060047e-06,
"loss": 0.5221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48001986742019653,
"step": 80,
"valid_targets_mean": 6497.2,
"valid_targets_min": 3127
},
{
"epoch": 0.13754045307443366,
"grad_norm": 0.5575974584155833,
"learning_rate": 7.759815242494227e-06,
"loss": 0.4746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4626394212245941,
"step": 85,
"valid_targets_mean": 6541.8,
"valid_targets_min": 3567
},
{
"epoch": 0.14563106796116504,
"grad_norm": 0.5396164383780504,
"learning_rate": 8.221709006928407e-06,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46605369448661804,
"step": 90,
"valid_targets_mean": 7617.8,
"valid_targets_min": 3885
},
{
"epoch": 0.15372168284789645,
"grad_norm": 0.6191649901679567,
"learning_rate": 8.683602771362586e-06,
"loss": 0.4983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5357075929641724,
"step": 95,
"valid_targets_mean": 5710.0,
"valid_targets_min": 284
},
{
"epoch": 0.16181229773462782,
"grad_norm": 0.47894871102676023,
"learning_rate": 9.145496535796767e-06,
"loss": 0.4542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35243353247642517,
"step": 100,
"valid_targets_mean": 6085.1,
"valid_targets_min": 3073
},
{
"epoch": 0.16990291262135923,
"grad_norm": 0.4740843869327914,
"learning_rate": 9.607390300230948e-06,
"loss": 0.4785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4505811929702759,
"step": 105,
"valid_targets_mean": 7739.5,
"valid_targets_min": 3524
},
{
"epoch": 0.1779935275080906,
"grad_norm": 0.46112304946532046,
"learning_rate": 1.0069284064665128e-05,
"loss": 0.458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4704515337944031,
"step": 110,
"valid_targets_mean": 7832.8,
"valid_targets_min": 2404
},
{
"epoch": 0.18608414239482202,
"grad_norm": 0.5109584178686144,
"learning_rate": 1.0531177829099309e-05,
"loss": 0.4322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44879865646362305,
"step": 115,
"valid_targets_mean": 6810.3,
"valid_targets_min": 3979
},
{
"epoch": 0.1941747572815534,
"grad_norm": 0.46619850801703333,
"learning_rate": 1.0993071593533488e-05,
"loss": 0.4315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4397251009941101,
"step": 120,
"valid_targets_mean": 7624.2,
"valid_targets_min": 3905
},
{
"epoch": 0.2022653721682848,
"grad_norm": 0.47702679305743545,
"learning_rate": 1.1454965357967669e-05,
"loss": 0.4447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43253201246261597,
"step": 125,
"valid_targets_mean": 6795.1,
"valid_targets_min": 3148
},
{
"epoch": 0.21035598705501618,
"grad_norm": 1.2109949158028912,
"learning_rate": 1.1916859122401848e-05,
"loss": 0.6233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6370628476142883,
"step": 130,
"valid_targets_mean": 3099.5,
"valid_targets_min": 1256
},
{
"epoch": 0.21844660194174756,
"grad_norm": 0.9744370820075807,
"learning_rate": 1.237875288683603e-05,
"loss": 0.6511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6300196051597595,
"step": 135,
"valid_targets_mean": 3709.8,
"valid_targets_min": 1344
},
{
"epoch": 0.22653721682847897,
"grad_norm": 0.902472131901638,
"learning_rate": 1.284064665127021e-05,
"loss": 0.6134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5684735774993896,
"step": 140,
"valid_targets_mean": 2654.6,
"valid_targets_min": 1082
},
{
"epoch": 0.23462783171521034,
"grad_norm": 0.9072911363668095,
"learning_rate": 1.3302540415704388e-05,
"loss": 0.607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6057754755020142,
"step": 145,
"valid_targets_mean": 2991.8,
"valid_targets_min": 1159
},
{
"epoch": 0.24271844660194175,
"grad_norm": 0.8517220825207069,
"learning_rate": 1.3764434180138568e-05,
"loss": 0.6192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6334041953086853,
"step": 150,
"valid_targets_mean": 3261.2,
"valid_targets_min": 1281
},
{
"epoch": 0.25080906148867316,
"grad_norm": 0.837155020681443,
"learning_rate": 1.4226327944572749e-05,
"loss": 0.599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5919010639190674,
"step": 155,
"valid_targets_mean": 3676.6,
"valid_targets_min": 1603
},
{
"epoch": 0.2588996763754045,
"grad_norm": 0.8162992185568456,
"learning_rate": 1.468822170900693e-05,
"loss": 0.597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5819936990737915,
"step": 160,
"valid_targets_mean": 3011.1,
"valid_targets_min": 1422
},
{
"epoch": 0.2669902912621359,
"grad_norm": 0.7935129254194224,
"learning_rate": 1.5150115473441109e-05,
"loss": 0.567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5208292603492737,
"step": 165,
"valid_targets_mean": 3071.8,
"valid_targets_min": 1277
},
{
"epoch": 0.2750809061488673,
"grad_norm": 0.8146619781186482,
"learning_rate": 1.561200923787529e-05,
"loss": 0.5688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.583451509475708,
"step": 170,
"valid_targets_mean": 3090.8,
"valid_targets_min": 1079
},
{
"epoch": 0.28317152103559873,
"grad_norm": 0.7721275818850296,
"learning_rate": 1.607390300230947e-05,
"loss": 0.5882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5752245187759399,
"step": 175,
"valid_targets_mean": 3369.2,
"valid_targets_min": 1104
},
{
"epoch": 0.2912621359223301,
"grad_norm": 0.7807944253862608,
"learning_rate": 1.653579676674365e-05,
"loss": 0.5595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.602877676486969,
"step": 180,
"valid_targets_mean": 3657.6,
"valid_targets_min": 1556
},
{
"epoch": 0.2993527508090615,
"grad_norm": 1.237953587348846,
"learning_rate": 1.699769053117783e-05,
"loss": 0.5697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5734540224075317,
"step": 185,
"valid_targets_mean": 2946.7,
"valid_targets_min": 860
},
{
"epoch": 0.3074433656957929,
"grad_norm": 0.7416704166205575,
"learning_rate": 1.7459584295612013e-05,
"loss": 0.5392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5371339321136475,
"step": 190,
"valid_targets_mean": 3523.2,
"valid_targets_min": 1404
},
{
"epoch": 0.3155339805825243,
"grad_norm": 0.5535465229823986,
"learning_rate": 1.792147806004619e-05,
"loss": 0.5082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46257442235946655,
"step": 195,
"valid_targets_mean": 5521.4,
"valid_targets_min": 1360
},
{
"epoch": 0.32362459546925565,
"grad_norm": 0.7440676720749868,
"learning_rate": 1.838337182448037e-05,
"loss": 0.5344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5397250652313232,
"step": 200,
"valid_targets_mean": 3396.9,
"valid_targets_min": 1336
},
{
"epoch": 0.33171521035598706,
"grad_norm": 0.7524676198416014,
"learning_rate": 1.8845265588914552e-05,
"loss": 0.5443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.541986346244812,
"step": 205,
"valid_targets_mean": 3617.4,
"valid_targets_min": 1726
},
{
"epoch": 0.33980582524271846,
"grad_norm": 0.6640846601991444,
"learning_rate": 1.9307159353348733e-05,
"loss": 0.5342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5500484704971313,
"step": 210,
"valid_targets_mean": 4753.2,
"valid_targets_min": 1146
},
{
"epoch": 0.3478964401294498,
"grad_norm": 0.7894552351445728,
"learning_rate": 1.976905311778291e-05,
"loss": 0.5287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5164601802825928,
"step": 215,
"valid_targets_mean": 2988.0,
"valid_targets_min": 1665
},
{
"epoch": 0.3559870550161812,
"grad_norm": 0.7612981287051088,
"learning_rate": 2.0230946882217092e-05,
"loss": 0.5401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6017681360244751,
"step": 220,
"valid_targets_mean": 3400.9,
"valid_targets_min": 985
},
{
"epoch": 0.3640776699029126,
"grad_norm": 0.6939836605089136,
"learning_rate": 2.0692840646651273e-05,
"loss": 0.5343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5006556510925293,
"step": 225,
"valid_targets_mean": 3745.3,
"valid_targets_min": 1398
},
{
"epoch": 0.37216828478964403,
"grad_norm": 0.6889492438195666,
"learning_rate": 2.115473441108545e-05,
"loss": 0.528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48514801263809204,
"step": 230,
"valid_targets_mean": 3360.9,
"valid_targets_min": 1133
},
{
"epoch": 0.3802588996763754,
"grad_norm": 0.7623990047403026,
"learning_rate": 2.1616628175519635e-05,
"loss": 0.5487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.57421875,
"step": 235,
"valid_targets_mean": 3318.2,
"valid_targets_min": 1383
},
{
"epoch": 0.3883495145631068,
"grad_norm": 0.8608207250476633,
"learning_rate": 2.2078521939953813e-05,
"loss": 0.5549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5341051816940308,
"step": 240,
"valid_targets_mean": 3564.1,
"valid_targets_min": 1035
},
{
"epoch": 0.3964401294498382,
"grad_norm": 0.8949184784742432,
"learning_rate": 2.2540415704387994e-05,
"loss": 0.5426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5230085849761963,
"step": 245,
"valid_targets_mean": 2470.4,
"valid_targets_min": 1285
},
{
"epoch": 0.4045307443365696,
"grad_norm": 0.6957663651549183,
"learning_rate": 2.3002309468822172e-05,
"loss": 0.5081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4455685019493103,
"step": 250,
"valid_targets_mean": 3419.8,
"valid_targets_min": 1415
},
{
"epoch": 0.41262135922330095,
"grad_norm": 0.6856073914304861,
"learning_rate": 2.346420323325635e-05,
"loss": 0.5198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5033816695213318,
"step": 255,
"valid_targets_mean": 3587.9,
"valid_targets_min": 1375
},
{
"epoch": 0.42071197411003236,
"grad_norm": 0.8179949015928839,
"learning_rate": 2.3926096997690534e-05,
"loss": 0.5441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5254044532775879,
"step": 260,
"valid_targets_mean": 2614.4,
"valid_targets_min": 1066
},
{
"epoch": 0.42880258899676377,
"grad_norm": 0.7498900598248376,
"learning_rate": 2.438799076212471e-05,
"loss": 0.5174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5212750434875488,
"step": 265,
"valid_targets_mean": 3381.9,
"valid_targets_min": 1125
},
{
"epoch": 0.4368932038834951,
"grad_norm": 0.7504675090521222,
"learning_rate": 2.4849884526558893e-05,
"loss": 0.5208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46384745836257935,
"step": 270,
"valid_targets_mean": 3233.6,
"valid_targets_min": 1199
},
{
"epoch": 0.4449838187702265,
"grad_norm": 0.7916017536563397,
"learning_rate": 2.5311778290993074e-05,
"loss": 0.5024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4946463704109192,
"step": 275,
"valid_targets_mean": 3305.2,
"valid_targets_min": 1344
},
{
"epoch": 0.45307443365695793,
"grad_norm": 0.6782862035278908,
"learning_rate": 2.5773672055427255e-05,
"loss": 0.4904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4988747835159302,
"step": 280,
"valid_targets_mean": 3871.6,
"valid_targets_min": 1205
},
{
"epoch": 0.46116504854368934,
"grad_norm": 0.7600807982882761,
"learning_rate": 2.6235565819861432e-05,
"loss": 0.4994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4982724189758301,
"step": 285,
"valid_targets_mean": 3910.4,
"valid_targets_min": 1450
},
{
"epoch": 0.4692556634304207,
"grad_norm": 0.5993399825918464,
"learning_rate": 2.6697459584295617e-05,
"loss": 0.4788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4518687129020691,
"step": 290,
"valid_targets_mean": 4702.8,
"valid_targets_min": 2246
},
{
"epoch": 0.4773462783171521,
"grad_norm": 0.7474788095150359,
"learning_rate": 2.7159353348729794e-05,
"loss": 0.51,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5318153500556946,
"step": 295,
"valid_targets_mean": 3323.4,
"valid_targets_min": 1348
},
{
"epoch": 0.4854368932038835,
"grad_norm": 0.6444802845925507,
"learning_rate": 2.7621247113163975e-05,
"loss": 0.4758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4648396372795105,
"step": 300,
"valid_targets_mean": 3920.9,
"valid_targets_min": 1318
},
{
"epoch": 0.4935275080906149,
"grad_norm": 0.6015753165422811,
"learning_rate": 2.8083140877598153e-05,
"loss": 0.4764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5057991743087769,
"step": 305,
"valid_targets_mean": 4233.6,
"valid_targets_min": 1361
},
{
"epoch": 0.5016181229773463,
"grad_norm": 0.8937976596128937,
"learning_rate": 2.8545034642032338e-05,
"loss": 0.5102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5273138284683228,
"step": 310,
"valid_targets_mean": 3595.1,
"valid_targets_min": 1368
},
{
"epoch": 0.5097087378640777,
"grad_norm": 0.7060203395582099,
"learning_rate": 2.9006928406466515e-05,
"loss": 0.5119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5150483250617981,
"step": 315,
"valid_targets_mean": 3354.8,
"valid_targets_min": 1186
},
{
"epoch": 0.517799352750809,
"grad_norm": 0.6260717983381987,
"learning_rate": 2.9468822170900696e-05,
"loss": 0.454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45638102293014526,
"step": 320,
"valid_targets_mean": 4103.5,
"valid_targets_min": 1405
},
{
"epoch": 0.5258899676375405,
"grad_norm": 0.6771131697225247,
"learning_rate": 2.9930715935334874e-05,
"loss": 0.4654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.452455073595047,
"step": 325,
"valid_targets_mean": 4204.2,
"valid_targets_min": 941
},
{
"epoch": 0.5339805825242718,
"grad_norm": 0.6764922910260465,
"learning_rate": 3.0392609699769055e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4742300808429718,
"step": 330,
"valid_targets_mean": 4473.8,
"valid_targets_min": 1696
},
{
"epoch": 0.5420711974110033,
"grad_norm": 0.7962549126746353,
"learning_rate": 3.0854503464203236e-05,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47426992654800415,
"step": 335,
"valid_targets_mean": 2837.8,
"valid_targets_min": 1330
},
{
"epoch": 0.5501618122977346,
"grad_norm": 0.5727443646037912,
"learning_rate": 3.131639722863742e-05,
"loss": 0.4537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4242827892303467,
"step": 340,
"valid_targets_mean": 4635.1,
"valid_targets_min": 1166
},
{
"epoch": 0.558252427184466,
"grad_norm": 0.7378350621646511,
"learning_rate": 3.17782909930716e-05,
"loss": 0.4565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5066303014755249,
"step": 345,
"valid_targets_mean": 3667.0,
"valid_targets_min": 1395
},
{
"epoch": 0.5663430420711975,
"grad_norm": 0.6783611200487234,
"learning_rate": 3.224018475750577e-05,
"loss": 0.4616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4323498606681824,
"step": 350,
"valid_targets_mean": 4262.1,
"valid_targets_min": 940
},
{
"epoch": 0.5744336569579288,
"grad_norm": 0.757137324177695,
"learning_rate": 3.270207852193996e-05,
"loss": 0.4876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48740166425704956,
"step": 355,
"valid_targets_mean": 3191.4,
"valid_targets_min": 1688
},
{
"epoch": 0.5825242718446602,
"grad_norm": 0.6858210837377695,
"learning_rate": 3.3163972286374135e-05,
"loss": 0.4397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43850621581077576,
"step": 360,
"valid_targets_mean": 3711.2,
"valid_targets_min": 1280
},
{
"epoch": 0.5906148867313916,
"grad_norm": 0.6287374086435015,
"learning_rate": 3.3625866050808316e-05,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40141230821609497,
"step": 365,
"valid_targets_mean": 4141.0,
"valid_targets_min": 1576
},
{
"epoch": 0.598705501618123,
"grad_norm": 0.6975941132702707,
"learning_rate": 3.40877598152425e-05,
"loss": 0.4847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5583797097206116,
"step": 370,
"valid_targets_mean": 3920.6,
"valid_targets_min": 993
},
{
"epoch": 0.6067961165048543,
"grad_norm": 0.7279439914063431,
"learning_rate": 3.454965357967668e-05,
"loss": 0.4577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4639485478401184,
"step": 375,
"valid_targets_mean": 2930.4,
"valid_targets_min": 1271
},
{
"epoch": 0.6148867313915858,
"grad_norm": 0.6768702572313738,
"learning_rate": 3.501154734411086e-05,
"loss": 0.4622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.490790992975235,
"step": 380,
"valid_targets_mean": 3889.4,
"valid_targets_min": 1109
},
{
"epoch": 0.6229773462783171,
"grad_norm": 0.6487053280504474,
"learning_rate": 3.547344110854504e-05,
"loss": 0.4638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45948219299316406,
"step": 385,
"valid_targets_mean": 4169.0,
"valid_targets_min": 1262
},
{
"epoch": 0.6310679611650486,
"grad_norm": 0.882983035029029,
"learning_rate": 3.5935334872979214e-05,
"loss": 0.4749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5022059082984924,
"step": 390,
"valid_targets_mean": 2340.9,
"valid_targets_min": 1380
},
{
"epoch": 0.63915857605178,
"grad_norm": 0.6320317979894593,
"learning_rate": 3.63972286374134e-05,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40444374084472656,
"step": 395,
"valid_targets_mean": 3383.8,
"valid_targets_min": 1136
},
{
"epoch": 0.6472491909385113,
"grad_norm": 0.5818960322996949,
"learning_rate": 3.6859122401847576e-05,
"loss": 0.4295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4237382411956787,
"step": 400,
"valid_targets_mean": 4683.7,
"valid_targets_min": 1129
},
{
"epoch": 0.6553398058252428,
"grad_norm": 0.809577266579874,
"learning_rate": 3.732101616628176e-05,
"loss": 0.4313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45975261926651,
"step": 405,
"valid_targets_mean": 3994.8,
"valid_targets_min": 1930
},
{
"epoch": 0.6634304207119741,
"grad_norm": 0.659659549528883,
"learning_rate": 3.778290993071594e-05,
"loss": 0.4204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43026500940322876,
"step": 410,
"valid_targets_mean": 3837.7,
"valid_targets_min": 1419
},
{
"epoch": 0.6715210355987055,
"grad_norm": 0.7331448698616245,
"learning_rate": 3.824480369515012e-05,
"loss": 0.4221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44799500703811646,
"step": 415,
"valid_targets_mean": 3206.0,
"valid_targets_min": 849
},
{
"epoch": 0.6796116504854369,
"grad_norm": 0.6992820860572108,
"learning_rate": 3.87066974595843e-05,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41871821880340576,
"step": 420,
"valid_targets_mean": 3158.6,
"valid_targets_min": 1188
},
{
"epoch": 0.6877022653721683,
"grad_norm": 0.5903634393524475,
"learning_rate": 3.9168591224018475e-05,
"loss": 0.4447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4192928969860077,
"step": 425,
"valid_targets_mean": 4985.4,
"valid_targets_min": 1162
},
{
"epoch": 0.6957928802588996,
"grad_norm": 0.6935560552905831,
"learning_rate": 3.963048498845266e-05,
"loss": 0.4453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4519827365875244,
"step": 430,
"valid_targets_mean": 3605.8,
"valid_targets_min": 1229
},
{
"epoch": 0.7038834951456311,
"grad_norm": 0.6756947997969236,
"learning_rate": 3.999999348775225e-05,
"loss": 0.4414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47775375843048096,
"step": 435,
"valid_targets_mean": 3628.4,
"valid_targets_min": 1204
},
{
"epoch": 0.7119741100323624,
"grad_norm": 0.7329858551067672,
"learning_rate": 3.9999765559526296e-05,
"loss": 0.4066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40486299991607666,
"step": 440,
"valid_targets_mean": 4005.9,
"valid_targets_min": 1431
},
{
"epoch": 0.7200647249190939,
"grad_norm": 0.6595983242797786,
"learning_rate": 3.999921202315374e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3833836317062378,
"step": 445,
"valid_targets_mean": 3881.7,
"valid_targets_min": 1211
},
{
"epoch": 0.7281553398058253,
"grad_norm": 0.6727930683168484,
"learning_rate": 3.9998332887646504e-05,
"loss": 0.4495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4389573633670807,
"step": 450,
"valid_targets_mean": 3740.8,
"valid_targets_min": 1231
},
{
"epoch": 0.7362459546925566,
"grad_norm": 0.9466550805793468,
"learning_rate": 3.999712816731743e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3840217590332031,
"step": 455,
"valid_targets_mean": 3616.2,
"valid_targets_min": 1364
},
{
"epoch": 0.7443365695792881,
"grad_norm": 0.6217684732379861,
"learning_rate": 3.999559788178009e-05,
"loss": 0.4305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41253650188446045,
"step": 460,
"valid_targets_mean": 3856.8,
"valid_targets_min": 1141
},
{
"epoch": 0.7524271844660194,
"grad_norm": 0.6248857718707198,
"learning_rate": 3.999374205594845e-05,
"loss": 0.3917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30960381031036377,
"step": 465,
"valid_targets_mean": 6443.2,
"valid_targets_min": 2485
},
{
"epoch": 0.7605177993527508,
"grad_norm": 0.5872970629177866,
"learning_rate": 3.999156072003646e-05,
"loss": 0.3286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28291448950767517,
"step": 470,
"valid_targets_mean": 5332.4,
"valid_targets_min": 824
},
{
"epoch": 0.7686084142394822,
"grad_norm": 0.47835828651939827,
"learning_rate": 3.9989053909557576e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31238192319869995,
"step": 475,
"valid_targets_mean": 6187.7,
"valid_targets_min": 2207
},
{
"epoch": 0.7766990291262136,
"grad_norm": 0.4871074224017115,
"learning_rate": 3.998622166532417e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571246922016144,
"step": 480,
"valid_targets_mean": 5631.6,
"valid_targets_min": 2795
},
{
"epoch": 0.7847896440129449,
"grad_norm": 0.4263025040455046,
"learning_rate": 3.998306403344688e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31412506103515625,
"step": 485,
"valid_targets_mean": 7407.4,
"valid_targets_min": 1902
},
{
"epoch": 0.7928802588996764,
"grad_norm": 0.47947323925930374,
"learning_rate": 3.997958106533383e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2837316691875458,
"step": 490,
"valid_targets_mean": 5209.8,
"valid_targets_min": 2991
},
{
"epoch": 0.8009708737864077,
"grad_norm": 0.5128232630032378,
"learning_rate": 3.997577281768982e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35242921113967896,
"step": 495,
"valid_targets_mean": 6012.4,
"valid_targets_min": 3782
},
{
"epoch": 0.8090614886731392,
"grad_norm": 0.5145002636153433,
"learning_rate": 3.997163935251543e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537648379802704,
"step": 500,
"valid_targets_mean": 5490.8,
"valid_targets_min": 3401
},
{
"epoch": 0.8171521035598706,
"grad_norm": 0.5086616334315329,
"learning_rate": 3.996718073710591e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30033719539642334,
"step": 505,
"valid_targets_mean": 5865.4,
"valid_targets_min": 4021
},
{
"epoch": 0.8252427184466019,
"grad_norm": 0.47029052122275783,
"learning_rate": 3.9962397044050206e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24913957715034485,
"step": 510,
"valid_targets_mean": 5680.2,
"valid_targets_min": 379
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.4245474236012608,
"learning_rate": 3.99572883512297e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23057851195335388,
"step": 515,
"valid_targets_mean": 5873.6,
"valid_targets_min": 1280
},
{
"epoch": 0.8414239482200647,
"grad_norm": 0.5632911300790845,
"learning_rate": 3.9951854741816954e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33303922414779663,
"step": 520,
"valid_targets_mean": 4735.3,
"valid_targets_min": 392
},
{
"epoch": 0.8495145631067961,
"grad_norm": 0.5155264290831733,
"learning_rate": 3.99460963042744e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29260292649269104,
"step": 525,
"valid_targets_mean": 5192.4,
"valid_targets_min": 647
},
{
"epoch": 0.8576051779935275,
"grad_norm": 0.46935004835095295,
"learning_rate": 3.994001313235283e-05,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25767964124679565,
"step": 530,
"valid_targets_mean": 5253.4,
"valid_targets_min": 253
},
{
"epoch": 0.8656957928802589,
"grad_norm": 0.49629700003966337,
"learning_rate": 3.993360532508993e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36085793375968933,
"step": 535,
"valid_targets_mean": 5694.6,
"valid_targets_min": 503
},
{
"epoch": 0.8737864077669902,
"grad_norm": 0.483093900599472,
"learning_rate": 3.9926872986808626e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2917660176753998,
"step": 540,
"valid_targets_mean": 5798.9,
"valid_targets_min": 1824
},
{
"epoch": 0.8818770226537217,
"grad_norm": 0.5566582367562767,
"learning_rate": 3.991981622711542e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825314998626709,
"step": 545,
"valid_targets_mean": 6017.6,
"valid_targets_min": 2360
},
{
"epoch": 0.889967637540453,
"grad_norm": 0.46853180296707475,
"learning_rate": 3.991243516089859e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3398240804672241,
"step": 550,
"valid_targets_mean": 7051.8,
"valid_targets_min": 3489
},
{
"epoch": 0.8980582524271845,
"grad_norm": 0.4847865772351801,
"learning_rate": 3.9904729908326295e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3135841190814972,
"step": 555,
"valid_targets_mean": 6098.8,
"valid_targets_min": 1470
},
{
"epoch": 0.9061488673139159,
"grad_norm": 0.5003251836794501,
"learning_rate": 3.989670059484465e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2598843574523926,
"step": 560,
"valid_targets_mean": 4782.9,
"valid_targets_min": 366
},
{
"epoch": 0.9142394822006472,
"grad_norm": 0.4802100079311373,
"learning_rate": 3.98883473511757e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2555955648422241,
"step": 565,
"valid_targets_mean": 5752.4,
"valid_targets_min": 3100
},
{
"epoch": 0.9223300970873787,
"grad_norm": 0.3865047150890052,
"learning_rate": 3.987967031331523e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2043823003768921,
"step": 570,
"valid_targets_mean": 6254.7,
"valid_targets_min": 2156
},
{
"epoch": 0.93042071197411,
"grad_norm": 0.5425912868516275,
"learning_rate": 3.987066962253063e-05,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928149700164795,
"step": 575,
"valid_targets_mean": 5049.7,
"valid_targets_min": 295
},
{
"epoch": 0.9385113268608414,
"grad_norm": 0.4214568082838799,
"learning_rate": 3.9861345425358506e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2728239893913269,
"step": 580,
"valid_targets_mean": 6636.9,
"valid_targets_min": 333
},
{
"epoch": 0.9466019417475728,
"grad_norm": 0.6495980738785143,
"learning_rate": 3.985169787360238e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2546083927154541,
"step": 585,
"valid_targets_mean": 5273.4,
"valid_targets_min": 2580
},
{
"epoch": 0.9546925566343042,
"grad_norm": 0.46365767656806356,
"learning_rate": 3.984172712433016e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27528953552246094,
"step": 590,
"valid_targets_mean": 5552.4,
"valid_targets_min": 396
},
{
"epoch": 0.9627831715210357,
"grad_norm": 0.49542433641132066,
"learning_rate": 3.983143333987161e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3295291066169739,
"step": 595,
"valid_targets_mean": 7252.6,
"valid_targets_min": 4266
},
{
"epoch": 0.970873786407767,
"grad_norm": 0.4815053281189472,
"learning_rate": 3.98208166878157e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2819350063800812,
"step": 600,
"valid_targets_mean": 5798.0,
"valid_targets_min": 2925
},
{
"epoch": 0.9789644012944984,
"grad_norm": 0.4362018609694083,
"learning_rate": 3.9809877341007865e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24610409140586853,
"step": 605,
"valid_targets_mean": 6265.6,
"valid_targets_min": 2353
},
{
"epoch": 0.9870550161812298,
"grad_norm": 0.5255099169324821,
"learning_rate": 3.979861547754723e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738872766494751,
"step": 610,
"valid_targets_mean": 5500.2,
"valid_targets_min": 2785
},
{
"epoch": 0.9951456310679612,
"grad_norm": 0.5814595529767955,
"learning_rate": 3.9787031280783665e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.255471408367157,
"step": 615,
"valid_targets_mean": 6825.4,
"valid_targets_min": 2113
},
{
"epoch": 1.0032362459546926,
"grad_norm": 0.521264035103106,
"learning_rate": 3.977512493931482e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4585817754268646,
"step": 620,
"valid_targets_mean": 8109.9,
"valid_targets_min": 2721
},
{
"epoch": 1.0113268608414239,
"grad_norm": 0.4980974525271715,
"learning_rate": 3.976289664698305e-05,
"loss": 0.3732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3889613449573517,
"step": 625,
"valid_targets_mean": 7440.1,
"valid_targets_min": 295
},
{
"epoch": 1.0194174757281553,
"grad_norm": 0.44838727254780897,
"learning_rate": 3.9750346602872275e-05,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36031463742256165,
"step": 630,
"valid_targets_mean": 6666.0,
"valid_targets_min": 436
},
{
"epoch": 1.0275080906148868,
"grad_norm": 0.511448483931203,
"learning_rate": 3.973747501130473e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29179736971855164,
"step": 635,
"valid_targets_mean": 6712.9,
"valid_targets_min": 2430
},
{
"epoch": 1.035598705501618,
"grad_norm": 0.48412379318776255,
"learning_rate": 3.97242820818376e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734421133995056,
"step": 640,
"valid_targets_mean": 7593.6,
"valid_targets_min": 2385
},
{
"epoch": 1.0436893203883495,
"grad_norm": 0.5767574946446217,
"learning_rate": 3.9710768029259695e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4075170159339905,
"step": 645,
"valid_targets_mean": 8572.8,
"valid_targets_min": 3812
},
{
"epoch": 1.051779935275081,
"grad_norm": 0.47192799914503875,
"learning_rate": 3.9696933073587864e-05,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3301822543144226,
"step": 650,
"valid_targets_mean": 7005.8,
"valid_targets_min": 2432
},
{
"epoch": 1.0598705501618122,
"grad_norm": 0.6861685062218944,
"learning_rate": 3.9682777440063455e-05,
"loss": 0.3764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3679102659225464,
"step": 655,
"valid_targets_mean": 7800.5,
"valid_targets_min": 2317
},
{
"epoch": 1.0679611650485437,
"grad_norm": 0.4525527931845314,
"learning_rate": 3.9668301359148655e-05,
"loss": 0.337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3416500389575958,
"step": 660,
"valid_targets_mean": 7407.8,
"valid_targets_min": 3408
},
{
"epoch": 1.0760517799352751,
"grad_norm": 0.49486536104768347,
"learning_rate": 3.965350506652272e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34230512380599976,
"step": 665,
"valid_targets_mean": 7218.2,
"valid_targets_min": 3958
},
{
"epoch": 1.0841423948220066,
"grad_norm": 0.5052558310995379,
"learning_rate": 3.963838880307815e-05,
"loss": 0.3595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37526077032089233,
"step": 670,
"valid_targets_mean": 6286.2,
"valid_targets_min": 2470
},
{
"epoch": 1.0922330097087378,
"grad_norm": 0.4834432080334965,
"learning_rate": 3.962295281491674e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39830780029296875,
"step": 675,
"valid_targets_mean": 8067.4,
"valid_targets_min": 3465
},
{
"epoch": 1.1003236245954693,
"grad_norm": 0.6282704766855602,
"learning_rate": 3.960719735334562e-05,
"loss": 0.3643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32480061054229736,
"step": 680,
"valid_targets_mean": 7811.1,
"valid_targets_min": 3446
},
{
"epoch": 1.1084142394822007,
"grad_norm": 0.490852558536864,
"learning_rate": 3.959112267487314e-05,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3614788055419922,
"step": 685,
"valid_targets_mean": 7021.4,
"valid_targets_min": 3473
},
{
"epoch": 1.116504854368932,
"grad_norm": 0.47061983952914566,
"learning_rate": 3.957472904120467e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086751103401184,
"step": 690,
"valid_targets_mean": 5997.2,
"valid_targets_min": 987
},
{
"epoch": 1.1245954692556634,
"grad_norm": 0.44888571078972783,
"learning_rate": 3.955801671923837e-05,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3621148467063904,
"step": 695,
"valid_targets_mean": 7148.6,
"valid_targets_min": 4702
},
{
"epoch": 1.132686084142395,
"grad_norm": 0.56027022071704,
"learning_rate": 3.954098598106084e-05,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325370728969574,
"step": 700,
"valid_targets_mean": 7563.4,
"valid_targets_min": 2494
},
{
"epoch": 1.1407766990291262,
"grad_norm": 0.4720884795289638,
"learning_rate": 3.952363710394269e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32920920848846436,
"step": 705,
"valid_targets_mean": 7400.8,
"valid_targets_min": 2898
},
{
"epoch": 1.1488673139158576,
"grad_norm": 0.45290892818769596,
"learning_rate": 3.9505970370334015e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32364755868911743,
"step": 710,
"valid_targets_mean": 6554.0,
"valid_targets_min": 2859
},
{
"epoch": 1.156957928802589,
"grad_norm": 0.4348077835242573,
"learning_rate": 3.94879860678598e-05,
"loss": 0.3591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35393470525741577,
"step": 715,
"valid_targets_mean": 8087.6,
"valid_targets_min": 3121
},
{
"epoch": 1.1650485436893203,
"grad_norm": 0.4227594099516516,
"learning_rate": 3.9469684489315256e-05,
"loss": 0.3497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35017964243888855,
"step": 720,
"valid_targets_mean": 7483.6,
"valid_targets_min": 2526
},
{
"epoch": 1.1731391585760518,
"grad_norm": 0.4500296851620212,
"learning_rate": 3.945106593266102e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622860312461853,
"step": 725,
"valid_targets_mean": 7937.6,
"valid_targets_min": 2332
},
{
"epoch": 1.1812297734627832,
"grad_norm": 0.5414055066436431,
"learning_rate": 3.943213070101834e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29072365164756775,
"step": 730,
"valid_targets_mean": 5858.5,
"valid_targets_min": 1991
},
{
"epoch": 1.1893203883495145,
"grad_norm": 0.481425269083926,
"learning_rate": 3.941287910266411e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29667848348617554,
"step": 735,
"valid_targets_mean": 6832.9,
"valid_targets_min": 2464
},
{
"epoch": 1.197411003236246,
"grad_norm": 0.5068660041921702,
"learning_rate": 3.9393311451025865e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37615975737571716,
"step": 740,
"valid_targets_mean": 7922.1,
"valid_targets_min": 3838
},
{
"epoch": 1.2055016181229774,
"grad_norm": 0.9147445359533504,
"learning_rate": 3.937342806467668e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48667970299720764,
"step": 745,
"valid_targets_mean": 3412.1,
"valid_targets_min": 1423
},
{
"epoch": 1.2135922330097086,
"grad_norm": 0.888516798970824,
"learning_rate": 3.935322926732998e-05,
"loss": 0.5244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49741584062576294,
"step": 750,
"valid_targets_mean": 3334.9,
"valid_targets_min": 1457
},
{
"epoch": 1.22168284789644,
"grad_norm": 0.7818920652158852,
"learning_rate": 3.933271538783427e-05,
"loss": 0.5071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4418655037879944,
"step": 755,
"valid_targets_mean": 3261.9,
"valid_targets_min": 1130
},
{
"epoch": 1.2297734627831716,
"grad_norm": 0.7776487371115436,
"learning_rate": 3.931188676016777e-05,
"loss": 0.4713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4955318570137024,
"step": 760,
"valid_targets_mean": 3196.9,
"valid_targets_min": 1352
},
{
"epoch": 1.237864077669903,
"grad_norm": 0.7930021342526781,
"learning_rate": 3.9290743723433e-05,
"loss": 0.5166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5079530477523804,
"step": 765,
"valid_targets_mean": 3218.4,
"valid_targets_min": 1283
},
{
"epoch": 1.2459546925566343,
"grad_norm": 0.7909110791334379,
"learning_rate": 3.926928662185126e-05,
"loss": 0.491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4915957450866699,
"step": 770,
"valid_targets_mean": 3128.2,
"valid_targets_min": 1174
},
{
"epoch": 1.2540453074433657,
"grad_norm": 0.765823080609702,
"learning_rate": 3.924751580475698e-05,
"loss": 0.4924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.494957834482193,
"step": 775,
"valid_targets_mean": 3595.7,
"valid_targets_min": 1167
},
{
"epoch": 1.262135922330097,
"grad_norm": 1.045712855129931,
"learning_rate": 3.922543162659209e-05,
"loss": 0.486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.507395327091217,
"step": 780,
"valid_targets_mean": 2384.2,
"valid_targets_min": 1050
},
{
"epoch": 1.2702265372168284,
"grad_norm": 0.8850101405229774,
"learning_rate": 3.9203034446900224e-05,
"loss": 0.4854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.507400393486023,
"step": 785,
"valid_targets_mean": 2044.2,
"valid_targets_min": 1031
},
{
"epoch": 1.27831715210356,
"grad_norm": 0.7931562943412704,
"learning_rate": 3.918032463032086e-05,
"loss": 0.478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.521835446357727,
"step": 790,
"valid_targets_mean": 2718.1,
"valid_targets_min": 1454
},
{
"epoch": 1.2864077669902914,
"grad_norm": 0.723093300351076,
"learning_rate": 3.9157302546583406e-05,
"loss": 0.485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4650059938430786,
"step": 795,
"valid_targets_mean": 3258.4,
"valid_targets_min": 1497
},
{
"epoch": 1.2944983818770226,
"grad_norm": 0.7343947043384617,
"learning_rate": 3.913396857050115e-05,
"loss": 0.4742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4760621190071106,
"step": 800,
"valid_targets_mean": 3150.2,
"valid_targets_min": 1604
},
{
"epoch": 1.302588996763754,
"grad_norm": 0.7778238888894733,
"learning_rate": 3.911032308196518e-05,
"loss": 0.4759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4637409448623657,
"step": 805,
"valid_targets_mean": 2876.9,
"valid_targets_min": 1155
},
{
"epoch": 1.3106796116504853,
"grad_norm": 0.6288806794338688,
"learning_rate": 3.9086366465938194e-05,
"loss": 0.4464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42423275113105774,
"step": 810,
"valid_targets_mean": 4079.6,
"valid_targets_min": 1052
},
{
"epoch": 1.3187702265372168,
"grad_norm": 0.6926348687095119,
"learning_rate": 3.906209911244823e-05,
"loss": 0.438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4340791702270508,
"step": 815,
"valid_targets_mean": 3415.6,
"valid_targets_min": 1602
},
{
"epoch": 1.3268608414239482,
"grad_norm": 0.726835789472572,
"learning_rate": 3.903752141658232e-05,
"loss": 0.4684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44731298089027405,
"step": 820,
"valid_targets_mean": 3181.6,
"valid_targets_min": 1316
},
{
"epoch": 1.3349514563106797,
"grad_norm": 0.789554550375042,
"learning_rate": 3.9012633778480054e-05,
"loss": 0.4608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4829597473144531,
"step": 825,
"valid_targets_mean": 3121.9,
"valid_targets_min": 1419
},
{
"epoch": 1.343042071197411,
"grad_norm": 0.6713483819715406,
"learning_rate": 3.8987436603327064e-05,
"loss": 0.458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47119760513305664,
"step": 830,
"valid_targets_mean": 3586.2,
"valid_targets_min": 1317
},
{
"epoch": 1.3511326860841424,
"grad_norm": 0.7427556747463112,
"learning_rate": 3.896193030134844e-05,
"loss": 0.4479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4320055842399597,
"step": 835,
"valid_targets_mean": 2831.5,
"valid_targets_min": 970
},
{
"epoch": 1.3592233009708738,
"grad_norm": 0.722101202230116,
"learning_rate": 3.893611528780204e-05,
"loss": 0.4705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4457879662513733,
"step": 840,
"valid_targets_mean": 3350.7,
"valid_targets_min": 1482
},
{
"epoch": 1.367313915857605,
"grad_norm": 0.6930675610937002,
"learning_rate": 3.890999198297171e-05,
"loss": 0.4597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41945701837539673,
"step": 845,
"valid_targets_mean": 3731.3,
"valid_targets_min": 2450
},
{
"epoch": 1.3754045307443366,
"grad_norm": 0.8212062520721645,
"learning_rate": 3.888356081216049e-05,
"loss": 0.4658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.520559549331665,
"step": 850,
"valid_targets_mean": 2778.6,
"valid_targets_min": 1161
},
{
"epoch": 1.383495145631068,
"grad_norm": 0.9671309453773359,
"learning_rate": 3.8856822205683646e-05,
"loss": 0.4742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5014246702194214,
"step": 855,
"valid_targets_mean": 2516.2,
"valid_targets_min": 1147
},
{
"epoch": 1.3915857605177995,
"grad_norm": 0.7705302765883373,
"learning_rate": 3.882977659886169e-05,
"loss": 0.4759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4699862003326416,
"step": 860,
"valid_targets_mean": 2672.7,
"valid_targets_min": 1160
},
{
"epoch": 1.3996763754045307,
"grad_norm": 0.7439341275062549,
"learning_rate": 3.8802424432013283e-05,
"loss": 0.4733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47823020815849304,
"step": 865,
"valid_targets_mean": 3144.7,
"valid_targets_min": 1229
},
{
"epoch": 1.4077669902912622,
"grad_norm": 0.8048849865194836,
"learning_rate": 3.8774766150448055e-05,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4707701802253723,
"step": 870,
"valid_targets_mean": 2757.4,
"valid_targets_min": 1187
},
{
"epoch": 1.4158576051779934,
"grad_norm": 0.7629841202120125,
"learning_rate": 3.874680220445938e-05,
"loss": 0.4529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4569883346557617,
"step": 875,
"valid_targets_mean": 3186.5,
"valid_targets_min": 1140
},
{
"epoch": 1.4239482200647249,
"grad_norm": 0.7580278084324503,
"learning_rate": 3.871853304931701e-05,
"loss": 0.4673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4785604178905487,
"step": 880,
"valid_targets_mean": 2945.1,
"valid_targets_min": 1342
},
{
"epoch": 1.4320388349514563,
"grad_norm": 0.7573866517699648,
"learning_rate": 3.8689959145259725e-05,
"loss": 0.4502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4420326352119446,
"step": 885,
"valid_targets_mean": 2664.8,
"valid_targets_min": 1158
},
{
"epoch": 1.4401294498381878,
"grad_norm": 0.7250738746302343,
"learning_rate": 3.866108095748776e-05,
"loss": 0.4507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4741765856742859,
"step": 890,
"valid_targets_mean": 3277.8,
"valid_targets_min": 905
},
{
"epoch": 1.448220064724919,
"grad_norm": 0.6758182045981384,
"learning_rate": 3.863189895615529e-05,
"loss": 0.4262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3965120017528534,
"step": 895,
"valid_targets_mean": 3435.2,
"valid_targets_min": 1523
},
{
"epoch": 1.4563106796116505,
"grad_norm": 0.7611603876330763,
"learning_rate": 3.8602413616362745e-05,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39768022298812866,
"step": 900,
"valid_targets_mean": 4198.9,
"valid_targets_min": 916
},
{
"epoch": 1.4644012944983817,
"grad_norm": 0.6247879749803259,
"learning_rate": 3.85726254181491e-05,
"loss": 0.4136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42923057079315186,
"step": 905,
"valid_targets_mean": 4307.2,
"valid_targets_min": 1372
},
{
"epoch": 1.4724919093851132,
"grad_norm": 0.590220922731002,
"learning_rate": 3.8542534846484055e-05,
"loss": 0.4118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38480812311172485,
"step": 910,
"valid_targets_mean": 4283.3,
"valid_targets_min": 965
},
{
"epoch": 1.4805825242718447,
"grad_norm": 0.6691179747584267,
"learning_rate": 3.8512142391260085e-05,
"loss": 0.4168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4205031394958496,
"step": 915,
"valid_targets_mean": 4556.1,
"valid_targets_min": 1616
},
{
"epoch": 1.4886731391585761,
"grad_norm": 0.6291998089233802,
"learning_rate": 3.848144854728457e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3751159906387329,
"step": 920,
"valid_targets_mean": 3447.2,
"valid_targets_min": 1306
},
{
"epoch": 1.4967637540453074,
"grad_norm": 0.6968952350014663,
"learning_rate": 3.8450453814271636e-05,
"loss": 0.4098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4444117546081543,
"step": 925,
"valid_targets_mean": 4328.6,
"valid_targets_min": 1066
},
{
"epoch": 1.5048543689320388,
"grad_norm": 0.6409550468842742,
"learning_rate": 3.8419158696834075e-05,
"loss": 0.4407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4060596227645874,
"step": 930,
"valid_targets_mean": 3835.6,
"valid_targets_min": 265
},
{
"epoch": 1.51294498381877,
"grad_norm": 0.6424363352174571,
"learning_rate": 3.8387563704475124e-05,
"loss": 0.418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3603544533252716,
"step": 935,
"valid_targets_mean": 3986.9,
"valid_targets_min": 1113
},
{
"epoch": 1.5210355987055015,
"grad_norm": 0.5995176367642314,
"learning_rate": 3.835566935158015e-05,
"loss": 0.3899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3868566155433655,
"step": 940,
"valid_targets_mean": 4109.8,
"valid_targets_min": 1541
},
{
"epoch": 1.529126213592233,
"grad_norm": 0.6241850671944227,
"learning_rate": 3.8323476157408315e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4304489493370056,
"step": 945,
"valid_targets_mean": 4168.6,
"valid_targets_min": 2291
},
{
"epoch": 1.5372168284789645,
"grad_norm": 1.040760910988651,
"learning_rate": 3.8290984646084056e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3906440734863281,
"step": 950,
"valid_targets_mean": 4216.5,
"valid_targets_min": 1752
},
{
"epoch": 1.545307443365696,
"grad_norm": 0.6519945827789969,
"learning_rate": 3.825819534658862e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4096558094024658,
"step": 955,
"valid_targets_mean": 3781.9,
"valid_targets_min": 1305
},
{
"epoch": 1.5533980582524272,
"grad_norm": 0.6479752533944285,
"learning_rate": 3.822510879275142e-05,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37997305393218994,
"step": 960,
"valid_targets_mean": 3348.1,
"valid_targets_min": 1135
},
{
"epoch": 1.5614886731391586,
"grad_norm": 0.588181029686509,
"learning_rate": 3.8191725523241346e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4473213851451874,
"step": 965,
"valid_targets_mean": 4481.9,
"valid_targets_min": 1322
},
{
"epoch": 1.5695792880258899,
"grad_norm": 0.6714890977266147,
"learning_rate": 3.8158046081557986e-05,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4482303559780121,
"step": 970,
"valid_targets_mean": 3422.4,
"valid_targets_min": 1174
},
{
"epoch": 1.5776699029126213,
"grad_norm": 0.6060732511857289,
"learning_rate": 3.812407101602281e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3715343773365021,
"step": 975,
"valid_targets_mean": 3936.9,
"valid_targets_min": 991
},
{
"epoch": 1.5857605177993528,
"grad_norm": 0.6001068677656148,
"learning_rate": 3.808980087977019e-05,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37591198086738586,
"step": 980,
"valid_targets_mean": 3986.6,
"valid_targets_min": 1735
},
{
"epoch": 1.5938511326860842,
"grad_norm": 0.7000946822381661,
"learning_rate": 3.8055236230738456e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40361475944519043,
"step": 985,
"valid_targets_mean": 3311.6,
"valid_targets_min": 1092
},
{
"epoch": 1.6019417475728155,
"grad_norm": 0.5788320307984678,
"learning_rate": 3.8020377631660756e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3535193204879761,
"step": 990,
"valid_targets_mean": 4680.1,
"valid_targets_min": 1798
},
{
"epoch": 1.610032362459547,
"grad_norm": 0.6639375139516203,
"learning_rate": 3.7985225650055956e-05,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4067763686180115,
"step": 995,
"valid_targets_mean": 4138.6,
"valid_targets_min": 1094
},
{
"epoch": 1.6181229773462782,
"grad_norm": 0.6129257993343638,
"learning_rate": 3.794978085821933e-05,
"loss": 0.3963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734704852104187,
"step": 1000,
"valid_targets_mean": 3797.0,
"valid_targets_min": 1324
},
{
"epoch": 1.6262135922330097,
"grad_norm": 0.586309978554014,
"learning_rate": 3.7914043833213294e-05,
"loss": 0.4079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4114878475666046,
"step": 1005,
"valid_targets_mean": 4714.8,
"valid_targets_min": 1255
},
{
"epoch": 1.6343042071197411,
"grad_norm": 0.7412145341429787,
"learning_rate": 3.787801515685799e-05,
"loss": 0.416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42866048216819763,
"step": 1010,
"valid_targets_mean": 3223.0,
"valid_targets_min": 1392
},
{
"epoch": 1.6423948220064726,
"grad_norm": 0.6298901268481449,
"learning_rate": 3.7841695415721826e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38183513283729553,
"step": 1015,
"valid_targets_mean": 3943.1,
"valid_targets_min": 1237
},
{
"epoch": 1.650485436893204,
"grad_norm": 0.6176784490755091,
"learning_rate": 3.78050852011119e-05,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33833619952201843,
"step": 1020,
"valid_targets_mean": 4954.7,
"valid_targets_min": 706
},
{
"epoch": 1.6585760517799353,
"grad_norm": 0.6087099001099794,
"learning_rate": 3.776818510906442e-05,
"loss": 0.3708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3340659737586975,
"step": 1025,
"valid_targets_mean": 3676.8,
"valid_targets_min": 1093
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.5668591607843806,
"learning_rate": 3.773099574033495e-05,
"loss": 0.3784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34908145666122437,
"step": 1030,
"valid_targets_mean": 4621.4,
"valid_targets_min": 1738
},
{
"epoch": 1.674757281553398,
"grad_norm": 0.6811988218257936,
"learning_rate": 3.7693517700388655e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33428844809532166,
"step": 1035,
"valid_targets_mean": 3523.9,
"valid_targets_min": 1856
},
{
"epoch": 1.6828478964401294,
"grad_norm": 0.661166060785201,
"learning_rate": 3.765575159939045e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38519763946533203,
"step": 1040,
"valid_targets_mean": 3767.3,
"valid_targets_min": 1039
},
{
"epoch": 1.690938511326861,
"grad_norm": 0.635519786642459,
"learning_rate": 3.761769805219505e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3758396506309509,
"step": 1045,
"valid_targets_mean": 4240.9,
"valid_targets_min": 995
},
{
"epoch": 1.6990291262135924,
"grad_norm": 0.5795362932404822,
"learning_rate": 3.757935767833696e-05,
"loss": 0.3795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.406206339597702,
"step": 1050,
"valid_targets_mean": 5330.5,
"valid_targets_min": 1212
},
{
"epoch": 1.7071197411003236,
"grad_norm": 0.5983057188423216,
"learning_rate": 3.7540731102020405e-05,
"loss": 0.3742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096472918987274,
"step": 1055,
"valid_targets_mean": 3586.9,
"valid_targets_min": 1172
},
{
"epoch": 1.715210355987055,
"grad_norm": 0.6829004913654826,
"learning_rate": 3.7501818952109156e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3755829334259033,
"step": 1060,
"valid_targets_mean": 3200.2,
"valid_targets_min": 1561
},
{
"epoch": 1.7233009708737863,
"grad_norm": 0.6663840962866384,
"learning_rate": 3.746262186211629e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4185965955257416,
"step": 1065,
"valid_targets_mean": 3854.4,
"valid_targets_min": 1217
},
{
"epoch": 1.7313915857605178,
"grad_norm": 1.678927068242607,
"learning_rate": 3.742314047019386e-05,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4099944829940796,
"step": 1070,
"valid_targets_mean": 2972.9,
"valid_targets_min": 333
},
{
"epoch": 1.7394822006472492,
"grad_norm": 0.6533292095832952,
"learning_rate": 3.7383375419122565e-05,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3951898515224457,
"step": 1075,
"valid_targets_mean": 3447.4,
"valid_targets_min": 1280
},
{
"epoch": 1.7475728155339807,
"grad_norm": 0.6963710269510751,
"learning_rate": 3.734332735630121e-05,
"loss": 0.3781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39096444845199585,
"step": 1080,
"valid_targets_mean": 3488.9,
"valid_targets_min": 1389
},
{
"epoch": 1.755663430420712,
"grad_norm": 0.4540955335898916,
"learning_rate": 3.730299693373622e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24774682521820068,
"step": 1085,
"valid_targets_mean": 6022.9,
"valid_targets_min": 2384
},
{
"epoch": 1.7637540453074434,
"grad_norm": 0.42684160855409603,
"learning_rate": 3.7262384808031004e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24269774556159973,
"step": 1090,
"valid_targets_mean": 6773.4,
"valid_targets_min": 1712
},
{
"epoch": 1.7718446601941746,
"grad_norm": 0.49895237577685475,
"learning_rate": 3.722149164037525e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23894259333610535,
"step": 1095,
"valid_targets_mean": 5853.4,
"valid_targets_min": 2336
},
{
"epoch": 1.779935275080906,
"grad_norm": 0.6262888400448398,
"learning_rate": 3.718031809653419e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23444335162639618,
"step": 1100,
"valid_targets_mean": 5625.0,
"valid_targets_min": 341
},
{
"epoch": 1.7880258899676376,
"grad_norm": 0.5207075255554792,
"learning_rate": 3.713886484683776e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2157619595527649,
"step": 1105,
"valid_targets_mean": 4999.9,
"valid_targets_min": 546
},
{
"epoch": 1.796116504854369,
"grad_norm": 0.515214744226938,
"learning_rate": 3.7097132566169644e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22869645059108734,
"step": 1110,
"valid_targets_mean": 5886.6,
"valid_targets_min": 362
},
{
"epoch": 1.8042071197411005,
"grad_norm": 0.5213961417814614,
"learning_rate": 3.7055121933956344e-05,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22981508076190948,
"step": 1115,
"valid_targets_mean": 5545.2,
"valid_targets_min": 349
},
{
"epoch": 1.8122977346278317,
"grad_norm": 0.5011582379645335,
"learning_rate": 3.7012833634156074e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22520172595977783,
"step": 1120,
"valid_targets_mean": 5221.4,
"valid_targets_min": 685
},
{
"epoch": 1.820388349514563,
"grad_norm": 0.433787558559027,
"learning_rate": 3.6970268355247664e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21840864419937134,
"step": 1125,
"valid_targets_mean": 6906.4,
"valid_targets_min": 3688
},
{
"epoch": 1.8284789644012944,
"grad_norm": 0.4461456898907489,
"learning_rate": 3.6927426790219296e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2790132164955139,
"step": 1130,
"valid_targets_mean": 5886.7,
"valid_targets_min": 3248
},
{
"epoch": 1.8365695792880259,
"grad_norm": 0.4450170159382012,
"learning_rate": 3.6884309636557294e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23092791438102722,
"step": 1135,
"valid_targets_mean": 5565.2,
"valid_targets_min": 849
},
{
"epoch": 1.8446601941747574,
"grad_norm": 0.5118163182829762,
"learning_rate": 3.6840917596234706e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.270181804895401,
"step": 1140,
"valid_targets_mean": 4495.2,
"valid_targets_min": 1104
},
{
"epoch": 1.8527508090614888,
"grad_norm": 0.5116271433775103,
"learning_rate": 3.67972513756999e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24221359193325043,
"step": 1145,
"valid_targets_mean": 5532.5,
"valid_targets_min": 3084
},
{
"epoch": 1.86084142394822,
"grad_norm": 0.5179137281679843,
"learning_rate": 3.675331168586507e-05,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2840508222579956,
"step": 1150,
"valid_targets_mean": 6345.2,
"valid_targets_min": 2085
},
{
"epoch": 1.8689320388349513,
"grad_norm": 0.45633158484470104,
"learning_rate": 3.670909924209464e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22190481424331665,
"step": 1155,
"valid_targets_mean": 6782.8,
"valid_targets_min": 4896
},
{
"epoch": 1.8770226537216828,
"grad_norm": 0.47235383732384373,
"learning_rate": 3.666461476419366e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19451837241649628,
"step": 1160,
"valid_targets_mean": 4796.1,
"valid_targets_min": 1174
},
{
"epoch": 1.8851132686084142,
"grad_norm": 0.4626112416545145,
"learning_rate": 3.6619858976396024e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689831554889679,
"step": 1165,
"valid_targets_mean": 6176.4,
"valid_targets_min": 2462
},
{
"epoch": 1.8932038834951457,
"grad_norm": 0.5391505583467975,
"learning_rate": 3.657483260735274e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3605060577392578,
"step": 1170,
"valid_targets_mean": 5792.8,
"valid_targets_min": 3198
},
{
"epoch": 1.9012944983818771,
"grad_norm": 0.45599119133953253,
"learning_rate": 3.652953639012001e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21034517884254456,
"step": 1175,
"valid_targets_mean": 6734.0,
"valid_targets_min": 3363
},
{
"epoch": 1.9093851132686084,
"grad_norm": 0.45662533458050836,
"learning_rate": 3.648397106214737e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21296310424804688,
"step": 1180,
"valid_targets_mean": 6156.2,
"valid_targets_min": 3554
},
{
"epoch": 1.9174757281553398,
"grad_norm": 0.4433638656237555,
"learning_rate": 3.6438137365265605e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25976046919822693,
"step": 1185,
"valid_targets_mean": 6275.4,
"valid_targets_min": 521
},
{
"epoch": 1.925566343042071,
"grad_norm": 0.4679879684777045,
"learning_rate": 3.639203604567471e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24510705471038818,
"step": 1190,
"valid_targets_mean": 6298.0,
"valid_targets_min": 437
},
{
"epoch": 1.9336569579288025,
"grad_norm": 0.4977336720705982,
"learning_rate": 3.634566785393175e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31283706426620483,
"step": 1195,
"valid_targets_mean": 6639.6,
"valid_targets_min": 2502
},
{
"epoch": 1.941747572815534,
"grad_norm": 0.5202866468820287,
"learning_rate": 3.629903354493863e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23550382256507874,
"step": 1200,
"valid_targets_mean": 5588.2,
"valid_targets_min": 3131
},
{
"epoch": 1.9498381877022655,
"grad_norm": 0.5219947278827387,
"learning_rate": 3.625213387792979e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2246617078781128,
"step": 1205,
"valid_targets_mean": 5546.2,
"valid_targets_min": 892
},
{
"epoch": 1.9579288025889967,
"grad_norm": 0.46448093815593106,
"learning_rate": 3.620496961645986e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23543399572372437,
"step": 1210,
"valid_targets_mean": 5383.6,
"valid_targets_min": 632
},
{
"epoch": 1.9660194174757282,
"grad_norm": 0.5060914468823391,
"learning_rate": 3.615754152839122e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29016217589378357,
"step": 1215,
"valid_targets_mean": 5866.8,
"valid_targets_min": 523
},
{
"epoch": 1.9741100323624594,
"grad_norm": 0.47924017927514234,
"learning_rate": 3.610985038588153e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23586151003837585,
"step": 1220,
"valid_targets_mean": 5499.6,
"valid_targets_min": 1071
},
{
"epoch": 1.9822006472491909,
"grad_norm": 0.4857460079460246,
"learning_rate": 3.606189696537112e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2761743664741516,
"step": 1225,
"valid_targets_mean": 6634.6,
"valid_targets_min": 910
},
{
"epoch": 1.9902912621359223,
"grad_norm": 0.4621192062943124,
"learning_rate": 3.601368204757034e-05,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509958744049072,
"step": 1230,
"valid_targets_mean": 5642.3,
"valid_targets_min": 409
},
{
"epoch": 1.9983818770226538,
"grad_norm": 0.504285712583757,
"learning_rate": 3.596520641744691e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23630420863628387,
"step": 1235,
"valid_targets_mean": 5486.1,
"valid_targets_min": 628
},
{
"epoch": 2.0064724919093853,
"grad_norm": 0.6014265194583701,
"learning_rate": 3.591647086421308e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2990904748439789,
"step": 1240,
"valid_targets_mean": 4996.2,
"valid_targets_min": 536
},
{
"epoch": 2.0145631067961167,
"grad_norm": 0.4549243639276278,
"learning_rate": 3.586747618131281e-05,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3390650749206543,
"step": 1245,
"valid_targets_mean": 8058.4,
"valid_targets_min": 3475
},
{
"epoch": 2.0226537216828477,
"grad_norm": 0.4749318683485237,
"learning_rate": 3.581822316640884e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3646315932273865,
"step": 1250,
"valid_targets_mean": 7721.6,
"valid_targets_min": 2978
},
{
"epoch": 2.030744336569579,
"grad_norm": 0.5059476480776492,
"learning_rate": 3.5768712621369724e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097308576107025,
"step": 1255,
"valid_targets_mean": 6325.1,
"valid_targets_min": 2196
},
{
"epoch": 2.0388349514563107,
"grad_norm": 0.43567691552176574,
"learning_rate": 3.571894535225674e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29119089245796204,
"step": 1260,
"valid_targets_mean": 7313.6,
"valid_targets_min": 2706
},
{
"epoch": 2.046925566343042,
"grad_norm": 0.9614339545477306,
"learning_rate": 3.566892216931081e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38573122024536133,
"step": 1265,
"valid_targets_mean": 8262.7,
"valid_targets_min": 2505
},
{
"epoch": 2.0550161812297736,
"grad_norm": 0.6941665522585272,
"learning_rate": 3.561864388693926e-05,
"loss": 0.3249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28548356890678406,
"step": 1270,
"valid_targets_mean": 6143.1,
"valid_targets_min": 611
},
{
"epoch": 2.063106796116505,
"grad_norm": 0.42092885788585327,
"learning_rate": 3.556811132370261e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.306254506111145,
"step": 1275,
"valid_targets_mean": 6580.4,
"valid_targets_min": 3909
},
{
"epoch": 2.071197411003236,
"grad_norm": 0.48148221197231267,
"learning_rate": 3.551732530230123e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2623848021030426,
"step": 1280,
"valid_targets_mean": 6454.7,
"valid_targets_min": 2205
},
{
"epoch": 2.0792880258899675,
"grad_norm": 0.45157690368933484,
"learning_rate": 3.54662866495619e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33691227436065674,
"step": 1285,
"valid_targets_mean": 7295.4,
"valid_targets_min": 2485
},
{
"epoch": 2.087378640776699,
"grad_norm": 0.44525824358048083,
"learning_rate": 3.5414996196424435e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31353265047073364,
"step": 1290,
"valid_targets_mean": 7182.0,
"valid_targets_min": 1873
},
{
"epoch": 2.0954692556634305,
"grad_norm": 0.4644732991993433,
"learning_rate": 3.536345477792809e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3179835081100464,
"step": 1295,
"valid_targets_mean": 7481.9,
"valid_targets_min": 3065
},
{
"epoch": 2.103559870550162,
"grad_norm": 0.4519791055149053,
"learning_rate": 3.5311663233197984e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3246445655822754,
"step": 1300,
"valid_targets_mean": 7622.2,
"valid_targets_min": 3085
},
{
"epoch": 2.1116504854368934,
"grad_norm": 0.4786819308529633,
"learning_rate": 3.525962240543144e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3294726610183716,
"step": 1305,
"valid_targets_mean": 6445.4,
"valid_targets_min": 2870
},
{
"epoch": 2.1197411003236244,
"grad_norm": 0.4554086419738832,
"learning_rate": 3.520733314188429e-05,
"loss": 0.3271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31785595417022705,
"step": 1310,
"valid_targets_mean": 6752.0,
"valid_targets_min": 2568
},
{
"epoch": 2.127831715210356,
"grad_norm": 0.45953570374734476,
"learning_rate": 3.515479629385699e-05,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3112117648124695,
"step": 1315,
"valid_targets_mean": 7377.4,
"valid_targets_min": 3797
},
{
"epoch": 2.1359223300970873,
"grad_norm": 0.43107122770104195,
"learning_rate": 3.5102012716680875e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29922381043434143,
"step": 1320,
"valid_targets_mean": 7377.4,
"valid_targets_min": 3726
},
{
"epoch": 2.144012944983819,
"grad_norm": 0.4890528047808735,
"learning_rate": 3.504898326970414e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28039124608039856,
"step": 1325,
"valid_targets_mean": 6884.6,
"valid_targets_min": 695
},
{
"epoch": 2.1521035598705502,
"grad_norm": 0.4492257868444859,
"learning_rate": 3.499570881627791e-05,
"loss": 0.3286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31394723057746887,
"step": 1330,
"valid_targets_mean": 7725.1,
"valid_targets_min": 3973
},
{
"epoch": 2.1601941747572817,
"grad_norm": 0.45196170093359594,
"learning_rate": 3.494219022374215e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36955010890960693,
"step": 1335,
"valid_targets_mean": 7827.6,
"valid_targets_min": 3936
},
{
"epoch": 2.168284789644013,
"grad_norm": 0.42892869442565384,
"learning_rate": 3.4888428363411564e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33320367336273193,
"step": 1340,
"valid_targets_mean": 8419.2,
"valid_targets_min": 5385
},
{
"epoch": 2.176375404530744,
"grad_norm": 0.45744113715758045,
"learning_rate": 3.48344241105614e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35591331124305725,
"step": 1345,
"valid_targets_mean": 8293.9,
"valid_targets_min": 3945
},
{
"epoch": 2.1844660194174756,
"grad_norm": 0.42030711419530997,
"learning_rate": 3.478017834441319e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29616591334342957,
"step": 1350,
"valid_targets_mean": 7622.2,
"valid_targets_min": 3170
},
{
"epoch": 2.192556634304207,
"grad_norm": 0.42933777850934934,
"learning_rate": 3.472569194812045e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29085344076156616,
"step": 1355,
"valid_targets_mean": 7071.5,
"valid_targets_min": 433
},
{
"epoch": 2.2006472491909386,
"grad_norm": 0.4822656065504384,
"learning_rate": 3.467096580875432e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3630227744579315,
"step": 1360,
"valid_targets_mean": 7871.8,
"valid_targets_min": 4330
},
{
"epoch": 2.20873786407767,
"grad_norm": 0.7805285602686421,
"learning_rate": 3.4616000817289076e-05,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.454883337020874,
"step": 1365,
"valid_targets_mean": 2993.9,
"valid_targets_min": 1430
},
{
"epoch": 2.2168284789644015,
"grad_norm": 0.7805602334689248,
"learning_rate": 3.456079786858766e-05,
"loss": 0.4537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45851534605026245,
"step": 1370,
"valid_targets_mean": 3060.9,
"valid_targets_min": 1119
},
{
"epoch": 2.2249190938511325,
"grad_norm": 0.8369096908438444,
"learning_rate": 3.450535786138709e-05,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42663732171058655,
"step": 1375,
"valid_targets_mean": 2852.3,
"valid_targets_min": 1528
},
{
"epoch": 2.233009708737864,
"grad_norm": 0.7602674447866041,
"learning_rate": 3.4449681698283856e-05,
"loss": 0.4264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4672640264034271,
"step": 1380,
"valid_targets_mean": 3322.4,
"valid_targets_min": 1137
},
{
"epoch": 2.2411003236245954,
"grad_norm": 0.7653932780247311,
"learning_rate": 3.4393770285719196e-05,
"loss": 0.4421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4281241297721863,
"step": 1385,
"valid_targets_mean": 3253.7,
"valid_targets_min": 1115
},
{
"epoch": 2.249190938511327,
"grad_norm": 0.8296647531841562,
"learning_rate": 3.433762453396434e-05,
"loss": 0.4413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4567793905735016,
"step": 1390,
"valid_targets_mean": 2743.4,
"valid_targets_min": 995
},
{
"epoch": 2.2572815533980584,
"grad_norm": 0.6605358764748289,
"learning_rate": 3.4281245357105726e-05,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4331215023994446,
"step": 1395,
"valid_targets_mean": 4347.8,
"valid_targets_min": 1044
},
{
"epoch": 2.26537216828479,
"grad_norm": 0.7525371302324368,
"learning_rate": 3.4224633673030074e-05,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46705174446105957,
"step": 1400,
"valid_targets_mean": 3000.2,
"valid_targets_min": 1293
},
{
"epoch": 2.273462783171521,
"grad_norm": 0.828408984869813,
"learning_rate": 3.416779040340945e-05,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41368424892425537,
"step": 1405,
"valid_targets_mean": 3091.8,
"valid_targets_min": 1429
},
{
"epoch": 2.2815533980582523,
"grad_norm": 0.8731185162707,
"learning_rate": 3.4110716473686305e-05,
"loss": 0.4412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4121938943862915,
"step": 1410,
"valid_targets_mean": 2893.9,
"valid_targets_min": 1170
},
{
"epoch": 2.2896440129449838,
"grad_norm": 0.6499592039768247,
"learning_rate": 3.405341281305835e-05,
"loss": 0.4151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4045106768608093,
"step": 1415,
"valid_targets_mean": 3624.3,
"valid_targets_min": 1115
},
{
"epoch": 2.2977346278317152,
"grad_norm": 0.8289152009164938,
"learning_rate": 3.3995880354463444e-05,
"loss": 0.4327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4141398072242737,
"step": 1420,
"valid_targets_mean": 2964.5,
"valid_targets_min": 1248
},
{
"epoch": 2.3058252427184467,
"grad_norm": 0.9528691187210049,
"learning_rate": 3.393812003456444e-05,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41642385721206665,
"step": 1425,
"valid_targets_mean": 3237.4,
"valid_targets_min": 1275
},
{
"epoch": 2.313915857605178,
"grad_norm": 0.7080266433968921,
"learning_rate": 3.3880132793733896e-05,
"loss": 0.3973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4032875895500183,
"step": 1430,
"valid_targets_mean": 2979.6,
"valid_targets_min": 1216
},
{
"epoch": 2.3220064724919096,
"grad_norm": 0.6952529365208576,
"learning_rate": 3.382191957603878e-05,
"loss": 0.3952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4107402563095093,
"step": 1435,
"valid_targets_mean": 3230.4,
"valid_targets_min": 1244
},
{
"epoch": 2.3300970873786406,
"grad_norm": 0.7272498923580895,
"learning_rate": 3.376348132922509e-05,
"loss": 0.4134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4044322073459625,
"step": 1440,
"valid_targets_mean": 2864.6,
"valid_targets_min": 1147
},
{
"epoch": 2.338187702265372,
"grad_norm": 0.6959547439645711,
"learning_rate": 3.3704819004702444e-05,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4201893210411072,
"step": 1445,
"valid_targets_mean": 3619.3,
"valid_targets_min": 1486
},
{
"epoch": 2.3462783171521036,
"grad_norm": 0.6715979921248629,
"learning_rate": 3.364593355752857e-05,
"loss": 0.4141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4077046513557434,
"step": 1450,
"valid_targets_mean": 3863.5,
"valid_targets_min": 1672
},
{
"epoch": 2.354368932038835,
"grad_norm": 0.7383136028350261,
"learning_rate": 3.358682594639379e-05,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43795761466026306,
"step": 1455,
"valid_targets_mean": 3301.6,
"valid_targets_min": 1346
},
{
"epoch": 2.3624595469255665,
"grad_norm": 0.7808846773518752,
"learning_rate": 3.3527497133605345e-05,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4166765511035919,
"step": 1460,
"valid_targets_mean": 2826.4,
"valid_targets_min": 1269
},
{
"epoch": 2.3705501618122975,
"grad_norm": 1.8254727752794442,
"learning_rate": 3.346794808507182e-05,
"loss": 0.4049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3987411856651306,
"step": 1465,
"valid_targets_mean": 2513.6,
"valid_targets_min": 1334
},
{
"epoch": 2.378640776699029,
"grad_norm": 0.8176247713463801,
"learning_rate": 3.340817977028732e-05,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40195712447166443,
"step": 1470,
"valid_targets_mean": 2750.2,
"valid_targets_min": 1299
},
{
"epoch": 2.3867313915857604,
"grad_norm": 0.9062003165524765,
"learning_rate": 3.3348193162315786e-05,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4356459677219391,
"step": 1475,
"valid_targets_mean": 2549.2,
"valid_targets_min": 1338
},
{
"epoch": 2.394822006472492,
"grad_norm": 0.7055341758798552,
"learning_rate": 3.3287989237775064e-05,
"loss": 0.4208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43329355120658875,
"step": 1480,
"valid_targets_mean": 3387.4,
"valid_targets_min": 1218
},
{
"epoch": 2.4029126213592233,
"grad_norm": 0.7345506690309963,
"learning_rate": 3.322756897682106e-05,
"loss": 0.406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4088819921016693,
"step": 1485,
"valid_targets_mean": 3456.2,
"valid_targets_min": 1527
},
{
"epoch": 2.411003236245955,
"grad_norm": 0.8017979886236237,
"learning_rate": 3.3166933363131765e-05,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39552873373031616,
"step": 1490,
"valid_targets_mean": 2982.2,
"valid_targets_min": 1216
},
{
"epoch": 2.4190938511326863,
"grad_norm": 0.937459026892843,
"learning_rate": 3.310608338389124e-05,
"loss": 0.4232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41104790568351746,
"step": 1495,
"valid_targets_mean": 3403.0,
"valid_targets_min": 1495
},
{
"epoch": 2.4271844660194173,
"grad_norm": 0.7438617223810716,
"learning_rate": 3.304502002977355e-05,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38526734709739685,
"step": 1500,
"valid_targets_mean": 3076.9,
"valid_targets_min": 1249
},
{
"epoch": 2.4352750809061487,
"grad_norm": 0.7446394304640043,
"learning_rate": 3.2983744294926614e-05,
"loss": 0.416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39251405000686646,
"step": 1505,
"valid_targets_mean": 3397.1,
"valid_targets_min": 1195
},
{
"epoch": 2.44336569579288,
"grad_norm": 0.7362091795056039,
"learning_rate": 3.292225717695606e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38442325592041016,
"step": 1510,
"valid_targets_mean": 2886.0,
"valid_targets_min": 1013
},
{
"epoch": 2.4514563106796117,
"grad_norm": 0.8169327602294557,
"learning_rate": 3.286055967690894e-05,
"loss": 0.3826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38595718145370483,
"step": 1515,
"valid_targets_mean": 2945.9,
"valid_targets_min": 1068
},
{
"epoch": 2.459546925566343,
"grad_norm": 0.7799505590543111,
"learning_rate": 3.279865279925748e-05,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3753122389316559,
"step": 1520,
"valid_targets_mean": 2965.0,
"valid_targets_min": 1034
},
{
"epoch": 2.4676375404530746,
"grad_norm": 0.5674370477801554,
"learning_rate": 3.273653755188265e-05,
"loss": 0.3715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37651532888412476,
"step": 1525,
"valid_targets_mean": 4745.3,
"valid_targets_min": 688
},
{
"epoch": 2.475728155339806,
"grad_norm": 0.6247727477015123,
"learning_rate": 3.267421494605786e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3644024133682251,
"step": 1530,
"valid_targets_mean": 4116.0,
"valid_targets_min": 1500
},
{
"epoch": 2.483818770226537,
"grad_norm": 0.7491582122547379,
"learning_rate": 3.261168599643239e-05,
"loss": 0.37,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35451722145080566,
"step": 1535,
"valid_targets_mean": 3082.2,
"valid_targets_min": 1538
},
{
"epoch": 2.4919093851132685,
"grad_norm": 0.6429281049648273,
"learning_rate": 3.254895172101495e-05,
"loss": 0.3482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33318030834198,
"step": 1540,
"valid_targets_mean": 3706.6,
"valid_targets_min": 1503
},
{
"epoch": 2.5,
"grad_norm": 0.6523483751167802,
"learning_rate": 3.248601314115709e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3792145848274231,
"step": 1545,
"valid_targets_mean": 3630.9,
"valid_targets_min": 987
},
{
"epoch": 2.5080906148867315,
"grad_norm": 0.7249836596601235,
"learning_rate": 3.2422871281536504e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3936595022678375,
"step": 1550,
"valid_targets_mean": 3107.8,
"valid_targets_min": 1074
},
{
"epoch": 2.516181229773463,
"grad_norm": 0.8616243014972932,
"learning_rate": 3.235952717014046e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3657923936843872,
"step": 1555,
"valid_targets_mean": 3956.6,
"valid_targets_min": 974
},
{
"epoch": 2.524271844660194,
"grad_norm": 0.638664828509639,
"learning_rate": 3.229598183824897e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37439674139022827,
"step": 1560,
"valid_targets_mean": 4259.0,
"valid_targets_min": 1555
},
{
"epoch": 2.5323624595469254,
"grad_norm": 0.6056668481066265,
"learning_rate": 3.223223632041806e-05,
"loss": 0.3682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3590593934059143,
"step": 1565,
"valid_targets_mean": 4229.0,
"valid_targets_min": 1335
},
{
"epoch": 2.540453074433657,
"grad_norm": 0.590522050754507,
"learning_rate": 3.216829165446288e-05,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3400675654411316,
"step": 1570,
"valid_targets_mean": 4780.1,
"valid_targets_min": 1276
},
{
"epoch": 2.5485436893203883,
"grad_norm": 0.6607067309911566,
"learning_rate": 3.210414888144085e-05,
"loss": 0.3554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3499111831188202,
"step": 1575,
"valid_targets_mean": 4779.9,
"valid_targets_min": 1071
},
{
"epoch": 2.55663430420712,
"grad_norm": 0.702948411258421,
"learning_rate": 3.203980904563467e-05,
"loss": 0.3398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3248726725578308,
"step": 1580,
"valid_targets_mean": 2915.0,
"valid_targets_min": 406
},
{
"epoch": 2.5647249190938513,
"grad_norm": 0.6628115331326496,
"learning_rate": 3.1975273194535365e-05,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35476428270339966,
"step": 1585,
"valid_targets_mean": 3659.4,
"valid_targets_min": 1228
},
{
"epoch": 2.5728155339805827,
"grad_norm": 0.6615270179204286,
"learning_rate": 3.191054237882519e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35199153423309326,
"step": 1590,
"valid_targets_mean": 4081.2,
"valid_targets_min": 1116
},
{
"epoch": 2.5809061488673137,
"grad_norm": 0.6626160538531557,
"learning_rate": 3.1845617652360556e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38913512229919434,
"step": 1595,
"valid_targets_mean": 4127.9,
"valid_targets_min": 1468
},
{
"epoch": 2.588996763754045,
"grad_norm": 0.5686585923437388,
"learning_rate": 3.178050007215483e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361608386039734,
"step": 1600,
"valid_targets_mean": 4937.8,
"valid_targets_min": 269
},
{
"epoch": 2.5970873786407767,
"grad_norm": 2.2272207542575115,
"learning_rate": 3.171519069836118e-05,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3982278108596802,
"step": 1605,
"valid_targets_mean": 2787.6,
"valid_targets_min": 1029
},
{
"epoch": 2.605177993527508,
"grad_norm": 0.6695229671580348,
"learning_rate": 3.1649690594255265e-05,
"loss": 0.3729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34326860308647156,
"step": 1610,
"valid_targets_mean": 3278.9,
"valid_targets_min": 1251
},
{
"epoch": 2.6132686084142396,
"grad_norm": 0.661728761043615,
"learning_rate": 3.1584000826217974e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3541804850101471,
"step": 1615,
"valid_targets_mean": 4680.7,
"valid_targets_min": 1062
},
{
"epoch": 2.6213592233009706,
"grad_norm": 0.8113177984942129,
"learning_rate": 3.151812246371802e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3555559515953064,
"step": 1620,
"valid_targets_mean": 4892.4,
"valid_targets_min": 922
},
{
"epoch": 2.6294498381877025,
"grad_norm": 0.576765401036298,
"learning_rate": 3.145205657929454e-05,
"loss": 0.3651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34818094968795776,
"step": 1625,
"valid_targets_mean": 4213.6,
"valid_targets_min": 1228
},
{
"epoch": 2.6375404530744335,
"grad_norm": 0.6921256308734074,
"learning_rate": 3.1385804248539665e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34675049781799316,
"step": 1630,
"valid_targets_mean": 3643.2,
"valid_targets_min": 774
},
{
"epoch": 2.645631067961165,
"grad_norm": 0.5734997693188809,
"learning_rate": 3.131936655008097e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3277677595615387,
"step": 1635,
"valid_targets_mean": 3834.2,
"valid_targets_min": 799
},
{
"epoch": 2.6537216828478964,
"grad_norm": 0.6176988613698919,
"learning_rate": 3.125274456556392e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33639439940452576,
"step": 1640,
"valid_targets_mean": 4379.6,
"valid_targets_min": 1377
},
{
"epoch": 2.661812297734628,
"grad_norm": 0.6544172101213054,
"learning_rate": 3.1185939379634274e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35664668679237366,
"step": 1645,
"valid_targets_mean": 3656.1,
"valid_targets_min": 1206
},
{
"epoch": 2.6699029126213594,
"grad_norm": 0.5477059231493232,
"learning_rate": 3.111895207992042e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30970466136932373,
"step": 1650,
"valid_targets_mean": 4599.8,
"valid_targets_min": 1474
},
{
"epoch": 2.6779935275080904,
"grad_norm": 0.7029760332920263,
"learning_rate": 3.1051783757015686e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3542120158672333,
"step": 1655,
"valid_targets_mean": 3595.6,
"valid_targets_min": 1424
},
{
"epoch": 2.686084142394822,
"grad_norm": 0.6498836452249998,
"learning_rate": 3.098443550446051e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3418267071247101,
"step": 1660,
"valid_targets_mean": 3510.6,
"valid_targets_min": 1446
},
{
"epoch": 2.6941747572815533,
"grad_norm": 1.2211153218964443,
"learning_rate": 3.0916908418724765e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3544435203075409,
"step": 1665,
"valid_targets_mean": 4430.4,
"valid_targets_min": 1561
},
{
"epoch": 2.7022653721682848,
"grad_norm": 1.2099387065339355,
"learning_rate": 3.0849203599189776e-05,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3719382882118225,
"step": 1670,
"valid_targets_mean": 3609.2,
"valid_targets_min": 1094
},
{
"epoch": 2.7103559870550162,
"grad_norm": 0.6608903398848406,
"learning_rate": 3.0781322148130514e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30829671025276184,
"step": 1675,
"valid_targets_mean": 3646.9,
"valid_targets_min": 1318
},
{
"epoch": 2.7184466019417477,
"grad_norm": 0.6424461992050344,
"learning_rate": 3.071326517069761e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3524508774280548,
"step": 1680,
"valid_targets_mean": 3864.7,
"valid_targets_min": 1537
},
{
"epoch": 2.726537216828479,
"grad_norm": 0.6088892936229023,
"learning_rate": 3.064503377489936e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35562074184417725,
"step": 1685,
"valid_targets_mean": 4292.1,
"valid_targets_min": 1626
},
{
"epoch": 2.73462783171521,
"grad_norm": 0.8310379687378989,
"learning_rate": 3.0576629071583704e-05,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3787177801132202,
"step": 1690,
"valid_targets_mean": 2578.6,
"valid_targets_min": 328
},
{
"epoch": 2.7427184466019416,
"grad_norm": 0.7336795250162784,
"learning_rate": 3.0508052174420132e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34328681230545044,
"step": 1695,
"valid_targets_mean": 3745.4,
"valid_targets_min": 1339
},
{
"epoch": 2.750809061488673,
"grad_norm": 0.5761292250835377,
"learning_rate": 3.0439304199881543e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521141767501831,
"step": 1700,
"valid_targets_mean": 6403.2,
"valid_targets_min": 1724
},
{
"epoch": 2.7588996763754046,
"grad_norm": 0.47192752380407144,
"learning_rate": 3.03703862672261e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2625490427017212,
"step": 1705,
"valid_targets_mean": 6242.4,
"valid_targets_min": 1861
},
{
"epoch": 2.766990291262136,
"grad_norm": 0.4692838219469033,
"learning_rate": 3.030129949847895e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24692867696285248,
"step": 1710,
"valid_targets_mean": 5536.4,
"valid_targets_min": 3078
},
{
"epoch": 2.775080906148867,
"grad_norm": 0.4695104746189952,
"learning_rate": 3.023204501841403e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22257234156131744,
"step": 1715,
"valid_targets_mean": 5897.4,
"valid_targets_min": 2340
},
{
"epoch": 2.783171521035599,
"grad_norm": 0.46675952644311963,
"learning_rate": 3.01626239545357e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24739572405815125,
"step": 1720,
"valid_targets_mean": 6239.1,
"valid_targets_min": 2926
},
{
"epoch": 2.79126213592233,
"grad_norm": 0.46028576559446716,
"learning_rate": 3.00930374370604e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19058983027935028,
"step": 1725,
"valid_targets_mean": 6132.8,
"valid_targets_min": 3165
},
{
"epoch": 2.7993527508090614,
"grad_norm": 0.4338650036638946,
"learning_rate": 3.002328659889826e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19038927555084229,
"step": 1730,
"valid_targets_mean": 5869.2,
"valid_targets_min": 2200
},
{
"epoch": 2.807443365695793,
"grad_norm": 0.4095273507413556,
"learning_rate": 2.995337257563466e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19616976380348206,
"step": 1735,
"valid_targets_mean": 6250.8,
"valid_targets_min": 552
},
{
"epoch": 2.8155339805825244,
"grad_norm": 0.4397121045961578,
"learning_rate": 2.9883296505511704e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.254894882440567,
"step": 1740,
"valid_targets_mean": 6930.5,
"valid_targets_min": 4391
},
{
"epoch": 2.823624595469256,
"grad_norm": 0.46668357421287665,
"learning_rate": 2.981305952940973e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20420300960540771,
"step": 1745,
"valid_targets_mean": 5333.6,
"valid_targets_min": 477
},
{
"epoch": 2.831715210355987,
"grad_norm": 0.46764197228804283,
"learning_rate": 2.9742662790828732e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21579869091510773,
"step": 1750,
"valid_targets_mean": 6891.6,
"valid_targets_min": 4008
},
{
"epoch": 2.8398058252427183,
"grad_norm": 0.48354599335481646,
"learning_rate": 2.9672107435869727e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21376736462116241,
"step": 1755,
"valid_targets_mean": 5651.2,
"valid_targets_min": 940
},
{
"epoch": 2.8478964401294498,
"grad_norm": 0.5475714799134836,
"learning_rate": 2.9601394613216086e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2783951759338379,
"step": 1760,
"valid_targets_mean": 5771.6,
"valid_targets_min": 909
},
{
"epoch": 2.855987055016181,
"grad_norm": 0.48845769089035257,
"learning_rate": 2.953052547411487e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19538253545761108,
"step": 1765,
"valid_targets_mean": 5659.5,
"valid_targets_min": 3276
},
{
"epoch": 2.8640776699029127,
"grad_norm": 0.4351545792992896,
"learning_rate": 2.9459501172358046e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24069242179393768,
"step": 1770,
"valid_targets_mean": 6256.8,
"valid_targets_min": 4223
},
{
"epoch": 2.872168284789644,
"grad_norm": 0.444626387049783,
"learning_rate": 2.9388322864263747e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18499356508255005,
"step": 1775,
"valid_targets_mean": 5226.5,
"valid_targets_min": 900
},
{
"epoch": 2.8802588996763756,
"grad_norm": 0.49978310609608434,
"learning_rate": 2.9316991708657382e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24685606360435486,
"step": 1780,
"valid_targets_mean": 6908.9,
"valid_targets_min": 2907
},
{
"epoch": 2.8883495145631066,
"grad_norm": 0.45780929753555405,
"learning_rate": 2.924550886685285e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22891566157341003,
"step": 1785,
"valid_targets_mean": 5650.2,
"valid_targets_min": 3626
},
{
"epoch": 2.896440129449838,
"grad_norm": 0.3931202774620866,
"learning_rate": 2.917387550263357e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18989673256874084,
"step": 1790,
"valid_targets_mean": 6715.2,
"valid_targets_min": 2968
},
{
"epoch": 2.9045307443365695,
"grad_norm": 0.45281393221699767,
"learning_rate": 2.9102092782233563e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21978428959846497,
"step": 1795,
"valid_targets_mean": 5944.2,
"valid_targets_min": 3462
},
{
"epoch": 2.912621359223301,
"grad_norm": 0.45339382448201765,
"learning_rate": 2.9030161874318455e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2767179608345032,
"step": 1800,
"valid_targets_mean": 7132.8,
"valid_targets_min": 3017
},
{
"epoch": 2.9207119741100325,
"grad_norm": 0.5075746973420298,
"learning_rate": 2.895808394996644e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2105654776096344,
"step": 1805,
"valid_targets_mean": 5465.3,
"valid_targets_min": 3731
},
{
"epoch": 2.9288025889967635,
"grad_norm": 0.4074364881732189,
"learning_rate": 2.8885860182649263e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18284833431243896,
"step": 1810,
"valid_targets_mean": 6481.9,
"valid_targets_min": 1048
},
{
"epoch": 2.9368932038834954,
"grad_norm": 0.5177652651451281,
"learning_rate": 2.881349174821305e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18447479605674744,
"step": 1815,
"valid_targets_mean": 5724.3,
"valid_targets_min": 3426
},
{
"epoch": 2.9449838187702264,
"grad_norm": 0.47895059311957167,
"learning_rate": 2.8740979824859194e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20376095175743103,
"step": 1820,
"valid_targets_mean": 5310.1,
"valid_targets_min": 1463
},
{
"epoch": 2.953074433656958,
"grad_norm": 0.49423974656062747,
"learning_rate": 2.8668325593125192e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23879647254943848,
"step": 1825,
"valid_targets_mean": 5651.5,
"valid_targets_min": 464
},
{
"epoch": 2.9611650485436893,
"grad_norm": 0.44390854244120626,
"learning_rate": 2.8595530235865397e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21764904260635376,
"step": 1830,
"valid_targets_mean": 6370.6,
"valid_targets_min": 3513
},
{
"epoch": 2.969255663430421,
"grad_norm": 0.6114626506498663,
"learning_rate": 2.8522594938231755e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261320561170578,
"step": 1835,
"valid_targets_mean": 7567.2,
"valid_targets_min": 3890
},
{
"epoch": 2.9773462783171523,
"grad_norm": 0.467812383161166,
"learning_rate": 2.8449520887654558e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2207464873790741,
"step": 1840,
"valid_targets_mean": 6544.5,
"valid_targets_min": 3523
},
{
"epoch": 2.9854368932038833,
"grad_norm": 0.4791034057933847,
"learning_rate": 2.8376309273823047e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18718640506267548,
"step": 1845,
"valid_targets_mean": 5593.0,
"valid_targets_min": 1614
},
{
"epoch": 2.9935275080906147,
"grad_norm": 0.4117756326042873,
"learning_rate": 2.8302961288666094e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20447809994220734,
"step": 1850,
"valid_targets_mean": 6863.6,
"valid_targets_min": 3648
},
{
"epoch": 3.001618122977346,
"grad_norm": 0.47583421251030267,
"learning_rate": 2.8229478126332766e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24508079886436462,
"step": 1855,
"valid_targets_mean": 6507.2,
"valid_targets_min": 1969
},
{
"epoch": 3.0097087378640777,
"grad_norm": 0.45872688387507193,
"learning_rate": 2.815586098317291e-05,
"loss": 0.3125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2711004614830017,
"step": 1860,
"valid_targets_mean": 6547.6,
"valid_targets_min": 2822
},
{
"epoch": 3.017799352750809,
"grad_norm": 0.47429826815585996,
"learning_rate": 2.8082111057717655e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886805534362793,
"step": 1865,
"valid_targets_mean": 7456.8,
"valid_targets_min": 1676
},
{
"epoch": 3.0258899676375406,
"grad_norm": 0.5015651427456486,
"learning_rate": 2.8008229550659883e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145654797554016,
"step": 1870,
"valid_targets_mean": 7212.2,
"valid_targets_min": 3800
},
{
"epoch": 3.033980582524272,
"grad_norm": 0.47188782403478186,
"learning_rate": 2.793421766483474e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24573259055614471,
"step": 1875,
"valid_targets_mean": 7030.2,
"valid_targets_min": 3738
},
{
"epoch": 3.042071197411003,
"grad_norm": 0.43763390517046236,
"learning_rate": 2.7860076605199995e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2639431357383728,
"step": 1880,
"valid_targets_mean": 6541.8,
"valid_targets_min": 469
},
{
"epoch": 3.0501618122977345,
"grad_norm": 0.44172809849782685,
"learning_rate": 2.7785807578816448e-05,
"loss": 0.3262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29740840196609497,
"step": 1885,
"valid_targets_mean": 7401.4,
"valid_targets_min": 2854
},
{
"epoch": 3.058252427184466,
"grad_norm": 0.429012811299429,
"learning_rate": 2.7711411794828274e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050397038459778,
"step": 1890,
"valid_targets_mean": 8668.2,
"valid_targets_min": 3365
},
{
"epoch": 3.0663430420711975,
"grad_norm": 0.4488913116405302,
"learning_rate": 2.7636890464443333e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24772655963897705,
"step": 1895,
"valid_targets_mean": 6754.3,
"valid_targets_min": 2100
},
{
"epoch": 3.074433656957929,
"grad_norm": 0.44216597098526006,
"learning_rate": 2.756224480091347e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3219381868839264,
"step": 1900,
"valid_targets_mean": 8038.2,
"valid_targets_min": 3704
},
{
"epoch": 3.0825242718446604,
"grad_norm": 0.49388425110906853,
"learning_rate": 2.7487476019514726e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122866749763489,
"step": 1905,
"valid_targets_mean": 6892.1,
"valid_targets_min": 1736
},
{
"epoch": 3.0906148867313914,
"grad_norm": 0.45296171291930487,
"learning_rate": 2.74125853375276e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2828711271286011,
"step": 1910,
"valid_targets_mean": 7149.5,
"valid_targets_min": 3606
},
{
"epoch": 3.098705501618123,
"grad_norm": 0.5691072351705835,
"learning_rate": 2.7337573974217177e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833087742328644,
"step": 1915,
"valid_targets_mean": 6004.5,
"valid_targets_min": 306
},
{
"epoch": 3.1067961165048543,
"grad_norm": 0.4162881780463123,
"learning_rate": 2.726244315081334e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25544559955596924,
"step": 1920,
"valid_targets_mean": 7372.0,
"valid_targets_min": 4593
},
{
"epoch": 3.114886731391586,
"grad_norm": 0.43692064078458287,
"learning_rate": 2.718719409049082e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34150227904319763,
"step": 1925,
"valid_targets_mean": 7420.4,
"valid_targets_min": 3842
},
{
"epoch": 3.1229773462783172,
"grad_norm": 0.501069700833799,
"learning_rate": 2.711182801834933e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35399535298347473,
"step": 1930,
"valid_targets_mean": 8089.4,
"valid_targets_min": 3071
},
{
"epoch": 3.1310679611650487,
"grad_norm": 0.5547118933791086,
"learning_rate": 2.7036346161393617e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902340888977051,
"step": 1935,
"valid_targets_mean": 6877.0,
"valid_targets_min": 3654
},
{
"epoch": 3.1391585760517797,
"grad_norm": 0.44034139813676154,
"learning_rate": 2.696074974851346e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29094940423965454,
"step": 1940,
"valid_targets_mean": 8145.8,
"valid_targets_min": 2130
},
{
"epoch": 3.147249190938511,
"grad_norm": 0.5016943552371228,
"learning_rate": 2.688504001046367e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3496394157409668,
"step": 1945,
"valid_targets_mean": 7568.6,
"valid_targets_min": 3435
},
{
"epoch": 3.1553398058252426,
"grad_norm": 0.48325348045886846,
"learning_rate": 2.6809218179844085e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26768216490745544,
"step": 1950,
"valid_targets_mean": 6097.7,
"valid_targets_min": 1161
},
{
"epoch": 3.163430420711974,
"grad_norm": 0.487336193105687,
"learning_rate": 2.6733285491079453e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33538806438446045,
"step": 1955,
"valid_targets_mean": 6649.2,
"valid_targets_min": 2993
},
{
"epoch": 3.1715210355987056,
"grad_norm": 0.4703762210934678,
"learning_rate": 2.6657243180399373e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2592100501060486,
"step": 1960,
"valid_targets_mean": 6283.1,
"valid_targets_min": 2278
},
{
"epoch": 3.179611650485437,
"grad_norm": 0.5068944167952791,
"learning_rate": 2.658109248581814e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30327221751213074,
"step": 1965,
"valid_targets_mean": 7856.1,
"valid_targets_min": 3609
},
{
"epoch": 3.1877022653721685,
"grad_norm": 0.47468151640087014,
"learning_rate": 2.650483464711462e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3432081341743469,
"step": 1970,
"valid_targets_mean": 8008.8,
"valid_targets_min": 1165
},
{
"epoch": 3.1957928802588995,
"grad_norm": 0.5084724878869032,
"learning_rate": 2.6428470905812047e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23990876972675323,
"step": 1975,
"valid_targets_mean": 7456.1,
"valid_targets_min": 2778
},
{
"epoch": 3.203883495145631,
"grad_norm": 0.6172383982749374,
"learning_rate": 2.6352002505157802e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3006366491317749,
"step": 1980,
"valid_targets_mean": 4243.0,
"valid_targets_min": 1153
},
{
"epoch": 3.2119741100323624,
"grad_norm": 0.7978962996020116,
"learning_rate": 2.6275430690103188e-05,
"loss": 0.4157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43584519624710083,
"step": 1985,
"valid_targets_mean": 2861.2,
"valid_targets_min": 1460
},
{
"epoch": 3.220064724919094,
"grad_norm": 0.9313628986194699,
"learning_rate": 2.6198756707283153e-05,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4482871890068054,
"step": 1990,
"valid_targets_mean": 2436.8,
"valid_targets_min": 1108
},
{
"epoch": 3.2281553398058254,
"grad_norm": 0.7634666137781282,
"learning_rate": 2.612198180499601e-05,
"loss": 0.3616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3643973171710968,
"step": 1995,
"valid_targets_mean": 3268.4,
"valid_targets_min": 1157
},
{
"epoch": 3.236245954692557,
"grad_norm": 0.8517352332533736,
"learning_rate": 2.604510723318309e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4433375895023346,
"step": 2000,
"valid_targets_mean": 2590.0,
"valid_targets_min": 872
},
{
"epoch": 3.244336569579288,
"grad_norm": 0.7252301434029291,
"learning_rate": 2.5968134243408405e-05,
"loss": 0.3972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39637094736099243,
"step": 2005,
"valid_targets_mean": 3088.1,
"valid_targets_min": 1500
},
{
"epoch": 3.2524271844660193,
"grad_norm": 0.8139379244117145,
"learning_rate": 2.5891064088838278e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3841778039932251,
"step": 2010,
"valid_targets_mean": 2681.4,
"valid_targets_min": 1213
},
{
"epoch": 3.2605177993527508,
"grad_norm": 0.7212261838585554,
"learning_rate": 2.5813898024220912e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3293357491493225,
"step": 2015,
"valid_targets_mean": 3165.6,
"valid_targets_min": 1467
},
{
"epoch": 3.2686084142394822,
"grad_norm": 0.7493586150342039,
"learning_rate": 2.573663730586601e-05,
"loss": 0.3873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40346598625183105,
"step": 2020,
"valid_targets_mean": 3995.6,
"valid_targets_min": 1173
},
{
"epoch": 3.2766990291262137,
"grad_norm": 0.8133579178643173,
"learning_rate": 2.5659283191624277e-05,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4063666760921478,
"step": 2025,
"valid_targets_mean": 3736.4,
"valid_targets_min": 1311
},
{
"epoch": 3.284789644012945,
"grad_norm": 0.9016208263184244,
"learning_rate": 2.5581836940866967e-05,
"loss": 0.4024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41699790954589844,
"step": 2030,
"valid_targets_mean": 3050.8,
"valid_targets_min": 1126
},
{
"epoch": 3.292880258899676,
"grad_norm": 0.7467519616638045,
"learning_rate": 2.550429981446537e-05,
"loss": 0.3821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37695205211639404,
"step": 2035,
"valid_targets_mean": 2968.2,
"valid_targets_min": 1254
},
{
"epoch": 3.3009708737864076,
"grad_norm": 0.679997759441785,
"learning_rate": 2.542667307477027e-05,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3674064576625824,
"step": 2040,
"valid_targets_mean": 3811.7,
"valid_targets_min": 1619
},
{
"epoch": 3.309061488673139,
"grad_norm": 0.7019193542215713,
"learning_rate": 2.534895798559144e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3509365916252136,
"step": 2045,
"valid_targets_mean": 4138.7,
"valid_targets_min": 1290
},
{
"epoch": 3.3171521035598706,
"grad_norm": 0.7644981967082519,
"learning_rate": 2.527115581217702e-05,
"loss": 0.3554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36790961027145386,
"step": 2050,
"valid_targets_mean": 3372.7,
"valid_targets_min": 1693
},
{
"epoch": 3.325242718446602,
"grad_norm": 0.8324542130119277,
"learning_rate": 2.5193267821192914e-05,
"loss": 0.3739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3999173045158386,
"step": 2055,
"valid_targets_mean": 2886.9,
"valid_targets_min": 1027
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.7251311605581526,
"learning_rate": 2.5115295280702222e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35481077432632446,
"step": 2060,
"valid_targets_mean": 3630.1,
"valid_targets_min": 1032
},
{
"epoch": 3.341423948220065,
"grad_norm": 0.8994421585493918,
"learning_rate": 2.5037239460144534e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.348206490278244,
"step": 2065,
"valid_targets_mean": 2775.9,
"valid_targets_min": 1173
},
{
"epoch": 3.349514563106796,
"grad_norm": 0.796492511881728,
"learning_rate": 2.4959101630315315e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.362110435962677,
"step": 2070,
"valid_targets_mean": 3605.9,
"valid_targets_min": 1897
},
{
"epoch": 3.3576051779935274,
"grad_norm": 1.3034529810821374,
"learning_rate": 2.4880883063345157e-05,
"loss": 0.3767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.366311252117157,
"step": 2075,
"valid_targets_mean": 2585.5,
"valid_targets_min": 1140
},
{
"epoch": 3.365695792880259,
"grad_norm": 0.8660088681232742,
"learning_rate": 2.480258503267912e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39507314562797546,
"step": 2080,
"valid_targets_mean": 2860.4,
"valid_targets_min": 1009
},
{
"epoch": 3.3737864077669903,
"grad_norm": 0.6972722103618133,
"learning_rate": 2.472420881305599e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3619586229324341,
"step": 2085,
"valid_targets_mean": 3527.3,
"valid_targets_min": 1380
},
{
"epoch": 3.381877022653722,
"grad_norm": 0.7218193777112525,
"learning_rate": 2.4645755680487497e-05,
"loss": 0.3873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3706960082054138,
"step": 2090,
"valid_targets_mean": 3451.2,
"valid_targets_min": 1500
},
{
"epoch": 3.389967637540453,
"grad_norm": 0.8084142195670189,
"learning_rate": 2.4567226912237566e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35703185200691223,
"step": 2095,
"valid_targets_mean": 2787.2,
"valid_targets_min": 1151
},
{
"epoch": 3.3980582524271843,
"grad_norm": 0.6964508405963089,
"learning_rate": 2.4488623786801523e-05,
"loss": 0.3759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3755350112915039,
"step": 2100,
"valid_targets_mean": 4092.3,
"valid_targets_min": 1302
},
{
"epoch": 3.4061488673139158,
"grad_norm": 0.8107522604064265,
"learning_rate": 2.4409947583885272e-05,
"loss": 0.3584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3875834345817566,
"step": 2105,
"valid_targets_mean": 2659.3,
"valid_targets_min": 1435
},
{
"epoch": 3.414239482200647,
"grad_norm": 0.7797309552660957,
"learning_rate": 2.4331199584384448e-05,
"loss": 0.37,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41315728425979614,
"step": 2110,
"valid_targets_mean": 3654.5,
"valid_targets_min": 2036
},
{
"epoch": 3.4223300970873787,
"grad_norm": 0.7938288617184067,
"learning_rate": 2.425238107036359e-05,
"loss": 0.3757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3548850119113922,
"step": 2115,
"valid_targets_mean": 2510.2,
"valid_targets_min": 1118
},
{
"epoch": 3.43042071197411,
"grad_norm": 0.9298235923393635,
"learning_rate": 2.4173493325035255e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37875327467918396,
"step": 2120,
"valid_targets_mean": 2486.3,
"valid_targets_min": 1216
},
{
"epoch": 3.4385113268608416,
"grad_norm": 0.793729423432582,
"learning_rate": 2.4094537632739126e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35467851161956787,
"step": 2125,
"valid_targets_mean": 3492.1,
"valid_targets_min": 1260
},
{
"epoch": 3.4466019417475726,
"grad_norm": 0.7849821970563073,
"learning_rate": 2.40155152789211e-05,
"loss": 0.3563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34691619873046875,
"step": 2130,
"valid_targets_mean": 2875.5,
"valid_targets_min": 1062
},
{
"epoch": 3.454692556634304,
"grad_norm": 0.7693298480722005,
"learning_rate": 2.3936427550112375e-05,
"loss": 0.3574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40094462037086487,
"step": 2135,
"valid_targets_mean": 3563.5,
"valid_targets_min": 1491
},
{
"epoch": 3.4627831715210355,
"grad_norm": 0.6373126854145776,
"learning_rate": 2.3857275733908476e-05,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33306121826171875,
"step": 2140,
"valid_targets_mean": 4153.3,
"valid_targets_min": 1248
},
{
"epoch": 3.470873786407767,
"grad_norm": 0.7673184920625664,
"learning_rate": 2.377806111894832e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40561556816101074,
"step": 2145,
"valid_targets_mean": 3383.9,
"valid_targets_min": 1266
},
{
"epoch": 3.4789644012944985,
"grad_norm": 0.6215117682240084,
"learning_rate": 2.3698784994893214e-05,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3328400254249573,
"step": 2150,
"valid_targets_mean": 4350.6,
"valid_targets_min": 1351
},
{
"epoch": 3.48705501618123,
"grad_norm": 0.77504169798237,
"learning_rate": 2.3619448652405885e-05,
"loss": 0.3318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32707396149635315,
"step": 2155,
"valid_targets_mean": 4064.1,
"valid_targets_min": 1670
},
{
"epoch": 3.4951456310679614,
"grad_norm": 0.5917729762982872,
"learning_rate": 2.3540053383129458e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.313139945268631,
"step": 2160,
"valid_targets_mean": 4482.6,
"valid_targets_min": 1115
},
{
"epoch": 3.5032362459546924,
"grad_norm": 0.7182867250889213,
"learning_rate": 2.346060047966638e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3666308522224426,
"step": 2165,
"valid_targets_mean": 3469.6,
"valid_targets_min": 1529
},
{
"epoch": 3.511326860841424,
"grad_norm": 0.6390375106609838,
"learning_rate": 2.3381091235557475e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3377194404602051,
"step": 2170,
"valid_targets_mean": 3768.1,
"valid_targets_min": 349
},
{
"epoch": 3.5194174757281553,
"grad_norm": 0.654587158888464,
"learning_rate": 2.330152694526077e-05,
"loss": 0.3184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33807533979415894,
"step": 2175,
"valid_targets_mean": 4148.2,
"valid_targets_min": 1399
},
{
"epoch": 3.527508090614887,
"grad_norm": 0.6152407643263405,
"learning_rate": 2.322190890413053e-05,
"loss": 0.3224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30578580498695374,
"step": 2180,
"valid_targets_mean": 4575.1,
"valid_targets_min": 1130
},
{
"epoch": 3.5355987055016183,
"grad_norm": 0.6712841496569436,
"learning_rate": 2.3142238408396076e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3307744860649109,
"step": 2185,
"valid_targets_mean": 4259.9,
"valid_targets_min": 1158
},
{
"epoch": 3.5436893203883493,
"grad_norm": 0.672919162530352,
"learning_rate": 2.3062516755140733e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.339915931224823,
"step": 2190,
"valid_targets_mean": 4558.8,
"valid_targets_min": 1336
},
{
"epoch": 3.551779935275081,
"grad_norm": 0.7516148005411548,
"learning_rate": 2.2982745242280716e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34565508365631104,
"step": 2195,
"valid_targets_mean": 4438.0,
"valid_targets_min": 1266
},
{
"epoch": 3.559870550161812,
"grad_norm": 0.6032399842230928,
"learning_rate": 2.290292516854396e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31961023807525635,
"step": 2200,
"valid_targets_mean": 4544.9,
"valid_targets_min": 1267
},
{
"epoch": 3.5679611650485437,
"grad_norm": 0.6327368151188703,
"learning_rate": 2.2823057833449013e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3518397808074951,
"step": 2205,
"valid_targets_mean": 4132.3,
"valid_targets_min": 1142
},
{
"epoch": 3.576051779935275,
"grad_norm": 0.5907129322549025,
"learning_rate": 2.274314453728386e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956004738807678,
"step": 2210,
"valid_targets_mean": 4665.3,
"valid_targets_min": 1871
},
{
"epoch": 3.5841423948220066,
"grad_norm": 0.5773586353010518,
"learning_rate": 2.2663186581084777e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30565541982650757,
"step": 2215,
"valid_targets_mean": 5279.4,
"valid_targets_min": 1157
},
{
"epoch": 3.592233009708738,
"grad_norm": 0.6978125591124367,
"learning_rate": 2.258318526661511e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29132378101348877,
"step": 2220,
"valid_targets_mean": 3529.3,
"valid_targets_min": 1433
},
{
"epoch": 3.600323624595469,
"grad_norm": 0.7250064098063926,
"learning_rate": 2.250314189634412e-05,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35525816679000854,
"step": 2225,
"valid_targets_mean": 3208.6,
"valid_targets_min": 1345
},
{
"epoch": 3.6084142394822005,
"grad_norm": 0.6810472579293779,
"learning_rate": 2.2423057773425745e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32046782970428467,
"step": 2230,
"valid_targets_mean": 3731.8,
"valid_targets_min": 1124
},
{
"epoch": 3.616504854368932,
"grad_norm": 0.6576908902184688,
"learning_rate": 2.2342934201677422e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33715614676475525,
"step": 2235,
"valid_targets_mean": 4375.0,
"valid_targets_min": 368
},
{
"epoch": 3.6245954692556634,
"grad_norm": 0.8395915796514543,
"learning_rate": 2.2262772485558814e-05,
"loss": 0.3304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3146824240684509,
"step": 2240,
"valid_targets_mean": 2428.5,
"valid_targets_min": 895
},
{
"epoch": 3.632686084142395,
"grad_norm": 0.7431826617479385,
"learning_rate": 2.218257393015062e-05,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33532094955444336,
"step": 2245,
"valid_targets_mean": 3131.6,
"valid_targets_min": 1451
},
{
"epoch": 3.6407766990291264,
"grad_norm": 0.6622130333948848,
"learning_rate": 2.2102339841133285e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3246265649795532,
"step": 2250,
"valid_targets_mean": 4755.8,
"valid_targets_min": 1169
},
{
"epoch": 3.648867313915858,
"grad_norm": 0.6260074949359321,
"learning_rate": 2.2022071524765786e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29530560970306396,
"step": 2255,
"valid_targets_mean": 4335.2,
"valid_targets_min": 1644
},
{
"epoch": 3.656957928802589,
"grad_norm": 0.6440630664498894,
"learning_rate": 2.1941770287864315e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28719133138656616,
"step": 2260,
"valid_targets_mean": 3863.4,
"valid_targets_min": 1861
},
{
"epoch": 3.6650485436893203,
"grad_norm": 0.6126886249442058,
"learning_rate": 2.1861437437781045e-05,
"loss": 0.3118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3384862244129181,
"step": 2265,
"valid_targets_mean": 4486.1,
"valid_targets_min": 1413
},
{
"epoch": 3.6731391585760518,
"grad_norm": 0.7024210805695811,
"learning_rate": 2.1781074282382834e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33213749527931213,
"step": 2270,
"valid_targets_mean": 3520.7,
"valid_targets_min": 1401
},
{
"epoch": 3.6812297734627832,
"grad_norm": 0.7445912146264361,
"learning_rate": 2.170068213002992e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32845768332481384,
"step": 2275,
"valid_targets_mean": 3274.1,
"valid_targets_min": 1012
},
{
"epoch": 3.6893203883495147,
"grad_norm": 0.7396134273791413,
"learning_rate": 2.1620262289554628e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3479768633842468,
"step": 2280,
"valid_targets_mean": 3706.2,
"valid_targets_min": 1061
},
{
"epoch": 3.6974110032362457,
"grad_norm": 0.6430183101362507,
"learning_rate": 2.1539816070240062e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28230059146881104,
"step": 2285,
"valid_targets_mean": 3550.2,
"valid_targets_min": 1327
},
{
"epoch": 3.705501618122977,
"grad_norm": 0.6548295376788589,
"learning_rate": 2.1459344781798807e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32259976863861084,
"step": 2290,
"valid_targets_mean": 4379.5,
"valid_targets_min": 1476
},
{
"epoch": 3.7135922330097086,
"grad_norm": 0.5791411549074513,
"learning_rate": 2.1378849734351565e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30870115756988525,
"step": 2295,
"valid_targets_mean": 5011.4,
"valid_targets_min": 311
},
{
"epoch": 3.72168284789644,
"grad_norm": 0.6686774018016203,
"learning_rate": 2.1298332238405856e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3138067126274109,
"step": 2300,
"valid_targets_mean": 3748.7,
"valid_targets_min": 1322
},
{
"epoch": 3.7297734627831716,
"grad_norm": 0.6176250019902619,
"learning_rate": 2.1217793604834687e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28627514839172363,
"step": 2305,
"valid_targets_mean": 4047.9,
"valid_targets_min": 1854
},
{
"epoch": 3.737864077669903,
"grad_norm": 0.6392998919122899,
"learning_rate": 2.1137235144855177e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30675268173217773,
"step": 2310,
"valid_targets_mean": 3985.9,
"valid_targets_min": 1189
},
{
"epoch": 3.7459546925566345,
"grad_norm": 0.6810561058243152,
"learning_rate": 2.1056658170007247e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32047516107559204,
"step": 2315,
"valid_targets_mean": 4031.6,
"valid_targets_min": 1708
},
{
"epoch": 3.7540453074433655,
"grad_norm": 0.5224360936076557,
"learning_rate": 2.0976063992132252e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21849115192890167,
"step": 2320,
"valid_targets_mean": 6091.9,
"valid_targets_min": 1642
},
{
"epoch": 3.762135922330097,
"grad_norm": 0.5087393518020041,
"learning_rate": 2.0895453923351613e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1869930475950241,
"step": 2325,
"valid_targets_mean": 5424.1,
"valid_targets_min": 4057
},
{
"epoch": 3.7702265372168284,
"grad_norm": 0.4499642484406925,
"learning_rate": 2.0814829276045465e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2276923507452011,
"step": 2330,
"valid_targets_mean": 5988.4,
"valid_targets_min": 1506
},
{
"epoch": 3.77831715210356,
"grad_norm": 0.49784474395857836,
"learning_rate": 2.0734191362831294e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22134488821029663,
"step": 2335,
"valid_targets_mean": 5366.7,
"valid_targets_min": 361
},
{
"epoch": 3.7864077669902914,
"grad_norm": 0.4512208729363229,
"learning_rate": 2.0653541496542566e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16249793767929077,
"step": 2340,
"valid_targets_mean": 6226.6,
"valid_targets_min": 317
},
{
"epoch": 3.794498381877023,
"grad_norm": 0.5065208653158666,
"learning_rate": 2.0572880990207343e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22169040143489838,
"step": 2345,
"valid_targets_mean": 5491.7,
"valid_targets_min": 2967
},
{
"epoch": 3.8025889967637543,
"grad_norm": 0.7330612173972851,
"learning_rate": 2.049221115702692e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19703437387943268,
"step": 2350,
"valid_targets_mean": 5216.8,
"valid_targets_min": 716
},
{
"epoch": 3.8106796116504853,
"grad_norm": 0.5442930834831672,
"learning_rate": 2.0411533310354433e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23777084052562714,
"step": 2355,
"valid_targets_mean": 5939.6,
"valid_targets_min": 314
},
{
"epoch": 3.8187702265372168,
"grad_norm": 0.5018825408101142,
"learning_rate": 2.0330848763673484e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22420501708984375,
"step": 2360,
"valid_targets_mean": 5939.4,
"valid_targets_min": 2599
},
{
"epoch": 3.8268608414239482,
"grad_norm": 0.4970494413717442,
"learning_rate": 2.0250158830576764e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20009323954582214,
"step": 2365,
"valid_targets_mean": 6258.1,
"valid_targets_min": 1956
},
{
"epoch": 3.8349514563106797,
"grad_norm": 0.44923834669987023,
"learning_rate": 2.0169464824744636e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1759965568780899,
"step": 2370,
"valid_targets_mean": 6348.2,
"valid_targets_min": 2993
},
{
"epoch": 3.843042071197411,
"grad_norm": 0.4495132904363796,
"learning_rate": 2.0088768059923795e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19953864812850952,
"step": 2375,
"valid_targets_mean": 6097.6,
"valid_targets_min": 1803
},
{
"epoch": 3.851132686084142,
"grad_norm": 0.5096333824884599,
"learning_rate": 2.0008069849905847e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24274849891662598,
"step": 2380,
"valid_targets_mean": 6063.0,
"valid_targets_min": 620
},
{
"epoch": 3.8592233009708736,
"grad_norm": 0.4745564296696438,
"learning_rate": 1.9927371508505915e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21321144700050354,
"step": 2385,
"valid_targets_mean": 5397.2,
"valid_targets_min": 2991
},
{
"epoch": 3.867313915857605,
"grad_norm": 0.4561833046514106,
"learning_rate": 1.984667434954126e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23293474316596985,
"step": 2390,
"valid_targets_mean": 6302.4,
"valid_targets_min": 587
},
{
"epoch": 3.8754045307443366,
"grad_norm": 0.48692062588305735,
"learning_rate": 1.9765979686809912e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20418483018875122,
"step": 2395,
"valid_targets_mean": 5835.7,
"valid_targets_min": 1488
},
{
"epoch": 3.883495145631068,
"grad_norm": 0.5760245409491545,
"learning_rate": 1.968528883406925e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20110785961151123,
"step": 2400,
"valid_targets_mean": 6698.3,
"valid_targets_min": 1041
},
{
"epoch": 3.8915857605177995,
"grad_norm": 0.455942195772971,
"learning_rate": 1.9604603105014616e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19040292501449585,
"step": 2405,
"valid_targets_mean": 6100.8,
"valid_targets_min": 3304
},
{
"epoch": 3.899676375404531,
"grad_norm": 0.43188977809199325,
"learning_rate": 1.9523923813257957e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18241921067237854,
"step": 2410,
"valid_targets_mean": 7247.2,
"valid_targets_min": 3122
},
{
"epoch": 3.907766990291262,
"grad_norm": 0.438052906217528,
"learning_rate": 1.9443252272306384e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2029222548007965,
"step": 2415,
"valid_targets_mean": 6403.1,
"valid_targets_min": 3898
},
{
"epoch": 3.9158576051779934,
"grad_norm": 0.47333386859383014,
"learning_rate": 1.9362589795540852e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605544537305832,
"step": 2420,
"valid_targets_mean": 5129.8,
"valid_targets_min": 1379
},
{
"epoch": 3.923948220064725,
"grad_norm": 0.5199177948375372,
"learning_rate": 1.9281937696194723e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19830086827278137,
"step": 2425,
"valid_targets_mean": 5376.5,
"valid_targets_min": 2363
},
{
"epoch": 3.9320388349514563,
"grad_norm": 0.5206001127949775,
"learning_rate": 1.9201297287332428e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1985754817724228,
"step": 2430,
"valid_targets_mean": 5625.6,
"valid_targets_min": 1809
},
{
"epoch": 3.940129449838188,
"grad_norm": 0.5033961651148904,
"learning_rate": 1.912066988182806e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20823442935943604,
"step": 2435,
"valid_targets_mean": 6466.5,
"valid_targets_min": 3494
},
{
"epoch": 3.948220064724919,
"grad_norm": 0.4571578459678172,
"learning_rate": 1.9040056792344005e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19116318225860596,
"step": 2440,
"valid_targets_mean": 6313.9,
"valid_targets_min": 1775
},
{
"epoch": 3.9563106796116507,
"grad_norm": 0.44341434436450294,
"learning_rate": 1.8959459331309576e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19575943052768707,
"step": 2445,
"valid_targets_mean": 6352.2,
"valid_targets_min": 1426
},
{
"epoch": 3.9644012944983817,
"grad_norm": 0.45862690264733,
"learning_rate": 1.8878878810899653e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17178326845169067,
"step": 2450,
"valid_targets_mean": 6052.2,
"valid_targets_min": 3261
},
{
"epoch": 3.972491909385113,
"grad_norm": 0.47784816019033394,
"learning_rate": 1.8798316543013317e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21690775454044342,
"step": 2455,
"valid_targets_mean": 5542.8,
"valid_targets_min": 361
},
{
"epoch": 3.9805825242718447,
"grad_norm": 0.4393081044956994,
"learning_rate": 1.8717773839252477e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17442364990711212,
"step": 2460,
"valid_targets_mean": 5560.8,
"valid_targets_min": 1301
},
{
"epoch": 3.988673139158576,
"grad_norm": 0.4967733193720244,
"learning_rate": 1.8637252010900515e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19287577271461487,
"step": 2465,
"valid_targets_mean": 5077.6,
"valid_targets_min": 422
},
{
"epoch": 3.9967637540453076,
"grad_norm": 0.5150380483343356,
"learning_rate": 1.8556752368900972e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16168953478336334,
"step": 2470,
"valid_targets_mean": 5078.6,
"valid_targets_min": 310
},
{
"epoch": 4.004854368932039,
"grad_norm": 0.5006842825532989,
"learning_rate": 1.8476276223836177e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28505608439445496,
"step": 2475,
"valid_targets_mean": 7461.8,
"valid_targets_min": 4222
},
{
"epoch": 4.0129449838187705,
"grad_norm": 0.4449390233467316,
"learning_rate": 1.8395824885905898e-05,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080679178237915,
"step": 2480,
"valid_targets_mean": 8813.2,
"valid_targets_min": 3435
},
{
"epoch": 4.0210355987055015,
"grad_norm": 0.45517804304428394,
"learning_rate": 1.8315399664906062e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30526304244995117,
"step": 2485,
"valid_targets_mean": 8051.2,
"valid_targets_min": 2932
},
{
"epoch": 4.029126213592233,
"grad_norm": 0.46941839918358313,
"learning_rate": 1.823500187020735e-05,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32779282331466675,
"step": 2490,
"valid_targets_mean": 8165.1,
"valid_targets_min": 2978
},
{
"epoch": 4.0372168284789645,
"grad_norm": 0.4965357687908804,
"learning_rate": 1.815463281073396e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27793848514556885,
"step": 2495,
"valid_targets_mean": 7405.6,
"valid_targets_min": 3938
},
{
"epoch": 4.0453074433656955,
"grad_norm": 0.5034223412827382,
"learning_rate": 1.8074293794942262e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26466065645217896,
"step": 2500,
"valid_targets_mean": 6687.1,
"valid_targets_min": 2974
},
{
"epoch": 4.053398058252427,
"grad_norm": 0.440367832467616,
"learning_rate": 1.7993986130799477e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32282423973083496,
"step": 2505,
"valid_targets_mean": 7811.5,
"valid_targets_min": 3018
},
{
"epoch": 4.061488673139158,
"grad_norm": 0.48021732325557415,
"learning_rate": 1.7913711125762435e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25816529989242554,
"step": 2510,
"valid_targets_mean": 6452.9,
"valid_targets_min": 956
},
{
"epoch": 4.06957928802589,
"grad_norm": 0.4512446325214269,
"learning_rate": 1.7833470086756214e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2777278423309326,
"step": 2515,
"valid_targets_mean": 7293.6,
"valid_targets_min": 4247
},
{
"epoch": 4.077669902912621,
"grad_norm": 0.42845468052968455,
"learning_rate": 1.7753264320152934e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563123106956482,
"step": 2520,
"valid_targets_mean": 7259.2,
"valid_targets_min": 2191
},
{
"epoch": 4.085760517799352,
"grad_norm": 0.4894422981849186,
"learning_rate": 1.7673095131750454e-05,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2566876709461212,
"step": 2525,
"valid_targets_mean": 6200.4,
"valid_targets_min": 2703
},
{
"epoch": 4.093851132686084,
"grad_norm": 0.5167026880546517,
"learning_rate": 1.759296382675112e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32553917169570923,
"step": 2530,
"valid_targets_mean": 6045.4,
"valid_targets_min": 1991
},
{
"epoch": 4.101941747572815,
"grad_norm": 0.456225396026587,
"learning_rate": 1.7512871709740515e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3135607838630676,
"step": 2535,
"valid_targets_mean": 8484.8,
"valid_targets_min": 4321
},
{
"epoch": 4.110032362459547,
"grad_norm": 0.4359728834305482,
"learning_rate": 1.743282008466619e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257236123085022,
"step": 2540,
"valid_targets_mean": 6967.7,
"valid_targets_min": 3742
},
{
"epoch": 4.118122977346278,
"grad_norm": 0.47833998100504577,
"learning_rate": 1.7352810254816498e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34937071800231934,
"step": 2545,
"valid_targets_mean": 8730.6,
"valid_targets_min": 4829
},
{
"epoch": 4.12621359223301,
"grad_norm": 0.4507590764600118,
"learning_rate": 1.727284352279934e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.338039368391037,
"step": 2550,
"valid_targets_mean": 8258.9,
"valid_targets_min": 2392
},
{
"epoch": 4.134304207119741,
"grad_norm": 0.46815652183190226,
"learning_rate": 1.7192921190520936e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833985984325409,
"step": 2555,
"valid_targets_mean": 7541.9,
"valid_targets_min": 4054
},
{
"epoch": 4.142394822006472,
"grad_norm": 0.7041539993056743,
"learning_rate": 1.7113044559164657e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2381104826927185,
"step": 2560,
"valid_targets_mean": 6805.5,
"valid_targets_min": 3012
},
{
"epoch": 4.150485436893204,
"grad_norm": 0.45520173715987966,
"learning_rate": 1.7033214929169847e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3208598494529724,
"step": 2565,
"valid_targets_mean": 8233.7,
"valid_targets_min": 3694
},
{
"epoch": 4.158576051779935,
"grad_norm": 0.4763941474946576,
"learning_rate": 1.695343360021064e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28221839666366577,
"step": 2570,
"valid_targets_mean": 6891.4,
"valid_targets_min": 3734
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.4372845011040278,
"learning_rate": 1.6873701871174782e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.316440224647522,
"step": 2575,
"valid_targets_mean": 8462.8,
"valid_targets_min": 2285
},
{
"epoch": 4.174757281553398,
"grad_norm": 0.4319984625589556,
"learning_rate": 1.6794021040142534e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788882851600647,
"step": 2580,
"valid_targets_mean": 7721.5,
"valid_targets_min": 4003
},
{
"epoch": 4.18284789644013,
"grad_norm": 0.4459508263295891,
"learning_rate": 1.6714392404365467e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29237473011016846,
"step": 2585,
"valid_targets_mean": 7546.4,
"valid_targets_min": 3816
},
{
"epoch": 4.190938511326861,
"grad_norm": 0.44578985610791283,
"learning_rate": 1.6634817260245417e-05,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26097139716148376,
"step": 2590,
"valid_targets_mean": 7171.8,
"valid_targets_min": 2549
},
{
"epoch": 4.199029126213592,
"grad_norm": 0.4837956443790072,
"learning_rate": 1.655529690331332e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902294993400574,
"step": 2595,
"valid_targets_mean": 6778.6,
"valid_targets_min": 2080
},
{
"epoch": 4.207119741100324,
"grad_norm": 0.8167988548284764,
"learning_rate": 1.6475832628208165e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42150378227233887,
"step": 2600,
"valid_targets_mean": 3177.8,
"valid_targets_min": 1294
},
{
"epoch": 4.215210355987055,
"grad_norm": 0.7615957557370234,
"learning_rate": 1.6396425728655874e-05,
"loss": 0.3736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37615785002708435,
"step": 2605,
"valid_targets_mean": 3481.9,
"valid_targets_min": 1415
},
{
"epoch": 4.223300970873787,
"grad_norm": 0.7887356809021314,
"learning_rate": 1.6317077497448278e-05,
"loss": 0.3611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32747870683670044,
"step": 2610,
"valid_targets_mean": 2773.0,
"valid_targets_min": 1253
},
{
"epoch": 4.231391585760518,
"grad_norm": 0.7388958962034481,
"learning_rate": 1.6237789226422033e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3640366196632385,
"step": 2615,
"valid_targets_mean": 3517.6,
"valid_targets_min": 977
},
{
"epoch": 4.239482200647249,
"grad_norm": 0.8211350839413274,
"learning_rate": 1.6158562206437634e-05,
"loss": 0.3689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3327547311782837,
"step": 2620,
"valid_targets_mean": 2927.6,
"valid_targets_min": 1136
},
{
"epoch": 4.247572815533981,
"grad_norm": 0.8017947866736652,
"learning_rate": 1.6079397727358345e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33964037895202637,
"step": 2625,
"valid_targets_mean": 3221.8,
"valid_targets_min": 1246
},
{
"epoch": 4.255663430420712,
"grad_norm": 0.8231664391013209,
"learning_rate": 1.6000297078029256e-05,
"loss": 0.3763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41385623812675476,
"step": 2630,
"valid_targets_mean": 3345.7,
"valid_targets_min": 1123
},
{
"epoch": 4.263754045307444,
"grad_norm": 0.807482211440655,
"learning_rate": 1.5921261546256236e-05,
"loss": 0.3429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3225884735584259,
"step": 2635,
"valid_targets_mean": 2662.1,
"valid_targets_min": 1310
},
{
"epoch": 4.271844660194175,
"grad_norm": 0.7308639134760625,
"learning_rate": 1.5842292418785026e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007241189479828,
"step": 2640,
"valid_targets_mean": 3257.6,
"valid_targets_min": 1319
},
{
"epoch": 4.2799352750809065,
"grad_norm": 0.805650608661951,
"learning_rate": 1.5763390981280258e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39171522855758667,
"step": 2645,
"valid_targets_mean": 3564.8,
"valid_targets_min": 1082
},
{
"epoch": 4.288025889967638,
"grad_norm": 0.8261461823177421,
"learning_rate": 1.568455851830453e-05,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.318564772605896,
"step": 2650,
"valid_targets_mean": 2672.8,
"valid_targets_min": 1292
},
{
"epoch": 4.296116504854369,
"grad_norm": 0.8080317661606545,
"learning_rate": 1.5605796313297502e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36015939712524414,
"step": 2655,
"valid_targets_mean": 3064.9,
"valid_targets_min": 977
},
{
"epoch": 4.3042071197411005,
"grad_norm": 0.6955171780036041,
"learning_rate": 1.552710564855498e-05,
"loss": 0.3383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3366152048110962,
"step": 2660,
"valid_targets_mean": 3880.6,
"valid_targets_min": 877
},
{
"epoch": 4.3122977346278315,
"grad_norm": 0.7976014610219154,
"learning_rate": 1.5448487805208047e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3383542001247406,
"step": 2665,
"valid_targets_mean": 3467.2,
"valid_targets_min": 1475
},
{
"epoch": 4.320388349514563,
"grad_norm": 0.7704921245778071,
"learning_rate": 1.5369944063202228e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3546125292778015,
"step": 2670,
"valid_targets_mean": 3955.9,
"valid_targets_min": 1137
},
{
"epoch": 4.328478964401294,
"grad_norm": 0.8636778847639369,
"learning_rate": 1.529147570127663e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35152947902679443,
"step": 2675,
"valid_targets_mean": 3870.5,
"valid_targets_min": 1294
},
{
"epoch": 4.336569579288026,
"grad_norm": 0.781729212171773,
"learning_rate": 1.5213083996943124e-05,
"loss": 0.3304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037518858909607,
"step": 2680,
"valid_targets_mean": 3128.0,
"valid_targets_min": 1222
},
{
"epoch": 4.344660194174757,
"grad_norm": 0.8221148280461172,
"learning_rate": 1.5134770226465533e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34873682260513306,
"step": 2685,
"valid_targets_mean": 3277.3,
"valid_targets_min": 1140
},
{
"epoch": 4.352750809061488,
"grad_norm": 0.9288812715286362,
"learning_rate": 1.5056535664838894e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3221864700317383,
"step": 2690,
"valid_targets_mean": 3244.1,
"valid_targets_min": 1388
},
{
"epoch": 4.36084142394822,
"grad_norm": 0.9070208170441065,
"learning_rate": 1.4978381585768676e-05,
"loss": 0.3611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3749698996543884,
"step": 2695,
"valid_targets_mean": 2561.9,
"valid_targets_min": 1129
},
{
"epoch": 4.368932038834951,
"grad_norm": 1.0518568013946572,
"learning_rate": 1.490030926165002e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3401104807853699,
"step": 2700,
"valid_targets_mean": 1831.4,
"valid_targets_min": 1013
},
{
"epoch": 4.377022653721683,
"grad_norm": 0.8470545820516009,
"learning_rate": 1.4822319963547083e-05,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34943297505378723,
"step": 2705,
"valid_targets_mean": 2959.6,
"valid_targets_min": 1689
},
{
"epoch": 4.385113268608414,
"grad_norm": 0.8641001873331948,
"learning_rate": 1.4744414961172267e-05,
"loss": 0.3528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3659989833831787,
"step": 2710,
"valid_targets_mean": 3059.9,
"valid_targets_min": 910
},
{
"epoch": 4.393203883495145,
"grad_norm": 0.88611420485447,
"learning_rate": 1.4666595522865628e-05,
"loss": 0.3404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34444698691368103,
"step": 2715,
"valid_targets_mean": 2292.4,
"valid_targets_min": 1128
},
{
"epoch": 4.401294498381877,
"grad_norm": 1.3843610065295007,
"learning_rate": 1.4588862915574158e-05,
"loss": 0.3398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3170504570007324,
"step": 2720,
"valid_targets_mean": 3623.2,
"valid_targets_min": 999
},
{
"epoch": 4.409385113268608,
"grad_norm": 0.7553534225613581,
"learning_rate": 1.4511218404831208e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32873186469078064,
"step": 2725,
"valid_targets_mean": 3616.4,
"valid_targets_min": 1483
},
{
"epoch": 4.41747572815534,
"grad_norm": 0.8279883071817279,
"learning_rate": 1.4433663254735868e-05,
"loss": 0.3529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39501428604125977,
"step": 2730,
"valid_targets_mean": 3939.2,
"valid_targets_min": 1255
},
{
"epoch": 4.425566343042071,
"grad_norm": 0.8436452088585356,
"learning_rate": 1.4356198727932357e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3371664583683014,
"step": 2735,
"valid_targets_mean": 3482.7,
"valid_targets_min": 1309
},
{
"epoch": 4.433656957928803,
"grad_norm": 0.8425594216816737,
"learning_rate": 1.427882608558951e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3945726752281189,
"step": 2740,
"valid_targets_mean": 3203.9,
"valid_targets_min": 1117
},
{
"epoch": 4.441747572815534,
"grad_norm": 0.8552168356844453,
"learning_rate": 1.420154658738023e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31872445344924927,
"step": 2745,
"valid_targets_mean": 3138.2,
"valid_targets_min": 1094
},
{
"epoch": 4.449838187702265,
"grad_norm": 0.7442574111597251,
"learning_rate": 1.4124361491460979e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3369321823120117,
"step": 2750,
"valid_targets_mean": 3830.7,
"valid_targets_min": 1383
},
{
"epoch": 4.457928802588997,
"grad_norm": 0.7566819794836184,
"learning_rate": 1.4047272054451288e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010716438293457,
"step": 2755,
"valid_targets_mean": 3429.1,
"valid_targets_min": 1021
},
{
"epoch": 4.466019417475728,
"grad_norm": 0.6907319746727313,
"learning_rate": 1.397027953141329e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925443649291992,
"step": 2760,
"valid_targets_mean": 3514.2,
"valid_targets_min": 946
},
{
"epoch": 4.47411003236246,
"grad_norm": 0.6438477052295435,
"learning_rate": 1.3893385175831326e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3193925619125366,
"step": 2765,
"valid_targets_mean": 3938.4,
"valid_targets_min": 1167
},
{
"epoch": 4.482200647249191,
"grad_norm": 0.6045823119652175,
"learning_rate": 1.3816590239591502e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3105623126029968,
"step": 2770,
"valid_targets_mean": 5108.3,
"valid_targets_min": 1959
},
{
"epoch": 4.490291262135923,
"grad_norm": 0.7509833584246006,
"learning_rate": 1.3739895972961312e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3150097131729126,
"step": 2775,
"valid_targets_mean": 3583.8,
"valid_targets_min": 660
},
{
"epoch": 4.498381877022654,
"grad_norm": 0.7392542720919617,
"learning_rate": 1.3663303624569303e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3625081181526184,
"step": 2780,
"valid_targets_mean": 3303.5,
"valid_targets_min": 1571
},
{
"epoch": 4.506472491909385,
"grad_norm": 0.7497171068842345,
"learning_rate": 1.3586814441384707e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32502812147140503,
"step": 2785,
"valid_targets_mean": 3323.2,
"valid_targets_min": 1681
},
{
"epoch": 4.514563106796117,
"grad_norm": 0.631259857417725,
"learning_rate": 1.3510429668697188e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28541266918182373,
"step": 2790,
"valid_targets_mean": 4724.1,
"valid_targets_min": 1245
},
{
"epoch": 4.522653721682848,
"grad_norm": 0.6720103718042312,
"learning_rate": 1.3434150550096534e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3023044764995575,
"step": 2795,
"valid_targets_mean": 3885.1,
"valid_targets_min": 1146
},
{
"epoch": 4.53074433656958,
"grad_norm": 0.7672977115433848,
"learning_rate": 1.3357978327452425e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622583746910095,
"step": 2800,
"valid_targets_mean": 4696.1,
"valid_targets_min": 1528
},
{
"epoch": 4.538834951456311,
"grad_norm": 0.70767106431573,
"learning_rate": 1.3281914240894218e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307115375995636,
"step": 2805,
"valid_targets_mean": 4114.5,
"valid_targets_min": 1384
},
{
"epoch": 4.546925566343042,
"grad_norm": 0.6165219862728282,
"learning_rate": 1.320595952879073e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30621129274368286,
"step": 2810,
"valid_targets_mean": 4788.4,
"valid_targets_min": 1569
},
{
"epoch": 4.555016181229774,
"grad_norm": 0.653761496025403,
"learning_rate": 1.3130115427730106e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2891233265399933,
"step": 2815,
"valid_targets_mean": 3966.3,
"valid_targets_min": 406
},
{
"epoch": 4.563106796116505,
"grad_norm": 0.7130430735759704,
"learning_rate": 1.3054383172499688e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2976634204387665,
"step": 2820,
"valid_targets_mean": 3847.1,
"valid_targets_min": 815
},
{
"epoch": 4.5711974110032365,
"grad_norm": 0.709782236189302,
"learning_rate": 1.2978763996065888e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3229979872703552,
"step": 2825,
"valid_targets_mean": 3528.3,
"valid_targets_min": 838
},
{
"epoch": 4.5792880258899675,
"grad_norm": 0.6662440633945301,
"learning_rate": 1.2903259129554138e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2709886431694031,
"step": 2830,
"valid_targets_mean": 3431.5,
"valid_targets_min": 1564
},
{
"epoch": 4.5873786407766985,
"grad_norm": 0.7092538828288426,
"learning_rate": 1.2827869802228816e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2797761559486389,
"step": 2835,
"valid_targets_mean": 3251.3,
"valid_targets_min": 1109
},
{
"epoch": 4.5954692556634305,
"grad_norm": 0.7572676051927053,
"learning_rate": 1.2752597241473273e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3064771294593811,
"step": 2840,
"valid_targets_mean": 3475.8,
"valid_targets_min": 1415
},
{
"epoch": 4.6035598705501615,
"grad_norm": 0.7552895417197777,
"learning_rate": 1.2677442672769832e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986189126968384,
"step": 2845,
"valid_targets_mean": 3176.6,
"valid_targets_min": 1211
},
{
"epoch": 4.611650485436893,
"grad_norm": 1.5698337614598337,
"learning_rate": 1.2602407319679822e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3134298622608185,
"step": 2850,
"valid_targets_mean": 3906.7,
"valid_targets_min": 1499
},
{
"epoch": 4.619741100323624,
"grad_norm": 0.8306746135033737,
"learning_rate": 1.2527492403823664e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3346129059791565,
"step": 2855,
"valid_targets_mean": 3102.3,
"valid_targets_min": 1104
},
{
"epoch": 4.627831715210356,
"grad_norm": 0.7384107704279723,
"learning_rate": 1.2452699144861012e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3285127878189087,
"step": 2860,
"valid_targets_mean": 3321.5,
"valid_targets_min": 1397
},
{
"epoch": 4.635922330097087,
"grad_norm": 0.7333343742356498,
"learning_rate": 1.237802876047086e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2842520773410797,
"step": 2865,
"valid_targets_mean": 3407.2,
"valid_targets_min": 1416
},
{
"epoch": 4.644012944983819,
"grad_norm": 0.684739860910513,
"learning_rate": 1.2303482466331727e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27704834938049316,
"step": 2870,
"valid_targets_mean": 4077.6,
"valid_targets_min": 1619
},
{
"epoch": 4.65210355987055,
"grad_norm": 0.774294316328799,
"learning_rate": 1.2229061476101883e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31210005283355713,
"step": 2875,
"valid_targets_mean": 3397.1,
"valid_targets_min": 1294
},
{
"epoch": 4.660194174757281,
"grad_norm": 0.5794806170925674,
"learning_rate": 1.2154767001399551e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2938528060913086,
"step": 2880,
"valid_targets_mean": 5222.0,
"valid_targets_min": 1125
},
{
"epoch": 4.668284789644013,
"grad_norm": 0.5590770240692666,
"learning_rate": 1.2080600251783233e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2748606503009796,
"step": 2885,
"valid_targets_mean": 4730.9,
"valid_targets_min": 1312
},
{
"epoch": 4.676375404530744,
"grad_norm": 0.6572005056341561,
"learning_rate": 1.2006562434731968e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911245822906494,
"step": 2890,
"valid_targets_mean": 3836.6,
"valid_targets_min": 1517
},
{
"epoch": 4.684466019417476,
"grad_norm": 0.6985233617878603,
"learning_rate": 1.193265475562571e-05,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325228214263916,
"step": 2895,
"valid_targets_mean": 4618.6,
"valid_targets_min": 1383
},
{
"epoch": 4.692556634304207,
"grad_norm": 0.874595786129551,
"learning_rate": 1.1858878417725683e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28530287742614746,
"step": 2900,
"valid_targets_mean": 4125.9,
"valid_targets_min": 1398
},
{
"epoch": 4.700647249190938,
"grad_norm": 0.6429408856747463,
"learning_rate": 1.1785234622154797e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.262306272983551,
"step": 2905,
"valid_targets_mean": 3722.9,
"valid_targets_min": 1407
},
{
"epoch": 4.70873786407767,
"grad_norm": 0.8608469799248508,
"learning_rate": 1.1711724567878095e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2957187592983246,
"step": 2910,
"valid_targets_mean": 3904.0,
"valid_targets_min": 1895
},
{
"epoch": 4.716828478964401,
"grad_norm": 0.7159209130807689,
"learning_rate": 1.1638349451683237e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613191604614258,
"step": 2915,
"valid_targets_mean": 3557.5,
"valid_targets_min": 1695
},
{
"epoch": 4.724919093851133,
"grad_norm": 0.7446038352770069,
"learning_rate": 1.1565110468160996e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005721867084503,
"step": 2920,
"valid_targets_mean": 3607.1,
"valid_targets_min": 1348
},
{
"epoch": 4.733009708737864,
"grad_norm": 0.7521397453688494,
"learning_rate": 1.1492008809685856e-05,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2908332347869873,
"step": 2925,
"valid_targets_mean": 3941.3,
"valid_targets_min": 1811
},
{
"epoch": 4.741100323624595,
"grad_norm": 0.8564547437417241,
"learning_rate": 1.141904566639652e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27682605385780334,
"step": 2930,
"valid_targets_mean": 2807.7,
"valid_targets_min": 431
},
{
"epoch": 4.749190938511327,
"grad_norm": 0.5946145119748939,
"learning_rate": 1.1346222226176606e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541586458683014,
"step": 2935,
"valid_targets_mean": 5157.0,
"valid_targets_min": 1680
},
{
"epoch": 4.757281553398058,
"grad_norm": 0.532503556021208,
"learning_rate": 1.1273539674635296e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22031345963478088,
"step": 2940,
"valid_targets_mean": 5799.4,
"valid_targets_min": 2379
},
{
"epoch": 4.76537216828479,
"grad_norm": 0.4872712728960179,
"learning_rate": 1.1200999195088e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1671465039253235,
"step": 2945,
"valid_targets_mean": 6073.6,
"valid_targets_min": 950
},
{
"epoch": 4.773462783171521,
"grad_norm": 0.51692554376425,
"learning_rate": 1.1128601968537111e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19749924540519714,
"step": 2950,
"valid_targets_mean": 5545.0,
"valid_targets_min": 2475
},
{
"epoch": 4.781553398058253,
"grad_norm": 0.654761675129204,
"learning_rate": 1.1056349173652791e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26196080446243286,
"step": 2955,
"valid_targets_mean": 6686.8,
"valid_targets_min": 3124
},
{
"epoch": 4.789644012944984,
"grad_norm": 0.516926906571057,
"learning_rate": 1.098424198675375e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16444584727287292,
"step": 2960,
"valid_targets_mean": 4961.1,
"valid_targets_min": 587
},
{
"epoch": 4.797734627831716,
"grad_norm": 0.47172896644965434,
"learning_rate": 1.0912281581788138e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16139261424541473,
"step": 2965,
"valid_targets_mean": 6079.8,
"valid_targets_min": 1883
},
{
"epoch": 4.805825242718447,
"grad_norm": 0.5379469984334276,
"learning_rate": 1.0840469130314382e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18077893555164337,
"step": 2970,
"valid_targets_mean": 4933.7,
"valid_targets_min": 502
},
{
"epoch": 4.813915857605178,
"grad_norm": 0.5230760700961994,
"learning_rate": 1.0768805801482151e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18261444568634033,
"step": 2975,
"valid_targets_mean": 5915.8,
"valid_targets_min": 3455
},
{
"epoch": 4.82200647249191,
"grad_norm": 0.4689333862630784,
"learning_rate": 1.0697292762013304e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18166537582874298,
"step": 2980,
"valid_targets_mean": 6650.1,
"valid_targets_min": 2561
},
{
"epoch": 4.830097087378641,
"grad_norm": 0.49323440105643984,
"learning_rate": 1.0625931176182905e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20641836524009705,
"step": 2985,
"valid_targets_mean": 6220.2,
"valid_targets_min": 2745
},
{
"epoch": 4.8381877022653725,
"grad_norm": 0.42657327738024303,
"learning_rate": 1.0554722205800245e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13979557156562805,
"step": 2990,
"valid_targets_mean": 6391.6,
"valid_targets_min": 2620
},
{
"epoch": 4.8462783171521036,
"grad_norm": 0.5850989160038047,
"learning_rate": 1.0483667010189973e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16110314428806305,
"step": 2995,
"valid_targets_mean": 5823.4,
"valid_targets_min": 2335
},
{
"epoch": 4.854368932038835,
"grad_norm": 0.4719018359213774,
"learning_rate": 1.0412766746173168e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19897709786891937,
"step": 3000,
"valid_targets_mean": 6701.3,
"valid_targets_min": 3184
},
{
"epoch": 4.8624595469255665,
"grad_norm": 0.4917541720726889,
"learning_rate": 1.0342022568048543e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20104116201400757,
"step": 3005,
"valid_targets_mean": 5738.4,
"valid_targets_min": 324
},
{
"epoch": 4.8705501618122975,
"grad_norm": 0.554594476082386,
"learning_rate": 1.0271435627573631e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21018058061599731,
"step": 3010,
"valid_targets_mean": 5771.9,
"valid_targets_min": 353
},
{
"epoch": 4.878640776699029,
"grad_norm": 0.458194799353725,
"learning_rate": 1.0201007073946041e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18960902094841003,
"step": 3015,
"valid_targets_mean": 6883.7,
"valid_targets_min": 405
},
{
"epoch": 4.88673139158576,
"grad_norm": 0.4901772432602992,
"learning_rate": 1.0130738053784768e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20777735114097595,
"step": 3020,
"valid_targets_mean": 5864.7,
"valid_targets_min": 922
},
{
"epoch": 4.894822006472491,
"grad_norm": 0.4858932378674697,
"learning_rate": 1.0060629711111494e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21894928812980652,
"step": 3025,
"valid_targets_mean": 6462.8,
"valid_targets_min": 3448
},
{
"epoch": 4.902912621359223,
"grad_norm": 0.505821195385407,
"learning_rate": 9.99068318733195e-06,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21098601818084717,
"step": 3030,
"valid_targets_mean": 6119.8,
"valid_targets_min": 351
},
{
"epoch": 4.911003236245954,
"grad_norm": 0.48153855254257244,
"learning_rate": 9.92089962121741e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22040508687496185,
"step": 3035,
"valid_targets_mean": 5484.6,
"valid_targets_min": 484
},
{
"epoch": 4.919093851132686,
"grad_norm": 0.49628525274695584,
"learning_rate": 9.851280148886061e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15337306261062622,
"step": 3040,
"valid_targets_mean": 6356.4,
"valid_targets_min": 3465
},
{
"epoch": 4.927184466019417,
"grad_norm": 0.4569887725574397,
"learning_rate": 9.78182590378455e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1723887175321579,
"step": 3045,
"valid_targets_mean": 7204.9,
"valid_targets_min": 2930
},
{
"epoch": 4.935275080906149,
"grad_norm": 0.5296992143508796,
"learning_rate": 9.712538016669557e-06,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18016985058784485,
"step": 3050,
"valid_targets_mean": 4959.0,
"valid_targets_min": 475
},
{
"epoch": 4.94336569579288,
"grad_norm": 0.46605102810031673,
"learning_rate": 9.643417615589299e-06,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13274593651294708,
"step": 3055,
"valid_targets_mean": 5758.4,
"valid_targets_min": 3177
},
{
"epoch": 4.951456310679612,
"grad_norm": 0.4714801915792423,
"learning_rate": 9.574465825865276e-06,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20519624650478363,
"step": 3060,
"valid_targets_mean": 6073.0,
"valid_targets_min": 2860
},
{
"epoch": 4.959546925566343,
"grad_norm": 0.45620286660464315,
"learning_rate": 9.50568377007386e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15038716793060303,
"step": 3065,
"valid_targets_mean": 5933.8,
"valid_targets_min": 3933
},
{
"epoch": 4.967637540453074,
"grad_norm": 0.4825590764718128,
"learning_rate": 9.43707256802806e-06,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191915825009346,
"step": 3070,
"valid_targets_mean": 6224.9,
"valid_targets_min": 418
},
{
"epoch": 4.975728155339806,
"grad_norm": 0.49435258210955274,
"learning_rate": 9.368633336759292e-06,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2108960747718811,
"step": 3075,
"valid_targets_mean": 6257.8,
"valid_targets_min": 2511
},
{
"epoch": 4.983818770226537,
"grad_norm": 0.5386278923623121,
"learning_rate": 9.300367190499178e-06,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2313598096370697,
"step": 3080,
"valid_targets_mean": 5614.5,
"valid_targets_min": 4016
},
{
"epoch": 4.991909385113269,
"grad_norm": 0.43193135908684027,
"learning_rate": 9.232275240661403e-06,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2286348193883896,
"step": 3085,
"valid_targets_mean": 7461.4,
"valid_targets_min": 3296
},
{
"epoch": 5.0,
"grad_norm": 0.5212733592125819,
"learning_rate": 9.164358595823661e-06,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21457836031913757,
"step": 3090,
"valid_targets_mean": 6528.7,
"valid_targets_min": 1969
},
{
"epoch": 5.008090614886731,
"grad_norm": 0.5319495569626199,
"learning_rate": 9.096618361709545e-06,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067016005516052,
"step": 3095,
"valid_targets_mean": 7367.1,
"valid_targets_min": 1791
},
{
"epoch": 5.016181229773463,
"grad_norm": 0.5211577495479047,
"learning_rate": 9.029055641170588e-06,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768145203590393,
"step": 3100,
"valid_targets_mean": 8089.4,
"valid_targets_min": 5145
},
{
"epoch": 5.024271844660194,
"grad_norm": 0.5295823335577148,
"learning_rate": 8.961671534168292e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725014388561249,
"step": 3105,
"valid_targets_mean": 7736.6,
"valid_targets_min": 2978
},
{
"epoch": 5.032362459546926,
"grad_norm": 0.7263128119198212,
"learning_rate": 8.894467137756228e-06,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000566363334656,
"step": 3110,
"valid_targets_mean": 7745.0,
"valid_targets_min": 2988
},
{
"epoch": 5.040453074433657,
"grad_norm": 0.45728545699209733,
"learning_rate": 8.827443546062165e-06,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2903977036476135,
"step": 3115,
"valid_targets_mean": 7508.9,
"valid_targets_min": 3292
},
{
"epoch": 5.048543689320389,
"grad_norm": 0.46957717103053953,
"learning_rate": 8.760601850270277e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30360230803489685,
"step": 3120,
"valid_targets_mean": 7365.6,
"valid_targets_min": 3274
},
{
"epoch": 5.05663430420712,
"grad_norm": 0.5000349877363641,
"learning_rate": 8.69394313860335e-06,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3295597732067108,
"step": 3125,
"valid_targets_mean": 7283.9,
"valid_targets_min": 2285
},
{
"epoch": 5.064724919093851,
"grad_norm": 0.4761118410851209,
"learning_rate": 8.62746849630508e-06,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27158045768737793,
"step": 3130,
"valid_targets_mean": 7289.2,
"valid_targets_min": 2822
},
{
"epoch": 5.072815533980583,
"grad_norm": 0.45387036145946663,
"learning_rate": 8.561179005622411e-06,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25855568051338196,
"step": 3135,
"valid_targets_mean": 7387.5,
"valid_targets_min": 3823
},
{
"epoch": 5.080906148867314,
"grad_norm": 0.5514967218526795,
"learning_rate": 8.495075745787895e-06,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2519291341304779,
"step": 3140,
"valid_targets_mean": 6462.8,
"valid_targets_min": 1285
},
{
"epoch": 5.088996763754046,
"grad_norm": 0.48360092752777134,
"learning_rate": 8.429159793002164e-06,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31536170840263367,
"step": 3145,
"valid_targets_mean": 9115.1,
"valid_targets_min": 5927
},
{
"epoch": 5.097087378640777,
"grad_norm": 0.506081856785789,
"learning_rate": 8.363432220416336e-06,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3049050569534302,
"step": 3150,
"valid_targets_mean": 7797.2,
"valid_targets_min": 1985
},
{
"epoch": 5.105177993527508,
"grad_norm": 0.5176036211803096,
"learning_rate": 8.297894098114612e-06,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24461714923381805,
"step": 3155,
"valid_targets_mean": 7330.4,
"valid_targets_min": 2779
},
{
"epoch": 5.11326860841424,
"grad_norm": 0.45319450230478064,
"learning_rate": 8.232546493096836e-06,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2451840341091156,
"step": 3160,
"valid_targets_mean": 7086.4,
"valid_targets_min": 2870
},
{
"epoch": 5.121359223300971,
"grad_norm": 0.5013359160427914,
"learning_rate": 8.167390469261105e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31205499172210693,
"step": 3165,
"valid_targets_mean": 8391.3,
"valid_targets_min": 880
},
{
"epoch": 5.1294498381877025,
"grad_norm": 0.48835871990641466,
"learning_rate": 8.102427087386457e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24966265261173248,
"step": 3170,
"valid_targets_mean": 6497.2,
"valid_targets_min": 3127
},
{
"epoch": 5.1375404530744335,
"grad_norm": 0.47289910533912854,
"learning_rate": 8.037657405115611e-06,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2476363182067871,
"step": 3175,
"valid_targets_mean": 6541.8,
"valid_targets_min": 3567
},
{
"epoch": 5.145631067961165,
"grad_norm": 0.47539629536114814,
"learning_rate": 7.973082476937728e-06,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635002136230469,
"step": 3180,
"valid_targets_mean": 7617.8,
"valid_targets_min": 3885
},
{
"epoch": 5.1537216828478964,
"grad_norm": 0.5585549485849161,
"learning_rate": 7.908703354171283e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30579209327697754,
"step": 3185,
"valid_targets_mean": 5710.0,
"valid_targets_min": 284
},
{
"epoch": 5.1618122977346275,
"grad_norm": 0.44686022386718305,
"learning_rate": 7.844521084946895e-06,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1834941804409027,
"step": 3190,
"valid_targets_mean": 6085.1,
"valid_targets_min": 3073
},
{
"epoch": 5.169902912621359,
"grad_norm": 0.4676860962444573,
"learning_rate": 7.780536714190298e-06,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26917046308517456,
"step": 3195,
"valid_targets_mean": 7739.5,
"valid_targets_min": 3524
},
{
"epoch": 5.17799352750809,
"grad_norm": 0.4986507281328184,
"learning_rate": 7.716751283605324e-06,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29654639959335327,
"step": 3200,
"valid_targets_mean": 7832.8,
"valid_targets_min": 2404
},
{
"epoch": 5.186084142394822,
"grad_norm": 0.47522046433557813,
"learning_rate": 7.653165831656937e-06,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719336450099945,
"step": 3205,
"valid_targets_mean": 6810.3,
"valid_targets_min": 3979
},
{
"epoch": 5.194174757281553,
"grad_norm": 0.4476741173784591,
"learning_rate": 7.589781393554321e-06,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759358584880829,
"step": 3210,
"valid_targets_mean": 7624.2,
"valid_targets_min": 3905
},
{
"epoch": 5.202265372168285,
"grad_norm": 0.5411741804025072,
"learning_rate": 7.526599001234058e-06,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2656782269477844,
"step": 3215,
"valid_targets_mean": 6795.1,
"valid_targets_min": 3148
},
{
"epoch": 5.210355987055016,
"grad_norm": 0.8063416501663134,
"learning_rate": 7.463619683343284e-06,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3292917013168335,
"step": 3220,
"valid_targets_mean": 3099.5,
"valid_targets_min": 1256
},
{
"epoch": 5.218446601941747,
"grad_norm": 0.7523254899644706,
"learning_rate": 7.400844465222963e-06,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3488837480545044,
"step": 3225,
"valid_targets_mean": 3709.8,
"valid_targets_min": 1344
},
{
"epoch": 5.226537216828479,
"grad_norm": 0.8129960141626508,
"learning_rate": 7.338274368891198e-06,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29325389862060547,
"step": 3230,
"valid_targets_mean": 2654.6,
"valid_targets_min": 1082
},
{
"epoch": 5.23462783171521,
"grad_norm": 0.84891707484108,
"learning_rate": 7.275910413026579e-06,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32466965913772583,
"step": 3235,
"valid_targets_mean": 2991.8,
"valid_targets_min": 1159
},
{
"epoch": 5.242718446601942,
"grad_norm": 0.8728926495709631,
"learning_rate": 7.213753612951624e-06,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38176876306533813,
"step": 3240,
"valid_targets_mean": 3261.2,
"valid_targets_min": 1281
},
{
"epoch": 5.250809061488673,
"grad_norm": 0.8433417368439166,
"learning_rate": 7.1518049806162196e-06,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35416272282600403,
"step": 3245,
"valid_targets_mean": 3676.6,
"valid_targets_min": 1603
},
{
"epoch": 5.258899676375404,
"grad_norm": 0.8489581240200976,
"learning_rate": 7.090065524581136e-06,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3246349096298218,
"step": 3250,
"valid_targets_mean": 3011.1,
"valid_targets_min": 1422
},
{
"epoch": 5.266990291262136,
"grad_norm": 0.8018879913146477,
"learning_rate": 7.0285362500016675e-06,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29004016518592834,
"step": 3255,
"valid_targets_mean": 3071.8,
"valid_targets_min": 1277
},
{
"epoch": 5.275080906148867,
"grad_norm": 0.8444531679837199,
"learning_rate": 6.967218158611202e-06,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3274296522140503,
"step": 3260,
"valid_targets_mean": 3090.8,
"valid_targets_min": 1079
},
{
"epoch": 5.283171521035599,
"grad_norm": 1.4990565330268864,
"learning_rate": 6.906112248704939e-06,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3334260582923889,
"step": 3265,
"valid_targets_mean": 3369.2,
"valid_targets_min": 1104
},
{
"epoch": 5.29126213592233,
"grad_norm": 0.8525857578497839,
"learning_rate": 6.845219515123667e-06,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38606202602386475,
"step": 3270,
"valid_targets_mean": 3657.6,
"valid_targets_min": 1556
},
{
"epoch": 5.299352750809062,
"grad_norm": 1.0945788176494664,
"learning_rate": 6.784540949237484e-06,
"loss": 0.3261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3346405625343323,
"step": 3275,
"valid_targets_mean": 2946.7,
"valid_targets_min": 860
},
{
"epoch": 5.307443365695793,
"grad_norm": 0.7396805936736428,
"learning_rate": 6.724077538929759e-06,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220456838607788,
"step": 3280,
"valid_targets_mean": 3523.2,
"valid_targets_min": 1404
},
{
"epoch": 5.315533980582524,
"grad_norm": 0.6013604910785784,
"learning_rate": 6.663830268580971e-06,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951660752296448,
"step": 3285,
"valid_targets_mean": 5521.4,
"valid_targets_min": 1360
},
{
"epoch": 5.323624595469256,
"grad_norm": 0.8298768134992649,
"learning_rate": 6.6038001190527146e-06,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3154316246509552,
"step": 3290,
"valid_targets_mean": 3396.9,
"valid_targets_min": 1336
},
{
"epoch": 5.331715210355987,
"grad_norm": 0.738625989323921,
"learning_rate": 6.543988067671752e-06,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32287925481796265,
"step": 3295,
"valid_targets_mean": 3617.4,
"valid_targets_min": 1726
},
{
"epoch": 5.339805825242719,
"grad_norm": 0.7679103475244519,
"learning_rate": 6.484395088214037e-06,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35048407316207886,
"step": 3300,
"valid_targets_mean": 4753.2,
"valid_targets_min": 1146
},
{
"epoch": 5.34789644012945,
"grad_norm": 0.7895088467002501,
"learning_rate": 6.425022150888924e-06,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2957543730735779,
"step": 3305,
"valid_targets_mean": 2988.0,
"valid_targets_min": 1665
},
{
"epoch": 5.355987055016181,
"grad_norm": 0.8257566232159592,
"learning_rate": 6.36587022232336e-06,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3673299551010132,
"step": 3310,
"valid_targets_mean": 3400.9,
"valid_targets_min": 985
},
{
"epoch": 5.364077669902913,
"grad_norm": 0.7185396884990038,
"learning_rate": 6.306940265546117e-06,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3062174320220947,
"step": 3315,
"valid_targets_mean": 3745.3,
"valid_targets_min": 1398
},
{
"epoch": 5.372168284789644,
"grad_norm": 0.733095396914552,
"learning_rate": 6.248233239972144e-06,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2923792600631714,
"step": 3320,
"valid_targets_mean": 3360.9,
"valid_targets_min": 1133
},
{
"epoch": 5.380258899676376,
"grad_norm": 0.8773111466520589,
"learning_rate": 6.189750101386931e-06,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35776978731155396,
"step": 3325,
"valid_targets_mean": 3318.2,
"valid_targets_min": 1383
},
{
"epoch": 5.388349514563107,
"grad_norm": 0.8173794193078433,
"learning_rate": 6.1314918019309535e-06,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33896470069885254,
"step": 3330,
"valid_targets_mean": 3564.1,
"valid_targets_min": 1035
},
{
"epoch": 5.3964401294498385,
"grad_norm": 1.189059892174759,
"learning_rate": 6.073459290084185e-06,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303739458322525,
"step": 3335,
"valid_targets_mean": 2470.4,
"valid_targets_min": 1285
},
{
"epoch": 5.4045307443365695,
"grad_norm": 0.7616019973262189,
"learning_rate": 6.01565351065063e-06,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26032713055610657,
"step": 3340,
"valid_targets_mean": 3419.8,
"valid_targets_min": 1415
},
{
"epoch": 5.412621359223301,
"grad_norm": 0.6846961329277493,
"learning_rate": 5.958075404742951e-06,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30751484632492065,
"step": 3345,
"valid_targets_mean": 3587.9,
"valid_targets_min": 1375
},
{
"epoch": 5.4207119741100325,
"grad_norm": 0.8653748694772552,
"learning_rate": 5.900725909767155e-06,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2950606048107147,
"step": 3350,
"valid_targets_mean": 2614.4,
"valid_targets_min": 1066
},
{
"epoch": 5.4288025889967635,
"grad_norm": 0.7715947516706176,
"learning_rate": 5.843605959407326e-06,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31399863958358765,
"step": 3355,
"valid_targets_mean": 3381.9,
"valid_targets_min": 1125
},
{
"epoch": 5.436893203883495,
"grad_norm": 0.8373987039194564,
"learning_rate": 5.7867164836104174e-06,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.279275119304657,
"step": 3360,
"valid_targets_mean": 3233.6,
"valid_targets_min": 1199
},
{
"epoch": 5.444983818770226,
"grad_norm": 0.9106273725610025,
"learning_rate": 5.730058408571135e-06,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3223729729652405,
"step": 3365,
"valid_targets_mean": 3305.2,
"valid_targets_min": 1344
},
{
"epoch": 5.453074433656958,
"grad_norm": 0.7994891025143966,
"learning_rate": 5.673632656716825e-06,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31081345677375793,
"step": 3370,
"valid_targets_mean": 3871.6,
"valid_targets_min": 1205
},
{
"epoch": 5.461165048543689,
"grad_norm": 0.7624042577791246,
"learning_rate": 5.617440146692485e-06,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30954042077064514,
"step": 3375,
"valid_targets_mean": 3910.4,
"valid_targets_min": 1450
},
{
"epoch": 5.46925566343042,
"grad_norm": 0.7095484444373912,
"learning_rate": 5.561481793345786e-06,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2747786045074463,
"step": 3380,
"valid_targets_mean": 4702.8,
"valid_targets_min": 2246
},
{
"epoch": 5.477346278317152,
"grad_norm": 0.7902102023863703,
"learning_rate": 5.505758507712196e-06,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31908634305000305,
"step": 3385,
"valid_targets_mean": 3323.4,
"valid_targets_min": 1348
},
{
"epoch": 5.485436893203883,
"grad_norm": 0.7074947155569701,
"learning_rate": 5.450271197000128e-06,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28372061252593994,
"step": 3390,
"valid_targets_mean": 3920.9,
"valid_targets_min": 1318
},
{
"epoch": 5.493527508090615,
"grad_norm": 0.6367141439259998,
"learning_rate": 5.395020764576211e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3219951093196869,
"step": 3395,
"valid_targets_mean": 4233.6,
"valid_targets_min": 1361
},
{
"epoch": 5.501618122977346,
"grad_norm": 0.7259097102070373,
"learning_rate": 5.340008109950512e-06,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3297671675682068,
"step": 3400,
"valid_targets_mean": 3595.1,
"valid_targets_min": 1368
},
{
"epoch": 5.509708737864077,
"grad_norm": 0.9618474062674968,
"learning_rate": 5.285234128761969e-06,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30990469455718994,
"step": 3405,
"valid_targets_mean": 3354.8,
"valid_targets_min": 1186
},
{
"epoch": 5.517799352750809,
"grad_norm": 0.6714184926341713,
"learning_rate": 5.230699712763758e-06,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863173484802246,
"step": 3410,
"valid_targets_mean": 4103.5,
"valid_targets_min": 1405
},
{
"epoch": 5.52588996763754,
"grad_norm": 0.8589890875883771,
"learning_rate": 5.176405749808786e-06,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28313857316970825,
"step": 3415,
"valid_targets_mean": 4204.2,
"valid_targets_min": 941
},
{
"epoch": 5.533980582524272,
"grad_norm": 0.6924780807211832,
"learning_rate": 5.122353123835262e-06,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.309023916721344,
"step": 3420,
"valid_targets_mean": 4473.8,
"valid_targets_min": 1696
},
{
"epoch": 5.542071197411003,
"grad_norm": 0.8142961750957524,
"learning_rate": 5.068542714852254e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.273823082447052,
"step": 3425,
"valid_targets_mean": 2837.8,
"valid_targets_min": 1330
},
{
"epoch": 5.550161812297735,
"grad_norm": 0.6118772127551925,
"learning_rate": 5.014975398925408e-06,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26475781202316284,
"step": 3430,
"valid_targets_mean": 4635.1,
"valid_targets_min": 1166
},
{
"epoch": 5.558252427184466,
"grad_norm": 0.7697161843514183,
"learning_rate": 4.9616520481626794e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.329695463180542,
"step": 3435,
"valid_targets_mean": 3667.0,
"valid_targets_min": 1395
},
{
"epoch": 5.566343042071198,
"grad_norm": 0.6704301668195795,
"learning_rate": 4.908573530700111e-06,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28023281693458557,
"step": 3440,
"valid_targets_mean": 4262.1,
"valid_targets_min": 940
},
{
"epoch": 5.574433656957929,
"grad_norm": 0.7411191986928855,
"learning_rate": 4.8557407106877175e-06,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2993595004081726,
"step": 3445,
"valid_targets_mean": 3191.4,
"valid_targets_min": 1688
},
{
"epoch": 5.58252427184466,
"grad_norm": 0.6780175654020204,
"learning_rate": 4.8031544482754136e-06,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27136701345443726,
"step": 3450,
"valid_targets_mean": 3711.2,
"valid_targets_min": 1280
},
{
"epoch": 5.590614886731392,
"grad_norm": 0.6656730656773023,
"learning_rate": 4.7508155995989944e-06,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25287604331970215,
"step": 3455,
"valid_targets_mean": 4141.0,
"valid_targets_min": 1576
},
{
"epoch": 5.598705501618123,
"grad_norm": 0.7430435623053471,
"learning_rate": 4.6987250167662435e-06,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3740665316581726,
"step": 3460,
"valid_targets_mean": 3920.6,
"valid_targets_min": 993
},
{
"epoch": 5.606796116504855,
"grad_norm": 0.8089842814454896,
"learning_rate": 4.6468835478430045e-06,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27529019117355347,
"step": 3465,
"valid_targets_mean": 2930.4,
"valid_targets_min": 1271
},
{
"epoch": 5.614886731391586,
"grad_norm": 0.7119442724378142,
"learning_rate": 4.595292036839383e-06,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3111814856529236,
"step": 3470,
"valid_targets_mean": 3889.4,
"valid_targets_min": 1109
},
{
"epoch": 5.622977346278317,
"grad_norm": 0.6843256595943354,
"learning_rate": 4.543951323696058e-06,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2997050881385803,
"step": 3475,
"valid_targets_mean": 4169.0,
"valid_targets_min": 1262
},
{
"epoch": 5.631067961165049,
"grad_norm": 0.9105040696365415,
"learning_rate": 4.492862244270544e-06,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28833556175231934,
"step": 3480,
"valid_targets_mean": 2340.9,
"valid_targets_min": 1380
},
{
"epoch": 5.63915857605178,
"grad_norm": 0.8519710587688972,
"learning_rate": 4.442025630323607e-06,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577669322490692,
"step": 3485,
"valid_targets_mean": 3383.8,
"valid_targets_min": 1136
},
{
"epoch": 5.647249190938512,
"grad_norm": 0.6327989909826687,
"learning_rate": 4.3914423095057516e-06,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2794429659843445,
"step": 3490,
"valid_targets_mean": 4683.7,
"valid_targets_min": 1129
},
{
"epoch": 5.655339805825243,
"grad_norm": 0.7673156000554755,
"learning_rate": 4.341113105343673e-06,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29908567667007446,
"step": 3495,
"valid_targets_mean": 3994.8,
"valid_targets_min": 1930
},
{
"epoch": 5.663430420711974,
"grad_norm": 0.6723541515246171,
"learning_rate": 4.291038837226935e-06,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26810508966445923,
"step": 3500,
"valid_targets_mean": 3837.7,
"valid_targets_min": 1419
},
{
"epoch": 5.671521035598706,
"grad_norm": 0.9407028763902802,
"learning_rate": 4.241220320394574e-06,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2722015082836151,
"step": 3505,
"valid_targets_mean": 3206.0,
"valid_targets_min": 849
},
{
"epoch": 5.679611650485437,
"grad_norm": 0.7507137274318326,
"learning_rate": 4.191658365921838e-06,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24956271052360535,
"step": 3510,
"valid_targets_mean": 3158.6,
"valid_targets_min": 1188
},
{
"epoch": 5.6877022653721685,
"grad_norm": 0.633710354363695,
"learning_rate": 4.1423537807070065e-06,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28306400775909424,
"step": 3515,
"valid_targets_mean": 4985.4,
"valid_targets_min": 1162
},
{
"epoch": 5.6957928802588995,
"grad_norm": 0.7106919845148538,
"learning_rate": 4.0933073674582054e-06,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28822749853134155,
"step": 3520,
"valid_targets_mean": 3605.8,
"valid_targets_min": 1229
},
{
"epoch": 5.703883495145631,
"grad_norm": 0.7709486431215857,
"learning_rate": 4.044519924680379e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3167271018028259,
"step": 3525,
"valid_targets_mean": 3628.4,
"valid_targets_min": 1204
},
{
"epoch": 5.711974110032362,
"grad_norm": 0.6752644698813571,
"learning_rate": 3.99599224666229e-06,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25341057777404785,
"step": 3530,
"valid_targets_mean": 4005.9,
"valid_targets_min": 1431
},
{
"epoch": 5.720064724919094,
"grad_norm": 0.6562003474426554,
"learning_rate": 3.947725123463559e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.236685648560524,
"step": 3535,
"valid_targets_mean": 3881.7,
"valid_targets_min": 1211
},
{
"epoch": 5.728155339805825,
"grad_norm": 0.7556232041762883,
"learning_rate": 3.8997193409018245e-06,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27064526081085205,
"step": 3540,
"valid_targets_mean": 3740.8,
"valid_targets_min": 1231
},
{
"epoch": 5.736245954692556,
"grad_norm": 0.7338747249872632,
"learning_rate": 3.851975680539941e-06,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25058260560035706,
"step": 3545,
"valid_targets_mean": 3616.2,
"valid_targets_min": 1364
},
{
"epoch": 5.744336569579288,
"grad_norm": 0.6512233633964314,
"learning_rate": 3.804494919673254e-06,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25747865438461304,
"step": 3550,
"valid_targets_mean": 3856.8,
"valid_targets_min": 1141
},
{
"epoch": 5.752427184466019,
"grad_norm": 0.5877368860493349,
"learning_rate": 3.757277831316961e-06,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17853707075119019,
"step": 3555,
"valid_targets_mean": 6443.2,
"valid_targets_min": 2485
},
{
"epoch": 5.760517799352751,
"grad_norm": 0.5882911139733148,
"learning_rate": 3.7103251841934993e-06,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1725941300392151,
"step": 3560,
"valid_targets_mean": 5332.4,
"valid_targets_min": 824
},
{
"epoch": 5.768608414239482,
"grad_norm": 0.5213804910886257,
"learning_rate": 3.663637742720052e-06,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20349499583244324,
"step": 3565,
"valid_targets_mean": 6187.7,
"valid_targets_min": 2207
},
{
"epoch": 5.776699029126213,
"grad_norm": 0.4967460727403076,
"learning_rate": 3.617216266996093e-06,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14877915382385254,
"step": 3570,
"valid_targets_mean": 5631.6,
"valid_targets_min": 2795
},
{
"epoch": 5.784789644012945,
"grad_norm": 0.46520895730300954,
"learning_rate": 3.571061512791012e-06,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2052791714668274,
"step": 3575,
"valid_targets_mean": 7407.4,
"valid_targets_min": 1902
},
{
"epoch": 5.792880258899676,
"grad_norm": 0.605749686688732,
"learning_rate": 3.525174231531814e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17778176069259644,
"step": 3580,
"valid_targets_mean": 5209.8,
"valid_targets_min": 2991
},
{
"epoch": 5.800970873786408,
"grad_norm": 0.5738206053924397,
"learning_rate": 3.4795551702908935e-06,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23292459547519684,
"step": 3585,
"valid_targets_mean": 6012.4,
"valid_targets_min": 3782
},
{
"epoch": 5.809061488673139,
"grad_norm": 0.6919134158935569,
"learning_rate": 3.434205071773855e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15268674492835999,
"step": 3590,
"valid_targets_mean": 5490.8,
"valid_targets_min": 3401
},
{
"epoch": 5.81715210355987,
"grad_norm": 0.525226561251439,
"learning_rate": 3.3891246743074245e-06,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1895448863506317,
"step": 3595,
"valid_targets_mean": 5865.4,
"valid_targets_min": 4021
},
{
"epoch": 5.825242718446602,
"grad_norm": 1.6748639613941427,
"learning_rate": 3.344314711827441e-06,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472940295934677,
"step": 3600,
"valid_targets_mean": 5680.2,
"valid_targets_min": 379
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.45456760472205415,
"learning_rate": 3.299775913866894e-06,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14308935403823853,
"step": 3605,
"valid_targets_mean": 5873.6,
"valid_targets_min": 1280
},
{
"epoch": 5.841423948220065,
"grad_norm": 0.5630454379610851,
"learning_rate": 3.255509005544062e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21299272775650024,
"step": 3610,
"valid_targets_mean": 4735.3,
"valid_targets_min": 392
},
{
"epoch": 5.849514563106796,
"grad_norm": 0.5764483473368531,
"learning_rate": 3.2115147075506957e-06,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1859305202960968,
"step": 3615,
"valid_targets_mean": 5192.4,
"valid_targets_min": 647
},
{
"epoch": 5.857605177993528,
"grad_norm": 0.5025174908790243,
"learning_rate": 3.1677937361402654e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15480957925319672,
"step": 3620,
"valid_targets_mean": 5253.4,
"valid_targets_min": 253
},
{
"epoch": 5.865695792880259,
"grad_norm": 0.5379455694292067,
"learning_rate": 3.124346803116354e-06,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2440945953130722,
"step": 3625,
"valid_targets_mean": 5694.6,
"valid_targets_min": 503
},
{
"epoch": 5.87378640776699,
"grad_norm": 0.5382994407776523,
"learning_rate": 3.0811746158210165e-06,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19144295156002045,
"step": 3630,
"valid_targets_mean": 5798.9,
"valid_targets_min": 1824
},
{
"epoch": 5.881877022653722,
"grad_norm": 0.6049388573466525,
"learning_rate": 3.0382778771232766e-06,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1829536110162735,
"step": 3635,
"valid_targets_mean": 6017.6,
"valid_targets_min": 2360
},
{
"epoch": 5.889967637540453,
"grad_norm": 1.0647486504663568,
"learning_rate": 2.9956572854077205e-06,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24133262038230896,
"step": 3640,
"valid_targets_mean": 7051.8,
"valid_targets_min": 3489
},
{
"epoch": 5.898058252427185,
"grad_norm": 0.5096369018693362,
"learning_rate": 2.9533135345630536e-06,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21242384612560272,
"step": 3645,
"valid_targets_mean": 6098.8,
"valid_targets_min": 1470
},
{
"epoch": 5.906148867313916,
"grad_norm": 0.5494897013669703,
"learning_rate": 2.911247313970882e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16211332380771637,
"step": 3650,
"valid_targets_mean": 4782.9,
"valid_targets_min": 366
},
{
"epoch": 5.914239482200648,
"grad_norm": 0.5116839125190226,
"learning_rate": 2.8694593084944356e-06,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16128423810005188,
"step": 3655,
"valid_targets_mean": 5752.4,
"valid_targets_min": 3100
},
{
"epoch": 5.922330097087379,
"grad_norm": 0.5133859926626013,
"learning_rate": 2.8279501984674396e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12045817077159882,
"step": 3660,
"valid_targets_mean": 6254.7,
"valid_targets_min": 2156
},
{
"epoch": 5.93042071197411,
"grad_norm": 0.5696448579606227,
"learning_rate": 2.7867206596830355e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20523615181446075,
"step": 3665,
"valid_targets_mean": 5049.7,
"valid_targets_min": 295
},
{
"epoch": 5.938511326860842,
"grad_norm": 0.4904852898035377,
"learning_rate": 2.7457713633827763e-06,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18365246057510376,
"step": 3670,
"valid_targets_mean": 6636.9,
"valid_targets_min": 333
},
{
"epoch": 5.946601941747573,
"grad_norm": 0.5282042145989304,
"learning_rate": 2.705102976245697e-06,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16423557698726654,
"step": 3675,
"valid_targets_mean": 5273.4,
"valid_targets_min": 2580
},
{
"epoch": 5.9546925566343045,
"grad_norm": 0.5154717781682355,
"learning_rate": 2.6647161603774763e-06,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18065178394317627,
"step": 3680,
"valid_targets_mean": 5552.4,
"valid_targets_min": 396
},
{
"epoch": 5.9627831715210355,
"grad_norm": 0.48478327032359064,
"learning_rate": 2.624611573299629e-06,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23541313409805298,
"step": 3685,
"valid_targets_mean": 7252.6,
"valid_targets_min": 4266
},
{
"epoch": 5.970873786407767,
"grad_norm": 0.539425851785002,
"learning_rate": 2.5847898679388217e-06,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19013917446136475,
"step": 3690,
"valid_targets_mean": 5798.0,
"valid_targets_min": 2925
},
{
"epoch": 5.9789644012944985,
"grad_norm": 0.5429501981383015,
"learning_rate": 2.5452516926162394e-06,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16128823161125183,
"step": 3695,
"valid_targets_mean": 6265.6,
"valid_targets_min": 2353
},
{
"epoch": 5.9870550161812295,
"grad_norm": 0.5651497028720758,
"learning_rate": 2.5059976910370255e-06,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18095943331718445,
"step": 3700,
"valid_targets_mean": 5500.2,
"valid_targets_min": 2785
},
{
"epoch": 5.995145631067961,
"grad_norm": 0.5098750853748499,
"learning_rate": 2.467028502279802e-06,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18532708287239075,
"step": 3705,
"valid_targets_mean": 6825.4,
"valid_targets_min": 2113
},
{
"epoch": 6.003236245954692,
"grad_norm": 0.6429110805047797,
"learning_rate": 2.428344760786283e-06,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3460083305835724,
"step": 3710,
"valid_targets_mean": 8109.9,
"valid_targets_min": 2721
},
{
"epoch": 6.011326860841424,
"grad_norm": 0.617993460237832,
"learning_rate": 2.389947096350913e-06,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27906131744384766,
"step": 3715,
"valid_targets_mean": 7440.1,
"valid_targets_min": 295
},
{
"epoch": 6.019417475728155,
"grad_norm": 0.5342153883227024,
"learning_rate": 2.3518361341106366e-06,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2538403868675232,
"step": 3720,
"valid_targets_mean": 6666.0,
"valid_targets_min": 436
},
{
"epoch": 6.027508090614886,
"grad_norm": 0.49092970456222856,
"learning_rate": 2.3140124945347188e-06,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2011633813381195,
"step": 3725,
"valid_targets_mean": 6712.9,
"valid_targets_min": 2430
},
{
"epoch": 6.035598705501618,
"grad_norm": 0.4772774830924541,
"learning_rate": 2.2764767934146304e-06,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27531710267066956,
"step": 3730,
"valid_targets_mean": 7593.6,
"valid_targets_min": 2385
},
{
"epoch": 6.043689320388349,
"grad_norm": 0.4885723859576736,
"learning_rate": 2.2392296418540527e-06,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31475353240966797,
"step": 3735,
"valid_targets_mean": 8572.8,
"valid_targets_min": 3812
},
{
"epoch": 6.051779935275081,
"grad_norm": 0.46349461761945754,
"learning_rate": 2.20227164625888e-06,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23537136614322662,
"step": 3740,
"valid_targets_mean": 7005.8,
"valid_targets_min": 2432
},
{
"epoch": 6.059870550161812,
"grad_norm": 0.5143036769044641,
"learning_rate": 2.165603408327386e-06,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768769860267639,
"step": 3745,
"valid_targets_mean": 7800.5,
"valid_targets_min": 2317
},
{
"epoch": 6.067961165048544,
"grad_norm": 0.46034482764138784,
"learning_rate": 2.129225525040428e-06,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25223392248153687,
"step": 3750,
"valid_targets_mean": 7407.8,
"valid_targets_min": 3408
},
{
"epoch": 6.076051779935275,
"grad_norm": 0.48621110957683666,
"learning_rate": 2.0931385886517043e-06,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531178593635559,
"step": 3755,
"valid_targets_mean": 7218.2,
"valid_targets_min": 3958
},
{
"epoch": 6.084142394822006,
"grad_norm": 0.5155976217240823,
"learning_rate": 2.05734318667812e-06,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27418065071105957,
"step": 3760,
"valid_targets_mean": 6286.2,
"valid_targets_min": 2470
},
{
"epoch": 6.092233009708738,
"grad_norm": 0.48664238742645205,
"learning_rate": 2.0218399018902368e-06,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080136477947235,
"step": 3765,
"valid_targets_mean": 8067.4,
"valid_targets_min": 3465
},
{
"epoch": 6.100323624595469,
"grad_norm": 0.46352182330349134,
"learning_rate": 1.986629312302759e-06,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24487361311912537,
"step": 3770,
"valid_targets_mean": 7811.1,
"valid_targets_min": 3446
},
{
"epoch": 6.108414239482201,
"grad_norm": 0.47902814582303754,
"learning_rate": 1.9517119911651594e-06,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27173787355422974,
"step": 3775,
"valid_targets_mean": 7021.4,
"valid_targets_min": 3473
},
{
"epoch": 6.116504854368932,
"grad_norm": 0.48426838259458393,
"learning_rate": 1.917088506952307e-06,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21929030120372772,
"step": 3780,
"valid_targets_mean": 5997.2,
"valid_targets_min": 987
},
{
"epoch": 6.124595469255663,
"grad_norm": 0.5379855412992037,
"learning_rate": 1.8827594233552338e-06,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751188278198242,
"step": 3785,
"valid_targets_mean": 7148.6,
"valid_targets_min": 4702
},
{
"epoch": 6.132686084142395,
"grad_norm": 0.4577375186919723,
"learning_rate": 1.8487252992719562e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24760842323303223,
"step": 3790,
"valid_targets_mean": 7563.4,
"valid_targets_min": 2494
},
{
"epoch": 6.140776699029126,
"grad_norm": 0.6351508094968208,
"learning_rate": 1.8149866887983747e-06,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24771344661712646,
"step": 3795,
"valid_targets_mean": 7400.8,
"valid_targets_min": 2898
},
{
"epoch": 6.148867313915858,
"grad_norm": 0.4709978586642668,
"learning_rate": 1.7815441412192447e-06,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23811772465705872,
"step": 3800,
"valid_targets_mean": 6554.0,
"valid_targets_min": 2859
},
{
"epoch": 6.156957928802589,
"grad_norm": 0.48529604703966406,
"learning_rate": 1.7483982009992506e-06,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738912105560303,
"step": 3805,
"valid_targets_mean": 8087.6,
"valid_targets_min": 3121
},
{
"epoch": 6.165048543689321,
"grad_norm": 0.5094951979756573,
"learning_rate": 1.715549407774124e-06,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26680633425712585,
"step": 3810,
"valid_targets_mean": 7483.6,
"valid_targets_min": 2526
},
{
"epoch": 6.173139158576052,
"grad_norm": 0.49094410985136205,
"learning_rate": 1.6829982963418667e-06,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2834646701812744,
"step": 3815,
"valid_targets_mean": 7937.6,
"valid_targets_min": 2332
},
{
"epoch": 6.181229773462783,
"grad_norm": 0.4943073784626869,
"learning_rate": 1.6507453966540454e-06,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21011626720428467,
"step": 3820,
"valid_targets_mean": 5858.5,
"valid_targets_min": 1991
},
{
"epoch": 6.189320388349515,
"grad_norm": 0.5144149277940221,
"learning_rate": 1.6187912338071577e-06,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21853004395961761,
"step": 3825,
"valid_targets_mean": 6832.9,
"valid_targets_min": 2464
},
{
"epoch": 6.197411003236246,
"grad_norm": 0.4876684368823754,
"learning_rate": 1.5871363280340913e-06,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29543834924697876,
"step": 3830,
"valid_targets_mean": 7922.1,
"valid_targets_min": 3838
},
{
"epoch": 6.205501618122978,
"grad_norm": 0.8665595775858145,
"learning_rate": 1.555781194695649e-06,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3264833092689514,
"step": 3835,
"valid_targets_mean": 3412.1,
"valid_targets_min": 1423
},
{
"epoch": 6.213592233009709,
"grad_norm": 0.892049887510929,
"learning_rate": 1.5247263442721494e-06,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33291494846343994,
"step": 3840,
"valid_targets_mean": 3334.9,
"valid_targets_min": 1457
},
{
"epoch": 6.2216828478964405,
"grad_norm": 0.7890194853199695,
"learning_rate": 1.4939722823551428e-06,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830268442630768,
"step": 3845,
"valid_targets_mean": 3261.9,
"valid_targets_min": 1130
},
{
"epoch": 6.229773462783172,
"grad_norm": 0.9008470932667201,
"learning_rate": 1.4635195096391463e-06,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32268476486206055,
"step": 3850,
"valid_targets_mean": 3196.9,
"valid_targets_min": 1352
},
{
"epoch": 6.237864077669903,
"grad_norm": 0.8472773074650307,
"learning_rate": 1.4333685219135163e-06,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3363885283470154,
"step": 3855,
"valid_targets_mean": 3218.4,
"valid_targets_min": 1283
},
{
"epoch": 6.2459546925566345,
"grad_norm": 0.8552973048647464,
"learning_rate": 1.403519810054379e-06,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3232272267341614,
"step": 3860,
"valid_targets_mean": 3128.2,
"valid_targets_min": 1174
},
{
"epoch": 6.2540453074433655,
"grad_norm": 0.7934267015934255,
"learning_rate": 1.373973860016602e-06,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3452760577201843,
"step": 3865,
"valid_targets_mean": 3595.7,
"valid_targets_min": 1167
},
{
"epoch": 6.262135922330097,
"grad_norm": 0.9335558226534135,
"learning_rate": 1.3447311528259354e-06,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3375539779663086,
"step": 3870,
"valid_targets_mean": 2384.2,
"valid_targets_min": 1050
},
{
"epoch": 6.270226537216828,
"grad_norm": 1.020746618496496,
"learning_rate": 1.3157921645711436e-06,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3059931993484497,
"step": 3875,
"valid_targets_mean": 2044.2,
"valid_targets_min": 1031
},
{
"epoch": 6.2783171521035595,
"grad_norm": 0.9350202814104195,
"learning_rate": 1.2871573663962611e-06,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34296131134033203,
"step": 3880,
"valid_targets_mean": 2718.1,
"valid_targets_min": 1454
},
{
"epoch": 6.286407766990291,
"grad_norm": 0.8146668135738933,
"learning_rate": 1.2588272244929401e-06,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30769336223602295,
"step": 3885,
"valid_targets_mean": 3258.4,
"valid_targets_min": 1497
},
{
"epoch": 6.294498381877022,
"grad_norm": 0.8273218896381229,
"learning_rate": 1.2308022000928287e-06,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3195771872997284,
"step": 3890,
"valid_targets_mean": 3150.2,
"valid_targets_min": 1604
},
{
"epoch": 6.302588996763754,
"grad_norm": 0.8419774148102896,
"learning_rate": 1.203082749460085e-06,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2897275388240814,
"step": 3895,
"valid_targets_mean": 2876.9,
"valid_targets_min": 1155
},
{
"epoch": 6.310679611650485,
"grad_norm": 1.050868420114631,
"learning_rate": 1.1756693238839566e-06,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29404884576797485,
"step": 3900,
"valid_targets_mean": 4079.6,
"valid_targets_min": 1052
},
{
"epoch": 6.318770226537217,
"grad_norm": 0.801631926562582,
"learning_rate": 1.1485623696714043e-06,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28582143783569336,
"step": 3905,
"valid_targets_mean": 3415.6,
"valid_targets_min": 1602
},
{
"epoch": 6.326860841423948,
"grad_norm": 0.7993792702234223,
"learning_rate": 1.1217623281398571e-06,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818544805049896,
"step": 3910,
"valid_targets_mean": 3181.6,
"valid_targets_min": 1316
},
{
"epoch": 6.334951456310679,
"grad_norm": 0.8511495939913303,
"learning_rate": 1.0952696356100234e-06,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3155943751335144,
"step": 3915,
"valid_targets_mean": 3121.9,
"valid_targets_min": 1419
},
{
"epoch": 6.343042071197411,
"grad_norm": 0.7964448416131412,
"learning_rate": 1.069084723398781e-06,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3194991946220398,
"step": 3920,
"valid_targets_mean": 3586.2,
"valid_targets_min": 1317
},
{
"epoch": 6.351132686084142,
"grad_norm": 1.895989148097138,
"learning_rate": 1.0432080178121695e-06,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2887115478515625,
"step": 3925,
"valid_targets_mean": 2831.5,
"valid_targets_min": 970
},
{
"epoch": 6.359223300970874,
"grad_norm": 0.8254121060367813,
"learning_rate": 1.0176399401384306e-06,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30215805768966675,
"step": 3930,
"valid_targets_mean": 3350.7,
"valid_targets_min": 1482
},
{
"epoch": 6.367313915857605,
"grad_norm": 0.8600251391796992,
"learning_rate": 9.92380906641166e-07,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902137339115143,
"step": 3935,
"valid_targets_mean": 3731.3,
"valid_targets_min": 2450
},
{
"epoch": 6.375404530744337,
"grad_norm": 0.8998136566486831,
"learning_rate": 9.674313285525484e-07,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3461061716079712,
"step": 3940,
"valid_targets_mean": 2778.6,
"valid_targets_min": 1161
},
{
"epoch": 6.383495145631068,
"grad_norm": 0.9099848810975844,
"learning_rate": 9.427916120666314e-07,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32288292050361633,
"step": 3945,
"valid_targets_mean": 2516.2,
"valid_targets_min": 1147
},
{
"epoch": 6.391585760517799,
"grad_norm": 0.9030343212723014,
"learning_rate": 9.18462158332738e-07,
"loss": 0.3118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29295065999031067,
"step": 3950,
"valid_targets_mean": 2672.7,
"valid_targets_min": 1160
},
{
"epoch": 6.399676375404531,
"grad_norm": 1.0808970579643715,
"learning_rate": 8.944433634489335e-07,
"loss": 0.3125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31745681166648865,
"step": 3955,
"valid_targets_mean": 3144.7,
"valid_targets_min": 1229
},
{
"epoch": 6.407766990291262,
"grad_norm": 0.8902905271705912,
"learning_rate": 8.707356184555626e-07,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307051420211792,
"step": 3960,
"valid_targets_mean": 2757.4,
"valid_targets_min": 1187
},
{
"epoch": 6.415857605177994,
"grad_norm": 0.8492882495541785,
"learning_rate": 8.473393093288962e-07,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30651533603668213,
"step": 3965,
"valid_targets_mean": 3186.5,
"valid_targets_min": 1140
},
{
"epoch": 6.423948220064725,
"grad_norm": 0.8938811801174615,
"learning_rate": 8.242548169748388e-07,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30959033966064453,
"step": 3970,
"valid_targets_mean": 2945.1,
"valid_targets_min": 1342
},
{
"epoch": 6.432038834951456,
"grad_norm": 0.8851063163539813,
"learning_rate": 8.014825172227359e-07,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2955814003944397,
"step": 3975,
"valid_targets_mean": 2664.8,
"valid_targets_min": 1158
},
{
"epoch": 6.440129449838188,
"grad_norm": 0.8471775153920295,
"learning_rate": 7.790227808192497e-07,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32479000091552734,
"step": 3980,
"valid_targets_mean": 3277.8,
"valid_targets_min": 905
},
{
"epoch": 6.448220064724919,
"grad_norm": 0.7712971413979559,
"learning_rate": 7.568759734223263e-07,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26132726669311523,
"step": 3985,
"valid_targets_mean": 3435.2,
"valid_targets_min": 1523
},
{
"epoch": 6.456310679611651,
"grad_norm": 0.7960120633487386,
"learning_rate": 7.350424555952318e-07,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780383825302124,
"step": 3990,
"valid_targets_mean": 4198.9,
"valid_targets_min": 916
},
{
"epoch": 6.464401294498382,
"grad_norm": 0.7940656209613582,
"learning_rate": 7.135225828007009e-07,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192026615142822,
"step": 3995,
"valid_targets_mean": 4307.2,
"valid_targets_min": 1372
},
{
"epoch": 6.472491909385114,
"grad_norm": 0.8659078167481403,
"learning_rate": 6.92316705395133e-07,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2758025527000427,
"step": 4000,
"valid_targets_mean": 4283.3,
"valid_targets_min": 965
},
{
"epoch": 6.480582524271845,
"grad_norm": 0.7520716674040167,
"learning_rate": 6.714251686228968e-07,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3214672803878784,
"step": 4005,
"valid_targets_mean": 4556.1,
"valid_targets_min": 1616
},
{
"epoch": 6.488673139158576,
"grad_norm": 0.8133648933005242,
"learning_rate": 6.508483126107146e-07,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.255154550075531,
"step": 4010,
"valid_targets_mean": 3447.2,
"valid_targets_min": 1306
},
{
"epoch": 6.496763754045308,
"grad_norm": 0.7949247419294541,
"learning_rate": 6.305864723621025e-07,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3274669647216797,
"step": 4015,
"valid_targets_mean": 4328.6,
"valid_targets_min": 1066
},
{
"epoch": 6.504854368932039,
"grad_norm": 0.7110098139561425,
"learning_rate": 6.10639977751939e-07,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28492259979248047,
"step": 4020,
"valid_targets_mean": 3835.6,
"valid_targets_min": 265
},
{
"epoch": 6.5129449838187705,
"grad_norm": 0.7126645911750137,
"learning_rate": 5.91009153521096e-07,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24657857418060303,
"step": 4025,
"valid_targets_mean": 3986.9,
"valid_targets_min": 1113
},
{
"epoch": 6.5210355987055015,
"grad_norm": 0.7110478416139949,
"learning_rate": 5.716943192711277e-07,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26910921931266785,
"step": 4030,
"valid_targets_mean": 4109.8,
"valid_targets_min": 1541
},
{
"epoch": 6.529126213592233,
"grad_norm": 0.7449519077071346,
"learning_rate": 5.526957894590923e-07,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063822388648987,
"step": 4035,
"valid_targets_mean": 4168.6,
"valid_targets_min": 2291
},
{
"epoch": 6.5372168284789645,
"grad_norm": 0.7021399739407856,
"learning_rate": 5.340138733924161e-07,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863706052303314,
"step": 4040,
"valid_targets_mean": 4216.5,
"valid_targets_min": 1752
},
{
"epoch": 6.5453074433656955,
"grad_norm": 0.7735052174852324,
"learning_rate": 5.156488752238708e-07,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29372304677963257,
"step": 4045,
"valid_targets_mean": 3781.9,
"valid_targets_min": 1305
},
{
"epoch": 6.553398058252427,
"grad_norm": 0.763189708006023,
"learning_rate": 4.976010939466136e-07,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.265279620885849,
"step": 4050,
"valid_targets_mean": 3348.1,
"valid_targets_min": 1135
},
{
"epoch": 6.561488673139158,
"grad_norm": 0.6971921406699557,
"learning_rate": 4.798708233893168e-07,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3288305401802063,
"step": 4055,
"valid_targets_mean": 4481.9,
"valid_targets_min": 1322
},
{
"epoch": 6.56957928802589,
"grad_norm": 0.7843790286009376,
"learning_rate": 4.624583522113879e-07,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31674474477767944,
"step": 4060,
"valid_targets_mean": 3422.4,
"valid_targets_min": 1174
},
{
"epoch": 6.577669902912621,
"grad_norm": 0.6898905734307865,
"learning_rate": 4.4536396389827986e-07,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700502872467041,
"step": 4065,
"valid_targets_mean": 3936.9,
"valid_targets_min": 991
},
{
"epoch": 6.585760517799352,
"grad_norm": 0.6732046516074872,
"learning_rate": 4.285879367568546e-07,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750830054283142,
"step": 4070,
"valid_targets_mean": 3986.6,
"valid_targets_min": 1735
},
{
"epoch": 6.593851132686084,
"grad_norm": 0.7679798193130004,
"learning_rate": 4.1213054391086914e-07,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28283199667930603,
"step": 4075,
"valid_targets_mean": 3311.6,
"valid_targets_min": 1092
},
{
"epoch": 6.601941747572815,
"grad_norm": 0.6026507323893453,
"learning_rate": 3.959920532965278e-07,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2601849436759949,
"step": 4080,
"valid_targets_mean": 4680.1,
"valid_targets_min": 1798
},
{
"epoch": 6.610032362459547,
"grad_norm": 0.7227252220712441,
"learning_rate": 3.8017272765810795e-07,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30186226963996887,
"step": 4085,
"valid_targets_mean": 4138.6,
"valid_targets_min": 1094
},
{
"epoch": 6.618122977346278,
"grad_norm": 0.6797239186310708,
"learning_rate": 3.646728245436926e-07,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772945761680603,
"step": 4090,
"valid_targets_mean": 3797.0,
"valid_targets_min": 1324
},
{
"epoch": 6.62621359223301,
"grad_norm": 0.6566219650337652,
"learning_rate": 3.4949259630097985e-07,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31445634365081787,
"step": 4095,
"valid_targets_mean": 4714.8,
"valid_targets_min": 1255
},
{
"epoch": 6.634304207119741,
"grad_norm": 0.7855187195704445,
"learning_rate": 3.346322900731602e-07,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3059901297092438,
"step": 4100,
"valid_targets_mean": 3223.0,
"valid_targets_min": 1392
},
{
"epoch": 6.642394822006472,
"grad_norm": 0.687926997782234,
"learning_rate": 3.2009214779491703e-07,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721381187438965,
"step": 4105,
"valid_targets_mean": 3943.1,
"valid_targets_min": 1237
},
{
"epoch": 6.650485436893204,
"grad_norm": 0.6262388534931846,
"learning_rate": 3.0587240618845437e-07,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525428533554077,
"step": 4110,
"valid_targets_mean": 4954.7,
"valid_targets_min": 706
},
{
"epoch": 6.658576051779935,
"grad_norm": 0.7958100221453792,
"learning_rate": 2.9197329675967556e-07,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23203250765800476,
"step": 4115,
"valid_targets_mean": 3676.8,
"valid_targets_min": 1093
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.6670568718226326,
"learning_rate": 2.7839504579439734e-07,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591486871242523,
"step": 4120,
"valid_targets_mean": 4621.4,
"valid_targets_min": 1738
},
{
"epoch": 6.674757281553398,
"grad_norm": 0.6841964897124194,
"learning_rate": 2.651378743546662e-07,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23089730739593506,
"step": 4125,
"valid_targets_mean": 3523.9,
"valid_targets_min": 1856
},
{
"epoch": 6.68284789644013,
"grad_norm": 0.7736922565372187,
"learning_rate": 2.5220199827516335e-07,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2762467861175537,
"step": 4130,
"valid_targets_mean": 3767.3,
"valid_targets_min": 1039
},
{
"epoch": 6.690938511326861,
"grad_norm": 0.6878220159499924,
"learning_rate": 2.395876281596898e-07,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.286093533039093,
"step": 4135,
"valid_targets_mean": 4240.9,
"valid_targets_min": 995
},
{
"epoch": 6.699029126213592,
"grad_norm": 0.6785912150782965,
"learning_rate": 2.2729496937773375e-07,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3174231946468353,
"step": 4140,
"valid_targets_mean": 5330.5,
"valid_targets_min": 1212
},
{
"epoch": 6.707119741100324,
"grad_norm": 0.6514244014519243,
"learning_rate": 2.1532422206113957e-07,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21629130840301514,
"step": 4145,
"valid_targets_mean": 3586.9,
"valid_targets_min": 1172
},
{
"epoch": 6.715210355987055,
"grad_norm": 0.7503383439275698,
"learning_rate": 2.036755811008284e-07,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261480450630188,
"step": 4150,
"valid_targets_mean": 3200.2,
"valid_targets_min": 1561
},
{
"epoch": 6.723300970873787,
"grad_norm": 0.7498083689815956,
"learning_rate": 1.9234923614364298e-07,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31724271178245544,
"step": 4155,
"valid_targets_mean": 3854.4,
"valid_targets_min": 1217
},
{
"epoch": 6.731391585760518,
"grad_norm": 0.8416117264342016,
"learning_rate": 1.813453715892588e-07,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30290308594703674,
"step": 4160,
"valid_targets_mean": 2972.9,
"valid_targets_min": 333
},
{
"epoch": 6.739482200647249,
"grad_norm": 0.7415989066146672,
"learning_rate": 1.706641665871689e-07,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292361855506897,
"step": 4165,
"valid_targets_mean": 3447.4,
"valid_targets_min": 1280
},
{
"epoch": 6.747572815533981,
"grad_norm": 0.7261344570096327,
"learning_rate": 1.603057950337794e-07,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824702262878418,
"step": 4170,
"valid_targets_mean": 3488.9,
"valid_targets_min": 1389
},
{
"epoch": 6.755663430420712,
"grad_norm": 0.5981854317735275,
"learning_rate": 1.5027042556958083e-07,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16710269451141357,
"step": 4175,
"valid_targets_mean": 6022.9,
"valid_targets_min": 2384
},
{
"epoch": 6.763754045307444,
"grad_norm": 0.6204828785463561,
"learning_rate": 1.4055822157638566e-07,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17309242486953735,
"step": 4180,
"valid_targets_mean": 6773.4,
"valid_targets_min": 1712
},
{
"epoch": 6.771844660194175,
"grad_norm": 0.6175696916898002,
"learning_rate": 1.3116934117468617e-07,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1712668240070343,
"step": 4185,
"valid_targets_mean": 5853.4,
"valid_targets_min": 2336
},
{
"epoch": 6.779935275080906,
"grad_norm": 0.6110178559303455,
"learning_rate": 1.2210393722106973e-07,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16805970668792725,
"step": 4190,
"valid_targets_mean": 5625.0,
"valid_targets_min": 341
},
{
"epoch": 6.788025889967638,
"grad_norm": 0.5850597980478186,
"learning_rate": 1.1336215730573863e-07,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.141169935464859,
"step": 4195,
"valid_targets_mean": 4999.9,
"valid_targets_min": 546
},
{
"epoch": 6.796116504854369,
"grad_norm": 0.5304772632067583,
"learning_rate": 1.0494414375009642e-07,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16190440952777863,
"step": 4200,
"valid_targets_mean": 5886.6,
"valid_targets_min": 362
},
{
"epoch": 6.8042071197411005,
"grad_norm": 0.7157488847124063,
"learning_rate": 9.68500336044409e-08,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16354969143867493,
"step": 4205,
"valid_targets_mean": 5545.2,
"valid_targets_min": 349
},
{
"epoch": 6.8122977346278315,
"grad_norm": 0.6188536501701989,
"learning_rate": 8.907995864572583e-08,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599283516407013,
"step": 4210,
"valid_targets_mean": 5221.4,
"valid_targets_min": 685
},
{
"epoch": 6.820388349514563,
"grad_norm": 0.6051646108971138,
"learning_rate": 8.16340453754183e-08,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15831029415130615,
"step": 4215,
"valid_targets_mean": 6906.4,
"valid_targets_min": 3688
},
{
"epoch": 6.828478964401294,
"grad_norm": 0.6843142673349079,
"learning_rate": 7.451241501744255e-08,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084500789642334,
"step": 4220,
"valid_targets_mean": 5886.7,
"valid_targets_min": 3248
},
{
"epoch": 6.836569579288026,
"grad_norm": 0.8169465061204166,
"learning_rate": 6.771518351619932e-08,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1563340127468109,
"step": 4225,
"valid_targets_mean": 5565.2,
"valid_targets_min": 849
},
{
"epoch": 6.844660194174757,
"grad_norm": 0.6240263655362814,
"learning_rate": 6.124246153468516e-08,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18898531794548035,
"step": 4230,
"valid_targets_mean": 4495.2,
"valid_targets_min": 1104
},
{
"epoch": 6.852750809061488,
"grad_norm": 0.6165610195908027,
"learning_rate": 5.5094354452684964e-08,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17224600911140442,
"step": 4235,
"valid_targets_mean": 5532.5,
"valid_targets_min": 3084
},
{
"epoch": 6.86084142394822,
"grad_norm": 0.5752785701802093,
"learning_rate": 4.927096236505779e-08,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22186093032360077,
"step": 4240,
"valid_targets_mean": 6345.2,
"valid_targets_min": 2085
},
{
"epoch": 6.868932038834951,
"grad_norm": 0.6268844620559095,
"learning_rate": 4.3772380080111534e-08,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1646140217781067,
"step": 4245,
"valid_targets_mean": 6782.8,
"valid_targets_min": 4896
},
{
"epoch": 6.877022653721683,
"grad_norm": 0.546664853489719,
"learning_rate": 3.85986971180552e-08,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12946677207946777,
"step": 4250,
"valid_targets_mean": 4796.1,
"valid_targets_min": 1174
},
{
"epoch": 6.885113268608414,
"grad_norm": 0.6505927779685415,
"learning_rate": 3.374999770954013e-08,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1995866596698761,
"step": 4255,
"valid_targets_mean": 6176.4,
"valid_targets_min": 2462
},
{
"epoch": 6.893203883495145,
"grad_norm": 0.6100138602783509,
"learning_rate": 2.9226360794296638e-08,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28793472051620483,
"step": 4260,
"valid_targets_mean": 5792.8,
"valid_targets_min": 3198
},
{
"epoch": 6.901294498381877,
"grad_norm": 0.5130289551978165,
"learning_rate": 2.502786001983726e-08,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15492425858974457,
"step": 4265,
"valid_targets_mean": 6734.0,
"valid_targets_min": 3363
},
{
"epoch": 6.909385113268608,
"grad_norm": 0.5083619319200668,
"learning_rate": 2.1154563740266588e-08,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484774798154831,
"step": 4270,
"valid_targets_mean": 6156.2,
"valid_targets_min": 3554
},
{
"epoch": 6.91747572815534,
"grad_norm": 0.5437899387117957,
"learning_rate": 1.7606535015164405e-08,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19615788757801056,
"step": 4275,
"valid_targets_mean": 6275.4,
"valid_targets_min": 521
},
{
"epoch": 6.925566343042071,
"grad_norm": 0.535514833773013,
"learning_rate": 1.4383831608562048e-08,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18205270171165466,
"step": 4280,
"valid_targets_mean": 6298.0,
"valid_targets_min": 437
},
{
"epoch": 6.933656957928802,
"grad_norm": 0.5176082517371361,
"learning_rate": 1.14865059879965e-08,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24456022679805756,
"step": 4285,
"valid_targets_mean": 6639.6,
"valid_targets_min": 2502
},
{
"epoch": 6.941747572815534,
"grad_norm": 0.5795990513548355,
"learning_rate": 8.914605323664394e-09,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16445422172546387,
"step": 4290,
"valid_targets_mean": 5588.2,
"valid_targets_min": 3131
},
{
"epoch": 6.949838187702265,
"grad_norm": 0.6200044961722991,
"learning_rate": 6.66817148764487e-09,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16037827730178833,
"step": 4295,
"valid_targets_mean": 5546.2,
"valid_targets_min": 892
},
{
"epoch": 6.957928802588997,
"grad_norm": 0.6945388564726743,
"learning_rate": 4.7472410532245495e-09,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16633108258247375,
"step": 4300,
"valid_targets_mean": 5383.6,
"valid_targets_min": 632
},
{
"epoch": 6.966019417475728,
"grad_norm": 0.5779686340710244,
"learning_rate": 3.151845294302458e-09,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22585266828536987,
"step": 4305,
"valid_targets_mean": 5866.8,
"valid_targets_min": 523
},
{
"epoch": 6.97411003236246,
"grad_norm": 0.5613541281121649,
"learning_rate": 1.882010184874883e-09,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740507185459137,
"step": 4310,
"valid_targets_mean": 5499.6,
"valid_targets_min": 1071
},
{
"epoch": 6.982200647249191,
"grad_norm": 0.5251874269236045,
"learning_rate": 9.377563986157078e-10,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2157984972000122,
"step": 4315,
"valid_targets_mean": 6634.6,
"valid_targets_min": 910
},
{
"epoch": 6.990291262135923,
"grad_norm": 0.515253369974493,
"learning_rate": 3.1909930854112646e-10,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872372180223465,
"step": 4320,
"valid_targets_mean": 5642.3,
"valid_targets_min": 409
},
{
"epoch": 6.998381877022654,
"grad_norm": 0.5332063951683166,
"learning_rate": 2.6048986760951466e-11,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17377439141273499,
"step": 4325,
"valid_targets_mean": 5486.1,
"valid_targets_min": 628
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20184344053268433,
"step": 4326,
"total_flos": 1656860604825600.0,
"train_loss": 0.3245428150801321,
"train_runtime": 27498.7411,
"train_samples_per_second": 2.513,
"train_steps_per_second": 0.157,
"valid_targets_mean": 6528.7,
"valid_targets_min": 1969
}
],
"logging_steps": 5,
"max_steps": 4326,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1656860604825600.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}