Files
a1-repo_scaffold/trainer_state.json
ModelHub XC 99e13f2d72 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-repo_scaffold
Source: Original Platform
2026-05-13 15:45:12 +08:00

9695 lines
269 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4389,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007974481658692184,
"grad_norm": 22.539601593654673,
"learning_rate": 3.644646924829157e-07,
"loss": 0.7236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7600098848342896,
"step": 5,
"valid_targets_mean": 4851.9,
"valid_targets_min": 237
},
{
"epoch": 0.01594896331738437,
"grad_norm": 23.275682007480874,
"learning_rate": 8.200455580865605e-07,
"loss": 0.7422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7550889253616333,
"step": 10,
"valid_targets_mean": 4153.7,
"valid_targets_min": 269
},
{
"epoch": 0.023923444976076555,
"grad_norm": 21.554468206830432,
"learning_rate": 1.2756264236902052e-06,
"loss": 0.7207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7336411476135254,
"step": 15,
"valid_targets_mean": 5106.7,
"valid_targets_min": 266
},
{
"epoch": 0.03189792663476874,
"grad_norm": 17.34512536090768,
"learning_rate": 1.7312072892938498e-06,
"loss": 0.6838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7120847702026367,
"step": 20,
"valid_targets_mean": 4411.2,
"valid_targets_min": 235
},
{
"epoch": 0.03987240829346093,
"grad_norm": 9.588441353519025,
"learning_rate": 2.1867881548974945e-06,
"loss": 0.6246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6012063026428223,
"step": 25,
"valid_targets_mean": 4489.4,
"valid_targets_min": 200
},
{
"epoch": 0.04784688995215311,
"grad_norm": 4.870389531616145,
"learning_rate": 2.642369020501139e-06,
"loss": 0.5402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4939027726650238,
"step": 30,
"valid_targets_mean": 5847.0,
"valid_targets_min": 315
},
{
"epoch": 0.05582137161084529,
"grad_norm": 2.7658562996335365,
"learning_rate": 3.0979498861047843e-06,
"loss": 0.5073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4871441423892975,
"step": 35,
"valid_targets_mean": 5392.2,
"valid_targets_min": 495
},
{
"epoch": 0.06379585326953748,
"grad_norm": 1.6108362387448016,
"learning_rate": 3.5535307517084285e-06,
"loss": 0.4935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47061264514923096,
"step": 40,
"valid_targets_mean": 5388.4,
"valid_targets_min": 208
},
{
"epoch": 0.07177033492822966,
"grad_norm": 1.3386250154648769,
"learning_rate": 4.009111617312073e-06,
"loss": 0.4709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4864431619644165,
"step": 45,
"valid_targets_mean": 4927.4,
"valid_targets_min": 817
},
{
"epoch": 0.07974481658692185,
"grad_norm": 0.9037410217035577,
"learning_rate": 4.464692482915718e-06,
"loss": 0.436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37901973724365234,
"step": 50,
"valid_targets_mean": 5363.9,
"valid_targets_min": 344
},
{
"epoch": 0.08771929824561403,
"grad_norm": 0.8962668028470888,
"learning_rate": 4.920273348519363e-06,
"loss": 0.4353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42550718784332275,
"step": 55,
"valid_targets_mean": 4650.9,
"valid_targets_min": 214
},
{
"epoch": 0.09569377990430622,
"grad_norm": 0.7175155926848071,
"learning_rate": 5.375854214123008e-06,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.379960298538208,
"step": 60,
"valid_targets_mean": 5349.0,
"valid_targets_min": 1052
},
{
"epoch": 0.10366826156299841,
"grad_norm": 0.6623643426461047,
"learning_rate": 5.831435079726651e-06,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43091630935668945,
"step": 65,
"valid_targets_mean": 5121.9,
"valid_targets_min": 207
},
{
"epoch": 0.11164274322169059,
"grad_norm": 0.6754894343009573,
"learning_rate": 6.287015945330297e-06,
"loss": 0.3789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43398618698120117,
"step": 70,
"valid_targets_mean": 4971.6,
"valid_targets_min": 290
},
{
"epoch": 0.11961722488038277,
"grad_norm": 0.5515059112771347,
"learning_rate": 6.742596810933942e-06,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36535507440567017,
"step": 75,
"valid_targets_mean": 5889.2,
"valid_targets_min": 237
},
{
"epoch": 0.12759170653907495,
"grad_norm": 0.5773732873387002,
"learning_rate": 7.1981776765375854e-06,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3957010507583618,
"step": 80,
"valid_targets_mean": 5604.6,
"valid_targets_min": 1493
},
{
"epoch": 0.13556618819776714,
"grad_norm": 0.551936709789771,
"learning_rate": 7.65375854214123e-06,
"loss": 0.367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3580014705657959,
"step": 85,
"valid_targets_mean": 5206.6,
"valid_targets_min": 239
},
{
"epoch": 0.14354066985645933,
"grad_norm": 0.5490810118496819,
"learning_rate": 8.109339407744875e-06,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33477139472961426,
"step": 90,
"valid_targets_mean": 5279.1,
"valid_targets_min": 366
},
{
"epoch": 0.15151515151515152,
"grad_norm": 0.5212462100646008,
"learning_rate": 8.564920273348521e-06,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3179510235786438,
"step": 95,
"valid_targets_mean": 5520.1,
"valid_targets_min": 551
},
{
"epoch": 0.1594896331738437,
"grad_norm": 0.5483602561286001,
"learning_rate": 9.020501138952164e-06,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3079075217247009,
"step": 100,
"valid_targets_mean": 4469.1,
"valid_targets_min": 247
},
{
"epoch": 0.1674641148325359,
"grad_norm": 0.5163840976300561,
"learning_rate": 9.47608200455581e-06,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911684513092041,
"step": 105,
"valid_targets_mean": 4836.1,
"valid_targets_min": 245
},
{
"epoch": 0.17543859649122806,
"grad_norm": 0.49241293958882054,
"learning_rate": 9.931662870159453e-06,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32421791553497314,
"step": 110,
"valid_targets_mean": 4989.3,
"valid_targets_min": 259
},
{
"epoch": 0.18341307814992025,
"grad_norm": 0.6731661811960075,
"learning_rate": 1.03872437357631e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3411160111427307,
"step": 115,
"valid_targets_mean": 3303.2,
"valid_targets_min": 220
},
{
"epoch": 0.19138755980861244,
"grad_norm": 0.6093925029848669,
"learning_rate": 1.0842824601366744e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30621105432510376,
"step": 120,
"valid_targets_mean": 5066.4,
"valid_targets_min": 269
},
{
"epoch": 0.19936204146730463,
"grad_norm": 0.5593908924009113,
"learning_rate": 1.1298405466970387e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3183234632015228,
"step": 125,
"valid_targets_mean": 6049.1,
"valid_targets_min": 346
},
{
"epoch": 0.20733652312599682,
"grad_norm": 0.6050357561923428,
"learning_rate": 1.1753986332574032e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018328547477722,
"step": 130,
"valid_targets_mean": 4385.7,
"valid_targets_min": 241
},
{
"epoch": 0.215311004784689,
"grad_norm": 0.49058884266137975,
"learning_rate": 1.2209567198177677e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29568153619766235,
"step": 135,
"valid_targets_mean": 5280.4,
"valid_targets_min": 260
},
{
"epoch": 0.22328548644338117,
"grad_norm": 0.4997292646119957,
"learning_rate": 1.2665148063781323e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3315421938896179,
"step": 140,
"valid_targets_mean": 6060.2,
"valid_targets_min": 237
},
{
"epoch": 0.23125996810207336,
"grad_norm": 0.5787387582389717,
"learning_rate": 1.3120728929384968e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29679274559020996,
"step": 145,
"valid_targets_mean": 3525.4,
"valid_targets_min": 226
},
{
"epoch": 0.23923444976076555,
"grad_norm": 0.5372974158957257,
"learning_rate": 1.357630979498861e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28743451833724976,
"step": 150,
"valid_targets_mean": 4102.1,
"valid_targets_min": 224
},
{
"epoch": 0.24720893141945774,
"grad_norm": 0.4870503108003043,
"learning_rate": 1.4031890660592255e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642919421195984,
"step": 155,
"valid_targets_mean": 5220.6,
"valid_targets_min": 253
},
{
"epoch": 0.2551834130781499,
"grad_norm": 0.5266528254525839,
"learning_rate": 1.4487471526195902e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28630515933036804,
"step": 160,
"valid_targets_mean": 5168.8,
"valid_targets_min": 255
},
{
"epoch": 0.2631578947368421,
"grad_norm": 0.5363668887252679,
"learning_rate": 1.4943052391799546e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562587559223175,
"step": 165,
"valid_targets_mean": 4222.8,
"valid_targets_min": 229
},
{
"epoch": 0.2711323763955343,
"grad_norm": 0.5652284763255125,
"learning_rate": 1.539863325740319e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27037516236305237,
"step": 170,
"valid_targets_mean": 4190.6,
"valid_targets_min": 206
},
{
"epoch": 0.27910685805422647,
"grad_norm": 0.5317822792661527,
"learning_rate": 1.5854214123006836e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2907927334308624,
"step": 175,
"valid_targets_mean": 5068.0,
"valid_targets_min": 161
},
{
"epoch": 0.28708133971291866,
"grad_norm": 0.5849656228564338,
"learning_rate": 1.630979498861048e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30426454544067383,
"step": 180,
"valid_targets_mean": 4185.5,
"valid_targets_min": 437
},
{
"epoch": 0.29505582137161085,
"grad_norm": 0.43284955804317315,
"learning_rate": 1.6765375854214125e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738342881202698,
"step": 185,
"valid_targets_mean": 6524.4,
"valid_targets_min": 245
},
{
"epoch": 0.30303030303030304,
"grad_norm": 0.5173143108613342,
"learning_rate": 1.722095671981777e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29575982689857483,
"step": 190,
"valid_targets_mean": 4829.8,
"valid_targets_min": 238
},
{
"epoch": 0.31100478468899523,
"grad_norm": 0.4761442663752431,
"learning_rate": 1.7676537585421415e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29583317041397095,
"step": 195,
"valid_targets_mean": 5772.1,
"valid_targets_min": 1205
},
{
"epoch": 0.3189792663476874,
"grad_norm": 0.5018234043143022,
"learning_rate": 1.813211845102506e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31572768092155457,
"step": 200,
"valid_targets_mean": 5848.1,
"valid_targets_min": 763
},
{
"epoch": 0.3269537480063796,
"grad_norm": 0.5455291918243139,
"learning_rate": 1.8587699316628704e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2614780366420746,
"step": 205,
"valid_targets_mean": 4031.1,
"valid_targets_min": 234
},
{
"epoch": 0.3349282296650718,
"grad_norm": 0.5022211222995883,
"learning_rate": 1.904328018223235e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27170923352241516,
"step": 210,
"valid_targets_mean": 5658.9,
"valid_targets_min": 683
},
{
"epoch": 0.34290271132376393,
"grad_norm": 0.5363369685681201,
"learning_rate": 1.9498861047835993e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27169087529182434,
"step": 215,
"valid_targets_mean": 5476.3,
"valid_targets_min": 3242
},
{
"epoch": 0.3508771929824561,
"grad_norm": 0.5138610867517525,
"learning_rate": 1.9954441913439638e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24844178557395935,
"step": 220,
"valid_targets_mean": 4867.3,
"valid_targets_min": 222
},
{
"epoch": 0.3588516746411483,
"grad_norm": 0.45211684676685016,
"learning_rate": 2.0410022779043283e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25427666306495667,
"step": 225,
"valid_targets_mean": 6399.5,
"valid_targets_min": 1011
},
{
"epoch": 0.3668261562998405,
"grad_norm": 0.5281985035133087,
"learning_rate": 2.0865603644646927e-05,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26478126645088196,
"step": 230,
"valid_targets_mean": 4467.6,
"valid_targets_min": 234
},
{
"epoch": 0.3748006379585327,
"grad_norm": 0.49350328076325595,
"learning_rate": 2.1321184510250572e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2781916856765747,
"step": 235,
"valid_targets_mean": 5363.7,
"valid_targets_min": 308
},
{
"epoch": 0.3827751196172249,
"grad_norm": 0.5171735546449495,
"learning_rate": 2.1776765375854217e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2462097555398941,
"step": 240,
"valid_targets_mean": 4708.7,
"valid_targets_min": 283
},
{
"epoch": 0.39074960127591707,
"grad_norm": 0.5406966523586195,
"learning_rate": 2.223234624145786e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27877381443977356,
"step": 245,
"valid_targets_mean": 4887.6,
"valid_targets_min": 309
},
{
"epoch": 0.39872408293460926,
"grad_norm": 0.6896080417250773,
"learning_rate": 2.2687927107061506e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2548321783542633,
"step": 250,
"valid_targets_mean": 5287.0,
"valid_targets_min": 239
},
{
"epoch": 0.40669856459330145,
"grad_norm": 0.5173014170367707,
"learning_rate": 2.314350797266515e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25407731533050537,
"step": 255,
"valid_targets_mean": 5538.5,
"valid_targets_min": 224
},
{
"epoch": 0.41467304625199364,
"grad_norm": 0.5161188756710522,
"learning_rate": 2.3599088838268792e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23988167941570282,
"step": 260,
"valid_targets_mean": 4940.8,
"valid_targets_min": 271
},
{
"epoch": 0.4226475279106858,
"grad_norm": 0.6956583936758113,
"learning_rate": 2.4054669703872436e-05,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24012714624404907,
"step": 265,
"valid_targets_mean": 3144.9,
"valid_targets_min": 248
},
{
"epoch": 0.430622009569378,
"grad_norm": 0.7718804998493908,
"learning_rate": 2.4510250569476085e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2716878056526184,
"step": 270,
"valid_targets_mean": 5462.4,
"valid_targets_min": 3412
},
{
"epoch": 0.43859649122807015,
"grad_norm": 0.5600994786468025,
"learning_rate": 2.496583143507973e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530458867549896,
"step": 275,
"valid_targets_mean": 4378.4,
"valid_targets_min": 235
},
{
"epoch": 0.44657097288676234,
"grad_norm": 0.5749427915716706,
"learning_rate": 2.5421412300683374e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26579219102859497,
"step": 280,
"valid_targets_mean": 4329.8,
"valid_targets_min": 243
},
{
"epoch": 0.45454545454545453,
"grad_norm": 0.5715496983969146,
"learning_rate": 2.587699316628702e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2740967571735382,
"step": 285,
"valid_targets_mean": 4174.0,
"valid_targets_min": 466
},
{
"epoch": 0.4625199362041467,
"grad_norm": 0.5046434387262629,
"learning_rate": 2.6332574031890663e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572627663612366,
"step": 290,
"valid_targets_mean": 5345.4,
"valid_targets_min": 285
},
{
"epoch": 0.4704944178628389,
"grad_norm": 0.4924149138472084,
"learning_rate": 2.6788154897494308e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25392043590545654,
"step": 295,
"valid_targets_mean": 4933.1,
"valid_targets_min": 209
},
{
"epoch": 0.4784688995215311,
"grad_norm": 0.6346007282511187,
"learning_rate": 2.7243735763097953e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26829683780670166,
"step": 300,
"valid_targets_mean": 4915.8,
"valid_targets_min": 628
},
{
"epoch": 0.4864433811802233,
"grad_norm": 0.5963249286669925,
"learning_rate": 2.7699316628701597e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2773645520210266,
"step": 305,
"valid_targets_mean": 4269.3,
"valid_targets_min": 188
},
{
"epoch": 0.4944178628389155,
"grad_norm": 0.4926305295857678,
"learning_rate": 2.815489749430524e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2462100088596344,
"step": 310,
"valid_targets_mean": 5357.4,
"valid_targets_min": 447
},
{
"epoch": 0.5023923444976076,
"grad_norm": 0.6162803917326616,
"learning_rate": 2.8610478359908883e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2961190640926361,
"step": 315,
"valid_targets_mean": 4947.2,
"valid_targets_min": 353
},
{
"epoch": 0.5103668261562998,
"grad_norm": 0.4585210580601163,
"learning_rate": 2.906605922551253e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2386709600687027,
"step": 320,
"valid_targets_mean": 6055.6,
"valid_targets_min": 901
},
{
"epoch": 0.518341307814992,
"grad_norm": 0.47805452614285815,
"learning_rate": 2.9521640091116176e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311428189277649,
"step": 325,
"valid_targets_mean": 5337.5,
"valid_targets_min": 550
},
{
"epoch": 0.5263157894736842,
"grad_norm": 0.567045162516125,
"learning_rate": 2.997722095671982e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24028460681438446,
"step": 330,
"valid_targets_mean": 4772.8,
"valid_targets_min": 214
},
{
"epoch": 0.5342902711323764,
"grad_norm": 0.5319903869888214,
"learning_rate": 3.0432801822323465e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26871269941329956,
"step": 335,
"valid_targets_mean": 5710.7,
"valid_targets_min": 1852
},
{
"epoch": 0.5422647527910686,
"grad_norm": 0.5268481071254558,
"learning_rate": 3.088838268792711e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25552791357040405,
"step": 340,
"valid_targets_mean": 4551.9,
"valid_targets_min": 239
},
{
"epoch": 0.5502392344497608,
"grad_norm": 0.5246127684755286,
"learning_rate": 3.1343963553530755e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24578902125358582,
"step": 345,
"valid_targets_mean": 4407.8,
"valid_targets_min": 245
},
{
"epoch": 0.5582137161084529,
"grad_norm": 0.5463821322401736,
"learning_rate": 3.17995444191344e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530014216899872,
"step": 350,
"valid_targets_mean": 5196.0,
"valid_targets_min": 258
},
{
"epoch": 0.5661881977671451,
"grad_norm": 0.5577611010208283,
"learning_rate": 3.2255125284738044e-05,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2547740340232849,
"step": 355,
"valid_targets_mean": 4768.6,
"valid_targets_min": 255
},
{
"epoch": 0.5741626794258373,
"grad_norm": 0.5348299340224125,
"learning_rate": 3.271070615034169e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24138829112052917,
"step": 360,
"valid_targets_mean": 6000.2,
"valid_targets_min": 4248
},
{
"epoch": 0.5821371610845295,
"grad_norm": 0.5208781233506476,
"learning_rate": 3.316628701594533e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25419485569000244,
"step": 365,
"valid_targets_mean": 5256.7,
"valid_targets_min": 439
},
{
"epoch": 0.5901116427432217,
"grad_norm": 0.49107029316580497,
"learning_rate": 3.362186788154898e-05,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2487025111913681,
"step": 370,
"valid_targets_mean": 5005.3,
"valid_targets_min": 252
},
{
"epoch": 0.5980861244019139,
"grad_norm": 0.6062940329738492,
"learning_rate": 3.407744874715262e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24524852633476257,
"step": 375,
"valid_targets_mean": 4933.1,
"valid_targets_min": 377
},
{
"epoch": 0.6060606060606061,
"grad_norm": 0.5256030165269368,
"learning_rate": 3.453302961275627e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22848409414291382,
"step": 380,
"valid_targets_mean": 4897.2,
"valid_targets_min": 337
},
{
"epoch": 0.6140350877192983,
"grad_norm": 0.7317569754705133,
"learning_rate": 3.498861047835991e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637185752391815,
"step": 385,
"valid_targets_mean": 3556.1,
"valid_targets_min": 748
},
{
"epoch": 0.6220095693779905,
"grad_norm": 0.450094616900918,
"learning_rate": 3.5444191343963557e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506665587425232,
"step": 390,
"valid_targets_mean": 6679.1,
"valid_targets_min": 2470
},
{
"epoch": 0.6299840510366826,
"grad_norm": 0.5519907109153948,
"learning_rate": 3.58997722095672e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557337284088135,
"step": 395,
"valid_targets_mean": 4688.7,
"valid_targets_min": 276
},
{
"epoch": 0.6379585326953748,
"grad_norm": 0.4923228611797438,
"learning_rate": 3.6355353075170846e-05,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2390061914920807,
"step": 400,
"valid_targets_mean": 4348.0,
"valid_targets_min": 235
},
{
"epoch": 0.645933014354067,
"grad_norm": 0.58492013354936,
"learning_rate": 3.681093394077449e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23605602979660034,
"step": 405,
"valid_targets_mean": 3866.8,
"valid_targets_min": 263
},
{
"epoch": 0.6539074960127592,
"grad_norm": 0.5800372174854277,
"learning_rate": 3.7266514806378135e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580878436565399,
"step": 410,
"valid_targets_mean": 4487.8,
"valid_targets_min": 728
},
{
"epoch": 0.6618819776714514,
"grad_norm": 0.5700368613429726,
"learning_rate": 3.772209567198178e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24940025806427002,
"step": 415,
"valid_targets_mean": 4252.4,
"valid_targets_min": 185
},
{
"epoch": 0.6698564593301436,
"grad_norm": 0.5691664020081905,
"learning_rate": 3.8177676537585425e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23814374208450317,
"step": 420,
"valid_targets_mean": 4767.3,
"valid_targets_min": 226
},
{
"epoch": 0.6778309409888357,
"grad_norm": 0.5041552220249231,
"learning_rate": 3.863325740318907e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26317381858825684,
"step": 425,
"valid_targets_mean": 5216.6,
"valid_targets_min": 213
},
{
"epoch": 0.6858054226475279,
"grad_norm": 0.5191567542690365,
"learning_rate": 3.9088838268792714e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2395055890083313,
"step": 430,
"valid_targets_mean": 4498.9,
"valid_targets_min": 606
},
{
"epoch": 0.69377990430622,
"grad_norm": 0.507951082676675,
"learning_rate": 3.954441913439636e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23812133073806763,
"step": 435,
"valid_targets_mean": 4862.8,
"valid_targets_min": 599
},
{
"epoch": 0.7017543859649122,
"grad_norm": 0.4415015257689068,
"learning_rate": 4e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284793496131897,
"step": 440,
"valid_targets_mean": 7053.9,
"valid_targets_min": 726
},
{
"epoch": 0.7097288676236044,
"grad_norm": 0.4687788595713669,
"learning_rate": 3.9999841858814384e-05,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22677697241306305,
"step": 445,
"valid_targets_mean": 5137.8,
"valid_targets_min": 332
},
{
"epoch": 0.7177033492822966,
"grad_norm": 0.4729761272261808,
"learning_rate": 3.999936743775839e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.208622008562088,
"step": 450,
"valid_targets_mean": 4527.2,
"valid_targets_min": 238
},
{
"epoch": 0.7256778309409888,
"grad_norm": 0.555015237464751,
"learning_rate": 3.9998576744334574e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21826383471488953,
"step": 455,
"valid_targets_mean": 4742.9,
"valid_targets_min": 302
},
{
"epoch": 0.733652312599681,
"grad_norm": 0.5310365582781416,
"learning_rate": 3.999746979104705e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25395524501800537,
"step": 460,
"valid_targets_mean": 5156.8,
"valid_targets_min": 237
},
{
"epoch": 0.7416267942583732,
"grad_norm": 0.4553894968924494,
"learning_rate": 3.999604659540131e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229715883731842,
"step": 465,
"valid_targets_mean": 5806.7,
"valid_targets_min": 227
},
{
"epoch": 0.7496012759170654,
"grad_norm": 0.553859237915477,
"learning_rate": 3.999430717990395e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24489501118659973,
"step": 470,
"valid_targets_mean": 4576.5,
"valid_targets_min": 393
},
{
"epoch": 0.7575757575757576,
"grad_norm": 0.5150108769606636,
"learning_rate": 3.999225157206228e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23615041375160217,
"step": 475,
"valid_targets_mean": 5394.9,
"valid_targets_min": 426
},
{
"epoch": 0.7655502392344498,
"grad_norm": 0.6385286959140647,
"learning_rate": 3.998987980438393e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22305330634117126,
"step": 480,
"valid_targets_mean": 5164.2,
"valid_targets_min": 223
},
{
"epoch": 0.773524720893142,
"grad_norm": 0.4830051792435215,
"learning_rate": 3.9987191914376306e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323000133037567,
"step": 485,
"valid_targets_mean": 4675.6,
"valid_targets_min": 242
},
{
"epoch": 0.7814992025518341,
"grad_norm": 0.5028756759202847,
"learning_rate": 3.998418794454604e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21495231986045837,
"step": 490,
"valid_targets_mean": 4435.6,
"valid_targets_min": 253
},
{
"epoch": 0.7894736842105263,
"grad_norm": 0.5087547658254494,
"learning_rate": 3.998086794239825e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23997387290000916,
"step": 495,
"valid_targets_mean": 5214.6,
"valid_targets_min": 252
},
{
"epoch": 0.7974481658692185,
"grad_norm": 0.4669380659732096,
"learning_rate": 3.997723196043585e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22620384395122528,
"step": 500,
"valid_targets_mean": 4997.2,
"valid_targets_min": 220
},
{
"epoch": 0.8054226475279107,
"grad_norm": 0.5551348865851036,
"learning_rate": 3.9973280056158695e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25103485584259033,
"step": 505,
"valid_targets_mean": 5329.7,
"valid_targets_min": 243
},
{
"epoch": 0.8133971291866029,
"grad_norm": 0.49318722832524914,
"learning_rate": 3.9969012292062655e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25136399269104004,
"step": 510,
"valid_targets_mean": 5802.3,
"valid_targets_min": 342
},
{
"epoch": 0.8213716108452951,
"grad_norm": 0.5198628597650791,
"learning_rate": 3.996442873563866e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2384355366230011,
"step": 515,
"valid_targets_mean": 5362.5,
"valid_targets_min": 256
},
{
"epoch": 0.8293460925039873,
"grad_norm": 0.5205934398395562,
"learning_rate": 3.9959529459371624e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787361443042755,
"step": 520,
"valid_targets_mean": 5885.7,
"valid_targets_min": 228
},
{
"epoch": 0.8373205741626795,
"grad_norm": 0.5252409924659849,
"learning_rate": 3.9954314540739284e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512431740760803,
"step": 525,
"valid_targets_mean": 5641.8,
"valid_targets_min": 1587
},
{
"epoch": 0.8452950558213717,
"grad_norm": 0.4704007226125745,
"learning_rate": 3.994878406221097e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23621171712875366,
"step": 530,
"valid_targets_mean": 5600.2,
"valid_targets_min": 536
},
{
"epoch": 0.8532695374800638,
"grad_norm": 0.6083127057740186,
"learning_rate": 3.994293811124632e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2614426612854004,
"step": 535,
"valid_targets_mean": 5253.0,
"valid_targets_min": 238
},
{
"epoch": 0.861244019138756,
"grad_norm": 0.4746686115421954,
"learning_rate": 3.993677678029392e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24418990314006805,
"step": 540,
"valid_targets_mean": 5040.0,
"valid_targets_min": 1001
},
{
"epoch": 0.8692185007974481,
"grad_norm": 0.49549218402068856,
"learning_rate": 3.9930300166789765e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25148677825927734,
"step": 545,
"valid_targets_mean": 5570.9,
"valid_targets_min": 319
},
{
"epoch": 0.8771929824561403,
"grad_norm": 0.5269114935537167,
"learning_rate": 3.992350837315581e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2529415786266327,
"step": 550,
"valid_targets_mean": 4481.4,
"valid_targets_min": 418
},
{
"epoch": 0.8851674641148325,
"grad_norm": 0.4966140006866359,
"learning_rate": 3.991640150679826e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23965132236480713,
"step": 555,
"valid_targets_mean": 4778.5,
"valid_targets_min": 193
},
{
"epoch": 0.8931419457735247,
"grad_norm": 0.46356963034858145,
"learning_rate": 3.990897968010596e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22081106901168823,
"step": 560,
"valid_targets_mean": 4536.8,
"valid_targets_min": 318
},
{
"epoch": 0.9011164274322169,
"grad_norm": 0.5158811337778442,
"learning_rate": 3.990124301044855e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25084495544433594,
"step": 565,
"valid_targets_mean": 5180.1,
"valid_targets_min": 262
},
{
"epoch": 0.9090909090909091,
"grad_norm": 0.4577837821562966,
"learning_rate": 3.989319162017465e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23798081278800964,
"step": 570,
"valid_targets_mean": 5647.1,
"valid_targets_min": 292
},
{
"epoch": 0.9170653907496013,
"grad_norm": 0.44187500790924766,
"learning_rate": 3.988482563660989e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23343367874622345,
"step": 575,
"valid_targets_mean": 5496.6,
"valid_targets_min": 179
},
{
"epoch": 0.9250398724082934,
"grad_norm": 0.5270106574297865,
"learning_rate": 3.987614519205493e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23939090967178345,
"step": 580,
"valid_targets_mean": 5919.2,
"valid_targets_min": 1221
},
{
"epoch": 0.9330143540669856,
"grad_norm": 0.463729984008716,
"learning_rate": 3.986715042378334e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22995294630527496,
"step": 585,
"valid_targets_mean": 5917.2,
"valid_targets_min": 852
},
{
"epoch": 0.9409888357256778,
"grad_norm": 0.47283664295456057,
"learning_rate": 3.985784147403947e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2240312099456787,
"step": 590,
"valid_targets_mean": 5174.1,
"valid_targets_min": 536
},
{
"epoch": 0.94896331738437,
"grad_norm": 0.5658848917368027,
"learning_rate": 3.9848218490036144e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.232914000749588,
"step": 595,
"valid_targets_mean": 5265.4,
"valid_targets_min": 732
},
{
"epoch": 0.9569377990430622,
"grad_norm": 0.4239055430774934,
"learning_rate": 3.983828162395238e-05,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20710644125938416,
"step": 600,
"valid_targets_mean": 6367.3,
"valid_targets_min": 1579
},
{
"epoch": 0.9649122807017544,
"grad_norm": 0.44068282934869724,
"learning_rate": 3.9828031032930944e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23547522723674774,
"step": 605,
"valid_targets_mean": 5768.8,
"valid_targets_min": 342
},
{
"epoch": 0.9728867623604466,
"grad_norm": 0.4301339156888651,
"learning_rate": 3.98174668790759e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22576510906219482,
"step": 610,
"valid_targets_mean": 5758.6,
"valid_targets_min": 250
},
{
"epoch": 0.9808612440191388,
"grad_norm": 0.4083465304334347,
"learning_rate": 3.9806589329450045e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21958738565444946,
"step": 615,
"valid_targets_mean": 6139.3,
"valid_targets_min": 258
},
{
"epoch": 0.988835725677831,
"grad_norm": 0.5589998597597372,
"learning_rate": 3.979539855607222e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2316368967294693,
"step": 620,
"valid_targets_mean": 4443.0,
"valid_targets_min": 293
},
{
"epoch": 0.9968102073365231,
"grad_norm": 0.49386174717125697,
"learning_rate": 3.9783894735914646e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23019137978553772,
"step": 625,
"valid_targets_mean": 5904.1,
"valid_targets_min": 407
},
{
"epoch": 1.0047846889952152,
"grad_norm": 0.44385071840879137,
"learning_rate": 3.9772078050900105e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19644610583782196,
"step": 630,
"valid_targets_mean": 5611.9,
"valid_targets_min": 342
},
{
"epoch": 1.0127591706539074,
"grad_norm": 0.48156890413963743,
"learning_rate": 3.9759948687899055e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2283916473388672,
"step": 635,
"valid_targets_mean": 4642.0,
"valid_targets_min": 226
},
{
"epoch": 1.0207336523125996,
"grad_norm": 0.5551974573135551,
"learning_rate": 3.974750683872667e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257927656173706,
"step": 640,
"valid_targets_mean": 4712.1,
"valid_targets_min": 253
},
{
"epoch": 1.0287081339712918,
"grad_norm": 0.5112679546587456,
"learning_rate": 3.973475270013984e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036946564912796,
"step": 645,
"valid_targets_mean": 3350.3,
"valid_targets_min": 220
},
{
"epoch": 1.036682615629984,
"grad_norm": 0.5657504932352997,
"learning_rate": 3.972168647383402e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104548066854477,
"step": 650,
"valid_targets_mean": 5710.1,
"valid_targets_min": 975
},
{
"epoch": 1.0446570972886762,
"grad_norm": 0.498819802151185,
"learning_rate": 3.970830836644006e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2443195879459381,
"step": 655,
"valid_targets_mean": 4341.6,
"valid_targets_min": 237
},
{
"epoch": 1.0526315789473684,
"grad_norm": 0.4777708787250058,
"learning_rate": 3.9694618589520945e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21855522692203522,
"step": 660,
"valid_targets_mean": 6137.1,
"valid_targets_min": 3874
},
{
"epoch": 1.0606060606060606,
"grad_norm": 0.42516424950849196,
"learning_rate": 3.9680617359568414e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22529324889183044,
"step": 665,
"valid_targets_mean": 5659.9,
"valid_targets_min": 265
},
{
"epoch": 1.0685805422647527,
"grad_norm": 0.43957454727525247,
"learning_rate": 3.966630489799959e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20638194680213928,
"step": 670,
"valid_targets_mean": 5418.2,
"valid_targets_min": 605
},
{
"epoch": 1.076555023923445,
"grad_norm": 0.480992229013917,
"learning_rate": 3.9651681431153445e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21741151809692383,
"step": 675,
"valid_targets_mean": 5676.9,
"valid_targets_min": 653
},
{
"epoch": 1.0845295055821371,
"grad_norm": 0.5286831646993043,
"learning_rate": 3.96367471902872e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22559064626693726,
"step": 680,
"valid_targets_mean": 4749.8,
"valid_targets_min": 1138
},
{
"epoch": 1.0925039872408293,
"grad_norm": 0.48401700631042965,
"learning_rate": 3.9621502411572705e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21404454112052917,
"step": 685,
"valid_targets_mean": 5151.9,
"valid_targets_min": 492
},
{
"epoch": 1.1004784688995215,
"grad_norm": 0.49933746338574914,
"learning_rate": 3.960594733609273e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24951139092445374,
"step": 690,
"valid_targets_mean": 5677.1,
"valid_targets_min": 414
},
{
"epoch": 1.1084529505582137,
"grad_norm": 0.5374555564691006,
"learning_rate": 3.9590082209837054e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23958654701709747,
"step": 695,
"valid_targets_mean": 4576.1,
"valid_targets_min": 250
},
{
"epoch": 1.1164274322169059,
"grad_norm": 0.43156726192991535,
"learning_rate": 3.957390728369867e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22211644053459167,
"step": 700,
"valid_targets_mean": 5652.7,
"valid_targets_min": 240
},
{
"epoch": 1.124401913875598,
"grad_norm": 0.5290650459685178,
"learning_rate": 3.955742281346979e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24193495512008667,
"step": 705,
"valid_targets_mean": 4738.0,
"valid_targets_min": 1201
},
{
"epoch": 1.1323763955342903,
"grad_norm": 0.4590727414985068,
"learning_rate": 3.9540629059837767e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20210333168506622,
"step": 710,
"valid_targets_mean": 5049.0,
"valid_targets_min": 386
},
{
"epoch": 1.1403508771929824,
"grad_norm": 0.5441856418870333,
"learning_rate": 3.952352628838102e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20969565212726593,
"step": 715,
"valid_targets_mean": 4226.9,
"valid_targets_min": 249
},
{
"epoch": 1.1483253588516746,
"grad_norm": 0.5380939962565157,
"learning_rate": 3.95061147695648e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.240693137049675,
"step": 720,
"valid_targets_mean": 4818.9,
"valid_targets_min": 549
},
{
"epoch": 1.1562998405103668,
"grad_norm": 0.5686689166363135,
"learning_rate": 3.9488394778736935e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24537625908851624,
"step": 725,
"valid_targets_mean": 3922.4,
"valid_targets_min": 129
},
{
"epoch": 1.164274322169059,
"grad_norm": 0.4593411130317016,
"learning_rate": 3.947036659612345e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20501753687858582,
"step": 730,
"valid_targets_mean": 4789.3,
"valid_targets_min": 242
},
{
"epoch": 1.1722488038277512,
"grad_norm": 0.5929679220372989,
"learning_rate": 3.945203050682418e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2176203429698944,
"step": 735,
"valid_targets_mean": 5827.9,
"valid_targets_min": 1421
},
{
"epoch": 1.1802232854864434,
"grad_norm": 0.49571444514839247,
"learning_rate": 3.94333868008082e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22823849320411682,
"step": 740,
"valid_targets_mean": 4559.8,
"valid_targets_min": 955
},
{
"epoch": 1.1881977671451356,
"grad_norm": 0.47051475648971036,
"learning_rate": 3.94144357729093e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21944183111190796,
"step": 745,
"valid_targets_mean": 5556.9,
"valid_targets_min": 241
},
{
"epoch": 1.1961722488038278,
"grad_norm": 0.4545193137066266,
"learning_rate": 3.939517772282127e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2306528091430664,
"step": 750,
"valid_targets_mean": 5773.1,
"valid_targets_min": 339
},
{
"epoch": 1.20414673046252,
"grad_norm": 0.5070293389053494,
"learning_rate": 3.93756129550932e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2366933524608612,
"step": 755,
"valid_targets_mean": 4809.0,
"valid_targets_min": 225
},
{
"epoch": 1.2121212121212122,
"grad_norm": 0.4581327620567569,
"learning_rate": 3.935574177912465e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23561245203018188,
"step": 760,
"valid_targets_mean": 5730.1,
"valid_targets_min": 431
},
{
"epoch": 1.2200956937799043,
"grad_norm": 0.44689390466942713,
"learning_rate": 3.9335564509160746e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25527051091194153,
"step": 765,
"valid_targets_mean": 5937.5,
"valid_targets_min": 308
},
{
"epoch": 1.2280701754385965,
"grad_norm": 0.5105030340361397,
"learning_rate": 3.931508146428724e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21357367932796478,
"step": 770,
"valid_targets_mean": 4240.1,
"valid_targets_min": 238
},
{
"epoch": 1.2360446570972887,
"grad_norm": 0.4285106295808272,
"learning_rate": 3.929429296842542e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22223004698753357,
"step": 775,
"valid_targets_mean": 5140.4,
"valid_targets_min": 207
},
{
"epoch": 1.244019138755981,
"grad_norm": 0.5033088319271173,
"learning_rate": 3.927319935032703e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2382790595293045,
"step": 780,
"valid_targets_mean": 4656.1,
"valid_targets_min": 190
},
{
"epoch": 1.251993620414673,
"grad_norm": 0.4832920433952073,
"learning_rate": 3.925180094356905e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22841961681842804,
"step": 785,
"valid_targets_mean": 4821.2,
"valid_targets_min": 332
},
{
"epoch": 1.2599681020733653,
"grad_norm": 0.5541953861894534,
"learning_rate": 3.9230098086548414e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22924378514289856,
"step": 790,
"valid_targets_mean": 5035.1,
"valid_targets_min": 387
},
{
"epoch": 1.2679425837320575,
"grad_norm": 0.45492743605486735,
"learning_rate": 3.920809112247668e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2217010259628296,
"step": 795,
"valid_targets_mean": 5301.2,
"valid_targets_min": 280
},
{
"epoch": 1.2759170653907497,
"grad_norm": 0.4050403811606527,
"learning_rate": 3.918578039937459e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20149385929107666,
"step": 800,
"valid_targets_mean": 6168.7,
"valid_targets_min": 3585
},
{
"epoch": 1.2838915470494419,
"grad_norm": 0.49884758775784616,
"learning_rate": 3.916316627006656e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22389544546604156,
"step": 805,
"valid_targets_mean": 4229.8,
"valid_targets_min": 205
},
{
"epoch": 1.291866028708134,
"grad_norm": 0.5437724639192097,
"learning_rate": 3.914024909217511e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21842722594738007,
"step": 810,
"valid_targets_mean": 5059.4,
"valid_targets_min": 261
},
{
"epoch": 1.2998405103668262,
"grad_norm": 0.4614914901673496,
"learning_rate": 3.911702922811522e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22969508171081543,
"step": 815,
"valid_targets_mean": 5216.5,
"valid_targets_min": 944
},
{
"epoch": 1.3078149920255182,
"grad_norm": 0.41670448262684845,
"learning_rate": 3.909350704508856e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21079647541046143,
"step": 820,
"valid_targets_mean": 5512.1,
"valid_targets_min": 985
},
{
"epoch": 1.3157894736842106,
"grad_norm": 0.4532640251959151,
"learning_rate": 3.906968291507773e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069890946149826,
"step": 825,
"valid_targets_mean": 4720.1,
"valid_targets_min": 223
},
{
"epoch": 1.3237639553429026,
"grad_norm": 0.5068128448354305,
"learning_rate": 3.904555721484034e-05,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22296027839183807,
"step": 830,
"valid_targets_mean": 4510.1,
"valid_targets_min": 213
},
{
"epoch": 1.331738437001595,
"grad_norm": 0.44758555237161834,
"learning_rate": 3.9021130325903076e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22679689526557922,
"step": 835,
"valid_targets_mean": 4813.0,
"valid_targets_min": 491
},
{
"epoch": 1.339712918660287,
"grad_norm": 0.4343562516139951,
"learning_rate": 3.899640263455566e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20167089998722076,
"step": 840,
"valid_targets_mean": 5034.6,
"valid_targets_min": 250
},
{
"epoch": 1.3476874003189794,
"grad_norm": 0.4572454435644633,
"learning_rate": 3.897137453184472e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20767706632614136,
"step": 845,
"valid_targets_mean": 5134.5,
"valid_targets_min": 278
},
{
"epoch": 1.3556618819776713,
"grad_norm": 0.5014219811560465,
"learning_rate": 3.894604641356767e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20389358699321747,
"step": 850,
"valid_targets_mean": 3887.2,
"valid_targets_min": 210
},
{
"epoch": 1.3636363636363638,
"grad_norm": 0.48510005391738675,
"learning_rate": 3.8920418680266346e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22810472548007965,
"step": 855,
"valid_targets_mean": 5032.4,
"valid_targets_min": 391
},
{
"epoch": 1.3716108452950557,
"grad_norm": 0.5183414139626299,
"learning_rate": 3.889449173722077e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2274407297372818,
"step": 860,
"valid_targets_mean": 4475.8,
"valid_targets_min": 272
},
{
"epoch": 1.3795853269537481,
"grad_norm": 0.5158129823910096,
"learning_rate": 3.8868265994442694e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2289605587720871,
"step": 865,
"valid_targets_mean": 4482.9,
"valid_targets_min": 298
},
{
"epoch": 1.38755980861244,
"grad_norm": 0.46178793662898315,
"learning_rate": 3.8841741866669126e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20329372584819794,
"step": 870,
"valid_targets_mean": 4624.8,
"valid_targets_min": 201
},
{
"epoch": 1.3955342902711323,
"grad_norm": 0.43110143764599795,
"learning_rate": 3.881491977335577e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101316750049591,
"step": 875,
"valid_targets_mean": 5321.4,
"valid_targets_min": 213
},
{
"epoch": 1.4035087719298245,
"grad_norm": 0.503740796436895,
"learning_rate": 3.878780013867038e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20829784870147705,
"step": 880,
"valid_targets_mean": 4938.4,
"valid_targets_min": 208
},
{
"epoch": 1.4114832535885167,
"grad_norm": 0.46875611927410893,
"learning_rate": 3.8760383391486074e-05,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2217826247215271,
"step": 885,
"valid_targets_mean": 5166.4,
"valid_targets_min": 1977
},
{
"epoch": 1.4194577352472089,
"grad_norm": 0.40715680224468764,
"learning_rate": 3.873266996537456e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2007824033498764,
"step": 890,
"valid_targets_mean": 6011.9,
"valid_targets_min": 1107
},
{
"epoch": 1.427432216905901,
"grad_norm": 0.4538795595368198,
"learning_rate": 3.8704660298599225e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19974635541439056,
"step": 895,
"valid_targets_mean": 5461.1,
"valid_targets_min": 233
},
{
"epoch": 1.4354066985645932,
"grad_norm": 0.3925116796629304,
"learning_rate": 3.867635483410827e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19021229445934296,
"step": 900,
"valid_targets_mean": 5960.0,
"valid_targets_min": 287
},
{
"epoch": 1.4433811802232854,
"grad_norm": 0.4526958366149273,
"learning_rate": 3.864775401952767e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224770188331604,
"step": 905,
"valid_targets_mean": 4794.1,
"valid_targets_min": 385
},
{
"epoch": 1.4513556618819776,
"grad_norm": 0.47739345174396636,
"learning_rate": 3.8618858307154085e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21421770751476288,
"step": 910,
"valid_targets_mean": 4971.1,
"valid_targets_min": 229
},
{
"epoch": 1.4593301435406698,
"grad_norm": 0.48441435233113955,
"learning_rate": 3.8589668153947743e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2115284949541092,
"step": 915,
"valid_targets_mean": 4584.6,
"valid_targets_min": 613
},
{
"epoch": 1.467304625199362,
"grad_norm": 0.48463948682962943,
"learning_rate": 3.8560184021525194e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21348783373832703,
"step": 920,
"valid_targets_mean": 4442.5,
"valid_targets_min": 192
},
{
"epoch": 1.4752791068580542,
"grad_norm": 0.4451502603868636,
"learning_rate": 3.853040637615199e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23046502470970154,
"step": 925,
"valid_targets_mean": 4936.4,
"valid_targets_min": 395
},
{
"epoch": 1.4832535885167464,
"grad_norm": 0.40199972450433025,
"learning_rate": 3.850033568873536e-05,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19406135380268097,
"step": 930,
"valid_targets_mean": 5947.2,
"valid_targets_min": 479
},
{
"epoch": 1.4912280701754386,
"grad_norm": 0.5368761175611442,
"learning_rate": 3.8469972434816706e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21021592617034912,
"step": 935,
"valid_targets_mean": 4767.3,
"valid_targets_min": 243
},
{
"epoch": 1.4992025518341308,
"grad_norm": 0.3986721112323499,
"learning_rate": 3.843931709456414e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19780415296554565,
"step": 940,
"valid_targets_mean": 5795.1,
"valid_targets_min": 861
},
{
"epoch": 1.507177033492823,
"grad_norm": 0.4587666035993858,
"learning_rate": 3.840837015276483e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22320160269737244,
"step": 945,
"valid_targets_mean": 5755.1,
"valid_targets_min": 941
},
{
"epoch": 1.5151515151515151,
"grad_norm": 0.45703951269412757,
"learning_rate": 3.83771320988174e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22210641205310822,
"step": 950,
"valid_targets_mean": 4737.4,
"valid_targets_min": 399
},
{
"epoch": 1.5231259968102073,
"grad_norm": 0.48709993942146484,
"learning_rate": 3.834560342672413e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22919026017189026,
"step": 955,
"valid_targets_mean": 5368.0,
"valid_targets_min": 471
},
{
"epoch": 1.5311004784688995,
"grad_norm": 0.5327015189373576,
"learning_rate": 3.831378463508318e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20985502004623413,
"step": 960,
"valid_targets_mean": 3672.7,
"valid_targets_min": 255
},
{
"epoch": 1.5390749601275917,
"grad_norm": 0.4889458724924527,
"learning_rate": 3.8281676227080694e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23470205068588257,
"step": 965,
"valid_targets_mean": 4279.4,
"valid_targets_min": 545
},
{
"epoch": 1.547049441786284,
"grad_norm": 0.4816208661066147,
"learning_rate": 3.824927871048284e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22319866716861725,
"step": 970,
"valid_targets_mean": 5811.1,
"valid_targets_min": 691
},
{
"epoch": 1.555023923444976,
"grad_norm": 0.49629303617677123,
"learning_rate": 3.8216592597627797e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20921722054481506,
"step": 975,
"valid_targets_mean": 4481.5,
"valid_targets_min": 458
},
{
"epoch": 1.5629984051036683,
"grad_norm": 0.4486748383761303,
"learning_rate": 3.818361840541761e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2034325897693634,
"step": 980,
"valid_targets_mean": 5753.4,
"valid_targets_min": 249
},
{
"epoch": 1.5709728867623605,
"grad_norm": 0.4704184941444946,
"learning_rate": 3.815035665531008e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2329174280166626,
"step": 985,
"valid_targets_mean": 5679.9,
"valid_targets_min": 794
},
{
"epoch": 1.5789473684210527,
"grad_norm": 0.7126080076891846,
"learning_rate": 3.811680787331047e-05,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20356056094169617,
"step": 990,
"valid_targets_mean": 4500.5,
"valid_targets_min": 200
},
{
"epoch": 1.5869218500797448,
"grad_norm": 0.4362810483573207,
"learning_rate": 3.8082972589963175e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25651684403419495,
"step": 995,
"valid_targets_mean": 5741.7,
"valid_targets_min": 485
},
{
"epoch": 1.594896331738437,
"grad_norm": 0.5308816657896737,
"learning_rate": 3.80488513403434e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22023651003837585,
"step": 1000,
"valid_targets_mean": 3424.5,
"valid_targets_min": 259
},
{
"epoch": 1.6028708133971292,
"grad_norm": 0.4510219809474634,
"learning_rate": 3.8014444664048616e-05,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21104635298252106,
"step": 1005,
"valid_targets_mean": 5196.3,
"valid_targets_min": 240
},
{
"epoch": 1.6108452950558214,
"grad_norm": 0.4803455404102778,
"learning_rate": 3.797975310519009e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21788547933101654,
"step": 1010,
"valid_targets_mean": 4816.5,
"valid_targets_min": 274
},
{
"epoch": 1.6188197767145136,
"grad_norm": 0.47472698938848756,
"learning_rate": 3.794477721238425e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23355194926261902,
"step": 1015,
"valid_targets_mean": 4637.8,
"valid_targets_min": 234
},
{
"epoch": 1.6267942583732058,
"grad_norm": 0.4147989370142633,
"learning_rate": 3.7909517538744e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19726088643074036,
"step": 1020,
"valid_targets_mean": 5528.1,
"valid_targets_min": 713
},
{
"epoch": 1.6347687400318978,
"grad_norm": 0.43057872861456375,
"learning_rate": 3.7873974641870006e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23569004237651825,
"step": 1025,
"valid_targets_mean": 5202.3,
"valid_targets_min": 429
},
{
"epoch": 1.6427432216905902,
"grad_norm": 0.4944214692564835,
"learning_rate": 3.7838149083841856e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22196251153945923,
"step": 1030,
"valid_targets_mean": 4496.9,
"valid_targets_min": 367
},
{
"epoch": 1.6507177033492821,
"grad_norm": 0.484950405225721,
"learning_rate": 3.7802041431209166e-05,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22201311588287354,
"step": 1035,
"valid_targets_mean": 5337.4,
"valid_targets_min": 276
},
{
"epoch": 1.6586921850079746,
"grad_norm": 0.46643309909033687,
"learning_rate": 3.776565225498264e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20948752760887146,
"step": 1040,
"valid_targets_mean": 5726.2,
"valid_targets_min": 216
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.4505057278309987,
"learning_rate": 3.7728982130625025e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21404105424880981,
"step": 1045,
"valid_targets_mean": 5463.8,
"valid_targets_min": 624
},
{
"epoch": 1.674641148325359,
"grad_norm": 0.4632571232381542,
"learning_rate": 3.769203163804202e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2386375069618225,
"step": 1050,
"valid_targets_mean": 4372.1,
"valid_targets_min": 212
},
{
"epoch": 1.682615629984051,
"grad_norm": 0.5885949234294394,
"learning_rate": 3.7654801361573076e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2116532027721405,
"step": 1055,
"valid_targets_mean": 3293.9,
"valid_targets_min": 164
},
{
"epoch": 1.6905901116427433,
"grad_norm": 0.476396006242146,
"learning_rate": 3.761729188998222e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2132015824317932,
"step": 1060,
"valid_targets_mean": 4883.0,
"valid_targets_min": 234
},
{
"epoch": 1.6985645933014353,
"grad_norm": 0.4415064752469964,
"learning_rate": 3.757950381644868e-05,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18930253386497498,
"step": 1065,
"valid_targets_mean": 4347.8,
"valid_targets_min": 201
},
{
"epoch": 1.7065390749601277,
"grad_norm": 0.4918318431688853,
"learning_rate": 3.7541437738557524e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22140301764011383,
"step": 1070,
"valid_targets_mean": 4014.4,
"valid_targets_min": 266
},
{
"epoch": 1.7145135566188197,
"grad_norm": 0.4757910103440479,
"learning_rate": 3.750309425829022e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22511640191078186,
"step": 1075,
"valid_targets_mean": 4329.7,
"valid_targets_min": 234
},
{
"epoch": 1.722488038277512,
"grad_norm": 0.418880480295893,
"learning_rate": 3.746447398201512e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2123282253742218,
"step": 1080,
"valid_targets_mean": 6908.0,
"valid_targets_min": 4942
},
{
"epoch": 1.730462519936204,
"grad_norm": 0.49617766079766823,
"learning_rate": 3.7425577520477846e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21871669590473175,
"step": 1085,
"valid_targets_mean": 4811.3,
"valid_targets_min": 198
},
{
"epoch": 1.7384370015948964,
"grad_norm": 0.4598780604045823,
"learning_rate": 3.738640548879166e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20024099946022034,
"step": 1090,
"valid_targets_mean": 4600.0,
"valid_targets_min": 295
},
{
"epoch": 1.7464114832535884,
"grad_norm": 0.4184329372379239,
"learning_rate": 3.7346958506427696e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20633798837661743,
"step": 1095,
"valid_targets_mean": 6165.7,
"valid_targets_min": 4183
},
{
"epoch": 1.7543859649122808,
"grad_norm": 0.4797137007699827,
"learning_rate": 3.730723719720523e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21521145105361938,
"step": 1100,
"valid_targets_mean": 4948.5,
"valid_targets_min": 238
},
{
"epoch": 1.7623604465709728,
"grad_norm": 0.464012546044584,
"learning_rate": 3.7267242189281746e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2169262021780014,
"step": 1105,
"valid_targets_mean": 6075.7,
"valid_targets_min": 2766
},
{
"epoch": 1.7703349282296652,
"grad_norm": 0.47591074751434326,
"learning_rate": 3.722697411514305e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22949981689453125,
"step": 1110,
"valid_targets_mean": 5401.1,
"valid_targets_min": 251
},
{
"epoch": 1.7783094098883572,
"grad_norm": 0.4993896425623004,
"learning_rate": 3.7186433611593225e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904512345790863,
"step": 1115,
"valid_targets_mean": 5432.9,
"valid_targets_min": 238
},
{
"epoch": 1.7862838915470496,
"grad_norm": 0.45815865946027584,
"learning_rate": 3.7145621319744614e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2207677662372589,
"step": 1120,
"valid_targets_mean": 5302.4,
"valid_targets_min": 193
},
{
"epoch": 1.7942583732057416,
"grad_norm": 0.4341993760317199,
"learning_rate": 3.7104537885007635e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21209567785263062,
"step": 1125,
"valid_targets_mean": 5470.0,
"valid_targets_min": 291
},
{
"epoch": 1.802232854864434,
"grad_norm": 0.4329735980280842,
"learning_rate": 3.7063183957080594e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21948090195655823,
"step": 1130,
"valid_targets_mean": 6026.4,
"valid_targets_min": 971
},
{
"epoch": 1.810207336523126,
"grad_norm": 0.4481414703783188,
"learning_rate": 3.7021560189939416e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2207806408405304,
"step": 1135,
"valid_targets_mean": 5682.9,
"valid_targets_min": 1396
},
{
"epoch": 1.8181818181818183,
"grad_norm": 0.522534265852767,
"learning_rate": 3.697966724182729e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21881750226020813,
"step": 1140,
"valid_targets_mean": 5429.8,
"valid_targets_min": 447
},
{
"epoch": 1.8261562998405103,
"grad_norm": 0.4974497276431288,
"learning_rate": 3.6937505775244246e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.190834641456604,
"step": 1145,
"valid_targets_mean": 4105.1,
"valid_targets_min": 215
},
{
"epoch": 1.8341307814992025,
"grad_norm": 0.4079277949685025,
"learning_rate": 3.689507645693674e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22405077517032623,
"step": 1150,
"valid_targets_mean": 5792.1,
"valid_targets_min": 686
},
{
"epoch": 1.8421052631578947,
"grad_norm": 0.49811626292486966,
"learning_rate": 3.6852379957887025e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2030624896287918,
"step": 1155,
"valid_targets_mean": 5252.1,
"valid_targets_min": 455
},
{
"epoch": 1.8500797448165869,
"grad_norm": 0.4204561756675584,
"learning_rate": 3.6809416953302606e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20025420188903809,
"step": 1160,
"valid_targets_mean": 5681.7,
"valid_targets_min": 1357
},
{
"epoch": 1.858054226475279,
"grad_norm": 0.44519682325171034,
"learning_rate": 3.676618812260553e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21237683296203613,
"step": 1165,
"valid_targets_mean": 5172.7,
"valid_targets_min": 315
},
{
"epoch": 1.8660287081339713,
"grad_norm": 0.39822025331588046,
"learning_rate": 3.672269414942166e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20583263039588928,
"step": 1170,
"valid_targets_mean": 6143.7,
"valid_targets_min": 4416
},
{
"epoch": 1.8740031897926634,
"grad_norm": 0.4171821917382488,
"learning_rate": 3.6678935721569825e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19881102442741394,
"step": 1175,
"valid_targets_mean": 5497.3,
"valid_targets_min": 315
},
{
"epoch": 1.8819776714513556,
"grad_norm": 0.4738173624083104,
"learning_rate": 3.663491353105101e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21670684218406677,
"step": 1180,
"valid_targets_mean": 4734.4,
"valid_targets_min": 252
},
{
"epoch": 1.8899521531100478,
"grad_norm": 0.38986990747488626,
"learning_rate": 3.659062827403735e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19631826877593994,
"step": 1185,
"valid_targets_mean": 5470.2,
"valid_targets_min": 544
},
{
"epoch": 1.89792663476874,
"grad_norm": 0.43069168920501544,
"learning_rate": 3.654608065086115e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22201283276081085,
"step": 1190,
"valid_targets_mean": 5315.6,
"valid_targets_min": 1025
},
{
"epoch": 1.9059011164274322,
"grad_norm": 0.4756282213697449,
"learning_rate": 3.650127136600379e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20297697186470032,
"step": 1195,
"valid_targets_mean": 4748.2,
"valid_targets_min": 220
},
{
"epoch": 1.9138755980861244,
"grad_norm": 0.42489920562160244,
"learning_rate": 3.645620112808464e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20593520998954773,
"step": 1200,
"valid_targets_mean": 5418.3,
"valid_targets_min": 253
},
{
"epoch": 1.9218500797448166,
"grad_norm": 0.4334876163320044,
"learning_rate": 3.641087064984977e-05,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22070161998271942,
"step": 1205,
"valid_targets_mean": 4694.1,
"valid_targets_min": 258
},
{
"epoch": 1.9298245614035088,
"grad_norm": 0.4516336012066562,
"learning_rate": 3.636528064816073e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20581312477588654,
"step": 1210,
"valid_targets_mean": 4649.5,
"valid_targets_min": 401
},
{
"epoch": 1.937799043062201,
"grad_norm": 0.4767246444943567,
"learning_rate": 3.6319431843983223e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21031825244426727,
"step": 1215,
"valid_targets_mean": 5190.2,
"valid_targets_min": 1234
},
{
"epoch": 1.9457735247208932,
"grad_norm": 0.4411208057237242,
"learning_rate": 3.6273324962375676e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20570659637451172,
"step": 1220,
"valid_targets_mean": 4742.9,
"valid_targets_min": 277
},
{
"epoch": 1.9537480063795853,
"grad_norm": 0.43422619282432606,
"learning_rate": 3.622696073247777e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23021955788135529,
"step": 1225,
"valid_targets_mean": 5510.6,
"valid_targets_min": 220
},
{
"epoch": 1.9617224880382775,
"grad_norm": 0.3958863238593673,
"learning_rate": 3.6180339887498953e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21620529890060425,
"step": 1230,
"valid_targets_mean": 5932.4,
"valid_targets_min": 3927
},
{
"epoch": 1.9696969696969697,
"grad_norm": 0.450040729571919,
"learning_rate": 3.613346316470678e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21761035919189453,
"step": 1235,
"valid_targets_mean": 5147.7,
"valid_targets_min": 197
},
{
"epoch": 1.977671451355662,
"grad_norm": 0.41291052485814267,
"learning_rate": 3.60863313054153e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143172323703766,
"step": 1240,
"valid_targets_mean": 5364.6,
"valid_targets_min": 198
},
{
"epoch": 1.985645933014354,
"grad_norm": 0.4220642316941175,
"learning_rate": 3.6038945054973334e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18891289830207825,
"step": 1245,
"valid_targets_mean": 4778.4,
"valid_targets_min": 350
},
{
"epoch": 1.9936204146730463,
"grad_norm": 0.41397715465144314,
"learning_rate": 3.599130516275266e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21088147163391113,
"step": 1250,
"valid_targets_mean": 5391.7,
"valid_targets_min": 1017
},
{
"epoch": 2.0015948963317385,
"grad_norm": 0.3643446187203916,
"learning_rate": 3.594341238213618e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.199854776263237,
"step": 1255,
"valid_targets_mean": 7008.9,
"valid_targets_min": 1310
},
{
"epoch": 2.0095693779904304,
"grad_norm": 0.5089005502007752,
"learning_rate": 3.589526747050601e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19922807812690735,
"step": 1260,
"valid_targets_mean": 5693.9,
"valid_targets_min": 253
},
{
"epoch": 2.017543859649123,
"grad_norm": 0.503959442172207,
"learning_rate": 3.584687118923149e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943974494934082,
"step": 1265,
"valid_targets_mean": 4555.7,
"valid_targets_min": 294
},
{
"epoch": 2.025518341307815,
"grad_norm": 0.479827670134503,
"learning_rate": 3.579822430365714e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20069649815559387,
"step": 1270,
"valid_targets_mean": 5865.2,
"valid_targets_min": 319
},
{
"epoch": 2.0334928229665072,
"grad_norm": 0.531555659296794,
"learning_rate": 3.57493275830906e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18816310167312622,
"step": 1275,
"valid_targets_mean": 4013.8,
"valid_targets_min": 257
},
{
"epoch": 2.041467304625199,
"grad_norm": 0.4535957632544287,
"learning_rate": 3.570018180079037e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182516947388649,
"step": 1280,
"valid_targets_mean": 4548.5,
"valid_targets_min": 404
},
{
"epoch": 2.0494417862838916,
"grad_norm": 0.4102394127837868,
"learning_rate": 3.5650787733953715e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1951259821653366,
"step": 1285,
"valid_targets_mean": 5618.1,
"valid_targets_min": 485
},
{
"epoch": 2.0574162679425836,
"grad_norm": 0.4455885359883081,
"learning_rate": 3.560114616370425e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18562662601470947,
"step": 1290,
"valid_targets_mean": 5641.9,
"valid_targets_min": 1013
},
{
"epoch": 2.065390749601276,
"grad_norm": 0.428626874635782,
"learning_rate": 3.555125787507964e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18140408396720886,
"step": 1295,
"valid_targets_mean": 5703.9,
"valid_targets_min": 880
},
{
"epoch": 2.073365231259968,
"grad_norm": 0.4584548418763648,
"learning_rate": 3.550112365701921e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18239644169807434,
"step": 1300,
"valid_targets_mean": 4791.1,
"valid_targets_min": 306
},
{
"epoch": 2.0813397129186604,
"grad_norm": 0.43039743066547864,
"learning_rate": 3.545074430235142e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17609882354736328,
"step": 1305,
"valid_targets_mean": 5186.6,
"valid_targets_min": 993
},
{
"epoch": 2.0893141945773523,
"grad_norm": 0.570297651690843,
"learning_rate": 3.540012060778137e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940477192401886,
"step": 1310,
"valid_targets_mean": 5585.9,
"valid_targets_min": 2335
},
{
"epoch": 2.0972886762360448,
"grad_norm": 0.5667347176037617,
"learning_rate": 3.534925337387816e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23207005858421326,
"step": 1315,
"valid_targets_mean": 4650.1,
"valid_targets_min": 988
},
{
"epoch": 2.1052631578947367,
"grad_norm": 0.437965181451973,
"learning_rate": 3.529814340506226e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18409255146980286,
"step": 1320,
"valid_targets_mean": 5324.3,
"valid_targets_min": 498
},
{
"epoch": 2.113237639553429,
"grad_norm": 0.48750716332724386,
"learning_rate": 3.524679150959277e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19646605849266052,
"step": 1325,
"valid_targets_mean": 5267.9,
"valid_targets_min": 242
},
{
"epoch": 2.121212121212121,
"grad_norm": 0.4674875720772593,
"learning_rate": 3.519519849955466e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.184675931930542,
"step": 1330,
"valid_targets_mean": 5060.6,
"valid_targets_min": 231
},
{
"epoch": 2.1291866028708135,
"grad_norm": 0.412128726013319,
"learning_rate": 3.514336519084591e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19906136393547058,
"step": 1335,
"valid_targets_mean": 6195.8,
"valid_targets_min": 1126
},
{
"epoch": 2.1371610845295055,
"grad_norm": 0.454372966625409,
"learning_rate": 3.509129240316461e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1770518273115158,
"step": 1340,
"valid_targets_mean": 4886.6,
"valid_targets_min": 229
},
{
"epoch": 2.145135566188198,
"grad_norm": 0.41470060548444787,
"learning_rate": 3.5038980959995985e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21732914447784424,
"step": 1345,
"valid_targets_mean": 5456.9,
"valid_targets_min": 431
},
{
"epoch": 2.15311004784689,
"grad_norm": 0.5082279794924567,
"learning_rate": 3.498643168859941e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2050442099571228,
"step": 1350,
"valid_targets_mean": 3737.6,
"valid_targets_min": 237
},
{
"epoch": 2.1610845295055823,
"grad_norm": 0.4465994627612317,
"learning_rate": 3.493364541999529e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1864827573299408,
"step": 1355,
"valid_targets_mean": 5549.5,
"valid_targets_min": 265
},
{
"epoch": 2.1690590111642742,
"grad_norm": 0.4959175879648974,
"learning_rate": 3.488062298895194e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19287291169166565,
"step": 1360,
"valid_targets_mean": 5856.5,
"valid_targets_min": 187
},
{
"epoch": 2.1770334928229667,
"grad_norm": 0.44527239357999826,
"learning_rate": 3.482736523397237e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1782650649547577,
"step": 1365,
"valid_targets_mean": 6042.2,
"valid_targets_min": 283
},
{
"epoch": 2.1850079744816586,
"grad_norm": 0.48649563144503055,
"learning_rate": 3.4773872997281026e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19013699889183044,
"step": 1370,
"valid_targets_mean": 4519.7,
"valid_targets_min": 234
},
{
"epoch": 2.192982456140351,
"grad_norm": 0.45009208736512063,
"learning_rate": 3.472014712481048e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20921623706817627,
"step": 1375,
"valid_targets_mean": 5785.2,
"valid_targets_min": 1188
},
{
"epoch": 2.200956937799043,
"grad_norm": 0.47367304566980717,
"learning_rate": 3.466618846618806e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19029450416564941,
"step": 1380,
"valid_targets_mean": 4545.1,
"valid_targets_min": 218
},
{
"epoch": 2.2089314194577354,
"grad_norm": 0.44532555731302303,
"learning_rate": 3.461199787472238e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2194649875164032,
"step": 1385,
"valid_targets_mean": 6045.2,
"valid_targets_min": 353
},
{
"epoch": 2.2169059011164274,
"grad_norm": 0.4574540062857725,
"learning_rate": 3.455757620738989e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2010454535484314,
"step": 1390,
"valid_targets_mean": 5319.1,
"valid_targets_min": 192
},
{
"epoch": 2.22488038277512,
"grad_norm": 0.4137662066758735,
"learning_rate": 3.450292432482127e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860542595386505,
"step": 1395,
"valid_targets_mean": 5334.2,
"valid_targets_min": 254
},
{
"epoch": 2.2328548644338118,
"grad_norm": 0.5266331960391181,
"learning_rate": 3.444804309128789e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20332130789756775,
"step": 1400,
"valid_targets_mean": 4094.9,
"valid_targets_min": 276
},
{
"epoch": 2.240829346092504,
"grad_norm": 0.4275504408813166,
"learning_rate": 3.439293337468808e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20420581102371216,
"step": 1405,
"valid_targets_mean": 5697.4,
"valid_targets_min": 280
},
{
"epoch": 2.248803827751196,
"grad_norm": 0.6098551773610512,
"learning_rate": 3.4337596046533426e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2192438542842865,
"step": 1410,
"valid_targets_mean": 4067.2,
"valid_targets_min": 273
},
{
"epoch": 2.2567783094098885,
"grad_norm": 0.46223066080996034,
"learning_rate": 3.4282031981935e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19895970821380615,
"step": 1415,
"valid_targets_mean": 5468.5,
"valid_targets_min": 241
},
{
"epoch": 2.2647527910685805,
"grad_norm": 0.4816233736428177,
"learning_rate": 3.42262420595895e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20274695754051208,
"step": 1420,
"valid_targets_mean": 4453.4,
"valid_targets_min": 243
},
{
"epoch": 2.2727272727272725,
"grad_norm": 0.5447011231170933,
"learning_rate": 3.417022716176539e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23817561566829681,
"step": 1425,
"valid_targets_mean": 4389.7,
"valid_targets_min": 207
},
{
"epoch": 2.280701754385965,
"grad_norm": 0.4065575430290217,
"learning_rate": 3.411398817428889e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17134660482406616,
"step": 1430,
"valid_targets_mean": 5676.4,
"valid_targets_min": 287
},
{
"epoch": 2.2886762360446573,
"grad_norm": 0.42839943743721853,
"learning_rate": 3.4057525986530016e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1901647001504898,
"step": 1435,
"valid_targets_mean": 5106.8,
"valid_targets_min": 231
},
{
"epoch": 2.2966507177033493,
"grad_norm": 0.5843289079352976,
"learning_rate": 3.400084149138851e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19277843832969666,
"step": 1440,
"valid_targets_mean": 5061.8,
"valid_targets_min": 248
},
{
"epoch": 2.3046251993620412,
"grad_norm": 0.41359975340834615,
"learning_rate": 3.394393558527969e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1865783929824829,
"step": 1445,
"valid_targets_mean": 4914.6,
"valid_targets_min": 215
},
{
"epoch": 2.3125996810207337,
"grad_norm": 0.8413467284644864,
"learning_rate": 3.388680916812031e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19681130349636078,
"step": 1450,
"valid_targets_mean": 3662.1,
"valid_targets_min": 231
},
{
"epoch": 2.320574162679426,
"grad_norm": 0.42971911311204314,
"learning_rate": 3.382946314331429e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1996922791004181,
"step": 1455,
"valid_targets_mean": 5618.2,
"valid_targets_min": 238
},
{
"epoch": 2.328548644338118,
"grad_norm": 0.44153231073372906,
"learning_rate": 3.377189841773848e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1980620175600052,
"step": 1460,
"valid_targets_mean": 6170.3,
"valid_targets_min": 231
},
{
"epoch": 2.33652312599681,
"grad_norm": 0.5293878213403573,
"learning_rate": 3.371411590172827e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18319925665855408,
"step": 1465,
"valid_targets_mean": 5088.3,
"valid_targets_min": 293
},
{
"epoch": 2.3444976076555024,
"grad_norm": 0.6426703391266552,
"learning_rate": 3.365611650906321e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20919805765151978,
"step": 1470,
"valid_targets_mean": 4000.6,
"valid_targets_min": 245
},
{
"epoch": 2.352472089314195,
"grad_norm": 0.3978379280431999,
"learning_rate": 3.359790115695259e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18329757452011108,
"step": 1475,
"valid_targets_mean": 5595.2,
"valid_targets_min": 236
},
{
"epoch": 2.360446570972887,
"grad_norm": 0.4545853833674734,
"learning_rate": 3.353947076602088e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20800280570983887,
"step": 1480,
"valid_targets_mean": 4826.0,
"valid_targets_min": 240
},
{
"epoch": 2.3684210526315788,
"grad_norm": 0.44645999692405564,
"learning_rate": 3.34808262602932e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20406398177146912,
"step": 1485,
"valid_targets_mean": 5473.4,
"valid_targets_min": 352
},
{
"epoch": 2.376395534290271,
"grad_norm": 0.445133870638968,
"learning_rate": 3.342196856718074e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2017001211643219,
"step": 1490,
"valid_targets_mean": 6088.2,
"valid_targets_min": 661
},
{
"epoch": 2.384370015948963,
"grad_norm": 0.597332937011485,
"learning_rate": 3.336289861746602e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19852346181869507,
"step": 1495,
"valid_targets_mean": 4930.6,
"valid_targets_min": 234
},
{
"epoch": 2.3923444976076556,
"grad_norm": 0.45394616672617394,
"learning_rate": 3.330361734528823e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.190562903881073,
"step": 1500,
"valid_targets_mean": 4513.7,
"valid_targets_min": 471
},
{
"epoch": 2.4003189792663475,
"grad_norm": 0.4805966610484533,
"learning_rate": 3.324412568812844e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20358845591545105,
"step": 1505,
"valid_targets_mean": 4287.1,
"valid_targets_min": 242
},
{
"epoch": 2.40829346092504,
"grad_norm": 0.42131026059287974,
"learning_rate": 3.318442458679477e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19886666536331177,
"step": 1510,
"valid_targets_mean": 5740.6,
"valid_targets_min": 1204
},
{
"epoch": 2.416267942583732,
"grad_norm": 0.4625097603216523,
"learning_rate": 3.312451498540751e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2181396782398224,
"step": 1515,
"valid_targets_mean": 4945.9,
"valid_targets_min": 208
},
{
"epoch": 2.4242424242424243,
"grad_norm": 0.7157764991804577,
"learning_rate": 3.306439783138421e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18493902683258057,
"step": 1520,
"valid_targets_mean": 4290.6,
"valid_targets_min": 233
},
{
"epoch": 2.4322169059011163,
"grad_norm": 0.48585805226131235,
"learning_rate": 3.3004074075424666e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1977916955947876,
"step": 1525,
"valid_targets_mean": 4688.1,
"valid_targets_min": 371
},
{
"epoch": 2.4401913875598087,
"grad_norm": 0.4127665889358799,
"learning_rate": 3.29435446714959e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21614857017993927,
"step": 1530,
"valid_targets_mean": 5571.1,
"valid_targets_min": 247
},
{
"epoch": 2.4481658692185007,
"grad_norm": 0.42425666745682966,
"learning_rate": 3.288281057681709e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20173463225364685,
"step": 1535,
"valid_targets_mean": 5986.9,
"valid_targets_min": 3398
},
{
"epoch": 2.456140350877193,
"grad_norm": 0.4248076718805002,
"learning_rate": 3.28218727518444e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972285509109497,
"step": 1540,
"valid_targets_mean": 6004.7,
"valid_targets_min": 312
},
{
"epoch": 2.464114832535885,
"grad_norm": 0.3922347541694817,
"learning_rate": 3.2760732160255835e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18398353457450867,
"step": 1545,
"valid_targets_mean": 5221.8,
"valid_targets_min": 257
},
{
"epoch": 2.4720893141945774,
"grad_norm": 0.4303243717469087,
"learning_rate": 3.269938976893595e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21553900837898254,
"step": 1550,
"valid_targets_mean": 5332.7,
"valid_targets_min": 385
},
{
"epoch": 2.4800637958532694,
"grad_norm": 0.4854770545469238,
"learning_rate": 3.2637846547960596e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17565301060676575,
"step": 1555,
"valid_targets_mean": 4513.3,
"valid_targets_min": 265
},
{
"epoch": 2.488038277511962,
"grad_norm": 0.43977338387056625,
"learning_rate": 3.2576103470581564e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19088605046272278,
"step": 1560,
"valid_targets_mean": 4912.8,
"valid_targets_min": 237
},
{
"epoch": 2.496012759170654,
"grad_norm": 0.4520785254838387,
"learning_rate": 3.25141615132112e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20245029032230377,
"step": 1565,
"valid_targets_mean": 5112.1,
"valid_targets_min": 897
},
{
"epoch": 2.503987240829346,
"grad_norm": 0.5068509455429572,
"learning_rate": 3.245202165540697e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19341543316841125,
"step": 1570,
"valid_targets_mean": 4056.7,
"valid_targets_min": 234
},
{
"epoch": 2.511961722488038,
"grad_norm": 0.5435007785354973,
"learning_rate": 3.238968487985594e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22572636604309082,
"step": 1575,
"valid_targets_mean": 5079.7,
"valid_targets_min": 470
},
{
"epoch": 2.5199362041467306,
"grad_norm": 0.45017998405884907,
"learning_rate": 3.232715217235927e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1891011893749237,
"step": 1580,
"valid_targets_mean": 4659.2,
"valid_targets_min": 269
},
{
"epoch": 2.5279106858054226,
"grad_norm": 0.46614430155117725,
"learning_rate": 3.226442452181662e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21900171041488647,
"step": 1585,
"valid_targets_mean": 4712.8,
"valid_targets_min": 290
},
{
"epoch": 2.535885167464115,
"grad_norm": 0.4179797529076482,
"learning_rate": 3.220150292021049e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20042002201080322,
"step": 1590,
"valid_targets_mean": 5453.1,
"valid_targets_min": 397
},
{
"epoch": 2.543859649122807,
"grad_norm": 0.3941065291864704,
"learning_rate": 3.213838836259055e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991400420665741,
"step": 1595,
"valid_targets_mean": 6182.4,
"valid_targets_min": 1366
},
{
"epoch": 2.5518341307814993,
"grad_norm": 0.5251204241670916,
"learning_rate": 3.2075081847057886e-05,
"loss": 0.192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1915452778339386,
"step": 1600,
"valid_targets_mean": 5069.6,
"valid_targets_min": 315
},
{
"epoch": 2.5598086124401913,
"grad_norm": 0.4344757969866471,
"learning_rate": 3.201158437474925e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20345640182495117,
"step": 1605,
"valid_targets_mean": 5158.1,
"valid_targets_min": 291
},
{
"epoch": 2.5677830940988837,
"grad_norm": 0.486960352408697,
"learning_rate": 3.194789694982119e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20748808979988098,
"step": 1610,
"valid_targets_mean": 4422.7,
"valid_targets_min": 313
},
{
"epoch": 2.5757575757575757,
"grad_norm": 0.40817659538238277,
"learning_rate": 3.1884020579434216e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19428619742393494,
"step": 1615,
"valid_targets_mean": 5725.4,
"valid_targets_min": 1368
},
{
"epoch": 2.583732057416268,
"grad_norm": 0.5274105752709692,
"learning_rate": 3.181995627373679e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1966966688632965,
"step": 1620,
"valid_targets_mean": 4958.5,
"valid_targets_min": 244
},
{
"epoch": 2.59170653907496,
"grad_norm": 0.6069953846941016,
"learning_rate": 3.1755705045849465e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21730463206768036,
"step": 1625,
"valid_targets_mean": 5876.8,
"valid_targets_min": 231
},
{
"epoch": 2.5996810207336525,
"grad_norm": 0.4266434532453334,
"learning_rate": 3.1691267911848765e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19540351629257202,
"step": 1630,
"valid_targets_mean": 6337.5,
"valid_targets_min": 1361
},
{
"epoch": 2.6076555023923444,
"grad_norm": 0.4740580478639372,
"learning_rate": 3.1626645890751167e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20163899660110474,
"step": 1635,
"valid_targets_mean": 4218.8,
"valid_targets_min": 375
},
{
"epoch": 2.6156299840510364,
"grad_norm": 0.45637845415807304,
"learning_rate": 3.156184000449697e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20877380669116974,
"step": 1640,
"valid_targets_mean": 5568.1,
"valid_targets_min": 1781
},
{
"epoch": 2.623604465709729,
"grad_norm": 0.4308877600902401,
"learning_rate": 3.149685127793415e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18682101368904114,
"step": 1645,
"valid_targets_mean": 5184.0,
"valid_targets_min": 234
},
{
"epoch": 2.6315789473684212,
"grad_norm": 0.4189163208718231,
"learning_rate": 3.143168073880214e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18947117030620575,
"step": 1650,
"valid_targets_mean": 7086.4,
"valid_targets_min": 3741
},
{
"epoch": 2.639553429027113,
"grad_norm": 0.5597913294956877,
"learning_rate": 3.1366329417715556e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20389412343502045,
"step": 1655,
"valid_targets_mean": 2807.3,
"valid_targets_min": 245
},
{
"epoch": 2.647527910685805,
"grad_norm": 0.4577649992315954,
"learning_rate": 3.1300798348147954e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21411626040935516,
"step": 1660,
"valid_targets_mean": 4915.6,
"valid_targets_min": 244
},
{
"epoch": 2.6555023923444976,
"grad_norm": 0.5697741917006428,
"learning_rate": 3.123508856641542e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18438398838043213,
"step": 1665,
"valid_targets_mean": 2729.6,
"valid_targets_min": 212
},
{
"epoch": 2.66347687400319,
"grad_norm": 0.4954551623019788,
"learning_rate": 3.116920111166025e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19248652458190918,
"step": 1670,
"valid_targets_mean": 5454.8,
"valid_targets_min": 1300
},
{
"epoch": 2.671451355661882,
"grad_norm": 0.6574670833738052,
"learning_rate": 3.1103137025834456e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20095154643058777,
"step": 1675,
"valid_targets_mean": 4381.1,
"valid_targets_min": 227
},
{
"epoch": 2.679425837320574,
"grad_norm": 0.5132611155528096,
"learning_rate": 3.103689735368333e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1844911277294159,
"step": 1680,
"valid_targets_mean": 5391.4,
"valid_targets_min": 252
},
{
"epoch": 2.6874003189792663,
"grad_norm": 0.4212211839126058,
"learning_rate": 3.097048314272889e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18505148589611053,
"step": 1685,
"valid_targets_mean": 5102.6,
"valid_targets_min": 300
},
{
"epoch": 2.6953748006379588,
"grad_norm": 0.4423902059794495,
"learning_rate": 3.090389544325335e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1688818335533142,
"step": 1690,
"valid_targets_mean": 4878.3,
"valid_targets_min": 324
},
{
"epoch": 2.7033492822966507,
"grad_norm": 0.5581123858755366,
"learning_rate": 3.08371353082825e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19731852412223816,
"step": 1695,
"valid_targets_mean": 3715.7,
"valid_targets_min": 251
},
{
"epoch": 2.7113237639553427,
"grad_norm": 0.42350710595986724,
"learning_rate": 3.0770203793568994e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16717937588691711,
"step": 1700,
"valid_targets_mean": 4077.0,
"valid_targets_min": 233
},
{
"epoch": 2.719298245614035,
"grad_norm": 0.49090848376444596,
"learning_rate": 3.0703101957575765e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15885134041309357,
"step": 1705,
"valid_targets_mean": 4482.4,
"valid_targets_min": 243
},
{
"epoch": 2.7272727272727275,
"grad_norm": 0.6436929861619126,
"learning_rate": 3.0635830861459204e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18233323097229004,
"step": 1710,
"valid_targets_mean": 4834.9,
"valid_targets_min": 195
},
{
"epoch": 2.7352472089314195,
"grad_norm": 0.46088720776870845,
"learning_rate": 3.056839156905239e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1806366741657257,
"step": 1715,
"valid_targets_mean": 4546.9,
"valid_targets_min": 237
},
{
"epoch": 2.7432216905901115,
"grad_norm": 0.4474922756938493,
"learning_rate": 3.0500785146848303e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22203987836837769,
"step": 1720,
"valid_targets_mean": 5486.4,
"valid_targets_min": 3263
},
{
"epoch": 2.751196172248804,
"grad_norm": 0.4954321658053421,
"learning_rate": 3.04330126639829e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19901606440544128,
"step": 1725,
"valid_targets_mean": 4870.5,
"valid_targets_min": 344
},
{
"epoch": 2.7591706539074963,
"grad_norm": 0.4289601290987771,
"learning_rate": 3.0365075192218278e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18361328542232513,
"step": 1730,
"valid_targets_mean": 5532.9,
"valid_targets_min": 361
},
{
"epoch": 2.7671451355661882,
"grad_norm": 0.43515257338738716,
"learning_rate": 3.0296973805925663e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1985451728105545,
"step": 1735,
"valid_targets_mean": 4923.9,
"valid_targets_min": 205
},
{
"epoch": 2.77511961722488,
"grad_norm": 0.49286906233457306,
"learning_rate": 3.022870958206845e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22014012932777405,
"step": 1740,
"valid_targets_mean": 4225.8,
"valid_targets_min": 241
},
{
"epoch": 2.7830940988835726,
"grad_norm": 0.46268729106701734,
"learning_rate": 3.0160283600185168e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991043984889984,
"step": 1745,
"valid_targets_mean": 5857.8,
"valid_targets_min": 2502
},
{
"epoch": 2.7910685805422646,
"grad_norm": 0.43987550309271245,
"learning_rate": 3.0091696942372412e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22454778850078583,
"step": 1750,
"valid_targets_mean": 5287.6,
"valid_targets_min": 426
},
{
"epoch": 2.799043062200957,
"grad_norm": 0.3909802203598762,
"learning_rate": 3.002295069326772e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18474428355693817,
"step": 1755,
"valid_targets_mean": 6217.1,
"valid_targets_min": 798
},
{
"epoch": 2.807017543859649,
"grad_norm": 0.4519033373142686,
"learning_rate": 2.9954045940032423e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228385955095291,
"step": 1760,
"valid_targets_mean": 4893.2,
"valid_targets_min": 796
},
{
"epoch": 2.8149920255183414,
"grad_norm": 0.443167897058933,
"learning_rate": 2.988498377233446e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19619905948638916,
"step": 1765,
"valid_targets_mean": 4660.5,
"valid_targets_min": 537
},
{
"epoch": 2.8229665071770333,
"grad_norm": 0.40577323628578027,
"learning_rate": 2.981576528233114e-05,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754124015569687,
"step": 1770,
"valid_targets_mean": 5301.9,
"valid_targets_min": 1010
},
{
"epoch": 2.8309409888357258,
"grad_norm": 0.7482306867842724,
"learning_rate": 2.9746391564651867e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19741225242614746,
"step": 1775,
"valid_targets_mean": 5149.7,
"valid_targets_min": 442
},
{
"epoch": 2.8389154704944177,
"grad_norm": 0.4247278253753553,
"learning_rate": 2.9676863716380845e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17590616643428802,
"step": 1780,
"valid_targets_mean": 4805.6,
"valid_targets_min": 245
},
{
"epoch": 2.84688995215311,
"grad_norm": 0.3967661509113751,
"learning_rate": 2.9607182837039697e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19023631513118744,
"step": 1785,
"valid_targets_mean": 5670.9,
"valid_targets_min": 342
},
{
"epoch": 2.854864433811802,
"grad_norm": 0.469096556872057,
"learning_rate": 2.9537350028570126e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1898074746131897,
"step": 1790,
"valid_targets_mean": 5681.8,
"valid_targets_min": 589
},
{
"epoch": 2.8628389154704945,
"grad_norm": 0.47473047259461487,
"learning_rate": 2.946736639531643e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18150553107261658,
"step": 1795,
"valid_targets_mean": 3808.1,
"valid_targets_min": 222
},
{
"epoch": 2.8708133971291865,
"grad_norm": 0.5204904028442524,
"learning_rate": 2.9397233044008092e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23707595467567444,
"step": 1800,
"valid_targets_mean": 4178.8,
"valid_targets_min": 220
},
{
"epoch": 2.878787878787879,
"grad_norm": 0.47501836141359854,
"learning_rate": 2.9326951083742243e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19446857273578644,
"step": 1805,
"valid_targets_mean": 4535.6,
"valid_targets_min": 389
},
{
"epoch": 2.886762360446571,
"grad_norm": 0.42948864890631583,
"learning_rate": 2.925652162596613e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17343220114707947,
"step": 1810,
"valid_targets_mean": 4889.4,
"valid_targets_min": 236
},
{
"epoch": 2.8947368421052633,
"grad_norm": 0.5059534986758673,
"learning_rate": 2.9185945784459558e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2241000235080719,
"step": 1815,
"valid_targets_mean": 5150.2,
"valid_targets_min": 330
},
{
"epoch": 2.9027113237639552,
"grad_norm": 0.47658050657237366,
"learning_rate": 2.9115224675317252e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21023055911064148,
"step": 1820,
"valid_targets_mean": 4221.5,
"valid_targets_min": 214
},
{
"epoch": 2.9106858054226477,
"grad_norm": 0.41994426403573426,
"learning_rate": 2.9044359416931206e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1868569403886795,
"step": 1825,
"valid_targets_mean": 5305.3,
"valid_targets_min": 350
},
{
"epoch": 2.9186602870813396,
"grad_norm": 0.41704691170495495,
"learning_rate": 2.897335112997302e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18512971699237823,
"step": 1830,
"valid_targets_mean": 5721.6,
"valid_targets_min": 1638
},
{
"epoch": 2.926634768740032,
"grad_norm": 0.44070738637909757,
"learning_rate": 2.8902200937376173e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.187473863363266,
"step": 1835,
"valid_targets_mean": 4991.3,
"valid_targets_min": 220
},
{
"epoch": 2.934609250398724,
"grad_norm": 0.41564417066878323,
"learning_rate": 2.8830909964318242e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1944010853767395,
"step": 1840,
"valid_targets_mean": 5204.4,
"valid_targets_min": 254
},
{
"epoch": 2.9425837320574164,
"grad_norm": 0.4711330801343301,
"learning_rate": 2.875947933820312e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18439987301826477,
"step": 1845,
"valid_targets_mean": 4334.9,
"valid_targets_min": 358
},
{
"epoch": 2.9505582137161084,
"grad_norm": 0.4312204583935454,
"learning_rate": 2.868791018864321e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2141954004764557,
"step": 1850,
"valid_targets_mean": 5918.7,
"valid_targets_min": 729
},
{
"epoch": 2.958532695374801,
"grad_norm": 0.3992293087829351,
"learning_rate": 2.861620364744151e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1783233880996704,
"step": 1855,
"valid_targets_mean": 5647.2,
"valid_targets_min": 265
},
{
"epoch": 2.9665071770334928,
"grad_norm": 0.4507956223008353,
"learning_rate": 2.854436084857379e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17667381465435028,
"step": 1860,
"valid_targets_mean": 4852.1,
"valid_targets_min": 213
},
{
"epoch": 2.974481658692185,
"grad_norm": 0.4773163155858111,
"learning_rate": 2.847238292817057e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20969876646995544,
"step": 1865,
"valid_targets_mean": 4586.2,
"valid_targets_min": 445
},
{
"epoch": 2.982456140350877,
"grad_norm": 0.4528434719614539,
"learning_rate": 2.8400271024499212e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2054166942834854,
"step": 1870,
"valid_targets_mean": 4955.4,
"valid_targets_min": 226
},
{
"epoch": 2.990430622009569,
"grad_norm": 0.3885619872358622,
"learning_rate": 2.832802627794593e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1787319779396057,
"step": 1875,
"valid_targets_mean": 5796.7,
"valid_targets_min": 237
},
{
"epoch": 2.9984051036682615,
"grad_norm": 0.42804120084625014,
"learning_rate": 2.8255649830997704e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17473948001861572,
"step": 1880,
"valid_targets_mean": 5018.7,
"valid_targets_min": 268
},
{
"epoch": 3.006379585326954,
"grad_norm": 0.433732961845131,
"learning_rate": 2.8183142828224238e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17086060345172882,
"step": 1885,
"valid_targets_mean": 5365.8,
"valid_targets_min": 974
},
{
"epoch": 3.014354066985646,
"grad_norm": 0.4863024499849261,
"learning_rate": 2.811050641625988e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191526398062706,
"step": 1890,
"valid_targets_mean": 5307.4,
"valid_targets_min": 280
},
{
"epoch": 3.0223285486443383,
"grad_norm": 0.4706758519016476,
"learning_rate": 2.8037741743785458e-05,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18275225162506104,
"step": 1895,
"valid_targets_mean": 5210.0,
"valid_targets_min": 1063
},
{
"epoch": 3.0303030303030303,
"grad_norm": 0.48525571024905406,
"learning_rate": 2.796484996151013e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1842869222164154,
"step": 1900,
"valid_targets_mean": 4938.5,
"valid_targets_min": 346
},
{
"epoch": 3.0382775119617227,
"grad_norm": 0.412438730549393,
"learning_rate": 2.7891832222153188e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17894425988197327,
"step": 1905,
"valid_targets_mean": 6566.9,
"valid_targets_min": 3239
},
{
"epoch": 3.0462519936204147,
"grad_norm": 0.4304985686601505,
"learning_rate": 2.7818689680425807e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17525765299797058,
"step": 1910,
"valid_targets_mean": 5481.5,
"valid_targets_min": 217
},
{
"epoch": 3.054226475279107,
"grad_norm": 0.3943796487066891,
"learning_rate": 2.7745423493012827e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17475299537181854,
"step": 1915,
"valid_targets_mean": 5954.4,
"valid_targets_min": 286
},
{
"epoch": 3.062200956937799,
"grad_norm": 0.4539894149791786,
"learning_rate": 2.767203481855441e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19275791943073273,
"step": 1920,
"valid_targets_mean": 5459.8,
"valid_targets_min": 715
},
{
"epoch": 3.0701754385964914,
"grad_norm": 0.5140612143362417,
"learning_rate": 2.7598524817627764e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18038983643054962,
"step": 1925,
"valid_targets_mean": 5190.4,
"valid_targets_min": 253
},
{
"epoch": 3.0781499202551834,
"grad_norm": 0.5065917391396272,
"learning_rate": 2.7524894652728754e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17167213559150696,
"step": 1930,
"valid_targets_mean": 5318.8,
"valid_targets_min": 210
},
{
"epoch": 3.0861244019138754,
"grad_norm": 0.4869400509228171,
"learning_rate": 2.7451145488253544e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19056691229343414,
"step": 1935,
"valid_targets_mean": 4080.8,
"valid_targets_min": 198
},
{
"epoch": 3.094098883572568,
"grad_norm": 0.43805490959459653,
"learning_rate": 2.7377278490480157e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18080243468284607,
"step": 1940,
"valid_targets_mean": 5616.9,
"valid_targets_min": 1092
},
{
"epoch": 3.1020733652312598,
"grad_norm": 0.5757191060457126,
"learning_rate": 2.730329482755006e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19692851603031158,
"step": 1945,
"valid_targets_mean": 4502.3,
"valid_targets_min": 285
},
{
"epoch": 3.110047846889952,
"grad_norm": 0.4558677202034122,
"learning_rate": 2.7229195669449667e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19101294875144958,
"step": 1950,
"valid_targets_mean": 5041.2,
"valid_targets_min": 213
},
{
"epoch": 3.118022328548644,
"grad_norm": 0.5737066377290475,
"learning_rate": 2.7154982187991855e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17446887493133545,
"step": 1955,
"valid_targets_mean": 4123.6,
"valid_targets_min": 164
},
{
"epoch": 3.1259968102073366,
"grad_norm": 0.4748676581841484,
"learning_rate": 2.7080655556797406e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1776636242866516,
"step": 1960,
"valid_targets_mean": 4680.4,
"valid_targets_min": 277
},
{
"epoch": 3.1339712918660285,
"grad_norm": 0.6049727128355192,
"learning_rate": 2.700621695127649e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19648462533950806,
"step": 1965,
"valid_targets_mean": 3179.7,
"valid_targets_min": 239
},
{
"epoch": 3.141945773524721,
"grad_norm": 0.904407825912653,
"learning_rate": 2.693166754861003e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16663089394569397,
"step": 1970,
"valid_targets_mean": 5391.8,
"valid_targets_min": 944
},
{
"epoch": 3.149920255183413,
"grad_norm": 0.4709363791045733,
"learning_rate": 2.685700852773113e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18905910849571228,
"step": 1975,
"valid_targets_mean": 4695.8,
"valid_targets_min": 229
},
{
"epoch": 3.1578947368421053,
"grad_norm": 0.42759989366433276,
"learning_rate": 2.6782241069306395e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15810883045196533,
"step": 1980,
"valid_targets_mean": 4624.4,
"valid_targets_min": 264
},
{
"epoch": 3.1658692185007973,
"grad_norm": 0.5668755951710633,
"learning_rate": 2.6707366355717268e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19498129189014435,
"step": 1985,
"valid_targets_mean": 3415.8,
"valid_targets_min": 237
},
{
"epoch": 3.1738437001594897,
"grad_norm": 0.5117307401139212,
"learning_rate": 2.663238557104136e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18552227318286896,
"step": 1990,
"valid_targets_mean": 5261.2,
"valid_targets_min": 1556
},
{
"epoch": 3.1818181818181817,
"grad_norm": 0.4511472489219715,
"learning_rate": 2.655729990103368e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19818511605262756,
"step": 1995,
"valid_targets_mean": 4634.6,
"valid_targets_min": 238
},
{
"epoch": 3.189792663476874,
"grad_norm": 0.45119915336535704,
"learning_rate": 2.648211053310792e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17265570163726807,
"step": 2000,
"valid_targets_mean": 4349.8,
"valid_targets_min": 274
},
{
"epoch": 3.197767145135566,
"grad_norm": 0.5099187438099473,
"learning_rate": 2.6406818656317654e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18631012737751007,
"step": 2005,
"valid_targets_mean": 5041.1,
"valid_targets_min": 186
},
{
"epoch": 3.2057416267942584,
"grad_norm": 0.43152334301712886,
"learning_rate": 2.6331425461337557e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20323804020881653,
"step": 2010,
"valid_targets_mean": 5194.4,
"valid_targets_min": 363
},
{
"epoch": 3.2137161084529504,
"grad_norm": 0.5058093159841838,
"learning_rate": 2.6255932140444546e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1969982385635376,
"step": 2015,
"valid_targets_mean": 4715.8,
"valid_targets_min": 564
},
{
"epoch": 3.221690590111643,
"grad_norm": 0.5417933534703635,
"learning_rate": 2.618033988749895e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17095516622066498,
"step": 2020,
"valid_targets_mean": 5090.6,
"valid_targets_min": 549
},
{
"epoch": 3.229665071770335,
"grad_norm": 0.5215923504113277,
"learning_rate": 2.6104649897925622e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18847623467445374,
"step": 2025,
"valid_targets_mean": 4847.3,
"valid_targets_min": 250
},
{
"epoch": 3.237639553429027,
"grad_norm": 0.4854778649654015,
"learning_rate": 2.602886336869503e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18689140677452087,
"step": 2030,
"valid_targets_mean": 4723.2,
"valid_targets_min": 696
},
{
"epoch": 3.245614035087719,
"grad_norm": 0.41371731832822933,
"learning_rate": 2.595298149830433e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168317049741745,
"step": 2035,
"valid_targets_mean": 5431.8,
"valid_targets_min": 449
},
{
"epoch": 3.2535885167464116,
"grad_norm": 0.4766656293066071,
"learning_rate": 2.5877005486758424e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16988810896873474,
"step": 2040,
"valid_targets_mean": 4498.4,
"valid_targets_min": 259
},
{
"epoch": 3.2615629984051036,
"grad_norm": 0.4657699021786932,
"learning_rate": 2.5800936535550954e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19996368885040283,
"step": 2045,
"valid_targets_mean": 5065.3,
"valid_targets_min": 389
},
{
"epoch": 3.269537480063796,
"grad_norm": 0.579537992120868,
"learning_rate": 2.5724775847645345e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1846703290939331,
"step": 2050,
"valid_targets_mean": 3962.0,
"valid_targets_min": 356
},
{
"epoch": 3.277511961722488,
"grad_norm": 0.43962432468601853,
"learning_rate": 2.5648524627455738e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17168590426445007,
"step": 2055,
"valid_targets_mean": 4880.3,
"valid_targets_min": 241
},
{
"epoch": 3.2854864433811803,
"grad_norm": 0.43976364075492486,
"learning_rate": 2.557218408082798e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17411866784095764,
"step": 2060,
"valid_targets_mean": 5362.1,
"valid_targets_min": 842
},
{
"epoch": 3.2934609250398723,
"grad_norm": 0.4166736194901456,
"learning_rate": 2.5495755415020504e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17816022038459778,
"step": 2065,
"valid_targets_mean": 5734.4,
"valid_targets_min": 905
},
{
"epoch": 3.3014354066985647,
"grad_norm": 0.4697125475765612,
"learning_rate": 2.5419239838685325e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751966029405594,
"step": 2070,
"valid_targets_mean": 4562.7,
"valid_targets_min": 285
},
{
"epoch": 3.3094098883572567,
"grad_norm": 0.4671449458327588,
"learning_rate": 2.5342638561848817e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16543221473693848,
"step": 2075,
"valid_targets_mean": 4974.4,
"valid_targets_min": 226
},
{
"epoch": 3.317384370015949,
"grad_norm": 0.40997152428438766,
"learning_rate": 2.526595279589265e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1541728526353836,
"step": 2080,
"valid_targets_mean": 4638.1,
"valid_targets_min": 226
},
{
"epoch": 3.325358851674641,
"grad_norm": 0.4771138092691609,
"learning_rate": 2.5189183753534634e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1681135892868042,
"step": 2085,
"valid_targets_mean": 4536.9,
"valid_targets_min": 210
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.43928713346598164,
"learning_rate": 2.5112332648809495e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14815892279148102,
"step": 2090,
"valid_targets_mean": 5117.4,
"valid_targets_min": 229
},
{
"epoch": 3.3413078149920254,
"grad_norm": 0.4313014172799839,
"learning_rate": 2.503540069704973e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17248690128326416,
"step": 2095,
"valid_targets_mean": 4849.8,
"valid_targets_min": 241
},
{
"epoch": 3.349282296650718,
"grad_norm": 0.4133044248197675,
"learning_rate": 2.4958389114866326e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17558759450912476,
"step": 2100,
"valid_targets_mean": 5708.4,
"valid_targets_min": 266
},
{
"epoch": 3.35725677830941,
"grad_norm": 0.4626815305223826,
"learning_rate": 2.488129912012958e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18145158886909485,
"step": 2105,
"valid_targets_mean": 5372.7,
"valid_targets_min": 290
},
{
"epoch": 3.3652312599681022,
"grad_norm": 0.5376199276841933,
"learning_rate": 2.4804131931949823e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20464350283145905,
"step": 2110,
"valid_targets_mean": 3939.8,
"valid_targets_min": 471
},
{
"epoch": 3.373205741626794,
"grad_norm": 0.39017410377798123,
"learning_rate": 2.4726888770658103e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16700437664985657,
"step": 2115,
"valid_targets_mean": 6394.6,
"valid_targets_min": 239
},
{
"epoch": 3.3811802232854866,
"grad_norm": 0.4501347693294624,
"learning_rate": 2.4649570857786928e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18887585401535034,
"step": 2120,
"valid_targets_mean": 5312.3,
"valid_targets_min": 257
},
{
"epoch": 3.3891547049441786,
"grad_norm": 0.3953602084293926,
"learning_rate": 2.4572179416050953e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16343992948532104,
"step": 2125,
"valid_targets_mean": 5817.3,
"valid_targets_min": 243
},
{
"epoch": 3.397129186602871,
"grad_norm": 0.5007835737617361,
"learning_rate": 2.449471566932761e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17662839591503143,
"step": 2130,
"valid_targets_mean": 4295.5,
"valid_targets_min": 226
},
{
"epoch": 3.405103668261563,
"grad_norm": 0.4957544588950391,
"learning_rate": 2.4417180842637764e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17977860569953918,
"step": 2135,
"valid_targets_mean": 3976.7,
"valid_targets_min": 194
},
{
"epoch": 3.4130781499202554,
"grad_norm": 0.38831190373740015,
"learning_rate": 2.4339576162126362e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16816681623458862,
"step": 2140,
"valid_targets_mean": 5675.8,
"valid_targets_min": 319
},
{
"epoch": 3.4210526315789473,
"grad_norm": 0.9616520701738128,
"learning_rate": 2.4261902855043027e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17975673079490662,
"step": 2145,
"valid_targets_mean": 4098.2,
"valid_targets_min": 603
},
{
"epoch": 3.4290271132376393,
"grad_norm": 0.4782879314316972,
"learning_rate": 2.418416214972265e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17841896414756775,
"step": 2150,
"valid_targets_mean": 4659.6,
"valid_targets_min": 223
},
{
"epoch": 3.4370015948963317,
"grad_norm": 0.4811275110351178,
"learning_rate": 2.4106355275565937e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17591729760169983,
"step": 2155,
"valid_targets_mean": 4179.1,
"valid_targets_min": 238
},
{
"epoch": 3.444976076555024,
"grad_norm": 0.3982427739209225,
"learning_rate": 2.4028483463020053e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15703259408473969,
"step": 2160,
"valid_targets_mean": 5950.8,
"valid_targets_min": 3447
},
{
"epoch": 3.452950558213716,
"grad_norm": 0.4924681333200768,
"learning_rate": 2.3950547943559056e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16207414865493774,
"step": 2165,
"valid_targets_mean": 5059.4,
"valid_targets_min": 244
},
{
"epoch": 3.460925039872408,
"grad_norm": 0.4085937153688259,
"learning_rate": 2.3872549949664493e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17049971222877502,
"step": 2170,
"valid_targets_mean": 5347.9,
"valid_targets_min": 283
},
{
"epoch": 3.4688995215311005,
"grad_norm": 0.4421895807116598,
"learning_rate": 2.3794490714805897e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17558689415454865,
"step": 2175,
"valid_targets_mean": 5187.2,
"valid_targets_min": 381
},
{
"epoch": 3.476874003189793,
"grad_norm": 0.419246164689495,
"learning_rate": 2.3716371473421242e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20042678713798523,
"step": 2180,
"valid_targets_mean": 5921.3,
"valid_targets_min": 705
},
{
"epoch": 3.484848484848485,
"grad_norm": 0.4534306165338507,
"learning_rate": 2.36381934608975e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17749859392642975,
"step": 2185,
"valid_targets_mean": 5067.5,
"valid_targets_min": 230
},
{
"epoch": 3.492822966507177,
"grad_norm": 0.5306038480542064,
"learning_rate": 2.3559957913551014e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18456803262233734,
"step": 2190,
"valid_targets_mean": 5680.9,
"valid_targets_min": 237
},
{
"epoch": 3.5007974481658692,
"grad_norm": 0.49172607407811136,
"learning_rate": 2.3481666068607994e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1954020857810974,
"step": 2195,
"valid_targets_mean": 4640.9,
"valid_targets_min": 357
},
{
"epoch": 3.5087719298245617,
"grad_norm": 0.41516895750937666,
"learning_rate": 2.3403319164184986e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15638519823551178,
"step": 2200,
"valid_targets_mean": 5532.4,
"valid_targets_min": 958
},
{
"epoch": 3.5167464114832536,
"grad_norm": 0.4251311303323281,
"learning_rate": 2.3324918439269206e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1633860468864441,
"step": 2205,
"valid_targets_mean": 5711.6,
"valid_targets_min": 3042
},
{
"epoch": 3.5247208931419456,
"grad_norm": 0.41401228714505406,
"learning_rate": 2.3246465133699024e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15223251283168793,
"step": 2210,
"valid_targets_mean": 5461.5,
"valid_targets_min": 1728
},
{
"epoch": 3.532695374800638,
"grad_norm": 0.43338985811687897,
"learning_rate": 2.31679604881443e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23456290364265442,
"step": 2215,
"valid_targets_mean": 6196.2,
"valid_targets_min": 234
},
{
"epoch": 3.5406698564593304,
"grad_norm": 0.4391172774731024,
"learning_rate": 2.3089405744086823e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16365471482276917,
"step": 2220,
"valid_targets_mean": 4690.2,
"valid_targets_min": 237
},
{
"epoch": 3.5486443381180224,
"grad_norm": 0.41279470884015235,
"learning_rate": 2.3010802143800626e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17660290002822876,
"step": 2225,
"valid_targets_mean": 5499.1,
"valid_targets_min": 255
},
{
"epoch": 3.5566188197767143,
"grad_norm": 0.4616887719700764,
"learning_rate": 2.2932150930332363e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628832221031189,
"step": 2230,
"valid_targets_mean": 4519.4,
"valid_targets_min": 236
},
{
"epoch": 3.5645933014354068,
"grad_norm": 0.4143421206391745,
"learning_rate": 2.2853453347481635e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17244276404380798,
"step": 2235,
"valid_targets_mean": 5402.8,
"valid_targets_min": 227
},
{
"epoch": 3.5725677830940987,
"grad_norm": 0.4491746905194006,
"learning_rate": 2.277471063978137e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15876632928848267,
"step": 2240,
"valid_targets_mean": 4808.6,
"valid_targets_min": 231
},
{
"epoch": 3.580542264752791,
"grad_norm": 0.5060019043175118,
"learning_rate": 2.2695924052478065e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17421862483024597,
"step": 2245,
"valid_targets_mean": 4258.2,
"valid_targets_min": 260
},
{
"epoch": 3.588516746411483,
"grad_norm": 0.41387766339051296,
"learning_rate": 2.2617094831512167e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17327752709388733,
"step": 2250,
"valid_targets_mean": 6265.3,
"valid_targets_min": 2950
},
{
"epoch": 3.5964912280701755,
"grad_norm": 0.4611729813954408,
"learning_rate": 2.253822422349831e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1817869246006012,
"step": 2255,
"valid_targets_mean": 4701.2,
"valid_targets_min": 397
},
{
"epoch": 3.6044657097288675,
"grad_norm": 0.43026115082741934,
"learning_rate": 2.2459313475705645e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1769014596939087,
"step": 2260,
"valid_targets_mean": 5325.2,
"valid_targets_min": 205
},
{
"epoch": 3.61244019138756,
"grad_norm": 0.5249375671075871,
"learning_rate": 2.23803638360381e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18358995020389557,
"step": 2265,
"valid_targets_mean": 3656.4,
"valid_targets_min": 199
},
{
"epoch": 3.620414673046252,
"grad_norm": 0.4541299825413091,
"learning_rate": 2.2301376553014625e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612316220998764,
"step": 2270,
"valid_targets_mean": 4446.9,
"valid_targets_min": 245
},
{
"epoch": 3.6283891547049443,
"grad_norm": 0.5119351564216902,
"learning_rate": 2.2222352875749493e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19726499915122986,
"step": 2275,
"valid_targets_mean": 5226.8,
"valid_targets_min": 395
},
{
"epoch": 3.6363636363636362,
"grad_norm": 0.4597152452341196,
"learning_rate": 2.214329405393249e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666208803653717,
"step": 2280,
"valid_targets_mean": 4824.7,
"valid_targets_min": 1500
},
{
"epoch": 3.6443381180223287,
"grad_norm": 0.41930922950793337,
"learning_rate": 2.2064201337809212e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17563220858573914,
"step": 2285,
"valid_targets_mean": 5103.7,
"valid_targets_min": 2380
},
{
"epoch": 3.6523125996810206,
"grad_norm": 0.551536941032092,
"learning_rate": 2.1985075978161236e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1810903698205948,
"step": 2290,
"valid_targets_mean": 4225.5,
"valid_targets_min": 238
},
{
"epoch": 3.660287081339713,
"grad_norm": 0.46416383882322815,
"learning_rate": 2.1905919226286385e-05,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1780536025762558,
"step": 2295,
"valid_targets_mean": 4323.2,
"valid_targets_min": 349
},
{
"epoch": 3.668261562998405,
"grad_norm": 0.4379742235735547,
"learning_rate": 2.1826732333978924e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1874227225780487,
"step": 2300,
"valid_targets_mean": 4977.4,
"valid_targets_min": 236
},
{
"epoch": 3.6762360446570974,
"grad_norm": 0.4619563699283561,
"learning_rate": 2.1747516553509755e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17133791744709015,
"step": 2305,
"valid_targets_mean": 4711.6,
"valid_targets_min": 245
},
{
"epoch": 3.6842105263157894,
"grad_norm": 0.489064170185469,
"learning_rate": 2.166827313760662e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689237505197525,
"step": 2310,
"valid_targets_mean": 4220.6,
"valid_targets_min": 358
},
{
"epoch": 3.692185007974482,
"grad_norm": 0.44106248237446816,
"learning_rate": 2.1589003339434292e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686490774154663,
"step": 2315,
"valid_targets_mean": 4874.4,
"valid_targets_min": 216
},
{
"epoch": 3.7001594896331738,
"grad_norm": 0.44652285565230415,
"learning_rate": 2.150970841257476e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18092358112335205,
"step": 2320,
"valid_targets_mean": 4935.1,
"valid_targets_min": 242
},
{
"epoch": 3.708133971291866,
"grad_norm": 0.41008613997039367,
"learning_rate": 2.1430389611007393e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724787950515747,
"step": 2325,
"valid_targets_mean": 5347.4,
"valid_targets_min": 306
},
{
"epoch": 3.716108452950558,
"grad_norm": 0.4552446615706991,
"learning_rate": 2.135104818908913e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17449814081192017,
"step": 2330,
"valid_targets_mean": 5358.0,
"valid_targets_min": 258
},
{
"epoch": 3.7240829346092506,
"grad_norm": 0.5705362385621706,
"learning_rate": 2.1271685401534617e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17245930433273315,
"step": 2335,
"valid_targets_mean": 5281.9,
"valid_targets_min": 252
},
{
"epoch": 3.7320574162679425,
"grad_norm": 0.45629997713629283,
"learning_rate": 2.11923025033964e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18641863763332367,
"step": 2340,
"valid_targets_mean": 4875.7,
"valid_targets_min": 244
},
{
"epoch": 3.740031897926635,
"grad_norm": 0.5004011387408458,
"learning_rate": 2.111290075004503e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1716715544462204,
"step": 2345,
"valid_targets_mean": 3934.6,
"valid_targets_min": 242
},
{
"epoch": 3.748006379585327,
"grad_norm": 0.46246492036373593,
"learning_rate": 2.103348139714925e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724526733160019,
"step": 2350,
"valid_targets_mean": 4492.5,
"valid_targets_min": 238
},
{
"epoch": 3.7559808612440193,
"grad_norm": 0.5448173548752107,
"learning_rate": 2.0954045700656126e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17832358181476593,
"step": 2355,
"valid_targets_mean": 3425.9,
"valid_targets_min": 205
},
{
"epoch": 3.7639553429027113,
"grad_norm": 0.5015418002105231,
"learning_rate": 2.0874594916771174e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18966464698314667,
"step": 2360,
"valid_targets_mean": 4649.9,
"valid_targets_min": 428
},
{
"epoch": 3.7719298245614032,
"grad_norm": 0.4569286157077601,
"learning_rate": 2.079513030193852e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15085861086845398,
"step": 2365,
"valid_targets_mean": 4497.1,
"valid_targets_min": 650
},
{
"epoch": 3.7799043062200957,
"grad_norm": 0.5131210924769427,
"learning_rate": 2.071565311282099e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16978487372398376,
"step": 2370,
"valid_targets_mean": 3804.6,
"valid_targets_min": 255
},
{
"epoch": 3.787878787878788,
"grad_norm": 0.4053676310724288,
"learning_rate": 2.063616460628029e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1770038604736328,
"step": 2375,
"valid_targets_mean": 5768.6,
"valid_targets_min": 227
},
{
"epoch": 3.79585326953748,
"grad_norm": 0.4533781362163844,
"learning_rate": 2.0556666039357084e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17858347296714783,
"step": 2380,
"valid_targets_mean": 5566.5,
"valid_targets_min": 252
},
{
"epoch": 3.803827751196172,
"grad_norm": 0.4188217594597362,
"learning_rate": 2.047715866925113e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18884845077991486,
"step": 2385,
"valid_targets_mean": 5425.9,
"valid_targets_min": 259
},
{
"epoch": 3.8118022328548644,
"grad_norm": 0.4764124493876062,
"learning_rate": 2.0397643753301403e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16345086693763733,
"step": 2390,
"valid_targets_mean": 5698.1,
"valid_targets_min": 286
},
{
"epoch": 3.819776714513557,
"grad_norm": 0.48932350458239837,
"learning_rate": 2.0318122548966225e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17059862613677979,
"step": 2395,
"valid_targets_mean": 4492.2,
"valid_targets_min": 427
},
{
"epoch": 3.827751196172249,
"grad_norm": 0.4210708424627556,
"learning_rate": 2.0238596313803337e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16127406060695648,
"step": 2400,
"valid_targets_mean": 6233.4,
"valid_targets_min": 4329
},
{
"epoch": 3.8357256778309408,
"grad_norm": 0.46048380449758947,
"learning_rate": 2.015906630545005e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19462665915489197,
"step": 2405,
"valid_targets_mean": 4631.4,
"valid_targets_min": 409
},
{
"epoch": 3.843700159489633,
"grad_norm": 0.42862173152229316,
"learning_rate": 2.0079533781603352e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18994180858135223,
"step": 2410,
"valid_targets_mean": 4918.5,
"valid_targets_min": 332
},
{
"epoch": 3.8516746411483256,
"grad_norm": 0.5010059874905928,
"learning_rate": 2e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20106858015060425,
"step": 2415,
"valid_targets_mean": 4281.1,
"valid_targets_min": 262
},
{
"epoch": 3.8596491228070176,
"grad_norm": 0.4072491507266973,
"learning_rate": 1.9920466218396655e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16354908049106598,
"step": 2420,
"valid_targets_mean": 4883.2,
"valid_targets_min": 245
},
{
"epoch": 3.8676236044657095,
"grad_norm": 0.4810942686183941,
"learning_rate": 1.9840933694549956e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18778419494628906,
"step": 2425,
"valid_targets_mean": 4466.9,
"valid_targets_min": 240
},
{
"epoch": 3.875598086124402,
"grad_norm": 0.4057684960139382,
"learning_rate": 1.976140368619667e-05,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1536000519990921,
"step": 2430,
"valid_targets_mean": 5985.8,
"valid_targets_min": 244
},
{
"epoch": 3.8835725677830943,
"grad_norm": 0.4211890086346668,
"learning_rate": 1.9681877451033778e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17464828491210938,
"step": 2435,
"valid_targets_mean": 5423.5,
"valid_targets_min": 373
},
{
"epoch": 3.8915470494417863,
"grad_norm": 0.47758132116301366,
"learning_rate": 1.9602356246698597e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19579948484897614,
"step": 2440,
"valid_targets_mean": 4473.9,
"valid_targets_min": 211
},
{
"epoch": 3.8995215311004783,
"grad_norm": 0.43785459648367925,
"learning_rate": 1.9522841330748877e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16913919150829315,
"step": 2445,
"valid_targets_mean": 5518.2,
"valid_targets_min": 876
},
{
"epoch": 3.9074960127591707,
"grad_norm": 0.4718315228758523,
"learning_rate": 1.944333396064292e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16812896728515625,
"step": 2450,
"valid_targets_mean": 4544.7,
"valid_targets_min": 228
},
{
"epoch": 3.915470494417863,
"grad_norm": 0.41246881276557107,
"learning_rate": 1.936383539371971e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.186811625957489,
"step": 2455,
"valid_targets_mean": 5773.6,
"valid_targets_min": 244
},
{
"epoch": 3.923444976076555,
"grad_norm": 0.4236112780842354,
"learning_rate": 1.9284346887179016e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823834776878357,
"step": 2460,
"valid_targets_mean": 5392.7,
"valid_targets_min": 269
},
{
"epoch": 3.931419457735247,
"grad_norm": 0.48575329642988746,
"learning_rate": 1.9204869698061493e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17913323640823364,
"step": 2465,
"valid_targets_mean": 4545.8,
"valid_targets_min": 189
},
{
"epoch": 3.9393939393939394,
"grad_norm": 0.4391863078677367,
"learning_rate": 1.9125405083228833e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18172624707221985,
"step": 2470,
"valid_targets_mean": 5295.9,
"valid_targets_min": 250
},
{
"epoch": 3.9473684210526314,
"grad_norm": 0.43686870532771416,
"learning_rate": 1.9045954299343884e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18156322836875916,
"step": 2475,
"valid_targets_mean": 5534.2,
"valid_targets_min": 735
},
{
"epoch": 3.955342902711324,
"grad_norm": 0.4410672277323973,
"learning_rate": 1.896651860285076e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16273203492164612,
"step": 2480,
"valid_targets_mean": 5046.9,
"valid_targets_min": 244
},
{
"epoch": 3.963317384370016,
"grad_norm": 0.4379301215701126,
"learning_rate": 1.8887099249954976e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18227660655975342,
"step": 2485,
"valid_targets_mean": 5287.8,
"valid_targets_min": 1155
},
{
"epoch": 3.971291866028708,
"grad_norm": 0.41662085884964606,
"learning_rate": 1.8807697496603604e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1678864061832428,
"step": 2490,
"valid_targets_mean": 5324.2,
"valid_targets_min": 445
},
{
"epoch": 3.9792663476874,
"grad_norm": 0.4373979648967585,
"learning_rate": 1.8728314598465386e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18611688911914825,
"step": 2495,
"valid_targets_mean": 5373.3,
"valid_targets_min": 382
},
{
"epoch": 3.9872408293460926,
"grad_norm": 0.457053493882227,
"learning_rate": 1.8648951810910878e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1983267068862915,
"step": 2500,
"valid_targets_mean": 5981.6,
"valid_targets_min": 342
},
{
"epoch": 3.9952153110047846,
"grad_norm": 0.43207203226320035,
"learning_rate": 1.856961038899261e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594964861869812,
"step": 2505,
"valid_targets_mean": 4767.2,
"valid_targets_min": 248
},
{
"epoch": 4.003189792663477,
"grad_norm": 0.44162771304729975,
"learning_rate": 1.849029158742525e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17399078607559204,
"step": 2510,
"valid_targets_mean": 4869.1,
"valid_targets_min": 259
},
{
"epoch": 4.011164274322169,
"grad_norm": 0.4100149325744668,
"learning_rate": 1.8410996660565714e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16074588894844055,
"step": 2515,
"valid_targets_mean": 5768.7,
"valid_targets_min": 495
},
{
"epoch": 4.019138755980861,
"grad_norm": 0.4871133329160863,
"learning_rate": 1.8331726862393385e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16799892485141754,
"step": 2520,
"valid_targets_mean": 5172.4,
"valid_targets_min": 980
},
{
"epoch": 4.027113237639553,
"grad_norm": 0.46342804287893813,
"learning_rate": 1.8252483446490245e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1649300903081894,
"step": 2525,
"valid_targets_mean": 5258.1,
"valid_targets_min": 226
},
{
"epoch": 4.035087719298246,
"grad_norm": 0.4888182281978054,
"learning_rate": 1.8173267666021075e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13286834955215454,
"step": 2530,
"valid_targets_mean": 3738.4,
"valid_targets_min": 225
},
{
"epoch": 4.043062200956938,
"grad_norm": 0.439511550487397,
"learning_rate": 1.8094080773713615e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16421306133270264,
"step": 2535,
"valid_targets_mean": 5328.5,
"valid_targets_min": 248
},
{
"epoch": 4.05103668261563,
"grad_norm": 0.39916496188969774,
"learning_rate": 1.8014924021838774e-05,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19473597407341003,
"step": 2540,
"valid_targets_mean": 6501.2,
"valid_targets_min": 798
},
{
"epoch": 4.059011164274322,
"grad_norm": 0.45532784154246636,
"learning_rate": 1.7935798662190798e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18312832713127136,
"step": 2545,
"valid_targets_mean": 5164.4,
"valid_targets_min": 1592
},
{
"epoch": 4.0669856459330145,
"grad_norm": 0.39457706368906487,
"learning_rate": 1.785670594606752e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14157655835151672,
"step": 2550,
"valid_targets_mean": 5789.8,
"valid_targets_min": 241
},
{
"epoch": 4.074960127591707,
"grad_norm": 0.44152278033105163,
"learning_rate": 1.777764712425052e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16815263032913208,
"step": 2555,
"valid_targets_mean": 5426.9,
"valid_targets_min": 362
},
{
"epoch": 4.082934609250398,
"grad_norm": 0.4297478681585869,
"learning_rate": 1.7698623446985378e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1471405178308487,
"step": 2560,
"valid_targets_mean": 5570.6,
"valid_targets_min": 221
},
{
"epoch": 4.090909090909091,
"grad_norm": 0.443891814693673,
"learning_rate": 1.7619636163961907e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15766510367393494,
"step": 2565,
"valid_targets_mean": 5007.6,
"valid_targets_min": 243
},
{
"epoch": 4.098883572567783,
"grad_norm": 0.6970765377465047,
"learning_rate": 1.754068652429436e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15241992473602295,
"step": 2570,
"valid_targets_mean": 4964.9,
"valid_targets_min": 257
},
{
"epoch": 4.106858054226476,
"grad_norm": 0.5016042784027481,
"learning_rate": 1.74617757765017e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15563294291496277,
"step": 2575,
"valid_targets_mean": 4340.1,
"valid_targets_min": 200
},
{
"epoch": 4.114832535885167,
"grad_norm": 0.4424438379039299,
"learning_rate": 1.738290516848784e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17813259363174438,
"step": 2580,
"valid_targets_mean": 5369.1,
"valid_targets_min": 251
},
{
"epoch": 4.12280701754386,
"grad_norm": 0.45797415814975423,
"learning_rate": 1.730407594752194e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16528105735778809,
"step": 2585,
"valid_targets_mean": 5390.3,
"valid_targets_min": 269
},
{
"epoch": 4.130781499202552,
"grad_norm": 0.5111816555204367,
"learning_rate": 1.722528936021864e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601203978061676,
"step": 2590,
"valid_targets_mean": 3531.6,
"valid_targets_min": 315
},
{
"epoch": 4.138755980861244,
"grad_norm": 0.3767954932539586,
"learning_rate": 1.714654665251837e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1518028825521469,
"step": 2595,
"valid_targets_mean": 6542.2,
"valid_targets_min": 1157
},
{
"epoch": 4.146730462519936,
"grad_norm": 0.46197127874950683,
"learning_rate": 1.7067849069667644e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1635223627090454,
"step": 2600,
"valid_targets_mean": 4890.6,
"valid_targets_min": 538
},
{
"epoch": 4.154704944178628,
"grad_norm": 0.590965129504492,
"learning_rate": 1.6989197856199377e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14913973212242126,
"step": 2605,
"valid_targets_mean": 5326.4,
"valid_targets_min": 255
},
{
"epoch": 4.162679425837321,
"grad_norm": 0.4398420111040478,
"learning_rate": 1.6910594255913177e-05,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16554518043994904,
"step": 2610,
"valid_targets_mean": 5232.0,
"valid_targets_min": 911
},
{
"epoch": 4.170653907496013,
"grad_norm": 1.2896108249705025,
"learning_rate": 1.6832039511855702e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1797063648700714,
"step": 2615,
"valid_targets_mean": 4964.2,
"valid_targets_min": 252
},
{
"epoch": 4.178628389154705,
"grad_norm": 0.4916215767968524,
"learning_rate": 1.6753534866300983e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.162457674741745,
"step": 2620,
"valid_targets_mean": 4723.4,
"valid_targets_min": 525
},
{
"epoch": 4.186602870813397,
"grad_norm": 0.436093385151016,
"learning_rate": 1.6675081560730804e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1415684074163437,
"step": 2625,
"valid_targets_mean": 4707.8,
"valid_targets_min": 245
},
{
"epoch": 4.1945773524720895,
"grad_norm": 0.3767766840818539,
"learning_rate": 1.6596680835815024e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15540149807929993,
"step": 2630,
"valid_targets_mean": 7057.1,
"valid_targets_min": 4854
},
{
"epoch": 4.202551834130782,
"grad_norm": 0.5066458024848639,
"learning_rate": 1.651833393139201e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16125883162021637,
"step": 2635,
"valid_targets_mean": 3526.9,
"valid_targets_min": 238
},
{
"epoch": 4.2105263157894735,
"grad_norm": 0.4523713268939122,
"learning_rate": 1.6440042086449e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16887378692626953,
"step": 2640,
"valid_targets_mean": 5442.1,
"valid_targets_min": 1251
},
{
"epoch": 4.218500797448166,
"grad_norm": 0.4669348386422092,
"learning_rate": 1.6361806539102508e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16306337714195251,
"step": 2645,
"valid_targets_mean": 5191.7,
"valid_targets_min": 232
},
{
"epoch": 4.226475279106858,
"grad_norm": 0.44072670778662126,
"learning_rate": 1.628362852657876e-05,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595107614994049,
"step": 2650,
"valid_targets_mean": 5289.1,
"valid_targets_min": 377
},
{
"epoch": 4.23444976076555,
"grad_norm": 0.4181461806366608,
"learning_rate": 1.620550928519411e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15849584341049194,
"step": 2655,
"valid_targets_mean": 4996.6,
"valid_targets_min": 378
},
{
"epoch": 4.242424242424242,
"grad_norm": 0.43195277822271283,
"learning_rate": 1.612745005033551e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16953721642494202,
"step": 2660,
"valid_targets_mean": 5369.8,
"valid_targets_min": 243
},
{
"epoch": 4.250398724082935,
"grad_norm": 0.41229933540536656,
"learning_rate": 1.6049452056440948e-05,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17528899013996124,
"step": 2665,
"valid_targets_mean": 6492.4,
"valid_targets_min": 3730
},
{
"epoch": 4.258373205741627,
"grad_norm": 0.4711001749394507,
"learning_rate": 1.597151653697995e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.156410813331604,
"step": 2670,
"valid_targets_mean": 4710.2,
"valid_targets_min": 329
},
{
"epoch": 4.266347687400319,
"grad_norm": 0.42542209328206093,
"learning_rate": 1.5893644724434066e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16571450233459473,
"step": 2675,
"valid_targets_mean": 5378.8,
"valid_targets_min": 393
},
{
"epoch": 4.274322169059011,
"grad_norm": 0.6303378780815382,
"learning_rate": 1.581583785027736e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1706840693950653,
"step": 2680,
"valid_targets_mean": 4807.1,
"valid_targets_min": 235
},
{
"epoch": 4.282296650717703,
"grad_norm": 0.48966028379629584,
"learning_rate": 1.5738097144956976e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15253716707229614,
"step": 2685,
"valid_targets_mean": 4374.9,
"valid_targets_min": 287
},
{
"epoch": 4.290271132376396,
"grad_norm": 0.41033469363863073,
"learning_rate": 1.566042383787364e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15829625725746155,
"step": 2690,
"valid_targets_mean": 6175.6,
"valid_targets_min": 224
},
{
"epoch": 4.298245614035087,
"grad_norm": 0.40731073913252946,
"learning_rate": 1.558281915736224e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14746209979057312,
"step": 2695,
"valid_targets_mean": 5612.4,
"valid_targets_min": 245
},
{
"epoch": 4.30622009569378,
"grad_norm": 0.5078322157963522,
"learning_rate": 1.550528433067239e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16952064633369446,
"step": 2700,
"valid_targets_mean": 5778.9,
"valid_targets_min": 878
},
{
"epoch": 4.314194577352472,
"grad_norm": 0.5507289227344653,
"learning_rate": 1.5427820583949054e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15994137525558472,
"step": 2705,
"valid_targets_mean": 4218.4,
"valid_targets_min": 239
},
{
"epoch": 4.3221690590111645,
"grad_norm": 0.408459346880975,
"learning_rate": 1.5350429142213075e-05,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14765138924121857,
"step": 2710,
"valid_targets_mean": 5390.0,
"valid_targets_min": 272
},
{
"epoch": 4.330143540669856,
"grad_norm": 0.4621251709763953,
"learning_rate": 1.5273111229341907e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16809380054473877,
"step": 2715,
"valid_targets_mean": 4960.4,
"valid_targets_min": 251
},
{
"epoch": 4.3381180223285485,
"grad_norm": 0.4859821294927119,
"learning_rate": 1.5195868068050185e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15256614983081818,
"step": 2720,
"valid_targets_mean": 4789.8,
"valid_targets_min": 265
},
{
"epoch": 4.346092503987241,
"grad_norm": 0.44208802195312985,
"learning_rate": 1.5118700879870426e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16697990894317627,
"step": 2725,
"valid_targets_mean": 5019.8,
"valid_targets_min": 227
},
{
"epoch": 4.354066985645933,
"grad_norm": 0.39327145737658015,
"learning_rate": 1.5041610885133681e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17563647031784058,
"step": 2730,
"valid_targets_mean": 6262.4,
"valid_targets_min": 4299
},
{
"epoch": 4.362041467304625,
"grad_norm": 0.5020697131026288,
"learning_rate": 1.496459930295028e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.158511221408844,
"step": 2735,
"valid_targets_mean": 5749.7,
"valid_targets_min": 347
},
{
"epoch": 4.370015948963317,
"grad_norm": 0.435040583369635,
"learning_rate": 1.4887667351190508e-05,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15348437428474426,
"step": 2740,
"valid_targets_mean": 5452.8,
"valid_targets_min": 866
},
{
"epoch": 4.37799043062201,
"grad_norm": 0.4713309684053475,
"learning_rate": 1.4810816246465374e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18029925227165222,
"step": 2745,
"valid_targets_mean": 4950.2,
"valid_targets_min": 238
},
{
"epoch": 4.385964912280702,
"grad_norm": 0.4989171949325947,
"learning_rate": 1.4734047204107358e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.162031888961792,
"step": 2750,
"valid_targets_mean": 5264.2,
"valid_targets_min": 797
},
{
"epoch": 4.393939393939394,
"grad_norm": 0.4481729316372481,
"learning_rate": 1.4657361438151192e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17081616818904877,
"step": 2755,
"valid_targets_mean": 4965.4,
"valid_targets_min": 281
},
{
"epoch": 4.401913875598086,
"grad_norm": 0.5035101448803713,
"learning_rate": 1.458076016131468e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17901387810707092,
"step": 2760,
"valid_targets_mean": 4425.4,
"valid_targets_min": 230
},
{
"epoch": 4.409888357256778,
"grad_norm": 0.439004055065166,
"learning_rate": 1.4504244584979494e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1770099699497223,
"step": 2765,
"valid_targets_mean": 5970.6,
"valid_targets_min": 280
},
{
"epoch": 4.417862838915471,
"grad_norm": 0.4559810410634476,
"learning_rate": 1.442781591917203e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16673271358013153,
"step": 2770,
"valid_targets_mean": 5037.8,
"valid_targets_min": 342
},
{
"epoch": 4.425837320574162,
"grad_norm": 0.49141320176391684,
"learning_rate": 1.4351475372544262e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17553502321243286,
"step": 2775,
"valid_targets_mean": 5215.1,
"valid_targets_min": 241
},
{
"epoch": 4.433811802232855,
"grad_norm": 0.4548580416328493,
"learning_rate": 1.4275224152354658e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15424610674381256,
"step": 2780,
"valid_targets_mean": 5256.7,
"valid_targets_min": 227
},
{
"epoch": 4.441786283891547,
"grad_norm": 0.43788067033156486,
"learning_rate": 1.4199063464449047e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14916040003299713,
"step": 2785,
"valid_targets_mean": 5186.2,
"valid_targets_min": 530
},
{
"epoch": 4.44976076555024,
"grad_norm": 0.4517238770171476,
"learning_rate": 1.4122994513241587e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15957307815551758,
"step": 2790,
"valid_targets_mean": 4431.6,
"valid_targets_min": 311
},
{
"epoch": 4.457735247208931,
"grad_norm": 0.4470813659837837,
"learning_rate": 1.4047018501695677e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16156211495399475,
"step": 2795,
"valid_targets_mean": 4721.2,
"valid_targets_min": 361
},
{
"epoch": 4.4657097288676235,
"grad_norm": 0.48463023071484423,
"learning_rate": 1.3971136631304978e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17857998609542847,
"step": 2800,
"valid_targets_mean": 4501.1,
"valid_targets_min": 721
},
{
"epoch": 4.473684210526316,
"grad_norm": 0.463251002628163,
"learning_rate": 1.3895350102074386e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17204450070858002,
"step": 2805,
"valid_targets_mean": 5583.7,
"valid_targets_min": 237
},
{
"epoch": 4.481658692185008,
"grad_norm": 0.43951674293696763,
"learning_rate": 1.3819660112501054e-05,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15155509114265442,
"step": 2810,
"valid_targets_mean": 5825.9,
"valid_targets_min": 897
},
{
"epoch": 4.4896331738437,
"grad_norm": 0.48668589039422894,
"learning_rate": 1.3744067859555461e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16631749272346497,
"step": 2815,
"valid_targets_mean": 4816.9,
"valid_targets_min": 250
},
{
"epoch": 4.497607655502392,
"grad_norm": 0.4474999184326488,
"learning_rate": 1.3668574538662451e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17684899270534515,
"step": 2820,
"valid_targets_mean": 5176.1,
"valid_targets_min": 243
},
{
"epoch": 4.505582137161085,
"grad_norm": 0.4462277446311322,
"learning_rate": 1.3593181343682353e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16628840565681458,
"step": 2825,
"valid_targets_mean": 5292.2,
"valid_targets_min": 309
},
{
"epoch": 4.513556618819777,
"grad_norm": 0.5107987331641045,
"learning_rate": 1.3517889466892085e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15675923228263855,
"step": 2830,
"valid_targets_mean": 3909.9,
"valid_targets_min": 296
},
{
"epoch": 4.521531100478469,
"grad_norm": 0.46641473919470094,
"learning_rate": 1.3442700098966326e-05,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16455984115600586,
"step": 2835,
"valid_targets_mean": 4710.5,
"valid_targets_min": 298
},
{
"epoch": 4.529505582137161,
"grad_norm": 0.5015636399760796,
"learning_rate": 1.3367614428958646e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17463116347789764,
"step": 2840,
"valid_targets_mean": 4366.3,
"valid_targets_min": 265
},
{
"epoch": 4.5374800637958534,
"grad_norm": 0.5206414572728846,
"learning_rate": 1.3292633644282735e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18271681666374207,
"step": 2845,
"valid_targets_mean": 4655.6,
"valid_targets_min": 237
},
{
"epoch": 4.545454545454545,
"grad_norm": 0.612470158692335,
"learning_rate": 1.3217758930693608e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15408973395824432,
"step": 2850,
"valid_targets_mean": 4344.2,
"valid_targets_min": 234
},
{
"epoch": 4.553429027113237,
"grad_norm": 0.38141520226279213,
"learning_rate": 1.314299147226887e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14755874872207642,
"step": 2855,
"valid_targets_mean": 5986.4,
"valid_targets_min": 880
},
{
"epoch": 4.56140350877193,
"grad_norm": 0.4310034608873921,
"learning_rate": 1.3068332451389969e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514865756034851,
"step": 2860,
"valid_targets_mean": 6271.6,
"valid_targets_min": 4306
},
{
"epoch": 4.569377990430622,
"grad_norm": 0.4356530709450213,
"learning_rate": 1.2993783048723515e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15877559781074524,
"step": 2865,
"valid_targets_mean": 5407.3,
"valid_targets_min": 399
},
{
"epoch": 4.577352472089315,
"grad_norm": 0.564670837742309,
"learning_rate": 1.2919344443202602e-05,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14960314333438873,
"step": 2870,
"valid_targets_mean": 3163.2,
"valid_targets_min": 218
},
{
"epoch": 4.585326953748006,
"grad_norm": 0.4785084988426857,
"learning_rate": 1.2845017812008158e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1763634979724884,
"step": 2875,
"valid_targets_mean": 4772.2,
"valid_targets_min": 222
},
{
"epoch": 4.5933014354066986,
"grad_norm": 0.42494589929233484,
"learning_rate": 1.277080433055034e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16085359454154968,
"step": 2880,
"valid_targets_mean": 5689.2,
"valid_targets_min": 225
},
{
"epoch": 4.601275917065391,
"grad_norm": 0.47807251510580745,
"learning_rate": 1.2696705172449944e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15512213110923767,
"step": 2885,
"valid_targets_mean": 4743.9,
"valid_targets_min": 185
},
{
"epoch": 4.6092503987240825,
"grad_norm": 0.45580307365244943,
"learning_rate": 1.2622721509519846e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17423364520072937,
"step": 2890,
"valid_targets_mean": 4932.5,
"valid_targets_min": 373
},
{
"epoch": 4.617224880382775,
"grad_norm": 0.5794992528529187,
"learning_rate": 1.2548854511746461e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17313656210899353,
"step": 2895,
"valid_targets_mean": 4594.8,
"valid_targets_min": 223
},
{
"epoch": 4.625199362041467,
"grad_norm": 0.4094555332819473,
"learning_rate": 1.247510534727125e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15635088086128235,
"step": 2900,
"valid_targets_mean": 5626.6,
"valid_targets_min": 414
},
{
"epoch": 4.63317384370016,
"grad_norm": 0.4677979868665022,
"learning_rate": 1.240147518237224e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1597626507282257,
"step": 2905,
"valid_targets_mean": 4849.3,
"valid_targets_min": 258
},
{
"epoch": 4.641148325358852,
"grad_norm": 0.4603270505711866,
"learning_rate": 1.2327965181445593e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16551506519317627,
"step": 2910,
"valid_targets_mean": 5237.4,
"valid_targets_min": 2288
},
{
"epoch": 4.649122807017544,
"grad_norm": 0.4366408749058765,
"learning_rate": 1.2254576506987182e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1736927628517151,
"step": 2915,
"valid_targets_mean": 5546.3,
"valid_targets_min": 350
},
{
"epoch": 4.657097288676236,
"grad_norm": 0.43355175444421734,
"learning_rate": 1.21813103195742e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15354032814502716,
"step": 2920,
"valid_targets_mean": 5324.1,
"valid_targets_min": 218
},
{
"epoch": 4.6650717703349285,
"grad_norm": 0.5608093339511655,
"learning_rate": 1.2108167777846815e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16178153455257416,
"step": 2925,
"valid_targets_mean": 5233.4,
"valid_targets_min": 242
},
{
"epoch": 4.67304625199362,
"grad_norm": 0.5169396036803482,
"learning_rate": 1.203515003848987e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18358519673347473,
"step": 2930,
"valid_targets_mean": 4139.6,
"valid_targets_min": 333
},
{
"epoch": 4.681020733652312,
"grad_norm": 0.5322766631274986,
"learning_rate": 1.1962258256214545e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16810274124145508,
"step": 2935,
"valid_targets_mean": 3680.1,
"valid_targets_min": 235
},
{
"epoch": 4.688995215311005,
"grad_norm": 0.4507589408310588,
"learning_rate": 1.1889493583740124e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14625227451324463,
"step": 2940,
"valid_targets_mean": 5085.9,
"valid_targets_min": 234
},
{
"epoch": 4.696969696969697,
"grad_norm": 0.5558750405081903,
"learning_rate": 1.1816857171775767e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1795760989189148,
"step": 2945,
"valid_targets_mean": 5080.6,
"valid_targets_min": 226
},
{
"epoch": 4.70494417862839,
"grad_norm": 0.481514040881239,
"learning_rate": 1.1744350169002308e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16550910472869873,
"step": 2950,
"valid_targets_mean": 4276.0,
"valid_targets_min": 220
},
{
"epoch": 4.712918660287081,
"grad_norm": 0.46285391513788915,
"learning_rate": 1.1671973722054077e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15627330541610718,
"step": 2955,
"valid_targets_mean": 5210.4,
"valid_targets_min": 325
},
{
"epoch": 4.720893141945774,
"grad_norm": 0.4381563224190673,
"learning_rate": 1.159972897550079e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16192206740379333,
"step": 2960,
"valid_targets_mean": 5571.1,
"valid_targets_min": 1626
},
{
"epoch": 4.728867623604466,
"grad_norm": 0.5236440592598125,
"learning_rate": 1.1527617071829447e-05,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1626909375190735,
"step": 2965,
"valid_targets_mean": 5419.7,
"valid_targets_min": 732
},
{
"epoch": 4.7368421052631575,
"grad_norm": 0.6260805242947385,
"learning_rate": 1.145563915142622e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17754967510700226,
"step": 2970,
"valid_targets_mean": 4668.6,
"valid_targets_min": 214
},
{
"epoch": 4.74481658692185,
"grad_norm": 0.43717068230202355,
"learning_rate": 1.1383796352558489e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1576494425535202,
"step": 2975,
"valid_targets_mean": 5962.7,
"valid_targets_min": 235
},
{
"epoch": 4.752791068580542,
"grad_norm": 0.5329045016777196,
"learning_rate": 1.1312089811356803e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1734808087348938,
"step": 2980,
"valid_targets_mean": 4494.7,
"valid_targets_min": 327
},
{
"epoch": 4.760765550239235,
"grad_norm": 0.46495559769894873,
"learning_rate": 1.1240520661796882e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16236670315265656,
"step": 2985,
"valid_targets_mean": 4686.7,
"valid_targets_min": 200
},
{
"epoch": 4.768740031897926,
"grad_norm": 0.43626568077375366,
"learning_rate": 1.1169090035681772e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1571044623851776,
"step": 2990,
"valid_targets_mean": 5496.3,
"valid_targets_min": 190
},
{
"epoch": 4.776714513556619,
"grad_norm": 0.45169170298100625,
"learning_rate": 1.109779906262383e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15914367139339447,
"step": 2995,
"valid_targets_mean": 5026.9,
"valid_targets_min": 238
},
{
"epoch": 4.784688995215311,
"grad_norm": 0.4655091549732474,
"learning_rate": 1.102664887002698e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16559766232967377,
"step": 3000,
"valid_targets_mean": 4727.7,
"valid_targets_min": 817
},
{
"epoch": 4.7926634768740035,
"grad_norm": 0.5136371479792501,
"learning_rate": 1.0955640583068802e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1526031494140625,
"step": 3005,
"valid_targets_mean": 4957.2,
"valid_targets_min": 224
},
{
"epoch": 4.800637958532695,
"grad_norm": 0.5016448829784496,
"learning_rate": 1.0884775324682755e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17114630341529846,
"step": 3010,
"valid_targets_mean": 4075.6,
"valid_targets_min": 191
},
{
"epoch": 4.8086124401913874,
"grad_norm": 0.444367284493778,
"learning_rate": 1.081405421554044e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16200141608715057,
"step": 3015,
"valid_targets_mean": 6258.1,
"valid_targets_min": 388
},
{
"epoch": 4.81658692185008,
"grad_norm": 0.4237329819210327,
"learning_rate": 1.074347837403387e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15558627247810364,
"step": 3020,
"valid_targets_mean": 5657.1,
"valid_targets_min": 349
},
{
"epoch": 4.824561403508772,
"grad_norm": 0.5176039560323095,
"learning_rate": 1.067304891625776e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16431066393852234,
"step": 3025,
"valid_targets_mean": 4240.2,
"valid_targets_min": 296
},
{
"epoch": 4.832535885167464,
"grad_norm": 0.528814370807462,
"learning_rate": 1.0602766955991913e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1717158555984497,
"step": 3030,
"valid_targets_mean": 4902.6,
"valid_targets_min": 492
},
{
"epoch": 4.840510366826156,
"grad_norm": 0.44331350492759686,
"learning_rate": 1.053263360468358e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16708722710609436,
"step": 3035,
"valid_targets_mean": 5435.2,
"valid_targets_min": 246
},
{
"epoch": 4.848484848484849,
"grad_norm": 0.44468265380219274,
"learning_rate": 1.0462649971429884e-05,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16008290648460388,
"step": 3040,
"valid_targets_mean": 5562.2,
"valid_targets_min": 237
},
{
"epoch": 4.856459330143541,
"grad_norm": 0.465252421331791,
"learning_rate": 1.0392817162960304e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.159569650888443,
"step": 3045,
"valid_targets_mean": 4934.4,
"valid_targets_min": 779
},
{
"epoch": 4.8644338118022326,
"grad_norm": 0.5128838331578629,
"learning_rate": 1.0323136283619167e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1651550829410553,
"step": 3050,
"valid_targets_mean": 4564.1,
"valid_targets_min": 215
},
{
"epoch": 4.872408293460925,
"grad_norm": 0.45912144059548055,
"learning_rate": 1.0253608435348136e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16643419861793518,
"step": 3055,
"valid_targets_mean": 5427.7,
"valid_targets_min": 229
},
{
"epoch": 4.880382775119617,
"grad_norm": 0.4460208854541763,
"learning_rate": 1.0184234717668867e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16689209640026093,
"step": 3060,
"valid_targets_mean": 4700.7,
"valid_targets_min": 230
},
{
"epoch": 4.88835725677831,
"grad_norm": 0.4135934097283204,
"learning_rate": 1.0115016227665544e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13867491483688354,
"step": 3065,
"valid_targets_mean": 5309.3,
"valid_targets_min": 577
},
{
"epoch": 4.896331738437001,
"grad_norm": 0.47533139658434936,
"learning_rate": 1.0045954059967577e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15308788418769836,
"step": 3070,
"valid_targets_mean": 4834.2,
"valid_targets_min": 390
},
{
"epoch": 4.904306220095694,
"grad_norm": 0.5327287831119275,
"learning_rate": 9.977049306732287e-06,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17162764072418213,
"step": 3075,
"valid_targets_mean": 4897.1,
"valid_targets_min": 238
},
{
"epoch": 4.912280701754386,
"grad_norm": 0.4904017524563081,
"learning_rate": 9.908303057627591e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14119388163089752,
"step": 3080,
"valid_targets_mean": 4725.4,
"valid_targets_min": 228
},
{
"epoch": 4.920255183413078,
"grad_norm": 0.4970617612422358,
"learning_rate": 9.83971639981484e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15496879816055298,
"step": 3085,
"valid_targets_mean": 4607.4,
"valid_targets_min": 408
},
{
"epoch": 4.92822966507177,
"grad_norm": 0.45864620988450583,
"learning_rate": 9.771290417931559e-06,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17323030531406403,
"step": 3090,
"valid_targets_mean": 5090.6,
"valid_targets_min": 293
},
{
"epoch": 4.9362041467304625,
"grad_norm": 0.42808519157930736,
"learning_rate": 9.703026194074342e-06,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540815681219101,
"step": 3095,
"valid_targets_mean": 5067.4,
"valid_targets_min": 327
},
{
"epoch": 4.944178628389155,
"grad_norm": 0.5865902968093246,
"learning_rate": 9.634924807781729e-06,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1912127435207367,
"step": 3100,
"valid_targets_mean": 5640.5,
"valid_targets_min": 246
},
{
"epoch": 4.952153110047847,
"grad_norm": 0.4717173764137801,
"learning_rate": 9.566987336017102e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16661816835403442,
"step": 3105,
"valid_targets_mean": 4765.6,
"valid_targets_min": 311
},
{
"epoch": 4.960127591706539,
"grad_norm": 0.40260436168463637,
"learning_rate": 9.499214853151699e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473720371723175,
"step": 3110,
"valid_targets_mean": 5560.6,
"valid_targets_min": 229
},
{
"epoch": 4.968102073365231,
"grad_norm": 0.6016222748580632,
"learning_rate": 9.431608430947619e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16205176711082458,
"step": 3115,
"valid_targets_mean": 4679.3,
"valid_targets_min": 252
},
{
"epoch": 4.976076555023924,
"grad_norm": 0.5889165021406836,
"learning_rate": 9.364169138540805e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17166294157505035,
"step": 3120,
"valid_targets_mean": 5065.7,
"valid_targets_min": 407
},
{
"epoch": 4.984051036682615,
"grad_norm": 0.4790845449767566,
"learning_rate": 9.296898042424237e-06,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18419404327869415,
"step": 3125,
"valid_targets_mean": 4631.6,
"valid_targets_min": 286
},
{
"epoch": 4.992025518341308,
"grad_norm": 0.598447892968231,
"learning_rate": 9.229796206431015e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18810789287090302,
"step": 3130,
"valid_targets_mean": 5094.1,
"valid_targets_min": 294
},
{
"epoch": 5.0,
"grad_norm": 0.4721586914499431,
"learning_rate": 9.162864691717513e-06,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15202680230140686,
"step": 3135,
"valid_targets_mean": 4077.1,
"valid_targets_min": 246
},
{
"epoch": 5.007974481658692,
"grad_norm": 0.45686843030415786,
"learning_rate": 9.096104556746654e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14485131204128265,
"step": 3140,
"valid_targets_mean": 4520.2,
"valid_targets_min": 212
},
{
"epoch": 5.015948963317384,
"grad_norm": 0.4413073850480446,
"learning_rate": 9.029516857271115e-06,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16614249348640442,
"step": 3145,
"valid_targets_mean": 5247.7,
"valid_targets_min": 407
},
{
"epoch": 5.023923444976076,
"grad_norm": 0.45791139693185595,
"learning_rate": 8.963102646316677e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14995019137859344,
"step": 3150,
"valid_targets_mean": 5282.4,
"valid_targets_min": 241
},
{
"epoch": 5.031897926634769,
"grad_norm": 0.5267991798971836,
"learning_rate": 8.896862974165553e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15393409132957458,
"step": 3155,
"valid_targets_mean": 3715.2,
"valid_targets_min": 223
},
{
"epoch": 5.039872408293461,
"grad_norm": 0.4667594466034452,
"learning_rate": 8.830798888339756e-06,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14532789587974548,
"step": 3160,
"valid_targets_mean": 4772.7,
"valid_targets_min": 203
},
{
"epoch": 5.047846889952153,
"grad_norm": 0.443279890846053,
"learning_rate": 8.764911433584581e-06,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14291726052761078,
"step": 3165,
"valid_targets_mean": 5765.4,
"valid_targets_min": 538
},
{
"epoch": 5.055821371610845,
"grad_norm": 0.5471455934145786,
"learning_rate": 8.699201651852056e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686840057373047,
"step": 3170,
"valid_targets_mean": 4019.4,
"valid_targets_min": 373
},
{
"epoch": 5.0637958532695375,
"grad_norm": 0.49683984011851123,
"learning_rate": 8.633670582284446e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15907122194766998,
"step": 3175,
"valid_targets_mean": 5820.6,
"valid_targets_min": 540
},
{
"epoch": 5.07177033492823,
"grad_norm": 0.5606716282540908,
"learning_rate": 8.56831926119787e-06,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14971384406089783,
"step": 3180,
"valid_targets_mean": 3764.8,
"valid_targets_min": 225
},
{
"epoch": 5.0797448165869215,
"grad_norm": 0.43047185858023407,
"learning_rate": 8.503148722065851e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13558684289455414,
"step": 3185,
"valid_targets_mean": 5010.2,
"valid_targets_min": 243
},
{
"epoch": 5.087719298245614,
"grad_norm": 0.46301730293349586,
"learning_rate": 8.43815999550303e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14114761352539062,
"step": 3190,
"valid_targets_mean": 4802.3,
"valid_targets_min": 650
},
{
"epoch": 5.095693779904306,
"grad_norm": 0.46169394066738256,
"learning_rate": 8.373354109248842e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17059487104415894,
"step": 3195,
"valid_targets_mean": 5362.9,
"valid_targets_min": 477
},
{
"epoch": 5.103668261562999,
"grad_norm": 0.4737706843985567,
"learning_rate": 8.308732088151245e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14929816126823425,
"step": 3200,
"valid_targets_mean": 5279.0,
"valid_targets_min": 1123
},
{
"epoch": 5.11164274322169,
"grad_norm": 0.558320078734975,
"learning_rate": 8.24429495415054e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14897915720939636,
"step": 3205,
"valid_targets_mean": 3327.8,
"valid_targets_min": 198
},
{
"epoch": 5.119617224880383,
"grad_norm": 0.4969563956951489,
"learning_rate": 8.180043726263216e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674622893333435,
"step": 3210,
"valid_targets_mean": 4794.8,
"valid_targets_min": 234
},
{
"epoch": 5.127591706539075,
"grad_norm": 0.4433365316202014,
"learning_rate": 8.115979420565794e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14808738231658936,
"step": 3215,
"valid_targets_mean": 5291.6,
"valid_targets_min": 448
},
{
"epoch": 5.1355661881977674,
"grad_norm": 0.4863373730285094,
"learning_rate": 8.052103050178806e-06,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640024185180664,
"step": 3220,
"valid_targets_mean": 5062.5,
"valid_targets_min": 760
},
{
"epoch": 5.143540669856459,
"grad_norm": 0.4930454760697995,
"learning_rate": 7.988415625250755e-06,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14119328558444977,
"step": 3225,
"valid_targets_mean": 4849.4,
"valid_targets_min": 258
},
{
"epoch": 5.151515151515151,
"grad_norm": 0.4113425375075243,
"learning_rate": 7.924918152942117e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13915401697158813,
"step": 3230,
"valid_targets_mean": 5780.1,
"valid_targets_min": 1144
},
{
"epoch": 5.159489633173844,
"grad_norm": 0.4727008507251189,
"learning_rate": 7.861611637409462e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16318866610527039,
"step": 3235,
"valid_targets_mean": 4842.1,
"valid_targets_min": 586
},
{
"epoch": 5.167464114832536,
"grad_norm": 0.4828095943833063,
"learning_rate": 7.798497079789513e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16433711349964142,
"step": 3240,
"valid_targets_mean": 4624.4,
"valid_targets_min": 274
},
{
"epoch": 5.175438596491228,
"grad_norm": 0.4744135193352567,
"learning_rate": 7.735575478183381e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1755599081516266,
"step": 3245,
"valid_targets_mean": 5212.1,
"valid_targets_min": 333
},
{
"epoch": 5.18341307814992,
"grad_norm": 0.4581602183709319,
"learning_rate": 7.672847827640735e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14598888158798218,
"step": 3250,
"valid_targets_mean": 4947.1,
"valid_targets_min": 367
},
{
"epoch": 5.1913875598086126,
"grad_norm": 0.44432426152642096,
"learning_rate": 7.610315120144067e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15802133083343506,
"step": 3255,
"valid_targets_mean": 5613.7,
"valid_targets_min": 230
},
{
"epoch": 5.199362041467305,
"grad_norm": 0.45090931602424295,
"learning_rate": 7.5479783445930414e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14497801661491394,
"step": 3260,
"valid_targets_mean": 5019.5,
"valid_targets_min": 241
},
{
"epoch": 5.2073365231259965,
"grad_norm": 0.48834864182029514,
"learning_rate": 7.485838486788803e-06,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15974393486976624,
"step": 3265,
"valid_targets_mean": 6540.7,
"valid_targets_min": 4632
},
{
"epoch": 5.215311004784689,
"grad_norm": 0.4491148244141114,
"learning_rate": 7.4238965294184374e-06,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14351961016654968,
"step": 3270,
"valid_targets_mean": 5034.4,
"valid_targets_min": 207
},
{
"epoch": 5.223285486443381,
"grad_norm": 0.4459921331500691,
"learning_rate": 7.362153452039409e-06,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1467072069644928,
"step": 3275,
"valid_targets_mean": 5784.2,
"valid_targets_min": 993
},
{
"epoch": 5.231259968102074,
"grad_norm": 0.48106320041218886,
"learning_rate": 7.300610231064056e-06,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14502954483032227,
"step": 3280,
"valid_targets_mean": 4507.9,
"valid_targets_min": 236
},
{
"epoch": 5.239234449760765,
"grad_norm": 0.4864889224714647,
"learning_rate": 7.239267839744166e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16197340190410614,
"step": 3285,
"valid_targets_mean": 4953.2,
"valid_targets_min": 255
},
{
"epoch": 5.247208931419458,
"grad_norm": 0.4604998630393094,
"learning_rate": 7.178127248155604e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14153867959976196,
"step": 3290,
"valid_targets_mean": 4488.4,
"valid_targets_min": 272
},
{
"epoch": 5.25518341307815,
"grad_norm": 0.49236439922059083,
"learning_rate": 7.117189423182917e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15775446593761444,
"step": 3295,
"valid_targets_mean": 5084.4,
"valid_targets_min": 210
},
{
"epoch": 5.2631578947368425,
"grad_norm": 0.47838707598832375,
"learning_rate": 7.056455328504104e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875396132469177,
"step": 3300,
"valid_targets_mean": 4948.1,
"valid_targets_min": 215
},
{
"epoch": 5.271132376395534,
"grad_norm": 0.5433755427176816,
"learning_rate": 6.995925924575342e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13437744975090027,
"step": 3305,
"valid_targets_mean": 4722.6,
"valid_targets_min": 222
},
{
"epoch": 5.279106858054226,
"grad_norm": 0.4815763895098848,
"learning_rate": 6.935602168615792e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14211152493953705,
"step": 3310,
"valid_targets_mean": 4732.8,
"valid_targets_min": 221
},
{
"epoch": 5.287081339712919,
"grad_norm": 0.4447410196842261,
"learning_rate": 6.875485014592493e-06,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14757999777793884,
"step": 3315,
"valid_targets_mean": 5167.4,
"valid_targets_min": 363
},
{
"epoch": 5.295055821371611,
"grad_norm": 0.4251332258800115,
"learning_rate": 6.815575413205235e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13727967441082,
"step": 3320,
"valid_targets_mean": 5821.2,
"valid_targets_min": 240
},
{
"epoch": 5.303030303030303,
"grad_norm": 0.49143529385732765,
"learning_rate": 6.755874311871562e-06,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14603282511234283,
"step": 3325,
"valid_targets_mean": 5343.0,
"valid_targets_min": 235
},
{
"epoch": 5.311004784688995,
"grad_norm": 0.4426387776988706,
"learning_rate": 6.696382654711777e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15520070493221283,
"step": 3330,
"valid_targets_mean": 5272.8,
"valid_targets_min": 235
},
{
"epoch": 5.318979266347688,
"grad_norm": 0.4049094841075801,
"learning_rate": 6.637101382533986e-06,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739316701889038,
"step": 3335,
"valid_targets_mean": 6374.6,
"valid_targets_min": 402
},
{
"epoch": 5.32695374800638,
"grad_norm": 0.4913045824856341,
"learning_rate": 6.578031432819263e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726195514202118,
"step": 3340,
"valid_targets_mean": 5006.8,
"valid_targets_min": 314
},
{
"epoch": 5.3349282296650715,
"grad_norm": 0.4627985926205782,
"learning_rate": 6.5191737397068015e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1454908698797226,
"step": 3345,
"valid_targets_mean": 5310.7,
"valid_targets_min": 589
},
{
"epoch": 5.342902711323764,
"grad_norm": 0.5210475663646326,
"learning_rate": 6.460529233979127e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15867014229297638,
"step": 3350,
"valid_targets_mean": 4499.4,
"valid_targets_min": 248
},
{
"epoch": 5.350877192982456,
"grad_norm": 0.49981873498821056,
"learning_rate": 6.402098843047417e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1456516683101654,
"step": 3355,
"valid_targets_mean": 5316.4,
"valid_targets_min": 598
},
{
"epoch": 5.358851674641148,
"grad_norm": 0.5064676891648265,
"learning_rate": 6.343883490936791e-06,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1448066532611847,
"step": 3360,
"valid_targets_mean": 4308.1,
"valid_targets_min": 233
},
{
"epoch": 5.36682615629984,
"grad_norm": 0.47905838596998346,
"learning_rate": 6.285884098271739e-06,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15558141469955444,
"step": 3365,
"valid_targets_mean": 5043.6,
"valid_targets_min": 243
},
{
"epoch": 5.374800637958533,
"grad_norm": 0.48629149557224766,
"learning_rate": 6.228101582261532e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16721400618553162,
"step": 3370,
"valid_targets_mean": 4973.9,
"valid_targets_min": 497
},
{
"epoch": 5.382775119617225,
"grad_norm": 0.4850858183720529,
"learning_rate": 6.170536856685716e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15335974097251892,
"step": 3375,
"valid_targets_mean": 4478.9,
"valid_targets_min": 223
},
{
"epoch": 5.3907496012759175,
"grad_norm": 0.4833072145728141,
"learning_rate": 6.113190831879698e-06,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16516146063804626,
"step": 3380,
"valid_targets_mean": 5205.5,
"valid_targets_min": 235
},
{
"epoch": 5.398724082934609,
"grad_norm": 0.4835288113090004,
"learning_rate": 6.056064414720317e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16842329502105713,
"step": 3385,
"valid_targets_mean": 5243.1,
"valid_targets_min": 411
},
{
"epoch": 5.4066985645933014,
"grad_norm": 0.43313320847470577,
"learning_rate": 5.999158508611496e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1504177451133728,
"step": 3390,
"valid_targets_mean": 5215.4,
"valid_targets_min": 465
},
{
"epoch": 5.414673046251994,
"grad_norm": 0.49036685155823234,
"learning_rate": 5.942474013469983e-06,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1608334183692932,
"step": 3395,
"valid_targets_mean": 4751.9,
"valid_targets_min": 285
},
{
"epoch": 5.422647527910685,
"grad_norm": 0.574663879399246,
"learning_rate": 5.886011825711117e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15289413928985596,
"step": 3400,
"valid_targets_mean": 5535.6,
"valid_targets_min": 242
},
{
"epoch": 5.430622009569378,
"grad_norm": 0.5322494164948655,
"learning_rate": 5.829772838234615e-06,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15102876722812653,
"step": 3405,
"valid_targets_mean": 3683.2,
"valid_targets_min": 240
},
{
"epoch": 5.43859649122807,
"grad_norm": 0.5187498623215531,
"learning_rate": 5.773757940410503e-06,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14615221321582794,
"step": 3410,
"valid_targets_mean": 4623.8,
"valid_targets_min": 346
},
{
"epoch": 5.446570972886763,
"grad_norm": 0.4685828114508998,
"learning_rate": 5.7179680180650055e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15752843022346497,
"step": 3415,
"valid_targets_mean": 5684.5,
"valid_targets_min": 300
},
{
"epoch": 5.454545454545454,
"grad_norm": 0.522889077511281,
"learning_rate": 5.6624039534665775e-06,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1590261310338974,
"step": 3420,
"valid_targets_mean": 4173.8,
"valid_targets_min": 233
},
{
"epoch": 5.4625199362041466,
"grad_norm": 0.4756762932324726,
"learning_rate": 5.607066625311925e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19886696338653564,
"step": 3425,
"valid_targets_mean": 5566.5,
"valid_targets_min": 164
},
{
"epoch": 5.470494417862839,
"grad_norm": 0.47917438890986686,
"learning_rate": 5.55195690871211e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160795658826828,
"step": 3430,
"valid_targets_mean": 4546.6,
"valid_targets_min": 446
},
{
"epoch": 5.478468899521531,
"grad_norm": 0.7787098363738806,
"learning_rate": 5.497075675178727e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853606253862381,
"step": 3435,
"valid_targets_mean": 4119.0,
"valid_targets_min": 224
},
{
"epoch": 5.486443381180223,
"grad_norm": 0.5471104540057793,
"learning_rate": 5.442423792610118e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13731586933135986,
"step": 3440,
"valid_targets_mean": 4580.0,
"valid_targets_min": 238
},
{
"epoch": 5.494417862838915,
"grad_norm": 0.43633058177704404,
"learning_rate": 5.388002125277627e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1393011510372162,
"step": 3445,
"valid_targets_mean": 5709.1,
"valid_targets_min": 2356
},
{
"epoch": 5.502392344497608,
"grad_norm": 0.500544121947255,
"learning_rate": 5.333811533811945e-06,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16812501847743988,
"step": 3450,
"valid_targets_mean": 4662.3,
"valid_targets_min": 404
},
{
"epoch": 5.5103668261563,
"grad_norm": 0.4321968671668473,
"learning_rate": 5.2798528751895265e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472059190273285,
"step": 3455,
"valid_targets_mean": 5412.5,
"valid_targets_min": 260
},
{
"epoch": 5.518341307814992,
"grad_norm": 0.516188282731035,
"learning_rate": 5.226127002718984e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455184817314148,
"step": 3460,
"valid_targets_mean": 4234.6,
"valid_targets_min": 243
},
{
"epoch": 5.526315789473684,
"grad_norm": 0.4966018837171216,
"learning_rate": 5.1726347660276424e-06,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1486985981464386,
"step": 3465,
"valid_targets_mean": 5566.6,
"valid_targets_min": 226
},
{
"epoch": 5.5342902711323765,
"grad_norm": 0.4791331897643804,
"learning_rate": 5.119377011048066e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13465863466262817,
"step": 3470,
"valid_targets_mean": 3971.8,
"valid_targets_min": 239
},
{
"epoch": 5.542264752791069,
"grad_norm": 0.6285282708036979,
"learning_rate": 5.066354580004713e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15100893378257751,
"step": 3475,
"valid_targets_mean": 3005.4,
"valid_targets_min": 269
},
{
"epoch": 5.55023923444976,
"grad_norm": 0.4915313605987961,
"learning_rate": 5.013568311400599e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14344826340675354,
"step": 3480,
"valid_targets_mean": 6651.2,
"valid_targets_min": 236
},
{
"epoch": 5.558213716108453,
"grad_norm": 0.5181311764118561,
"learning_rate": 4.96101904000402e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16833406686782837,
"step": 3485,
"valid_targets_mean": 4451.7,
"valid_targets_min": 298
},
{
"epoch": 5.566188197767145,
"grad_norm": 0.44911434199256317,
"learning_rate": 4.908707596835396e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16398075222969055,
"step": 3490,
"valid_targets_mean": 5795.6,
"valid_targets_min": 243
},
{
"epoch": 5.574162679425838,
"grad_norm": 0.48887673542216,
"learning_rate": 4.856634809154093e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14630258083343506,
"step": 3495,
"valid_targets_mean": 4798.6,
"valid_targets_min": 395
},
{
"epoch": 5.582137161084529,
"grad_norm": 0.4795845324226209,
"learning_rate": 4.804801500445338e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16289225220680237,
"step": 3500,
"valid_targets_mean": 4453.1,
"valid_targets_min": 245
},
{
"epoch": 5.590111642743222,
"grad_norm": 0.49292253026437766,
"learning_rate": 4.753208490407233e-06,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18191534280776978,
"step": 3505,
"valid_targets_mean": 4498.8,
"valid_targets_min": 489
},
{
"epoch": 5.598086124401914,
"grad_norm": 0.5089760135607062,
"learning_rate": 4.701856594937744e-06,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13293233513832092,
"step": 3510,
"valid_targets_mean": 3764.9,
"valid_targets_min": 215
},
{
"epoch": 5.606060606060606,
"grad_norm": 0.4746190959310646,
"learning_rate": 4.650746626121838e-06,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13995599746704102,
"step": 3515,
"valid_targets_mean": 4787.4,
"valid_targets_min": 199
},
{
"epoch": 5.614035087719298,
"grad_norm": 0.5034639146801175,
"learning_rate": 4.5998793922186315e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15416234731674194,
"step": 3520,
"valid_targets_mean": 4616.1,
"valid_targets_min": 246
},
{
"epoch": 5.62200956937799,
"grad_norm": 0.46111743578791226,
"learning_rate": 4.549255697648576e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.152305006980896,
"step": 3525,
"valid_targets_mean": 4995.6,
"valid_targets_min": 227
},
{
"epoch": 5.629984051036683,
"grad_norm": 0.4608602450555988,
"learning_rate": 4.498876342980796e-06,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579793095588684,
"step": 3530,
"valid_targets_mean": 5248.8,
"valid_targets_min": 255
},
{
"epoch": 5.637958532695375,
"grad_norm": 0.4733308675485752,
"learning_rate": 4.448742124920368e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14798873662948608,
"step": 3535,
"valid_targets_mean": 5376.5,
"valid_targets_min": 221
},
{
"epoch": 5.645933014354067,
"grad_norm": 0.6093609437426408,
"learning_rate": 4.39885383629576e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16494160890579224,
"step": 3540,
"valid_targets_mean": 5107.6,
"valid_targets_min": 242
},
{
"epoch": 5.653907496012759,
"grad_norm": 0.4704193599073439,
"learning_rate": 4.349212266046285e-06,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16326230764389038,
"step": 3545,
"valid_targets_mean": 5324.4,
"valid_targets_min": 269
},
{
"epoch": 5.6618819776714515,
"grad_norm": 0.4657747975162824,
"learning_rate": 4.299818199209629e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17422260344028473,
"step": 3550,
"valid_targets_mean": 4970.7,
"valid_targets_min": 1396
},
{
"epoch": 5.669856459330144,
"grad_norm": 0.420515044849732,
"learning_rate": 4.250672416909407e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514442265033722,
"step": 3555,
"valid_targets_mean": 5760.6,
"valid_targets_min": 1570
},
{
"epoch": 5.6778309409888355,
"grad_norm": 0.41516338928503643,
"learning_rate": 4.201775696342862e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16060051321983337,
"step": 3560,
"valid_targets_mean": 6413.8,
"valid_targets_min": 3600
},
{
"epoch": 5.685805422647528,
"grad_norm": 0.46906623700170114,
"learning_rate": 4.153128810768517e-06,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16279572248458862,
"step": 3565,
"valid_targets_mean": 4736.4,
"valid_targets_min": 208
},
{
"epoch": 5.69377990430622,
"grad_norm": 0.5015754356988779,
"learning_rate": 4.104732529493991e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18926894664764404,
"step": 3570,
"valid_targets_mean": 4425.1,
"valid_targets_min": 227
},
{
"epoch": 5.701754385964913,
"grad_norm": 0.45105806384824143,
"learning_rate": 4.056587617863825e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17029494047164917,
"step": 3575,
"valid_targets_mean": 5617.8,
"valid_targets_min": 460
},
{
"epoch": 5.709728867623604,
"grad_norm": 0.49175639523779135,
"learning_rate": 4.008694837247345e-06,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18568654358386993,
"step": 3580,
"valid_targets_mean": 6270.6,
"valid_targets_min": 244
},
{
"epoch": 5.717703349282297,
"grad_norm": 0.6769881677170507,
"learning_rate": 3.961054945026674e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1355312615633011,
"step": 3585,
"valid_targets_mean": 4165.9,
"valid_targets_min": 218
},
{
"epoch": 5.725677830940989,
"grad_norm": 0.5133023315898203,
"learning_rate": 3.913668694584705e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15609794855117798,
"step": 3590,
"valid_targets_mean": 4151.4,
"valid_targets_min": 220
},
{
"epoch": 5.733652312599681,
"grad_norm": 0.44064504684893196,
"learning_rate": 3.866536835293227e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14749088883399963,
"step": 3595,
"valid_targets_mean": 5171.5,
"valid_targets_min": 281
},
{
"epoch": 5.741626794258373,
"grad_norm": 0.4520697005826577,
"learning_rate": 3.819660112501053e-06,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739054441452026,
"step": 3600,
"valid_targets_mean": 5231.6,
"valid_targets_min": 227
},
{
"epoch": 5.749601275917065,
"grad_norm": 0.4991227138203837,
"learning_rate": 3.773039267522227e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16402383148670197,
"step": 3605,
"valid_targets_mean": 4534.4,
"valid_targets_min": 625
},
{
"epoch": 5.757575757575758,
"grad_norm": 0.4986065297798539,
"learning_rate": 3.72667503762433e-06,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630692034959793,
"step": 3610,
"valid_targets_mean": 5159.6,
"valid_targets_min": 389
},
{
"epoch": 5.76555023923445,
"grad_norm": 0.4049459898514612,
"learning_rate": 3.680568156016786e-06,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414915919303894,
"step": 3615,
"valid_targets_mean": 6273.9,
"valid_targets_min": 3956
},
{
"epoch": 5.773524720893142,
"grad_norm": 0.543662044908981,
"learning_rate": 3.6347193518392776e-06,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631641983985901,
"step": 3620,
"valid_targets_mean": 3520.4,
"valid_targets_min": 242
},
{
"epoch": 5.781499202551834,
"grad_norm": 0.5132679429264033,
"learning_rate": 3.58912935015024e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17440487444400787,
"step": 3625,
"valid_targets_mean": 4255.1,
"valid_targets_min": 328
},
{
"epoch": 5.7894736842105265,
"grad_norm": 0.5053310023786863,
"learning_rate": 3.543798871915367e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15172672271728516,
"step": 3630,
"valid_targets_mean": 4452.2,
"valid_targets_min": 227
},
{
"epoch": 5.797448165869218,
"grad_norm": 0.4684784598941,
"learning_rate": 3.498728633996209e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14971506595611572,
"step": 3635,
"valid_targets_mean": 5225.2,
"valid_targets_min": 230
},
{
"epoch": 5.8054226475279105,
"grad_norm": 0.46115162406236737,
"learning_rate": 3.453919349138859e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14659349620342255,
"step": 3640,
"valid_targets_mean": 5709.1,
"valid_targets_min": 299
},
{
"epoch": 5.813397129186603,
"grad_norm": 0.46020022381518416,
"learning_rate": 3.4093717259626514e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13591623306274414,
"step": 3645,
"valid_targets_mean": 4973.1,
"valid_targets_min": 765
},
{
"epoch": 5.821371610845295,
"grad_norm": 0.47367553344910285,
"learning_rate": 3.365086468948988e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1700918823480606,
"step": 3650,
"valid_targets_mean": 5319.5,
"valid_targets_min": 225
},
{
"epoch": 5.829346092503988,
"grad_norm": 0.6505180384813233,
"learning_rate": 3.321064278430175e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515679657459259,
"step": 3655,
"valid_targets_mean": 4172.9,
"valid_targets_min": 212
},
{
"epoch": 5.837320574162679,
"grad_norm": 0.49312956238364775,
"learning_rate": 3.277305850578345e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14799179136753082,
"step": 3660,
"valid_targets_mean": 4885.3,
"valid_targets_min": 227
},
{
"epoch": 5.845295055821372,
"grad_norm": 0.4184102214187514,
"learning_rate": 3.2338118773944684e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1451129913330078,
"step": 3665,
"valid_targets_mean": 6137.9,
"valid_targets_min": 2702
},
{
"epoch": 5.853269537480064,
"grad_norm": 0.4917317516199451,
"learning_rate": 3.1905830466973975e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15702003240585327,
"step": 3670,
"valid_targets_mean": 5106.1,
"valid_targets_min": 264
},
{
"epoch": 5.861244019138756,
"grad_norm": 0.4628847616665014,
"learning_rate": 3.14762004211298e-06,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16175755858421326,
"step": 3675,
"valid_targets_mean": 5198.9,
"valid_targets_min": 214
},
{
"epoch": 5.869218500797448,
"grad_norm": 0.47601217080416275,
"learning_rate": 3.1049235430632696e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15074549615383148,
"step": 3680,
"valid_targets_mean": 4520.1,
"valid_targets_min": 233
},
{
"epoch": 5.87719298245614,
"grad_norm": 0.5834218075207638,
"learning_rate": 3.062494224755759e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2231508493423462,
"step": 3685,
"valid_targets_mean": 4244.4,
"valid_targets_min": 232
},
{
"epoch": 5.885167464114833,
"grad_norm": 0.4766868558186829,
"learning_rate": 3.0203327581727195e-06,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1613055020570755,
"step": 3690,
"valid_targets_mean": 4811.6,
"valid_targets_min": 255
},
{
"epoch": 5.893141945773524,
"grad_norm": 0.44876715014880975,
"learning_rate": 2.9784398100605937e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14462366700172424,
"step": 3695,
"valid_targets_mean": 5235.1,
"valid_targets_min": 278
},
{
"epoch": 5.901116427432217,
"grad_norm": 0.4510142737031215,
"learning_rate": 2.9368160429194127e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13386178016662598,
"step": 3700,
"valid_targets_mean": 5353.9,
"valid_targets_min": 283
},
{
"epoch": 5.909090909090909,
"grad_norm": 0.4556921018996119,
"learning_rate": 2.895462114992371e-06,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17346566915512085,
"step": 3705,
"valid_targets_mean": 5930.0,
"valid_targets_min": 252
},
{
"epoch": 5.917065390749602,
"grad_norm": 0.4682379596121741,
"learning_rate": 2.8543786802553943e-06,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1504223793745041,
"step": 3710,
"valid_targets_mean": 4891.8,
"valid_targets_min": 244
},
{
"epoch": 5.925039872408293,
"grad_norm": 0.5028889161289527,
"learning_rate": 2.813566388406781e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16947460174560547,
"step": 3715,
"valid_targets_mean": 5198.4,
"valid_targets_min": 238
},
{
"epoch": 5.9330143540669855,
"grad_norm": 0.42820894853940544,
"learning_rate": 2.773025884856957e-06,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14061594009399414,
"step": 3720,
"valid_targets_mean": 5816.4,
"valid_targets_min": 469
},
{
"epoch": 5.940988835725678,
"grad_norm": 0.4664774104232858,
"learning_rate": 2.7327578107182585e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13510872423648834,
"step": 3725,
"valid_targets_mean": 5545.6,
"valid_targets_min": 273
},
{
"epoch": 5.94896331738437,
"grad_norm": 0.5238401849218677,
"learning_rate": 2.692762802794775e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16264596581459045,
"step": 3730,
"valid_targets_mean": 4376.4,
"valid_targets_min": 230
},
{
"epoch": 5.956937799043062,
"grad_norm": 0.45087693055845296,
"learning_rate": 2.6530414935723104e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1532100886106491,
"step": 3735,
"valid_targets_mean": 4878.6,
"valid_targets_min": 259
},
{
"epoch": 5.964912280701754,
"grad_norm": 0.4438179509578052,
"learning_rate": 2.6135945112083506e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14241643249988556,
"step": 3740,
"valid_targets_mean": 4956.2,
"valid_targets_min": 379
},
{
"epoch": 5.972886762360447,
"grad_norm": 0.5549037871035863,
"learning_rate": 2.574422479522156e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596030294895172,
"step": 3745,
"valid_targets_mean": 4997.6,
"valid_targets_min": 549
},
{
"epoch": 5.980861244019139,
"grad_norm": 0.5895868584381605,
"learning_rate": 2.535526017984884e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16880738735198975,
"step": 3750,
"valid_targets_mean": 3346.3,
"valid_targets_min": 199
},
{
"epoch": 5.988835725677831,
"grad_norm": 0.5130364660857234,
"learning_rate": 2.4969057417097807e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15060560405254364,
"step": 3755,
"valid_targets_mean": 3963.4,
"valid_targets_min": 314
},
{
"epoch": 5.996810207336523,
"grad_norm": 0.4976543721703397,
"learning_rate": 2.458562261442483e-06,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13388743996620178,
"step": 3760,
"valid_targets_mean": 5151.2,
"valid_targets_min": 245
},
{
"epoch": 6.0047846889952154,
"grad_norm": 0.44928966826086414,
"learning_rate": 2.4204961835513263e-06,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16202214360237122,
"step": 3765,
"valid_targets_mean": 5942.7,
"valid_targets_min": 388
},
{
"epoch": 6.012759170653908,
"grad_norm": 0.4062032075083199,
"learning_rate": 2.3827081100177797e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1397780179977417,
"step": 3770,
"valid_targets_mean": 6125.1,
"valid_targets_min": 223
},
{
"epoch": 6.020733652312599,
"grad_norm": 0.44993434313584385,
"learning_rate": 2.3451986384269266e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594015508890152,
"step": 3775,
"valid_targets_mean": 5130.2,
"valid_targets_min": 269
},
{
"epoch": 6.028708133971292,
"grad_norm": 0.4875301922172514,
"learning_rate": 2.307968361957993e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14149093627929688,
"step": 3780,
"valid_targets_mean": 4876.2,
"valid_targets_min": 404
},
{
"epoch": 6.036682615629984,
"grad_norm": 0.4629594770445272,
"learning_rate": 2.2710178693749805e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16642490029335022,
"step": 3785,
"valid_targets_mean": 4987.9,
"valid_targets_min": 254
},
{
"epoch": 6.044657097288677,
"grad_norm": 0.5166944673117188,
"learning_rate": 2.2343477450173665e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17281094193458557,
"step": 3790,
"valid_targets_mean": 4621.1,
"valid_targets_min": 215
},
{
"epoch": 6.052631578947368,
"grad_norm": 0.47068452452288745,
"learning_rate": 2.197958568790839e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15370580554008484,
"step": 3795,
"valid_targets_mean": 4905.4,
"valid_targets_min": 912
},
{
"epoch": 6.0606060606060606,
"grad_norm": 0.4549056607289303,
"learning_rate": 2.161850916158148e-06,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16554537415504456,
"step": 3800,
"valid_targets_mean": 5324.4,
"valid_targets_min": 240
},
{
"epoch": 6.068580542264753,
"grad_norm": 0.4845167729156862,
"learning_rate": 2.1260253581299996e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14590927958488464,
"step": 3805,
"valid_targets_mean": 4456.4,
"valid_targets_min": 545
},
{
"epoch": 6.076555023923445,
"grad_norm": 0.4653335767771134,
"learning_rate": 2.0904824612560046e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1586759090423584,
"step": 3810,
"valid_targets_mean": 4953.6,
"valid_targets_min": 407
},
{
"epoch": 6.084529505582137,
"grad_norm": 0.48055135656708736,
"learning_rate": 2.0552227876157536e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13218027353286743,
"step": 3815,
"valid_targets_mean": 5003.9,
"valid_targets_min": 205
},
{
"epoch": 6.092503987240829,
"grad_norm": 0.4867289410365764,
"learning_rate": 2.020246894809912e-06,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14842218160629272,
"step": 3820,
"valid_targets_mean": 4870.1,
"valid_targets_min": 223
},
{
"epoch": 6.100478468899522,
"grad_norm": 0.4788267536406092,
"learning_rate": 1.9855553359513836e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16526566445827484,
"step": 3825,
"valid_targets_mean": 4967.4,
"valid_targets_min": 347
},
{
"epoch": 6.108452950558214,
"grad_norm": 0.44362145470110076,
"learning_rate": 1.9511486596566054e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13952435553073883,
"step": 3830,
"valid_targets_mean": 5323.2,
"valid_targets_min": 732
},
{
"epoch": 6.116427432216906,
"grad_norm": 0.44421535025224507,
"learning_rate": 1.917027410036825e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15196619927883148,
"step": 3835,
"valid_targets_mean": 5453.3,
"valid_targets_min": 680
},
{
"epoch": 6.124401913875598,
"grad_norm": 0.48619880208308525,
"learning_rate": 1.8831921266895348e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1549423336982727,
"step": 3840,
"valid_targets_mean": 4936.4,
"valid_targets_min": 292
},
{
"epoch": 6.1323763955342905,
"grad_norm": 0.4933266469826171,
"learning_rate": 1.8496433446899197e-06,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14725814759731293,
"step": 3845,
"valid_targets_mean": 4630.4,
"valid_targets_min": 371
},
{
"epoch": 6.140350877192983,
"grad_norm": 0.4355406021657482,
"learning_rate": 1.8163815945823881e-06,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13551683723926544,
"step": 3850,
"valid_targets_mean": 6277.8,
"valid_targets_min": 369
},
{
"epoch": 6.148325358851674,
"grad_norm": 0.44639648871243803,
"learning_rate": 1.7834074023722082e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13991107046604156,
"step": 3855,
"valid_targets_mean": 5152.2,
"valid_targets_min": 231
},
{
"epoch": 6.156299840510367,
"grad_norm": 0.489541279190905,
"learning_rate": 1.7507212895171632e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15481799840927124,
"step": 3860,
"valid_targets_mean": 5027.0,
"valid_targets_min": 318
},
{
"epoch": 6.164274322169059,
"grad_norm": 0.5049501309051616,
"learning_rate": 1.7183237729193081e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16344068944454193,
"step": 3865,
"valid_targets_mean": 4705.1,
"valid_targets_min": 444
},
{
"epoch": 6.172248803827751,
"grad_norm": 0.5079803335616084,
"learning_rate": 1.6862153649168211e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15662287175655365,
"step": 3870,
"valid_targets_mean": 4186.4,
"valid_targets_min": 241
},
{
"epoch": 6.180223285486443,
"grad_norm": 0.5116936150655245,
"learning_rate": 1.6543965732758737e-06,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1334778070449829,
"step": 3875,
"valid_targets_mean": 4322.1,
"valid_targets_min": 326
},
{
"epoch": 6.188197767145136,
"grad_norm": 0.45160368109673826,
"learning_rate": 1.6228679011826032e-06,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16378632187843323,
"step": 3880,
"valid_targets_mean": 5385.4,
"valid_targets_min": 547
},
{
"epoch": 6.196172248803828,
"grad_norm": 0.4571770596267456,
"learning_rate": 1.591629847235172e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14328834414482117,
"step": 3885,
"valid_targets_mean": 5291.6,
"valid_targets_min": 598
},
{
"epoch": 6.2041467304625195,
"grad_norm": 0.4692079789797092,
"learning_rate": 1.5606829054358686e-06,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150887131690979,
"step": 3890,
"valid_targets_mean": 5435.4,
"valid_targets_min": 1139
},
{
"epoch": 6.212121212121212,
"grad_norm": 0.426069274473679,
"learning_rate": 1.5300275651832963e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14551419019699097,
"step": 3895,
"valid_targets_mean": 6428.3,
"valid_targets_min": 1623
},
{
"epoch": 6.220095693779904,
"grad_norm": 0.6045869058817608,
"learning_rate": 1.499664311264648e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14620190858840942,
"step": 3900,
"valid_targets_mean": 4127.7,
"valid_targets_min": 252
},
{
"epoch": 6.228070175438597,
"grad_norm": 0.5782970704223566,
"learning_rate": 1.4695936238480135e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1496705263853073,
"step": 3905,
"valid_targets_mean": 3291.6,
"valid_targets_min": 240
},
{
"epoch": 6.236044657097288,
"grad_norm": 0.47876040223726124,
"learning_rate": 1.4398159784748144e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15745174884796143,
"step": 3910,
"valid_targets_mean": 5079.1,
"valid_targets_min": 266
},
{
"epoch": 6.244019138755981,
"grad_norm": 0.5126346829344415,
"learning_rate": 1.4103318460522598e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16566559672355652,
"step": 3915,
"valid_targets_mean": 4192.6,
"valid_targets_min": 273
},
{
"epoch": 6.251993620414673,
"grad_norm": 0.5416124300618265,
"learning_rate": 1.3811416928459177e-06,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15463967621326447,
"step": 3920,
"valid_targets_mean": 4478.5,
"valid_targets_min": 272
},
{
"epoch": 6.2599681020733655,
"grad_norm": 0.4448108644678357,
"learning_rate": 1.3522459804723353e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1516856849193573,
"step": 3925,
"valid_targets_mean": 5685.1,
"valid_targets_min": 711
},
{
"epoch": 6.267942583732057,
"grad_norm": 0.4289450178961959,
"learning_rate": 1.3236451658917293e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15075251460075378,
"step": 3930,
"valid_targets_mean": 5997.5,
"valid_targets_min": 2915
},
{
"epoch": 6.2759170653907494,
"grad_norm": 0.46681109243000163,
"learning_rate": 1.2953397014007728e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14777758717536926,
"step": 3935,
"valid_targets_mean": 5023.1,
"valid_targets_min": 390
},
{
"epoch": 6.283891547049442,
"grad_norm": 0.42835960080586744,
"learning_rate": 1.2673300346254447e-06,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13789385557174683,
"step": 3940,
"valid_targets_mean": 5225.6,
"valid_targets_min": 289
},
{
"epoch": 6.291866028708134,
"grad_norm": 0.5196426280217668,
"learning_rate": 1.239616608513925e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15100279450416565,
"step": 3945,
"valid_targets_mean": 4081.2,
"valid_targets_min": 286
},
{
"epoch": 6.299840510366826,
"grad_norm": 0.5022813022318281,
"learning_rate": 1.2121998613296259e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14675407111644745,
"step": 3950,
"valid_targets_mean": 5395.9,
"valid_targets_min": 412
},
{
"epoch": 6.307814992025518,
"grad_norm": 0.44890211526343465,
"learning_rate": 1.1850802266442396e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509132981300354,
"step": 3955,
"valid_targets_mean": 5812.4,
"valid_targets_min": 2642
},
{
"epoch": 6.315789473684211,
"grad_norm": 0.5061776876413504,
"learning_rate": 1.1582581333308784e-06,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14476345479488373,
"step": 3960,
"valid_targets_mean": 4706.8,
"valid_targets_min": 408
},
{
"epoch": 6.323763955342903,
"grad_norm": 0.5217658882608658,
"learning_rate": 1.1317340055573122e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14775893092155457,
"step": 3965,
"valid_targets_mean": 3739.5,
"valid_targets_min": 199
},
{
"epoch": 6.3317384370015946,
"grad_norm": 0.5118859450723333,
"learning_rate": 1.1055082627792357e-06,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16105467081069946,
"step": 3970,
"valid_targets_mean": 4756.9,
"valid_targets_min": 293
},
{
"epoch": 6.339712918660287,
"grad_norm": 0.5054678322271705,
"learning_rate": 1.0795813197336602e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12841784954071045,
"step": 3975,
"valid_targets_mean": 4324.1,
"valid_targets_min": 251
},
{
"epoch": 6.347687400318979,
"grad_norm": 0.5102069371772863,
"learning_rate": 1.0539535864323391e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.164170041680336,
"step": 3980,
"valid_targets_mean": 4642.5,
"valid_targets_min": 212
},
{
"epoch": 6.355661881977672,
"grad_norm": 0.47695267618075876,
"learning_rate": 1.0286254681552777e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15313708782196045,
"step": 3985,
"valid_targets_mean": 5626.9,
"valid_targets_min": 273
},
{
"epoch": 6.363636363636363,
"grad_norm": 0.43091234410044393,
"learning_rate": 1.0035973654443466e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15081724524497986,
"step": 3990,
"valid_targets_mean": 5959.9,
"valid_targets_min": 284
},
{
"epoch": 6.371610845295056,
"grad_norm": 0.5340840931679183,
"learning_rate": 9.788696740969295e-07,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14918410778045654,
"step": 3995,
"valid_targets_mean": 4531.4,
"valid_targets_min": 1210
},
{
"epoch": 6.379585326953748,
"grad_norm": 0.4247409219481503,
"learning_rate": 9.544427851596661e-07,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14433777332305908,
"step": 4000,
"valid_targets_mean": 6152.6,
"valid_targets_min": 241
},
{
"epoch": 6.3875598086124405,
"grad_norm": 0.4895024880775478,
"learning_rate": 9.303170849222764e-07,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440003663301468,
"step": 4005,
"valid_targets_mean": 4668.4,
"valid_targets_min": 300
},
{
"epoch": 6.395534290271132,
"grad_norm": 0.429988312127633,
"learning_rate": 9.064929549114421e-07,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1483185589313507,
"step": 4010,
"valid_targets_mean": 6485.9,
"valid_targets_min": 3764
},
{
"epoch": 6.4035087719298245,
"grad_norm": 0.46137829910478273,
"learning_rate": 8.829707718847835e-07,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15009953081607819,
"step": 4015,
"valid_targets_mean": 5219.5,
"valid_targets_min": 341
},
{
"epoch": 6.411483253588517,
"grad_norm": 0.47612714642052334,
"learning_rate": 8.597509078248923e-07,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14877188205718994,
"step": 4020,
"valid_targets_mean": 5458.4,
"valid_targets_min": 263
},
{
"epoch": 6.419457735247209,
"grad_norm": 0.4790590020325636,
"learning_rate": 8.368337299334461e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14202189445495605,
"step": 4025,
"valid_targets_mean": 4610.4,
"valid_targets_min": 221
},
{
"epoch": 6.427432216905901,
"grad_norm": 0.43486828774128805,
"learning_rate": 8.142196006254144e-07,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14796648919582367,
"step": 4030,
"valid_targets_mean": 5326.4,
"valid_targets_min": 357
},
{
"epoch": 6.435406698564593,
"grad_norm": 0.4703735281341048,
"learning_rate": 7.919088775233264e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.155422180891037,
"step": 4035,
"valid_targets_mean": 5504.8,
"valid_targets_min": 220
},
{
"epoch": 6.443381180223286,
"grad_norm": 0.535947939565035,
"learning_rate": 7.699019134515917e-07,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15502360463142395,
"step": 4040,
"valid_targets_mean": 4319.9,
"valid_targets_min": 285
},
{
"epoch": 6.451355661881978,
"grad_norm": 0.4818703555632311,
"learning_rate": 7.48199056430956e-07,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630256175994873,
"step": 4045,
"valid_targets_mean": 5285.6,
"valid_targets_min": 208
},
{
"epoch": 6.45933014354067,
"grad_norm": 0.5035873377823161,
"learning_rate": 7.268006496729762e-07,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15067459642887115,
"step": 4050,
"valid_targets_mean": 5337.9,
"valid_targets_min": 174
},
{
"epoch": 6.467304625199362,
"grad_norm": 0.502747428173728,
"learning_rate": 7.057070315745851e-07,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1535114347934723,
"step": 4055,
"valid_targets_mean": 4404.4,
"valid_targets_min": 201
},
{
"epoch": 6.475279106858054,
"grad_norm": 0.4016268682691944,
"learning_rate": 6.849185357127686e-07,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472223699092865,
"step": 4060,
"valid_targets_mean": 5625.4,
"valid_targets_min": 252
},
{
"epoch": 6.483253588516747,
"grad_norm": 0.500867474532203,
"learning_rate": 6.64435490839257e-07,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15104928612709045,
"step": 4065,
"valid_targets_mean": 5525.7,
"valid_targets_min": 233
},
{
"epoch": 6.491228070175438,
"grad_norm": 0.4376815836110299,
"learning_rate": 6.442582208753578e-07,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15212634205818176,
"step": 4070,
"valid_targets_mean": 6167.4,
"valid_targets_min": 372
},
{
"epoch": 6.499202551834131,
"grad_norm": 0.4925011711593379,
"learning_rate": 6.243870449068068e-07,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13938778638839722,
"step": 4075,
"valid_targets_mean": 4858.9,
"valid_targets_min": 293
},
{
"epoch": 6.507177033492823,
"grad_norm": 0.5028373020409859,
"learning_rate": 6.048222771787382e-07,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14744833111763,
"step": 4080,
"valid_targets_mean": 4449.3,
"valid_targets_min": 285
},
{
"epoch": 6.515151515151516,
"grad_norm": 0.4451538888037021,
"learning_rate": 5.85564227090707e-07,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15033164620399475,
"step": 4085,
"valid_targets_mean": 5139.9,
"valid_targets_min": 227
},
{
"epoch": 6.523125996810207,
"grad_norm": 0.49448838566482495,
"learning_rate": 5.666131991917989e-07,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14017827808856964,
"step": 4090,
"valid_targets_mean": 5041.9,
"valid_targets_min": 233
},
{
"epoch": 6.5311004784688995,
"grad_norm": 0.5416350180533349,
"learning_rate": 5.479694931758194e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1785852611064911,
"step": 4095,
"valid_targets_mean": 5573.2,
"valid_targets_min": 437
},
{
"epoch": 6.539074960127592,
"grad_norm": 0.5628948990040651,
"learning_rate": 5.296334038765483e-07,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1577194631099701,
"step": 4100,
"valid_targets_mean": 4427.6,
"valid_targets_min": 477
},
{
"epoch": 6.5470494417862835,
"grad_norm": 0.48315562844847276,
"learning_rate": 5.116052212630696e-07,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14190314710140228,
"step": 4105,
"valid_targets_mean": 4638.1,
"valid_targets_min": 238
},
{
"epoch": 6.555023923444976,
"grad_norm": 0.4649105580146512,
"learning_rate": 4.938852304352026e-07,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1748298704624176,
"step": 4110,
"valid_targets_mean": 6575.4,
"valid_targets_min": 783
},
{
"epoch": 6.562998405103668,
"grad_norm": 0.4586563960264318,
"learning_rate": 4.7647371161898547e-07,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14360040426254272,
"step": 4115,
"valid_targets_mean": 5360.1,
"valid_targets_min": 332
},
{
"epoch": 6.570972886762361,
"grad_norm": 0.45085707891473675,
"learning_rate": 4.593709401622359e-07,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1483638733625412,
"step": 4120,
"valid_targets_mean": 5548.3,
"valid_targets_min": 283
},
{
"epoch": 6.578947368421053,
"grad_norm": 0.46458186030605464,
"learning_rate": 4.425771865302153e-07,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13930150866508484,
"step": 4125,
"valid_targets_mean": 5190.6,
"valid_targets_min": 350
},
{
"epoch": 6.586921850079745,
"grad_norm": 0.43541944344062583,
"learning_rate": 4.2609271630133174e-07,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1533948928117752,
"step": 4130,
"valid_targets_mean": 5871.0,
"valid_targets_min": 231
},
{
"epoch": 6.594896331738437,
"grad_norm": 0.5031511197247889,
"learning_rate": 4.099177901629525e-07,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139293372631073,
"step": 4135,
"valid_targets_mean": 3976.4,
"valid_targets_min": 185
},
{
"epoch": 6.6028708133971294,
"grad_norm": 0.5019363115194629,
"learning_rate": 3.9405266390727836e-07,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16090963780879974,
"step": 4140,
"valid_targets_mean": 5086.2,
"valid_targets_min": 195
},
{
"epoch": 6.610845295055821,
"grad_norm": 0.4844497814826883,
"learning_rate": 3.7849758842729344e-07,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16627800464630127,
"step": 4145,
"valid_targets_mean": 5407.1,
"valid_targets_min": 199
},
{
"epoch": 6.618819776714513,
"grad_norm": 0.4591731715598886,
"learning_rate": 3.632528097128085e-07,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14857414364814758,
"step": 4150,
"valid_targets_mean": 5256.8,
"valid_targets_min": 229
},
{
"epoch": 6.626794258373206,
"grad_norm": 0.5202929604535261,
"learning_rate": 3.48318568846564e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455889195203781,
"step": 4155,
"valid_targets_mean": 4872.8,
"valid_targets_min": 247
},
{
"epoch": 6.634768740031898,
"grad_norm": 0.4705904446828977,
"learning_rate": 3.336951020004087e-07,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14285165071487427,
"step": 4160,
"valid_targets_mean": 5109.5,
"valid_targets_min": 200
},
{
"epoch": 6.64274322169059,
"grad_norm": 0.45577635857265425,
"learning_rate": 3.1938264043158694e-07,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13021527230739594,
"step": 4165,
"valid_targets_mean": 4774.4,
"valid_targets_min": 435
},
{
"epoch": 6.650717703349282,
"grad_norm": 0.4486128504903437,
"learning_rate": 3.05381410479062e-07,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472494751214981,
"step": 4170,
"valid_targets_mean": 5558.4,
"valid_targets_min": 536
},
{
"epoch": 6.6586921850079746,
"grad_norm": 0.4535891529882187,
"learning_rate": 2.916916335599407e-07,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309969127178192,
"step": 4175,
"valid_targets_mean": 5063.6,
"valid_targets_min": 443
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.5137615372694194,
"learning_rate": 2.783135261659831e-07,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.131601944565773,
"step": 4180,
"valid_targets_mean": 4253.1,
"valid_targets_min": 180
},
{
"epoch": 6.6746411483253585,
"grad_norm": 0.4956512141213648,
"learning_rate": 2.6524729986016293e-07,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1345309317111969,
"step": 4185,
"valid_targets_mean": 4681.8,
"valid_targets_min": 370
},
{
"epoch": 6.682615629984051,
"grad_norm": 0.4322804982850078,
"learning_rate": 2.524931612733328e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1334218680858612,
"step": 4190,
"valid_targets_mean": 5158.1,
"valid_targets_min": 1221
},
{
"epoch": 6.690590111642743,
"grad_norm": 0.5524770921264247,
"learning_rate": 2.400513121009529e-07,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13881897926330566,
"step": 4195,
"valid_targets_mean": 5170.0,
"valid_targets_min": 217
},
{
"epoch": 6.698564593301436,
"grad_norm": 0.4416808616196191,
"learning_rate": 2.279219490998985e-07,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14825358986854553,
"step": 4200,
"valid_targets_mean": 5345.4,
"valid_targets_min": 192
},
{
"epoch": 6.706539074960127,
"grad_norm": 0.41557160123119896,
"learning_rate": 2.161052640853578e-07,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15103837847709656,
"step": 4205,
"valid_targets_mean": 6218.0,
"valid_targets_min": 3267
},
{
"epoch": 6.71451355661882,
"grad_norm": 0.4665005539147527,
"learning_rate": 2.0460144392778768e-07,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14628729224205017,
"step": 4210,
"valid_targets_mean": 5114.4,
"valid_targets_min": 184
},
{
"epoch": 6.722488038277512,
"grad_norm": 0.41678070100960785,
"learning_rate": 1.9341067054996277e-07,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13423167169094086,
"step": 4215,
"valid_targets_mean": 6462.1,
"valid_targets_min": 707
},
{
"epoch": 6.7304625199362045,
"grad_norm": 0.5329553956676955,
"learning_rate": 1.8253312092409992e-07,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16593559086322784,
"step": 4220,
"valid_targets_mean": 4739.5,
"valid_targets_min": 458
},
{
"epoch": 6.738437001594896,
"grad_norm": 0.4077664732039775,
"learning_rate": 1.7196896706906273e-07,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14922519028186798,
"step": 4225,
"valid_targets_mean": 6259.2,
"valid_targets_min": 1201
},
{
"epoch": 6.746411483253588,
"grad_norm": 0.4572419979041358,
"learning_rate": 1.6171837604762597e-07,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14641094207763672,
"step": 4230,
"valid_targets_mean": 5254.2,
"valid_targets_min": 598
},
{
"epoch": 6.754385964912281,
"grad_norm": 0.494702420453681,
"learning_rate": 1.5178150996385755e-07,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1475975215435028,
"step": 4235,
"valid_targets_mean": 4546.5,
"valid_targets_min": 232
},
{
"epoch": 6.762360446570973,
"grad_norm": 0.4796385200530194,
"learning_rate": 1.421585259605318e-07,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1568702608346939,
"step": 4240,
"valid_targets_mean": 5172.8,
"valid_targets_min": 260
},
{
"epoch": 6.770334928229665,
"grad_norm": 0.43075191213287334,
"learning_rate": 1.3284957621666039e-07,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14368301630020142,
"step": 4245,
"valid_targets_mean": 5836.8,
"valid_targets_min": 1704
},
{
"epoch": 6.778309409888357,
"grad_norm": 0.4851600090501543,
"learning_rate": 1.2385480794507853e-07,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13613252341747284,
"step": 4250,
"valid_targets_mean": 5194.1,
"valid_targets_min": 224
},
{
"epoch": 6.78628389154705,
"grad_norm": 0.49076420450563607,
"learning_rate": 1.1517436339011589e-07,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567186713218689,
"step": 4255,
"valid_targets_mean": 4560.8,
"valid_targets_min": 306
},
{
"epoch": 6.794258373205742,
"grad_norm": 0.481268750942527,
"learning_rate": 1.0680837982535607e-07,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13878720998764038,
"step": 4260,
"valid_targets_mean": 5214.8,
"valid_targets_min": 247
},
{
"epoch": 6.8022328548644335,
"grad_norm": 0.525692133957443,
"learning_rate": 9.875698955145174e-08,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12678062915802002,
"step": 4265,
"valid_targets_mean": 4339.8,
"valid_targets_min": 242
},
{
"epoch": 6.810207336523126,
"grad_norm": 0.42621079495304015,
"learning_rate": 9.102031989404403e-08,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495763659477234,
"step": 4270,
"valid_targets_mean": 5675.7,
"valid_targets_min": 642
},
{
"epoch": 6.818181818181818,
"grad_norm": 0.4580655646450462,
"learning_rate": 8.359849320174196e-08,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15296252071857452,
"step": 4275,
"valid_targets_mean": 5290.6,
"valid_targets_min": 261
},
{
"epoch": 6.826156299840511,
"grad_norm": 0.424793015484167,
"learning_rate": 7.649162684419731e-08,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1285790205001831,
"step": 4280,
"valid_targets_mean": 5851.7,
"valid_targets_min": 997
},
{
"epoch": 6.834130781499202,
"grad_norm": 0.6009179207598535,
"learning_rate": 6.969983321023499e-08,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15977022051811218,
"step": 4285,
"valid_targets_mean": 4550.5,
"valid_targets_min": 446
},
{
"epoch": 6.842105263157895,
"grad_norm": 0.43101483729428003,
"learning_rate": 6.322321970608337e-08,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13828077912330627,
"step": 4290,
"valid_targets_mean": 6386.3,
"valid_targets_min": 205
},
{
"epoch": 6.850079744816587,
"grad_norm": 0.4465415769876545,
"learning_rate": 5.7061888753677796e-08,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383409947156906,
"step": 4295,
"valid_targets_mean": 5717.8,
"valid_targets_min": 262
},
{
"epoch": 6.858054226475279,
"grad_norm": 0.5473085555335196,
"learning_rate": 5.121593778903755e-08,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14721372723579407,
"step": 4300,
"valid_targets_mean": 4142.8,
"valid_targets_min": 239
},
{
"epoch": 6.866028708133971,
"grad_norm": 0.4853378564035753,
"learning_rate": 4.5685459260722544e-08,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15751667320728302,
"step": 4305,
"valid_targets_mean": 5418.1,
"valid_targets_min": 238
},
{
"epoch": 6.8740031897926634,
"grad_norm": 0.4931042806071698,
"learning_rate": 4.047054062837452e-08,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14012879133224487,
"step": 4310,
"valid_targets_mean": 4697.9,
"valid_targets_min": 230
},
{
"epoch": 6.881977671451356,
"grad_norm": 0.8971037686738282,
"learning_rate": 3.55712643613404e-08,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15433238446712494,
"step": 4315,
"valid_targets_mean": 4864.7,
"valid_targets_min": 205
},
{
"epoch": 6.889952153110048,
"grad_norm": 0.4692472893763074,
"learning_rate": 3.0987707937351066e-08,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1405605673789978,
"step": 4320,
"valid_targets_mean": 4847.9,
"valid_targets_min": 302
},
{
"epoch": 6.89792663476874,
"grad_norm": 0.47088407985998104,
"learning_rate": 2.6719943841311268e-08,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14168399572372437,
"step": 4325,
"valid_targets_mean": 4563.3,
"valid_targets_min": 186
},
{
"epoch": 6.905901116427432,
"grad_norm": 0.4156838063505349,
"learning_rate": 2.2768039564151635e-08,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1466359794139862,
"step": 4330,
"valid_targets_mean": 6131.1,
"valid_targets_min": 222
},
{
"epoch": 6.913875598086125,
"grad_norm": 0.45459420575813153,
"learning_rate": 1.913205760175174e-08,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472633183002472,
"step": 4335,
"valid_targets_mean": 5499.1,
"valid_targets_min": 918
},
{
"epoch": 6.921850079744816,
"grad_norm": 0.5393281054744222,
"learning_rate": 1.5812055453963136e-08,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455461084842682,
"step": 4340,
"valid_targets_mean": 4090.8,
"valid_targets_min": 223
},
{
"epoch": 6.9298245614035086,
"grad_norm": 0.4636075944477561,
"learning_rate": 1.280808562369229e-08,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15545576810836792,
"step": 4345,
"valid_targets_mean": 5444.2,
"valid_targets_min": 306
},
{
"epoch": 6.937799043062201,
"grad_norm": 0.4669452035057073,
"learning_rate": 1.01201956160768e-08,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16182288527488708,
"step": 4350,
"valid_targets_mean": 5502.8,
"valid_targets_min": 237
},
{
"epoch": 6.945773524720893,
"grad_norm": 0.5151990228437675,
"learning_rate": 7.74842793772601e-09,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16319866478443146,
"step": 4355,
"valid_targets_mean": 4926.0,
"valid_targets_min": 294
},
{
"epoch": 6.953748006379586,
"grad_norm": 0.4990613508241575,
"learning_rate": 5.692820096054874e-09,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18269044160842896,
"step": 4360,
"valid_targets_mean": 5456.6,
"valid_targets_min": 353
},
{
"epoch": 6.961722488038277,
"grad_norm": 0.4688789910525006,
"learning_rate": 3.9534045986888706e-09,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1274082511663437,
"step": 4365,
"valid_targets_mean": 4650.2,
"valid_targets_min": 253
},
{
"epoch": 6.96969696969697,
"grad_norm": 0.47324806337291064,
"learning_rate": 2.530208952953306e-09,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16023960709571838,
"step": 4370,
"valid_targets_mean": 5175.2,
"valid_targets_min": 188
},
{
"epoch": 6.977671451355662,
"grad_norm": 0.5245943580661637,
"learning_rate": 1.4232556654314445e-09,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14867472648620605,
"step": 4375,
"valid_targets_mean": 4396.8,
"valid_targets_min": 217
},
{
"epoch": 6.985645933014354,
"grad_norm": 0.49879412018200225,
"learning_rate": 6.325622416136767e-10,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16116350889205933,
"step": 4380,
"valid_targets_mean": 5194.9,
"valid_targets_min": 606
},
{
"epoch": 6.993620414673046,
"grad_norm": 0.5977785482250375,
"learning_rate": 1.581411856199644e-10,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16265273094177246,
"step": 4385,
"valid_targets_mean": 4349.9,
"valid_targets_min": 237
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1386960744857788,
"step": 4389,
"total_flos": 1630450968166400.0,
"train_loss": 0.1932186623672386,
"train_runtime": 23240.6244,
"train_samples_per_second": 3.017,
"train_steps_per_second": 0.189,
"valid_targets_mean": 4301.4,
"valid_targets_min": 221
}
],
"logging_steps": 5,
"max_steps": 4389,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1630450968166400.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}