Files
a1-curriculum_easy/trainer_state.json
ModelHub XC 79b9c7fc7b 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-curriculum_easy
Source: Original Platform
2026-05-13 12:40:16 +08:00

9101 lines
253 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4116,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008503401360544218,
"grad_norm": 16.284088332723297,
"learning_rate": 3.883495145631068e-07,
"loss": 0.7008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6880989074707031,
"step": 5,
"valid_targets_mean": 3394.2,
"valid_targets_min": 1520
},
{
"epoch": 0.017006802721088437,
"grad_norm": 14.839739819166988,
"learning_rate": 8.737864077669904e-07,
"loss": 0.6754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6068336367607117,
"step": 10,
"valid_targets_mean": 3490.3,
"valid_targets_min": 1012
},
{
"epoch": 0.025510204081632654,
"grad_norm": 13.952466669607169,
"learning_rate": 1.359223300970874e-06,
"loss": 0.6342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6203460693359375,
"step": 15,
"valid_targets_mean": 3233.2,
"valid_targets_min": 1535
},
{
"epoch": 0.034013605442176874,
"grad_norm": 12.6446610614783,
"learning_rate": 1.8446601941747574e-06,
"loss": 0.6454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6516385674476624,
"step": 20,
"valid_targets_mean": 3449.2,
"valid_targets_min": 1103
},
{
"epoch": 0.04251700680272109,
"grad_norm": 8.19224953585781,
"learning_rate": 2.330097087378641e-06,
"loss": 0.5636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5059263110160828,
"step": 25,
"valid_targets_mean": 3176.9,
"valid_targets_min": 1296
},
{
"epoch": 0.05102040816326531,
"grad_norm": 5.247631542695172,
"learning_rate": 2.8155339805825245e-06,
"loss": 0.5175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4891727566719055,
"step": 30,
"valid_targets_mean": 3418.7,
"valid_targets_min": 1376
},
{
"epoch": 0.05952380952380952,
"grad_norm": 3.1552727841621153,
"learning_rate": 3.300970873786408e-06,
"loss": 0.4638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4893268942832947,
"step": 35,
"valid_targets_mean": 3089.0,
"valid_targets_min": 1058
},
{
"epoch": 0.06802721088435375,
"grad_norm": 1.6068476825700668,
"learning_rate": 3.7864077669902915e-06,
"loss": 0.4355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4086935222148895,
"step": 40,
"valid_targets_mean": 4035.6,
"valid_targets_min": 1506
},
{
"epoch": 0.07653061224489796,
"grad_norm": 1.2002679568552468,
"learning_rate": 4.271844660194175e-06,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.403389573097229,
"step": 45,
"valid_targets_mean": 3934.1,
"valid_targets_min": 1328
},
{
"epoch": 0.08503401360544217,
"grad_norm": 0.9667513884903771,
"learning_rate": 4.7572815533980585e-06,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39787787199020386,
"step": 50,
"valid_targets_mean": 4216.1,
"valid_targets_min": 1416
},
{
"epoch": 0.0935374149659864,
"grad_norm": 0.8925696727275947,
"learning_rate": 5.242718446601942e-06,
"loss": 0.3858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46847638487815857,
"step": 55,
"valid_targets_mean": 4303.9,
"valid_targets_min": 1352
},
{
"epoch": 0.10204081632653061,
"grad_norm": 0.8357941987187405,
"learning_rate": 5.728155339805825e-06,
"loss": 0.3561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3789106011390686,
"step": 60,
"valid_targets_mean": 3574.6,
"valid_targets_min": 1645
},
{
"epoch": 0.11054421768707483,
"grad_norm": 0.7397059160537327,
"learning_rate": 6.213592233009709e-06,
"loss": 0.3645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42246219515800476,
"step": 65,
"valid_targets_mean": 3720.4,
"valid_targets_min": 1078
},
{
"epoch": 0.11904761904761904,
"grad_norm": 1.126422671830154,
"learning_rate": 6.6990291262135935e-06,
"loss": 0.3923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3333202600479126,
"step": 70,
"valid_targets_mean": 3193.3,
"valid_targets_min": 1204
},
{
"epoch": 0.12755102040816327,
"grad_norm": 0.632940371104463,
"learning_rate": 7.184466019417476e-06,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33268964290618896,
"step": 75,
"valid_targets_mean": 3355.2,
"valid_targets_min": 1090
},
{
"epoch": 0.1360544217687075,
"grad_norm": 0.6098061945319946,
"learning_rate": 7.66990291262136e-06,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3157602846622467,
"step": 80,
"valid_targets_mean": 3896.2,
"valid_targets_min": 1676
},
{
"epoch": 0.1445578231292517,
"grad_norm": 0.6247199509119066,
"learning_rate": 8.155339805825243e-06,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38960957527160645,
"step": 85,
"valid_targets_mean": 3736.6,
"valid_targets_min": 793
},
{
"epoch": 0.15306122448979592,
"grad_norm": 0.7385270073420317,
"learning_rate": 8.640776699029127e-06,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33316653966903687,
"step": 90,
"valid_targets_mean": 2948.8,
"valid_targets_min": 1070
},
{
"epoch": 0.16156462585034015,
"grad_norm": 0.492100707949269,
"learning_rate": 9.12621359223301e-06,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2514708340167999,
"step": 95,
"valid_targets_mean": 4425.4,
"valid_targets_min": 1240
},
{
"epoch": 0.17006802721088435,
"grad_norm": 0.5951003547593199,
"learning_rate": 9.611650485436894e-06,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2692122757434845,
"step": 100,
"valid_targets_mean": 2710.9,
"valid_targets_min": 1322
},
{
"epoch": 0.17857142857142858,
"grad_norm": 0.7613709438724316,
"learning_rate": 1.0097087378640778e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38309434056282043,
"step": 105,
"valid_targets_mean": 3319.0,
"valid_targets_min": 1125
},
{
"epoch": 0.1870748299319728,
"grad_norm": 0.5914325453792764,
"learning_rate": 1.0582524271844662e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25947824120521545,
"step": 110,
"valid_targets_mean": 2820.6,
"valid_targets_min": 690
},
{
"epoch": 0.195578231292517,
"grad_norm": 0.6002580182988407,
"learning_rate": 1.1067961165048544e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35196587443351746,
"step": 115,
"valid_targets_mean": 3586.2,
"valid_targets_min": 668
},
{
"epoch": 0.20408163265306123,
"grad_norm": 0.5372570805761464,
"learning_rate": 1.1553398058252427e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28968310356140137,
"step": 120,
"valid_targets_mean": 4067.5,
"valid_targets_min": 1436
},
{
"epoch": 0.21258503401360543,
"grad_norm": 0.5237896767254485,
"learning_rate": 1.2038834951456311e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32339826226234436,
"step": 125,
"valid_targets_mean": 4317.6,
"valid_targets_min": 1065
},
{
"epoch": 0.22108843537414966,
"grad_norm": 0.5670068619189014,
"learning_rate": 1.2524271844660197e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3546511232852936,
"step": 130,
"valid_targets_mean": 3980.6,
"valid_targets_min": 758
},
{
"epoch": 0.22959183673469388,
"grad_norm": 0.5255698995362615,
"learning_rate": 1.300970873786408e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28089749813079834,
"step": 135,
"valid_targets_mean": 4137.8,
"valid_targets_min": 804
},
{
"epoch": 0.23809523809523808,
"grad_norm": 0.5595742490638705,
"learning_rate": 1.3495145631067962e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.267475962638855,
"step": 140,
"valid_targets_mean": 3784.4,
"valid_targets_min": 1328
},
{
"epoch": 0.2465986394557823,
"grad_norm": 0.588682917285768,
"learning_rate": 1.3980582524271846e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28826704621315,
"step": 145,
"valid_targets_mean": 3321.7,
"valid_targets_min": 1237
},
{
"epoch": 0.25510204081632654,
"grad_norm": 0.6379265355221891,
"learning_rate": 1.446601941747573e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3119679093360901,
"step": 150,
"valid_targets_mean": 3228.9,
"valid_targets_min": 1314
},
{
"epoch": 0.26360544217687076,
"grad_norm": 1.1311868788928263,
"learning_rate": 1.4951456310679614e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28038668632507324,
"step": 155,
"valid_targets_mean": 3130.2,
"valid_targets_min": 1197
},
{
"epoch": 0.272108843537415,
"grad_norm": 0.5961390202565682,
"learning_rate": 1.5436893203883496e-05,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23698543012142181,
"step": 160,
"valid_targets_mean": 3128.9,
"valid_targets_min": 1230
},
{
"epoch": 0.28061224489795916,
"grad_norm": 0.748114955090481,
"learning_rate": 1.592233009708738e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971285581588745,
"step": 165,
"valid_targets_mean": 3631.0,
"valid_targets_min": 1322
},
{
"epoch": 0.2891156462585034,
"grad_norm": 0.5913012294912496,
"learning_rate": 1.6407766990291263e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528142035007477,
"step": 170,
"valid_targets_mean": 3472.6,
"valid_targets_min": 1044
},
{
"epoch": 0.2976190476190476,
"grad_norm": 0.6335415710139134,
"learning_rate": 1.6893203883495145e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000209629535675,
"step": 175,
"valid_targets_mean": 3211.1,
"valid_targets_min": 951
},
{
"epoch": 0.30612244897959184,
"grad_norm": 0.5716361790983413,
"learning_rate": 1.737864077669903e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25265321135520935,
"step": 180,
"valid_targets_mean": 3723.9,
"valid_targets_min": 1553
},
{
"epoch": 0.31462585034013607,
"grad_norm": 0.5461651660212551,
"learning_rate": 1.7864077669902916e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22830471396446228,
"step": 185,
"valid_targets_mean": 3600.1,
"valid_targets_min": 277
},
{
"epoch": 0.3231292517006803,
"grad_norm": 0.6266878783879113,
"learning_rate": 1.8349514563106798e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27608734369277954,
"step": 190,
"valid_targets_mean": 3576.2,
"valid_targets_min": 1838
},
{
"epoch": 0.33163265306122447,
"grad_norm": 0.6262564074677799,
"learning_rate": 1.883495145631068e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33075207471847534,
"step": 195,
"valid_targets_mean": 3644.2,
"valid_targets_min": 1408
},
{
"epoch": 0.3401360544217687,
"grad_norm": 0.6222343963607243,
"learning_rate": 1.9320388349514565e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28491562604904175,
"step": 200,
"valid_targets_mean": 3473.6,
"valid_targets_min": 1591
},
{
"epoch": 0.3486394557823129,
"grad_norm": 0.5692531688349544,
"learning_rate": 1.9805825242718447e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2638142704963684,
"step": 205,
"valid_targets_mean": 4383.2,
"valid_targets_min": 1505
},
{
"epoch": 0.35714285714285715,
"grad_norm": 0.6016824349437719,
"learning_rate": 2.0291262135922333e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2720300257205963,
"step": 210,
"valid_targets_mean": 3857.2,
"valid_targets_min": 1115
},
{
"epoch": 0.3656462585034014,
"grad_norm": 0.5660323710291796,
"learning_rate": 2.0776699029126215e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20892475545406342,
"step": 215,
"valid_targets_mean": 3352.7,
"valid_targets_min": 1090
},
{
"epoch": 0.3741496598639456,
"grad_norm": 0.5397652134256967,
"learning_rate": 2.1262135922330097e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2417203038930893,
"step": 220,
"valid_targets_mean": 3862.2,
"valid_targets_min": 1166
},
{
"epoch": 0.3826530612244898,
"grad_norm": 0.9020207934335027,
"learning_rate": 2.1747572815533982e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2550874948501587,
"step": 225,
"valid_targets_mean": 4108.3,
"valid_targets_min": 1093
},
{
"epoch": 0.391156462585034,
"grad_norm": 0.5496806077798531,
"learning_rate": 2.2233009708737864e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542770206928253,
"step": 230,
"valid_targets_mean": 3857.4,
"valid_targets_min": 1737
},
{
"epoch": 0.39965986394557823,
"grad_norm": 0.5786260227985688,
"learning_rate": 2.271844660194175e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23735564947128296,
"step": 235,
"valid_targets_mean": 3291.6,
"valid_targets_min": 1552
},
{
"epoch": 0.40816326530612246,
"grad_norm": 0.624916105565735,
"learning_rate": 2.3203883495145632e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25283026695251465,
"step": 240,
"valid_targets_mean": 3140.6,
"valid_targets_min": 1101
},
{
"epoch": 0.4166666666666667,
"grad_norm": 0.6230467099115211,
"learning_rate": 2.3689320388349514e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23698002099990845,
"step": 245,
"valid_targets_mean": 3379.9,
"valid_targets_min": 868
},
{
"epoch": 0.42517006802721086,
"grad_norm": 0.5654277458214261,
"learning_rate": 2.41747572815534e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25777631998062134,
"step": 250,
"valid_targets_mean": 4212.4,
"valid_targets_min": 1376
},
{
"epoch": 0.4336734693877551,
"grad_norm": 0.845325859827072,
"learning_rate": 2.466019417475728e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28165894746780396,
"step": 255,
"valid_targets_mean": 3721.9,
"valid_targets_min": 1469
},
{
"epoch": 0.4421768707482993,
"grad_norm": 0.5477155296016747,
"learning_rate": 2.514563106796117e-05,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22638031840324402,
"step": 260,
"valid_targets_mean": 3850.2,
"valid_targets_min": 1020
},
{
"epoch": 0.45068027210884354,
"grad_norm": 0.590971583313143,
"learning_rate": 2.5631067961165052e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25587913393974304,
"step": 265,
"valid_targets_mean": 3664.8,
"valid_targets_min": 1193
},
{
"epoch": 0.45918367346938777,
"grad_norm": 0.7112768961498113,
"learning_rate": 2.6116504854368934e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2385358214378357,
"step": 270,
"valid_targets_mean": 3111.2,
"valid_targets_min": 738
},
{
"epoch": 0.467687074829932,
"grad_norm": 0.5301764242793776,
"learning_rate": 2.660194174757282e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.267933189868927,
"step": 275,
"valid_targets_mean": 4447.9,
"valid_targets_min": 1926
},
{
"epoch": 0.47619047619047616,
"grad_norm": 0.5551111127425339,
"learning_rate": 2.7087378640776702e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21886155009269714,
"step": 280,
"valid_targets_mean": 3772.6,
"valid_targets_min": 1751
},
{
"epoch": 0.4846938775510204,
"grad_norm": 0.5167918851842331,
"learning_rate": 2.7572815533980587e-05,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27086275815963745,
"step": 285,
"valid_targets_mean": 4184.1,
"valid_targets_min": 1025
},
{
"epoch": 0.4931972789115646,
"grad_norm": 0.7009839725364524,
"learning_rate": 2.805825242718447e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23540431261062622,
"step": 290,
"valid_targets_mean": 3462.0,
"valid_targets_min": 1618
},
{
"epoch": 0.5017006802721088,
"grad_norm": 0.6603793288831256,
"learning_rate": 2.854368932038835e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22473765909671783,
"step": 295,
"valid_targets_mean": 2997.2,
"valid_targets_min": 1662
},
{
"epoch": 0.5102040816326531,
"grad_norm": 0.5472173526564987,
"learning_rate": 2.9029126213592237e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626279294490814,
"step": 300,
"valid_targets_mean": 4095.4,
"valid_targets_min": 1374
},
{
"epoch": 0.5187074829931972,
"grad_norm": 0.583901679673355,
"learning_rate": 2.951456310679612e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25624722242355347,
"step": 305,
"valid_targets_mean": 3267.6,
"valid_targets_min": 1342
},
{
"epoch": 0.5272108843537415,
"grad_norm": 0.5974779827455141,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29399585723876953,
"step": 310,
"valid_targets_mean": 3656.5,
"valid_targets_min": 1623
},
{
"epoch": 0.5357142857142857,
"grad_norm": 0.5848328720235239,
"learning_rate": 3.0485436893203886e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22116899490356445,
"step": 315,
"valid_targets_mean": 3654.2,
"valid_targets_min": 1822
},
{
"epoch": 0.54421768707483,
"grad_norm": 0.5219255102519595,
"learning_rate": 3.097087378640777e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269960880279541,
"step": 320,
"valid_targets_mean": 4145.9,
"valid_targets_min": 1355
},
{
"epoch": 0.5527210884353742,
"grad_norm": 0.5503971512937593,
"learning_rate": 3.1456310679611654e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24401246011257172,
"step": 325,
"valid_targets_mean": 4419.8,
"valid_targets_min": 1234
},
{
"epoch": 0.5612244897959183,
"grad_norm": 0.5701637940871919,
"learning_rate": 3.194174757281554e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21285384893417358,
"step": 330,
"valid_targets_mean": 3603.2,
"valid_targets_min": 1061
},
{
"epoch": 0.5697278911564626,
"grad_norm": 0.616506008664278,
"learning_rate": 3.242718446601942e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27921557426452637,
"step": 335,
"valid_targets_mean": 3437.5,
"valid_targets_min": 1340
},
{
"epoch": 0.5782312925170068,
"grad_norm": 0.6116541556683032,
"learning_rate": 3.29126213592233e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24892035126686096,
"step": 340,
"valid_targets_mean": 3190.8,
"valid_targets_min": 1245
},
{
"epoch": 0.5867346938775511,
"grad_norm": 0.5147623109762519,
"learning_rate": 3.339805825242719e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2467966079711914,
"step": 345,
"valid_targets_mean": 4105.7,
"valid_targets_min": 2111
},
{
"epoch": 0.5952380952380952,
"grad_norm": 0.5560814376438035,
"learning_rate": 3.388349514563107e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26886463165283203,
"step": 350,
"valid_targets_mean": 3899.1,
"valid_targets_min": 792
},
{
"epoch": 0.6037414965986394,
"grad_norm": 0.5999655031743574,
"learning_rate": 3.436893203883495e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39038926362991333,
"step": 355,
"valid_targets_mean": 4675.1,
"valid_targets_min": 1261
},
{
"epoch": 0.6122448979591837,
"grad_norm": 0.5430030557117063,
"learning_rate": 3.485436893203884e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2600330114364624,
"step": 360,
"valid_targets_mean": 3977.9,
"valid_targets_min": 1596
},
{
"epoch": 0.6207482993197279,
"grad_norm": 0.5731887626204569,
"learning_rate": 3.5339805825242724e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22550851106643677,
"step": 365,
"valid_targets_mean": 3385.5,
"valid_targets_min": 1171
},
{
"epoch": 0.6292517006802721,
"grad_norm": 0.5627496362039582,
"learning_rate": 3.582524271844661e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910814881324768,
"step": 370,
"valid_targets_mean": 4556.4,
"valid_targets_min": 1882
},
{
"epoch": 0.6377551020408163,
"grad_norm": 0.5991575814558935,
"learning_rate": 3.631067961165049e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.211978018283844,
"step": 375,
"valid_targets_mean": 3452.8,
"valid_targets_min": 1318
},
{
"epoch": 0.6462585034013606,
"grad_norm": 0.6102343665862296,
"learning_rate": 3.679611650485437e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21666033565998077,
"step": 380,
"valid_targets_mean": 3131.9,
"valid_targets_min": 1314
},
{
"epoch": 0.6547619047619048,
"grad_norm": 0.5948668213611634,
"learning_rate": 3.728155339805826e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24347296357154846,
"step": 385,
"valid_targets_mean": 3611.2,
"valid_targets_min": 883
},
{
"epoch": 0.6632653061224489,
"grad_norm": 0.6047163659117363,
"learning_rate": 3.776699029126214e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2162351906299591,
"step": 390,
"valid_targets_mean": 3810.4,
"valid_targets_min": 771
},
{
"epoch": 0.6717687074829932,
"grad_norm": 0.5375529397120948,
"learning_rate": 3.825242718446602e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22332267463207245,
"step": 395,
"valid_targets_mean": 3901.6,
"valid_targets_min": 773
},
{
"epoch": 0.6802721088435374,
"grad_norm": 1.0342771407751923,
"learning_rate": 3.873786407766991e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1947087049484253,
"step": 400,
"valid_targets_mean": 3132.8,
"valid_targets_min": 1457
},
{
"epoch": 0.6887755102040817,
"grad_norm": 0.5626435257811521,
"learning_rate": 3.9223300970873787e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2347477376461029,
"step": 405,
"valid_targets_mean": 3649.8,
"valid_targets_min": 1331
},
{
"epoch": 0.6972789115646258,
"grad_norm": 0.569318137076344,
"learning_rate": 3.970873786407767e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20133861899375916,
"step": 410,
"valid_targets_mean": 3133.1,
"valid_targets_min": 1569
},
{
"epoch": 0.70578231292517,
"grad_norm": 1.0743284208556751,
"learning_rate": 3.9999971224844676e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24629156291484833,
"step": 415,
"valid_targets_mean": 3826.4,
"valid_targets_min": 1325
},
{
"epoch": 0.7142857142857143,
"grad_norm": 0.6635319496766661,
"learning_rate": 3.9999647505298214e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18993477523326874,
"step": 420,
"valid_targets_mean": 2720.0,
"valid_targets_min": 1349
},
{
"epoch": 0.7227891156462585,
"grad_norm": 0.6170915333057738,
"learning_rate": 3.999896410310244e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22692041099071503,
"step": 425,
"valid_targets_mean": 3027.8,
"valid_targets_min": 726
},
{
"epoch": 0.7312925170068028,
"grad_norm": 0.5463223980088899,
"learning_rate": 3.9997921030547975e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2502792477607727,
"step": 430,
"valid_targets_mean": 4274.4,
"valid_targets_min": 1318
},
{
"epoch": 0.7397959183673469,
"grad_norm": 0.6317330429857803,
"learning_rate": 3.9996518306393906e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2522296607494354,
"step": 435,
"valid_targets_mean": 4349.2,
"valid_targets_min": 1531
},
{
"epoch": 0.7482993197278912,
"grad_norm": 0.5589182010307014,
"learning_rate": 3.999475595586746e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22174233198165894,
"step": 440,
"valid_targets_mean": 3621.8,
"valid_targets_min": 1171
},
{
"epoch": 0.7568027210884354,
"grad_norm": 0.6274192316998353,
"learning_rate": 3.9992634010663535e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19328610599040985,
"step": 445,
"valid_targets_mean": 3207.5,
"valid_targets_min": 1380
},
{
"epoch": 0.7653061224489796,
"grad_norm": 0.7143188282236254,
"learning_rate": 3.999015250894415e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24878516793251038,
"step": 450,
"valid_targets_mean": 2905.9,
"valid_targets_min": 704
},
{
"epoch": 0.7738095238095238,
"grad_norm": 0.6357498516540245,
"learning_rate": 3.998731149533774e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257612943649292,
"step": 455,
"valid_targets_mean": 4270.8,
"valid_targets_min": 1016
},
{
"epoch": 0.782312925170068,
"grad_norm": 0.608459313439396,
"learning_rate": 3.9984111020938376e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23315557837486267,
"step": 460,
"valid_targets_mean": 3114.2,
"valid_targets_min": 468
},
{
"epoch": 0.7908163265306123,
"grad_norm": 0.5311014249453725,
"learning_rate": 3.998055114330483e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22066374123096466,
"step": 465,
"valid_targets_mean": 4115.8,
"valid_targets_min": 237
},
{
"epoch": 0.7993197278911565,
"grad_norm": 0.5517724265625736,
"learning_rate": 3.9976631926459536e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21982333064079285,
"step": 470,
"valid_targets_mean": 3534.5,
"valid_targets_min": 1529
},
{
"epoch": 0.8078231292517006,
"grad_norm": 0.5625719777203932,
"learning_rate": 3.997235344088747e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19416046142578125,
"step": 475,
"valid_targets_mean": 3017.0,
"valid_targets_min": 740
},
{
"epoch": 0.8163265306122449,
"grad_norm": 0.6799480818848552,
"learning_rate": 3.9967715763534805e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2595263123512268,
"step": 480,
"valid_targets_mean": 3761.9,
"valid_targets_min": 1567
},
{
"epoch": 0.8248299319727891,
"grad_norm": 0.6509377180428996,
"learning_rate": 3.9962718977807637e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21661224961280823,
"step": 485,
"valid_targets_mean": 3430.8,
"valid_targets_min": 516
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.6165176687499115,
"learning_rate": 3.995736317357041e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20129480957984924,
"step": 490,
"valid_targets_mean": 3195.6,
"valid_targets_min": 864
},
{
"epoch": 0.8418367346938775,
"grad_norm": 0.5318159802711743,
"learning_rate": 3.9951648447144305e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27752143144607544,
"step": 495,
"valid_targets_mean": 4461.1,
"valid_targets_min": 1431
},
{
"epoch": 0.8503401360544217,
"grad_norm": 0.5556209073828486,
"learning_rate": 3.9945574901305534e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.202958345413208,
"step": 500,
"valid_targets_mean": 3815.9,
"valid_targets_min": 1488
},
{
"epoch": 0.858843537414966,
"grad_norm": 1.0342886678960757,
"learning_rate": 3.9939142645283475e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19952651858329773,
"step": 505,
"valid_targets_mean": 2500.6,
"valid_targets_min": 844
},
{
"epoch": 0.8673469387755102,
"grad_norm": 0.5402963048438412,
"learning_rate": 3.9932351794758705e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27289947867393494,
"step": 510,
"valid_targets_mean": 4066.7,
"valid_targets_min": 1590
},
{
"epoch": 0.8758503401360545,
"grad_norm": 0.4961205211173556,
"learning_rate": 3.992520247186094e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20045743882656097,
"step": 515,
"valid_targets_mean": 3896.8,
"valid_targets_min": 1635
},
{
"epoch": 0.8843537414965986,
"grad_norm": 0.5120923461971542,
"learning_rate": 3.991769480516681e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18355634808540344,
"step": 520,
"valid_targets_mean": 3659.9,
"valid_targets_min": 1564
},
{
"epoch": 0.8928571428571429,
"grad_norm": 0.5623713120504147,
"learning_rate": 3.9909828929697575e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22784064710140228,
"step": 525,
"valid_targets_mean": 3482.8,
"valid_targets_min": 1422
},
{
"epoch": 0.9013605442176871,
"grad_norm": 0.7661825249423273,
"learning_rate": 3.9901604986916666e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24556386470794678,
"step": 530,
"valid_targets_mean": 4166.4,
"valid_targets_min": 656
},
{
"epoch": 0.9098639455782312,
"grad_norm": 0.5954424304699879,
"learning_rate": 3.9893023124727176e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2076413780450821,
"step": 535,
"valid_targets_mean": 3791.6,
"valid_targets_min": 1222
},
{
"epoch": 0.9183673469387755,
"grad_norm": 0.5761225149341407,
"learning_rate": 3.988408349746916e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1701766699552536,
"step": 540,
"valid_targets_mean": 3159.8,
"valid_targets_min": 292
},
{
"epoch": 0.9268707482993197,
"grad_norm": 0.6231094057313721,
"learning_rate": 3.9874786265916895e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19349026679992676,
"step": 545,
"valid_targets_mean": 3046.1,
"valid_targets_min": 1543
},
{
"epoch": 0.935374149659864,
"grad_norm": 0.5278032564391175,
"learning_rate": 3.986513159727598e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22423487901687622,
"step": 550,
"valid_targets_mean": 3591.6,
"valid_targets_min": 1361
},
{
"epoch": 0.9438775510204082,
"grad_norm": 0.5593996618941262,
"learning_rate": 3.985511966518031e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21108989417552948,
"step": 555,
"valid_targets_mean": 3543.1,
"valid_targets_min": 785
},
{
"epoch": 0.9523809523809523,
"grad_norm": 0.6004996101097438,
"learning_rate": 3.984475064968897e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20403581857681274,
"step": 560,
"valid_targets_mean": 2996.8,
"valid_targets_min": 1127
},
{
"epoch": 0.9608843537414966,
"grad_norm": 0.5607013766195372,
"learning_rate": 3.9834024737282994e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2213515192270279,
"step": 565,
"valid_targets_mean": 3813.0,
"valid_targets_min": 712
},
{
"epoch": 0.9693877551020408,
"grad_norm": 0.5378418432619649,
"learning_rate": 3.9822942120862016e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22113119065761566,
"step": 570,
"valid_targets_mean": 3979.8,
"valid_targets_min": 1487
},
{
"epoch": 0.9778911564625851,
"grad_norm": 0.5155096520501556,
"learning_rate": 3.981150299974079e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17551299929618835,
"step": 575,
"valid_targets_mean": 4004.7,
"valid_targets_min": 1841
},
{
"epoch": 0.9863945578231292,
"grad_norm": 1.0096571246008348,
"learning_rate": 3.979970757964561e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19910582900047302,
"step": 580,
"valid_targets_mean": 4383.6,
"valid_targets_min": 1271
},
{
"epoch": 0.9948979591836735,
"grad_norm": 0.4896747460569099,
"learning_rate": 3.978755607271061e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23156213760375977,
"step": 585,
"valid_targets_mean": 4823.2,
"valid_targets_min": 1267
},
{
"epoch": 1.0034013605442176,
"grad_norm": 0.5672962424422774,
"learning_rate": 3.977504869747395e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22572076320648193,
"step": 590,
"valid_targets_mean": 3516.4,
"valid_targets_min": 345
},
{
"epoch": 1.0119047619047619,
"grad_norm": 0.5312338195955498,
"learning_rate": 3.976218567887389e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20064997673034668,
"step": 595,
"valid_targets_mean": 3369.6,
"valid_targets_min": 791
},
{
"epoch": 1.0204081632653061,
"grad_norm": 0.5907568049016817,
"learning_rate": 3.974896724824475e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838887631893158,
"step": 600,
"valid_targets_mean": 3293.3,
"valid_targets_min": 1016
},
{
"epoch": 1.0289115646258504,
"grad_norm": 0.5741661915632267,
"learning_rate": 3.97353936433127e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22130995988845825,
"step": 605,
"valid_targets_mean": 3553.5,
"valid_targets_min": 1363
},
{
"epoch": 1.0374149659863945,
"grad_norm": 0.5548887515405546,
"learning_rate": 3.972146510819158e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20798607170581818,
"step": 610,
"valid_targets_mean": 3264.7,
"valid_targets_min": 759
},
{
"epoch": 1.0459183673469388,
"grad_norm": 0.48775913922713154,
"learning_rate": 3.970718189337841e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696465015411377,
"step": 615,
"valid_targets_mean": 3921.0,
"valid_targets_min": 1030
},
{
"epoch": 1.054421768707483,
"grad_norm": 0.5390452642348323,
"learning_rate": 3.969254425574895e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27588415145874023,
"step": 620,
"valid_targets_mean": 3971.6,
"valid_targets_min": 1047
},
{
"epoch": 1.0629251700680271,
"grad_norm": 0.5601492770617569,
"learning_rate": 3.9677552458553046e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1914624273777008,
"step": 625,
"valid_targets_mean": 3866.6,
"valid_targets_min": 1334
},
{
"epoch": 1.0714285714285714,
"grad_norm": 0.5372040764678854,
"learning_rate": 3.9662206771409925e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18735885620117188,
"step": 630,
"valid_targets_mean": 3296.4,
"valid_targets_min": 1828
},
{
"epoch": 1.0799319727891157,
"grad_norm": 0.4929419148783689,
"learning_rate": 3.964650747030332e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2222883701324463,
"step": 635,
"valid_targets_mean": 4493.8,
"valid_targets_min": 766
},
{
"epoch": 1.08843537414966,
"grad_norm": 0.5087861156990097,
"learning_rate": 3.963045483757652e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2039588987827301,
"step": 640,
"valid_targets_mean": 3933.9,
"valid_targets_min": 1732
},
{
"epoch": 1.096938775510204,
"grad_norm": 0.5471473406579418,
"learning_rate": 3.961404916192728e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703445315361023,
"step": 645,
"valid_targets_mean": 3236.4,
"valid_targets_min": 1522
},
{
"epoch": 1.1054421768707483,
"grad_norm": 0.601726665077757,
"learning_rate": 3.959729073840265e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2089315801858902,
"step": 650,
"valid_targets_mean": 2669.9,
"valid_targets_min": 771
},
{
"epoch": 1.1139455782312926,
"grad_norm": 0.5342431672997215,
"learning_rate": 3.958017986839364e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16569793224334717,
"step": 655,
"valid_targets_mean": 4190.9,
"valid_targets_min": 1653
},
{
"epoch": 1.1224489795918366,
"grad_norm": 0.47771373985756477,
"learning_rate": 3.956271685962985e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18933849036693573,
"step": 660,
"valid_targets_mean": 4276.8,
"valid_targets_min": 1203
},
{
"epoch": 1.130952380952381,
"grad_norm": 0.5180075636533443,
"learning_rate": 3.954490202617385e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20420797169208527,
"step": 665,
"valid_targets_mean": 3466.0,
"valid_targets_min": 1387
},
{
"epoch": 1.1394557823129252,
"grad_norm": 0.4810886562810522,
"learning_rate": 3.9526735688415624e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14678673446178436,
"step": 670,
"valid_targets_mean": 3429.4,
"valid_targets_min": 1151
},
{
"epoch": 1.1479591836734695,
"grad_norm": 0.43889872604968944,
"learning_rate": 3.9508218173066766e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18565359711647034,
"step": 675,
"valid_targets_mean": 4528.4,
"valid_targets_min": 1485
},
{
"epoch": 1.1564625850340136,
"grad_norm": 0.5494878687879327,
"learning_rate": 3.948934981315457e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21876271069049835,
"step": 680,
"valid_targets_mean": 3376.0,
"valid_targets_min": 1641
},
{
"epoch": 1.1649659863945578,
"grad_norm": 0.5527438745919528,
"learning_rate": 3.947013094801612e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18596649169921875,
"step": 685,
"valid_targets_mean": 3657.0,
"valid_targets_min": 1586
},
{
"epoch": 1.1734693877551021,
"grad_norm": 0.5825833837175836,
"learning_rate": 3.945056192329212e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1742013394832611,
"step": 690,
"valid_targets_mean": 2917.1,
"valid_targets_min": 1281
},
{
"epoch": 1.1819727891156462,
"grad_norm": 0.503721095345985,
"learning_rate": 3.9430643090920705e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2232275754213333,
"step": 695,
"valid_targets_mean": 4089.5,
"valid_targets_min": 1418
},
{
"epoch": 1.1904761904761905,
"grad_norm": 0.5218165403092541,
"learning_rate": 3.941037480913111e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1619264781475067,
"step": 700,
"valid_targets_mean": 3523.6,
"valid_targets_min": 1437
},
{
"epoch": 1.1989795918367347,
"grad_norm": 0.5281430386469016,
"learning_rate": 3.9389757442437214e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17680522799491882,
"step": 705,
"valid_targets_mean": 3565.9,
"valid_targets_min": 1325
},
{
"epoch": 1.2074829931972788,
"grad_norm": 0.5235289654221893,
"learning_rate": 3.936879136163102e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17753741145133972,
"step": 710,
"valid_targets_mean": 3354.5,
"valid_targets_min": 861
},
{
"epoch": 1.215986394557823,
"grad_norm": 0.5243131901993361,
"learning_rate": 3.934747694377594e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17617300152778625,
"step": 715,
"valid_targets_mean": 3630.2,
"valid_targets_min": 740
},
{
"epoch": 1.2244897959183674,
"grad_norm": 0.507546135504406,
"learning_rate": 3.932581457220004e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20022642612457275,
"step": 720,
"valid_targets_mean": 3641.4,
"valid_targets_min": 1358
},
{
"epoch": 1.2329931972789117,
"grad_norm": 0.4976716238444004,
"learning_rate": 3.9303804636489165e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976463496685028,
"step": 725,
"valid_targets_mean": 4419.9,
"valid_targets_min": 1633
},
{
"epoch": 1.2414965986394557,
"grad_norm": 0.5483850422579489,
"learning_rate": 3.928144753247987e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1868499368429184,
"step": 730,
"valid_targets_mean": 3198.6,
"valid_targets_min": 1518
},
{
"epoch": 1.25,
"grad_norm": 0.5488817504510112,
"learning_rate": 3.925874366225237e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1806359589099884,
"step": 735,
"valid_targets_mean": 3055.3,
"valid_targets_min": 1080
},
{
"epoch": 1.2585034013605443,
"grad_norm": 0.5066572269595151,
"learning_rate": 3.923569343412327e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1659495234489441,
"step": 740,
"valid_targets_mean": 3302.1,
"valid_targets_min": 1180
},
{
"epoch": 1.2670068027210886,
"grad_norm": 0.5849934441349959,
"learning_rate": 3.921229726263824e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1774701178073883,
"step": 745,
"valid_targets_mean": 2528.7,
"valid_targets_min": 1202
},
{
"epoch": 1.2755102040816326,
"grad_norm": 0.49696403833836683,
"learning_rate": 3.918855556856453e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18610414862632751,
"step": 750,
"valid_targets_mean": 3840.2,
"valid_targets_min": 1166
},
{
"epoch": 1.284013605442177,
"grad_norm": 0.51760011092419,
"learning_rate": 3.916446877888345e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.152181014418602,
"step": 755,
"valid_targets_mean": 3712.1,
"valid_targets_min": 1562
},
{
"epoch": 1.2925170068027212,
"grad_norm": 0.5197150478352947,
"learning_rate": 3.914003732678264e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17886745929718018,
"step": 760,
"valid_targets_mean": 3652.8,
"valid_targets_min": 1389
},
{
"epoch": 1.3010204081632653,
"grad_norm": 0.6469050227526758,
"learning_rate": 3.911526165164831e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18235021829605103,
"step": 765,
"valid_targets_mean": 3708.6,
"valid_targets_min": 1362
},
{
"epoch": 1.3095238095238095,
"grad_norm": 0.49033685187396464,
"learning_rate": 3.909014219905736e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17945152521133423,
"step": 770,
"valid_targets_mean": 4450.9,
"valid_targets_min": 1164
},
{
"epoch": 1.3180272108843538,
"grad_norm": 0.48357041587084415,
"learning_rate": 3.906467942076929e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16390027105808258,
"step": 775,
"valid_targets_mean": 3853.2,
"valid_targets_min": 261
},
{
"epoch": 1.3265306122448979,
"grad_norm": 0.5416106118859744,
"learning_rate": 3.903887377471816e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1834583282470703,
"step": 780,
"valid_targets_mean": 3806.6,
"valid_targets_min": 626
},
{
"epoch": 1.3350340136054422,
"grad_norm": 0.5709573952961344,
"learning_rate": 3.901272572500431e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2096044272184372,
"step": 785,
"valid_targets_mean": 3210.9,
"valid_targets_min": 1076
},
{
"epoch": 1.3435374149659864,
"grad_norm": 0.49261093365090397,
"learning_rate": 3.8986235741886016e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19666042923927307,
"step": 790,
"valid_targets_mean": 4010.6,
"valid_targets_min": 1349
},
{
"epoch": 1.3520408163265305,
"grad_norm": 0.5295408603491522,
"learning_rate": 3.8959404301771035e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17796075344085693,
"step": 795,
"valid_targets_mean": 3584.5,
"valid_targets_min": 1196
},
{
"epoch": 1.3605442176870748,
"grad_norm": 0.5009867989877805,
"learning_rate": 3.893223188720804e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16877491772174835,
"step": 800,
"valid_targets_mean": 3927.5,
"valid_targets_min": 1379
},
{
"epoch": 1.369047619047619,
"grad_norm": 0.5414078300255754,
"learning_rate": 3.890471898687797e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19157296419143677,
"step": 805,
"valid_targets_mean": 3358.6,
"valid_targets_min": 1356
},
{
"epoch": 1.3775510204081631,
"grad_norm": 0.5222165452421504,
"learning_rate": 3.887686609558516e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23859623074531555,
"step": 810,
"valid_targets_mean": 4134.9,
"valid_targets_min": 1487
},
{
"epoch": 1.3860544217687074,
"grad_norm": 0.5217149334650539,
"learning_rate": 3.8848673714248545e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26612165570259094,
"step": 815,
"valid_targets_mean": 4028.3,
"valid_targets_min": 1564
},
{
"epoch": 1.3945578231292517,
"grad_norm": 0.5170659251716594,
"learning_rate": 3.882014234989258e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22827790677547455,
"step": 820,
"valid_targets_mean": 3701.8,
"valid_targets_min": 1093
},
{
"epoch": 1.403061224489796,
"grad_norm": 0.4688236578703589,
"learning_rate": 3.879127251563814e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2379659116268158,
"step": 825,
"valid_targets_mean": 4414.6,
"valid_targets_min": 602
},
{
"epoch": 1.4115646258503403,
"grad_norm": 0.49118587067228825,
"learning_rate": 3.87620647306933e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15896081924438477,
"step": 830,
"valid_targets_mean": 3619.9,
"valid_targets_min": 872
},
{
"epoch": 1.4200680272108843,
"grad_norm": 0.5821773109112104,
"learning_rate": 3.873251952034398e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18274542689323425,
"step": 835,
"valid_targets_mean": 2929.2,
"valid_targets_min": 656
},
{
"epoch": 1.4285714285714286,
"grad_norm": 0.5452331430405628,
"learning_rate": 3.8702637415944554e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17982515692710876,
"step": 840,
"valid_targets_mean": 3342.9,
"valid_targets_min": 1236
},
{
"epoch": 1.4370748299319729,
"grad_norm": 0.46140086600989344,
"learning_rate": 3.867241895490818e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1850546896457672,
"step": 845,
"valid_targets_mean": 4547.8,
"valid_targets_min": 1230
},
{
"epoch": 1.445578231292517,
"grad_norm": 0.6096456433047177,
"learning_rate": 3.864186468069727e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20062093436717987,
"step": 850,
"valid_targets_mean": 3861.6,
"valid_targets_min": 1361
},
{
"epoch": 1.4540816326530612,
"grad_norm": 0.4585502938921594,
"learning_rate": 3.86109751428136e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22109025716781616,
"step": 855,
"valid_targets_mean": 4631.1,
"valid_targets_min": 649
},
{
"epoch": 1.4625850340136055,
"grad_norm": 0.6500708452308398,
"learning_rate": 3.8579750896788526e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19890360534191132,
"step": 860,
"valid_targets_mean": 3457.9,
"valid_targets_min": 1516
},
{
"epoch": 1.4710884353741496,
"grad_norm": 0.5301669401019695,
"learning_rate": 3.8548192504172905e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16666162014007568,
"step": 865,
"valid_targets_mean": 3235.4,
"valid_targets_min": 1496
},
{
"epoch": 1.4795918367346939,
"grad_norm": 0.5003852480841234,
"learning_rate": 3.851630053252706e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19342686235904694,
"step": 870,
"valid_targets_mean": 3817.6,
"valid_targets_min": 1010
},
{
"epoch": 1.4880952380952381,
"grad_norm": 0.7206386070487517,
"learning_rate": 3.848407555541054e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1805090308189392,
"step": 875,
"valid_targets_mean": 3128.2,
"valid_targets_min": 1237
},
{
"epoch": 1.4965986394557822,
"grad_norm": 0.5325698260432379,
"learning_rate": 3.845151815237183e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22101525962352753,
"step": 880,
"valid_targets_mean": 3731.1,
"valid_targets_min": 1267
},
{
"epoch": 1.5051020408163265,
"grad_norm": 0.49784608869204255,
"learning_rate": 3.841862890893787e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21092960238456726,
"step": 885,
"valid_targets_mean": 4910.1,
"valid_targets_min": 2027
},
{
"epoch": 1.5136054421768708,
"grad_norm": 0.5139966586488321,
"learning_rate": 3.838540841660363e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17927789688110352,
"step": 890,
"valid_targets_mean": 3502.6,
"valid_targets_min": 1390
},
{
"epoch": 1.5221088435374148,
"grad_norm": 0.5753720323032561,
"learning_rate": 3.835185727282135e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17120110988616943,
"step": 895,
"valid_targets_mean": 3286.3,
"valid_targets_min": 1413
},
{
"epoch": 1.5306122448979593,
"grad_norm": 0.47592158361035486,
"learning_rate": 3.8317976080989884e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.163374125957489,
"step": 900,
"valid_targets_mean": 3801.1,
"valid_targets_min": 1384
},
{
"epoch": 1.5391156462585034,
"grad_norm": 0.5502887147122869,
"learning_rate": 3.828376545044381e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637812852859497,
"step": 905,
"valid_targets_mean": 3125.3,
"valid_targets_min": 1185
},
{
"epoch": 1.5476190476190477,
"grad_norm": 0.49349113517485865,
"learning_rate": 3.824922599644249e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690322607755661,
"step": 910,
"valid_targets_mean": 3258.8,
"valid_targets_min": 1083
},
{
"epoch": 1.556122448979592,
"grad_norm": 0.5864646081268652,
"learning_rate": 3.8214358340159e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19114357233047485,
"step": 915,
"valid_targets_mean": 2737.2,
"valid_targets_min": 294
},
{
"epoch": 1.564625850340136,
"grad_norm": 0.6146750809665836,
"learning_rate": 3.817916310866892e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2137393355369568,
"step": 920,
"valid_targets_mean": 3575.6,
"valid_targets_min": 1833
},
{
"epoch": 1.5731292517006803,
"grad_norm": 0.5497560800319427,
"learning_rate": 3.814364093493912e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1964998096227646,
"step": 925,
"valid_targets_mean": 3551.7,
"valid_targets_min": 1423
},
{
"epoch": 1.5816326530612246,
"grad_norm": 0.5252883761247669,
"learning_rate": 3.810779245781633e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1650836169719696,
"step": 930,
"valid_targets_mean": 3089.8,
"valid_targets_min": 1403
},
{
"epoch": 1.5901360544217686,
"grad_norm": 0.5121570735439744,
"learning_rate": 3.807161832201569e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19136366248130798,
"step": 935,
"valid_targets_mean": 4138.2,
"valid_targets_min": 1424
},
{
"epoch": 1.598639455782313,
"grad_norm": 0.5958778544952104,
"learning_rate": 3.80351191781091e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19539722800254822,
"step": 940,
"valid_targets_mean": 3694.7,
"valid_targets_min": 1215
},
{
"epoch": 1.6071428571428572,
"grad_norm": 0.46321527919315125,
"learning_rate": 3.799829568251358e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710878312587738,
"step": 945,
"valid_targets_mean": 4287.4,
"valid_targets_min": 1580
},
{
"epoch": 1.6156462585034013,
"grad_norm": 0.4474705462489259,
"learning_rate": 3.7961148497479414e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14631542563438416,
"step": 950,
"valid_targets_mean": 3635.0,
"valid_targets_min": 1443
},
{
"epoch": 1.6241496598639455,
"grad_norm": 0.41640737339744915,
"learning_rate": 3.792367829107828e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16833257675170898,
"step": 955,
"valid_targets_mean": 4065.6,
"valid_targets_min": 870
},
{
"epoch": 1.6326530612244898,
"grad_norm": 0.5577723930562095,
"learning_rate": 3.7885885737191214e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20395566523075104,
"step": 960,
"valid_targets_mean": 3751.8,
"valid_targets_min": 773
},
{
"epoch": 1.641156462585034,
"grad_norm": 0.5370007375191718,
"learning_rate": 3.784777151549648e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23845341801643372,
"step": 965,
"valid_targets_mean": 3401.8,
"valid_targets_min": 1196
},
{
"epoch": 1.6496598639455784,
"grad_norm": 0.4890736313125839,
"learning_rate": 3.780933631145738e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19676534831523895,
"step": 970,
"valid_targets_mean": 4242.6,
"valid_targets_min": 1641
},
{
"epoch": 1.6581632653061225,
"grad_norm": 0.5462693213339227,
"learning_rate": 3.777058081630989e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1821269541978836,
"step": 975,
"valid_targets_mean": 2902.4,
"valid_targets_min": 758
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.8337967865673986,
"learning_rate": 3.773150572705026e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20385128259658813,
"step": 980,
"valid_targets_mean": 2980.2,
"valid_targets_min": 1114
},
{
"epoch": 1.675170068027211,
"grad_norm": 0.5621665933713426,
"learning_rate": 3.769211174642245e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18322809040546417,
"step": 985,
"valid_targets_mean": 3570.9,
"valid_targets_min": 1141
},
{
"epoch": 1.683673469387755,
"grad_norm": 0.5494341598343004,
"learning_rate": 3.765239958290551e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19005733728408813,
"step": 990,
"valid_targets_mean": 3032.7,
"valid_targets_min": 1423
},
{
"epoch": 1.6921768707482994,
"grad_norm": 0.48352418832732824,
"learning_rate": 3.761236995070086e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16157102584838867,
"step": 995,
"valid_targets_mean": 3347.1,
"valid_targets_min": 1193
},
{
"epoch": 1.7006802721088436,
"grad_norm": 0.5632869048679273,
"learning_rate": 3.757202356971937e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18931040167808533,
"step": 1000,
"valid_targets_mean": 3152.6,
"valid_targets_min": 1561
},
{
"epoch": 1.7091836734693877,
"grad_norm": 0.5192329176419131,
"learning_rate": 3.75313611655685e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21477651596069336,
"step": 1005,
"valid_targets_mean": 3273.4,
"valid_targets_min": 1808
},
{
"epoch": 1.717687074829932,
"grad_norm": 0.537867998522921,
"learning_rate": 3.74903834695392e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20665214955806732,
"step": 1010,
"valid_targets_mean": 2862.1,
"valid_targets_min": 1222
},
{
"epoch": 1.7261904761904763,
"grad_norm": 0.4845497530535329,
"learning_rate": 3.7449091218592765e-05,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17452441155910492,
"step": 1015,
"valid_targets_mean": 3869.9,
"valid_targets_min": 820
},
{
"epoch": 1.7346938775510203,
"grad_norm": 0.6076016507448156,
"learning_rate": 3.740748515534761e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17511403560638428,
"step": 1020,
"valid_targets_mean": 3225.7,
"valid_targets_min": 1603
},
{
"epoch": 1.7431972789115646,
"grad_norm": 0.4883623691095037,
"learning_rate": 3.736556602806587e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.172734797000885,
"step": 1025,
"valid_targets_mean": 3836.9,
"valid_targets_min": 2000
},
{
"epoch": 1.751700680272109,
"grad_norm": 0.46550827165041286,
"learning_rate": 3.732333459063995e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.199026957154274,
"step": 1030,
"valid_targets_mean": 4062.8,
"valid_targets_min": 1556
},
{
"epoch": 1.760204081632653,
"grad_norm": 0.5129468567005807,
"learning_rate": 3.728079160257903e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14423376321792603,
"step": 1035,
"valid_targets_mean": 2858.1,
"valid_targets_min": 1339
},
{
"epoch": 1.7687074829931972,
"grad_norm": 0.5574813775362133,
"learning_rate": 3.723793782899531e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18245592713356018,
"step": 1040,
"valid_targets_mean": 3276.6,
"valid_targets_min": 670
},
{
"epoch": 1.7772108843537415,
"grad_norm": 0.4670140940140349,
"learning_rate": 3.719477404059032e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462934911251068,
"step": 1045,
"valid_targets_mean": 3054.8,
"valid_targets_min": 1503
},
{
"epoch": 1.7857142857142856,
"grad_norm": 0.46194682964420647,
"learning_rate": 3.715130101364103e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16554617881774902,
"step": 1050,
"valid_targets_mean": 3644.1,
"valid_targets_min": 1373
},
{
"epoch": 1.79421768707483,
"grad_norm": 0.5984466271446732,
"learning_rate": 3.710751952998591e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2118651270866394,
"step": 1055,
"valid_targets_mean": 4197.6,
"valid_targets_min": 1768
},
{
"epoch": 1.8027210884353742,
"grad_norm": 0.5456400454044104,
"learning_rate": 3.7063430377010804e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17311958968639374,
"step": 1060,
"valid_targets_mean": 2987.2,
"valid_targets_min": 1077
},
{
"epoch": 1.8112244897959182,
"grad_norm": 0.4767702066385362,
"learning_rate": 3.7019034347634884e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19531995058059692,
"step": 1065,
"valid_targets_mean": 3875.5,
"valid_targets_min": 656
},
{
"epoch": 1.8197278911564627,
"grad_norm": 0.5195825806924265,
"learning_rate": 3.6974332240296285e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16434217989444733,
"step": 1070,
"valid_targets_mean": 3075.5,
"valid_targets_min": 272
},
{
"epoch": 1.8282312925170068,
"grad_norm": 0.49345991558681523,
"learning_rate": 3.692932485893779e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20877480506896973,
"step": 1075,
"valid_targets_mean": 3642.0,
"valid_targets_min": 1468
},
{
"epoch": 1.836734693877551,
"grad_norm": 0.47208468050600655,
"learning_rate": 3.6884013012992384e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17622429132461548,
"step": 1080,
"valid_targets_mean": 4071.4,
"valid_targets_min": 1942
},
{
"epoch": 1.8452380952380953,
"grad_norm": 0.48753304789559393,
"learning_rate": 3.683839751736866e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18847878277301788,
"step": 1085,
"valid_targets_mean": 3604.7,
"valid_targets_min": 1249
},
{
"epoch": 1.8537414965986394,
"grad_norm": 0.5185334909460225,
"learning_rate": 3.67924791924362e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18857452273368835,
"step": 1090,
"valid_targets_mean": 3293.7,
"valid_targets_min": 1583
},
{
"epoch": 1.8622448979591837,
"grad_norm": 0.5361821399516076,
"learning_rate": 3.6746258864010804e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21333011984825134,
"step": 1095,
"valid_targets_mean": 3541.9,
"valid_targets_min": 1101
},
{
"epoch": 1.870748299319728,
"grad_norm": 0.5150375744442169,
"learning_rate": 3.669973736333961e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18149079382419586,
"step": 1100,
"valid_targets_mean": 3461.7,
"valid_targets_min": 1551
},
{
"epoch": 1.879251700680272,
"grad_norm": 0.47641795347351734,
"learning_rate": 3.665291552708622e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16541434824466705,
"step": 1105,
"valid_targets_mean": 3537.1,
"valid_targets_min": 721
},
{
"epoch": 1.8877551020408163,
"grad_norm": 0.44107915244193463,
"learning_rate": 3.660579419731556e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17657120525836945,
"step": 1110,
"valid_targets_mean": 4444.3,
"valid_targets_min": 1768
},
{
"epoch": 1.8962585034013606,
"grad_norm": 0.4490354679780014,
"learning_rate": 3.655837422147881e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18245811760425568,
"step": 1115,
"valid_targets_mean": 3821.4,
"valid_targets_min": 832
},
{
"epoch": 1.9047619047619047,
"grad_norm": 0.5471874801090619,
"learning_rate": 3.6510656452398124e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19018134474754333,
"step": 1120,
"valid_targets_mean": 3944.4,
"valid_targets_min": 704
},
{
"epoch": 1.913265306122449,
"grad_norm": 0.5210175865126913,
"learning_rate": 3.646264174825131e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1890740543603897,
"step": 1125,
"valid_targets_mean": 2996.8,
"valid_targets_min": 1240
},
{
"epoch": 1.9217687074829932,
"grad_norm": 0.44413848715103277,
"learning_rate": 3.6414330972556396e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596677303314209,
"step": 1130,
"valid_targets_mean": 3841.4,
"valid_targets_min": 1839
},
{
"epoch": 1.9302721088435373,
"grad_norm": 0.5011986427153032,
"learning_rate": 3.6365724994156074e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710270792245865,
"step": 1135,
"valid_targets_mean": 3877.1,
"valid_targets_min": 1103
},
{
"epoch": 1.9387755102040818,
"grad_norm": 0.507796898706084,
"learning_rate": 3.63168246872021e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19725248217582703,
"step": 1140,
"valid_targets_mean": 4247.8,
"valid_targets_min": 1249
},
{
"epoch": 1.9472789115646258,
"grad_norm": 0.44045711685293365,
"learning_rate": 3.626763093113959e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19037358462810516,
"step": 1145,
"valid_targets_mean": 3963.4,
"valid_targets_min": 1103
},
{
"epoch": 1.95578231292517,
"grad_norm": 0.47446755779794997,
"learning_rate": 3.621814461069114e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25513309240341187,
"step": 1150,
"valid_targets_mean": 5124.9,
"valid_targets_min": 1921
},
{
"epoch": 1.9642857142857144,
"grad_norm": 0.5301424189044126,
"learning_rate": 3.6168366615841e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22564446926116943,
"step": 1155,
"valid_targets_mean": 3610.2,
"valid_targets_min": 1429
},
{
"epoch": 1.9727891156462585,
"grad_norm": 0.45622538657301903,
"learning_rate": 3.6118297841818986e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16688859462738037,
"step": 1160,
"valid_targets_mean": 3964.9,
"valid_targets_min": 1107
},
{
"epoch": 1.9812925170068028,
"grad_norm": 0.4665999563671873,
"learning_rate": 3.6067939189084446e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19204774498939514,
"step": 1165,
"valid_targets_mean": 4142.7,
"valid_targets_min": 1263
},
{
"epoch": 1.989795918367347,
"grad_norm": 0.6056661231032858,
"learning_rate": 3.6017291563310005e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19215795397758484,
"step": 1170,
"valid_targets_mean": 3911.9,
"valid_targets_min": 1572
},
{
"epoch": 1.998299319727891,
"grad_norm": 0.4928298103688405,
"learning_rate": 3.5966355875365344e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15711480379104614,
"step": 1175,
"valid_targets_mean": 3181.3,
"valid_targets_min": 1284
},
{
"epoch": 2.006802721088435,
"grad_norm": 0.5046280559739479,
"learning_rate": 3.591513304130076e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1728023886680603,
"step": 1180,
"valid_targets_mean": 3395.6,
"valid_targets_min": 366
},
{
"epoch": 2.0153061224489797,
"grad_norm": 0.4858331630925101,
"learning_rate": 3.586362398233072e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15058520436286926,
"step": 1185,
"valid_targets_mean": 3435.6,
"valid_targets_min": 1263
},
{
"epoch": 2.0238095238095237,
"grad_norm": 0.4598459736943386,
"learning_rate": 3.58118296248173e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740441918373108,
"step": 1190,
"valid_targets_mean": 4536.1,
"valid_targets_min": 1025
},
{
"epoch": 2.0323129251700682,
"grad_norm": 0.5668851483118568,
"learning_rate": 3.57597509002535e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1615862250328064,
"step": 1195,
"valid_targets_mean": 3981.8,
"valid_targets_min": 1479
},
{
"epoch": 2.0408163265306123,
"grad_norm": 0.5400385121875237,
"learning_rate": 3.57073887452465e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18597358465194702,
"step": 1200,
"valid_targets_mean": 3258.4,
"valid_targets_min": 1617
},
{
"epoch": 2.0493197278911564,
"grad_norm": 0.5191849885658418,
"learning_rate": 3.565474410150083e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14795230329036713,
"step": 1205,
"valid_targets_mean": 3404.8,
"valid_targets_min": 1328
},
{
"epoch": 2.057823129251701,
"grad_norm": 0.5615079980327268,
"learning_rate": 3.560181791580144e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724962741136551,
"step": 1210,
"valid_targets_mean": 3804.8,
"valid_targets_min": 1510
},
{
"epoch": 2.066326530612245,
"grad_norm": 0.5078447283351805,
"learning_rate": 3.5548611139996634e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18177998065948486,
"step": 1215,
"valid_targets_mean": 3558.1,
"valid_targets_min": 1636
},
{
"epoch": 2.074829931972789,
"grad_norm": 0.5101085621115222,
"learning_rate": 3.549512473098097e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17449212074279785,
"step": 1220,
"valid_targets_mean": 3910.8,
"valid_targets_min": 881
},
{
"epoch": 2.0833333333333335,
"grad_norm": 0.5548489837592624,
"learning_rate": 3.544135965067807e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1575036644935608,
"step": 1225,
"valid_targets_mean": 3391.7,
"valid_targets_min": 1339
},
{
"epoch": 2.0918367346938775,
"grad_norm": 0.4790386496422741,
"learning_rate": 3.5387316866023314e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16516387462615967,
"step": 1230,
"valid_targets_mean": 4590.2,
"valid_targets_min": 1000
},
{
"epoch": 2.1003401360544216,
"grad_norm": 0.5504333723509913,
"learning_rate": 3.533299734894642e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1627981960773468,
"step": 1235,
"valid_targets_mean": 3015.6,
"valid_targets_min": 1230
},
{
"epoch": 2.108843537414966,
"grad_norm": 0.5147065086665726,
"learning_rate": 3.527840207635399e-05,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14713545143604279,
"step": 1240,
"valid_targets_mean": 3302.9,
"valid_targets_min": 1533
},
{
"epoch": 2.11734693877551,
"grad_norm": 0.49542337740054593,
"learning_rate": 3.522353203011197e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17458561062812805,
"step": 1245,
"valid_targets_mean": 3551.1,
"valid_targets_min": 740
},
{
"epoch": 2.1258503401360542,
"grad_norm": 0.5262275942748199,
"learning_rate": 3.5168388197027894e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19332650303840637,
"step": 1250,
"valid_targets_mean": 3784.7,
"valid_targets_min": 2209
},
{
"epoch": 2.1343537414965987,
"grad_norm": 0.5194049620721893,
"learning_rate": 3.5112971568833265e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1369602084159851,
"step": 1255,
"valid_targets_mean": 3164.5,
"valid_targets_min": 1186
},
{
"epoch": 2.142857142857143,
"grad_norm": 0.4894157553384943,
"learning_rate": 3.505728314216563e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1559082269668579,
"step": 1260,
"valid_targets_mean": 3526.8,
"valid_targets_min": 1441
},
{
"epoch": 2.1513605442176873,
"grad_norm": 0.5306280181793118,
"learning_rate": 3.500132391855067e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1700558364391327,
"step": 1265,
"valid_targets_mean": 3411.9,
"valid_targets_min": 1526
},
{
"epoch": 2.1598639455782314,
"grad_norm": 0.5439788996564396,
"learning_rate": 3.494509490438422e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17945188283920288,
"step": 1270,
"valid_targets_mean": 3294.2,
"valid_targets_min": 1077
},
{
"epoch": 2.1683673469387754,
"grad_norm": 0.5426839393421363,
"learning_rate": 3.4888597110914155e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20356306433677673,
"step": 1275,
"valid_targets_mean": 3401.2,
"valid_targets_min": 766
},
{
"epoch": 2.17687074829932,
"grad_norm": 0.49376468682501007,
"learning_rate": 3.483183155422216e-05,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1475028395652771,
"step": 1280,
"valid_targets_mean": 3422.0,
"valid_targets_min": 1364
},
{
"epoch": 2.185374149659864,
"grad_norm": 0.4822219704611301,
"learning_rate": 3.477479925520555e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18960726261138916,
"step": 1285,
"valid_targets_mean": 3851.6,
"valid_targets_min": 701
},
{
"epoch": 2.193877551020408,
"grad_norm": 0.5238254870802262,
"learning_rate": 3.471750123955878e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17107030749320984,
"step": 1290,
"valid_targets_mean": 4155.1,
"valid_targets_min": 1339
},
{
"epoch": 2.2023809523809526,
"grad_norm": 0.47745457726658785,
"learning_rate": 3.465993853775516e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15339364111423492,
"step": 1295,
"valid_targets_mean": 4033.9,
"valid_targets_min": 1507
},
{
"epoch": 2.2108843537414966,
"grad_norm": 0.44068028477047305,
"learning_rate": 3.460211218502815e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628030687570572,
"step": 1300,
"valid_targets_mean": 4219.1,
"valid_targets_min": 1276
},
{
"epoch": 2.2193877551020407,
"grad_norm": 0.6017847646540015,
"learning_rate": 3.45440232213529e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17169851064682007,
"step": 1305,
"valid_targets_mean": 3840.2,
"valid_targets_min": 280
},
{
"epoch": 2.227891156462585,
"grad_norm": 0.54520808841801,
"learning_rate": 3.4485672691427416e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14305715262889862,
"step": 1310,
"valid_targets_mean": 2790.1,
"valid_targets_min": 1090
},
{
"epoch": 2.2363945578231292,
"grad_norm": 0.5069630613900863,
"learning_rate": 3.4427061644653873e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14984074234962463,
"step": 1315,
"valid_targets_mean": 3722.7,
"valid_targets_min": 1552
},
{
"epoch": 2.2448979591836733,
"grad_norm": 0.5074028738160252,
"learning_rate": 3.436819113511967e-05,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1426405906677246,
"step": 1320,
"valid_targets_mean": 3276.1,
"valid_targets_min": 1724
},
{
"epoch": 2.253401360544218,
"grad_norm": 0.4860031673915145,
"learning_rate": 3.43090622215785e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13676658272743225,
"step": 1325,
"valid_targets_mean": 3905.1,
"valid_targets_min": 910
},
{
"epoch": 2.261904761904762,
"grad_norm": 0.4673453723403358,
"learning_rate": 3.4249675967431325e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15425705909729004,
"step": 1330,
"valid_targets_mean": 3778.6,
"valid_targets_min": 918
},
{
"epoch": 2.270408163265306,
"grad_norm": 0.5466310303785124,
"learning_rate": 3.419003344070723e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15783560276031494,
"step": 1335,
"valid_targets_mean": 2919.6,
"valid_targets_min": 1198
},
{
"epoch": 2.2789115646258504,
"grad_norm": 0.5031432547752726,
"learning_rate": 3.413013571404423e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13498738408088684,
"step": 1340,
"valid_targets_mean": 3161.5,
"valid_targets_min": 1101
},
{
"epoch": 2.2874149659863945,
"grad_norm": 0.4510753214929706,
"learning_rate": 3.406998386466995e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14579127728939056,
"step": 1345,
"valid_targets_mean": 4415.7,
"valid_targets_min": 1551
},
{
"epoch": 2.295918367346939,
"grad_norm": 0.48263377269745095,
"learning_rate": 3.400957897438229e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15821559727191925,
"step": 1350,
"valid_targets_mean": 4076.9,
"valid_targets_min": 1378
},
{
"epoch": 2.304421768707483,
"grad_norm": 0.5644267830161144,
"learning_rate": 3.3948922129529935e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19237931072711945,
"step": 1355,
"valid_targets_mean": 3423.6,
"valid_targets_min": 1047
},
{
"epoch": 2.312925170068027,
"grad_norm": 0.49196181950491424,
"learning_rate": 3.388801442099286e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689063459634781,
"step": 1360,
"valid_targets_mean": 3449.7,
"valid_targets_min": 1569
},
{
"epoch": 2.3214285714285716,
"grad_norm": 0.7510781582658744,
"learning_rate": 3.3826856944162655e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1868104636669159,
"step": 1365,
"valid_targets_mean": 3785.6,
"valid_targets_min": 1125
},
{
"epoch": 2.3299319727891157,
"grad_norm": 0.4746939257817625,
"learning_rate": 3.376545079892288e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18635499477386475,
"step": 1370,
"valid_targets_mean": 4005.7,
"valid_targets_min": 1397
},
{
"epoch": 2.3384353741496597,
"grad_norm": 0.47890327016140144,
"learning_rate": 3.3703797089629245e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15403881669044495,
"step": 1375,
"valid_targets_mean": 3932.6,
"valid_targets_min": 429
},
{
"epoch": 2.3469387755102042,
"grad_norm": 0.6080390195957247,
"learning_rate": 3.364189692508976e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20440378785133362,
"step": 1380,
"valid_targets_mean": 3630.7,
"valid_targets_min": 1517
},
{
"epoch": 2.3554421768707483,
"grad_norm": 0.5322930693149741,
"learning_rate": 3.357975141854482e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26613375544548035,
"step": 1385,
"valid_targets_mean": 3968.5,
"valid_targets_min": 1073
},
{
"epoch": 2.3639455782312924,
"grad_norm": 0.4547239931273904,
"learning_rate": 3.3517361687647136e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1697888970375061,
"step": 1390,
"valid_targets_mean": 4553.2,
"valid_targets_min": 1024
},
{
"epoch": 2.372448979591837,
"grad_norm": 0.5000330158435863,
"learning_rate": 3.3454728854441667e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15525534749031067,
"step": 1395,
"valid_targets_mean": 3786.2,
"valid_targets_min": 1926
},
{
"epoch": 2.380952380952381,
"grad_norm": 0.413483824010835,
"learning_rate": 3.3391854045345437e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15179120004177094,
"step": 1400,
"valid_targets_mean": 4099.1,
"valid_targets_min": 1398
},
{
"epoch": 2.389455782312925,
"grad_norm": 0.554412863715429,
"learning_rate": 3.332873839112727e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15291377902030945,
"step": 1405,
"valid_targets_mean": 3096.1,
"valid_targets_min": 1376
},
{
"epoch": 2.3979591836734695,
"grad_norm": 0.48293985993173416,
"learning_rate": 3.3265383026887464e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14159250259399414,
"step": 1410,
"valid_targets_mean": 3414.8,
"valid_targets_min": 1532
},
{
"epoch": 2.4064625850340136,
"grad_norm": 0.5300362438284278,
"learning_rate": 3.320178909203735e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17707979679107666,
"step": 1415,
"valid_targets_mean": 3817.1,
"valid_targets_min": 1698
},
{
"epoch": 2.4149659863945576,
"grad_norm": 0.6038778356769944,
"learning_rate": 3.313795773027885e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19175416231155396,
"step": 1420,
"valid_targets_mean": 3383.4,
"valid_targets_min": 590
},
{
"epoch": 2.423469387755102,
"grad_norm": 0.6333836363677777,
"learning_rate": 3.307389008958385e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16913290321826935,
"step": 1425,
"valid_targets_mean": 2575.2,
"valid_targets_min": 787
},
{
"epoch": 2.431972789115646,
"grad_norm": 0.47277667370501736,
"learning_rate": 3.30095873221736e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15604209899902344,
"step": 1430,
"valid_targets_mean": 3869.1,
"valid_targets_min": 1412
},
{
"epoch": 2.4404761904761907,
"grad_norm": 0.477865671202061,
"learning_rate": 3.294505058449797e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18286634981632233,
"step": 1435,
"valid_targets_mean": 5235.6,
"valid_targets_min": 1369
},
{
"epoch": 2.4489795918367347,
"grad_norm": 0.48362971440543534,
"learning_rate": 3.288028103721465e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15418080985546112,
"step": 1440,
"valid_targets_mean": 3559.9,
"valid_targets_min": 414
},
{
"epoch": 2.457482993197279,
"grad_norm": 0.5232022183706239,
"learning_rate": 3.2815279845168296e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18612605333328247,
"step": 1445,
"valid_targets_mean": 3365.7,
"valid_targets_min": 1283
},
{
"epoch": 2.4659863945578233,
"grad_norm": 0.506042116749104,
"learning_rate": 3.2750048177369554e-05,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18770621716976166,
"step": 1450,
"valid_targets_mean": 3635.6,
"valid_targets_min": 1733
},
{
"epoch": 2.4744897959183674,
"grad_norm": 0.572670882166851,
"learning_rate": 3.268458720697406e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14232869446277618,
"step": 1455,
"valid_targets_mean": 2885.1,
"valid_targets_min": 1269
},
{
"epoch": 2.4829931972789114,
"grad_norm": 0.5196864471454508,
"learning_rate": 3.2618898111261316e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13820812106132507,
"step": 1460,
"valid_targets_mean": 3341.0,
"valid_targets_min": 820
},
{
"epoch": 2.491496598639456,
"grad_norm": 0.5015347039801419,
"learning_rate": 3.2552982071613555e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13426734507083893,
"step": 1465,
"valid_targets_mean": 3133.6,
"valid_targets_min": 1657
},
{
"epoch": 2.5,
"grad_norm": 0.4921036727094327,
"learning_rate": 3.248684027349445e-05,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14220476150512695,
"step": 1470,
"valid_targets_mean": 3232.5,
"valid_targets_min": 1359
},
{
"epoch": 2.508503401360544,
"grad_norm": 0.44217854739998835,
"learning_rate": 3.2420473906427824e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17743223905563354,
"step": 1475,
"valid_targets_mean": 4313.5,
"valid_targets_min": 1603
},
{
"epoch": 2.5170068027210886,
"grad_norm": 0.4778736306901132,
"learning_rate": 3.235388416397626e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16074007749557495,
"step": 1480,
"valid_targets_mean": 3948.7,
"valid_targets_min": 1540
},
{
"epoch": 2.5255102040816326,
"grad_norm": 0.6095052805264233,
"learning_rate": 3.228707224371961e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17271192371845245,
"step": 1485,
"valid_targets_mean": 3558.2,
"valid_targets_min": 1375
},
{
"epoch": 2.534013605442177,
"grad_norm": 0.45590045375975136,
"learning_rate": 3.222003934723347e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1279994696378708,
"step": 1490,
"valid_targets_mean": 3846.9,
"valid_targets_min": 1859
},
{
"epoch": 2.542517006802721,
"grad_norm": 0.49738813457635117,
"learning_rate": 3.215278668006757e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1717885434627533,
"step": 1495,
"valid_targets_mean": 3760.4,
"valid_targets_min": 1279
},
{
"epoch": 2.5510204081632653,
"grad_norm": 0.4090299383293233,
"learning_rate": 3.208531545172413e-05,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15844562649726868,
"step": 1500,
"valid_targets_mean": 4329.8,
"valid_targets_min": 1368
},
{
"epoch": 2.5595238095238093,
"grad_norm": 0.5431786244764008,
"learning_rate": 3.2017626875636024e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14518578350543976,
"step": 1505,
"valid_targets_mean": 3229.6,
"valid_targets_min": 1434
},
{
"epoch": 2.568027210884354,
"grad_norm": 0.49615820264902144,
"learning_rate": 3.194972216914502e-05,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1399931013584137,
"step": 1510,
"valid_targets_mean": 3413.1,
"valid_targets_min": 670
},
{
"epoch": 2.576530612244898,
"grad_norm": 0.9718435300877193,
"learning_rate": 3.18816025534799e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514762043952942,
"step": 1515,
"valid_targets_mean": 3781.0,
"valid_targets_min": 1671
},
{
"epoch": 2.5850340136054424,
"grad_norm": 0.5068549521619831,
"learning_rate": 3.181326925373443e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19092750549316406,
"step": 1520,
"valid_targets_mean": 4007.5,
"valid_targets_min": 1248
},
{
"epoch": 2.5935374149659864,
"grad_norm": 0.47078024333063895,
"learning_rate": 3.174472349884539e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13935624063014984,
"step": 1525,
"valid_targets_mean": 3828.7,
"valid_targets_min": 893
},
{
"epoch": 2.6020408163265305,
"grad_norm": 0.4738214558863609,
"learning_rate": 3.1675966521570444e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14629226922988892,
"step": 1530,
"valid_targets_mean": 3698.9,
"valid_targets_min": 1408
},
{
"epoch": 2.6105442176870746,
"grad_norm": 0.49017231137420236,
"learning_rate": 3.160699955846597e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15869465470314026,
"step": 1535,
"valid_targets_mean": 3895.1,
"valid_targets_min": 1622
},
{
"epoch": 2.619047619047619,
"grad_norm": 0.5202593666777702,
"learning_rate": 3.1537823849864834e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20912855863571167,
"step": 1540,
"valid_targets_mean": 3743.7,
"valid_targets_min": 912
},
{
"epoch": 2.627551020408163,
"grad_norm": 0.5005906380020121,
"learning_rate": 3.1468440639854056e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13278600573539734,
"step": 1545,
"valid_targets_mean": 3161.0,
"valid_targets_min": 1611
},
{
"epoch": 2.6360544217687076,
"grad_norm": 0.4999686965484099,
"learning_rate": 3.139885117625249e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15896578133106232,
"step": 1550,
"valid_targets_mean": 3742.4,
"valid_targets_min": 1355
},
{
"epoch": 2.6445578231292517,
"grad_norm": 0.5263565414304656,
"learning_rate": 3.132905671058831e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18690796196460724,
"step": 1555,
"valid_targets_mean": 4175.1,
"valid_targets_min": 1608
},
{
"epoch": 2.6530612244897958,
"grad_norm": 0.46022006535755816,
"learning_rate": 3.1259058498076554e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1319347470998764,
"step": 1560,
"valid_targets_mean": 3780.4,
"valid_targets_min": 1459
},
{
"epoch": 2.6615646258503403,
"grad_norm": 0.48588937455117837,
"learning_rate": 3.1188857797596545e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12452636659145355,
"step": 1565,
"valid_targets_mean": 2937.5,
"valid_targets_min": 1096
},
{
"epoch": 2.6700680272108843,
"grad_norm": 0.5191575759086287,
"learning_rate": 3.111845587166922e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2404664009809494,
"step": 1570,
"valid_targets_mean": 4137.2,
"valid_targets_min": 1510
},
{
"epoch": 2.678571428571429,
"grad_norm": 0.5208651523922655,
"learning_rate": 3.104785398643447e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14865821599960327,
"step": 1575,
"valid_targets_mean": 2932.2,
"valid_targets_min": 292
},
{
"epoch": 2.687074829931973,
"grad_norm": 0.4114567953463469,
"learning_rate": 3.0977053411628315e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14979563653469086,
"step": 1580,
"valid_targets_mean": 4161.8,
"valid_targets_min": 1572
},
{
"epoch": 2.695578231292517,
"grad_norm": 0.4913074740374502,
"learning_rate": 3.090605542056013e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15900972485542297,
"step": 1585,
"valid_targets_mean": 3456.5,
"valid_targets_min": 1115
},
{
"epoch": 2.704081632653061,
"grad_norm": 0.4442392356579173,
"learning_rate": 3.083486129008967e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18399524688720703,
"step": 1590,
"valid_targets_mean": 4740.0,
"valid_targets_min": 1565
},
{
"epoch": 2.7125850340136055,
"grad_norm": 0.4754861826964586,
"learning_rate": 3.07634723006042e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1808849275112152,
"step": 1595,
"valid_targets_mean": 4251.0,
"valid_targets_min": 1249
},
{
"epoch": 2.7210884353741496,
"grad_norm": 0.4655468525053816,
"learning_rate": 3.069188973599538e-05,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1294795274734497,
"step": 1600,
"valid_targets_mean": 3314.2,
"valid_targets_min": 723
},
{
"epoch": 2.729591836734694,
"grad_norm": 0.43464410382803953,
"learning_rate": 3.062011488363623e-05,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.147240549325943,
"step": 1605,
"valid_targets_mean": 3935.8,
"valid_targets_min": 1130
},
{
"epoch": 2.738095238095238,
"grad_norm": 0.46040122910771636,
"learning_rate": 3.054814903435794e-05,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14695018529891968,
"step": 1610,
"valid_targets_mean": 3722.0,
"valid_targets_min": 1673
},
{
"epoch": 2.746598639455782,
"grad_norm": 0.45733532745749556,
"learning_rate": 3.0475993482426695e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2099800556898117,
"step": 1615,
"valid_targets_mean": 4918.6,
"valid_targets_min": 1845
},
{
"epoch": 2.7551020408163263,
"grad_norm": 0.4956060655830285,
"learning_rate": 3.0403649525520374e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18889182806015015,
"step": 1620,
"valid_targets_mean": 3856.4,
"valid_targets_min": 988
},
{
"epoch": 2.7636054421768708,
"grad_norm": 0.4768716386514472,
"learning_rate": 3.033111846470521e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15743374824523926,
"step": 1625,
"valid_targets_mean": 3608.8,
"valid_targets_min": 872
},
{
"epoch": 2.772108843537415,
"grad_norm": 0.525730309515445,
"learning_rate": 3.02584016044124e-05,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15813755989074707,
"step": 1630,
"valid_targets_mean": 3100.8,
"valid_targets_min": 642
},
{
"epoch": 2.7806122448979593,
"grad_norm": 0.5351477674686339,
"learning_rate": 3.0185500252414633e-05,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16096732020378113,
"step": 1635,
"valid_targets_mean": 3815.7,
"valid_targets_min": 1239
},
{
"epoch": 2.7891156462585034,
"grad_norm": 0.4716262544441501,
"learning_rate": 3.01124157198026e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1661742478609085,
"step": 1640,
"valid_targets_mean": 3724.4,
"valid_targets_min": 1140
},
{
"epoch": 2.7976190476190474,
"grad_norm": 0.4138239303384503,
"learning_rate": 3.003914932096137e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16232448816299438,
"step": 1645,
"valid_targets_mean": 4448.6,
"valid_targets_min": 1633
},
{
"epoch": 2.806122448979592,
"grad_norm": 0.46852819112237687,
"learning_rate": 2.99657023735468e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20756766200065613,
"step": 1650,
"valid_targets_mean": 4463.3,
"valid_targets_min": 1380
},
{
"epoch": 2.814625850340136,
"grad_norm": 0.39483602863790196,
"learning_rate": 2.9892076198461794e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1203012689948082,
"step": 1655,
"valid_targets_mean": 4115.1,
"valid_targets_min": 859
},
{
"epoch": 2.8231292517006805,
"grad_norm": 0.48880278190048604,
"learning_rate": 2.9818272119832576e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17082348465919495,
"step": 1660,
"valid_targets_mean": 3551.8,
"valid_targets_min": 692
},
{
"epoch": 2.8316326530612246,
"grad_norm": 0.41769851905531785,
"learning_rate": 2.974429146498487e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666543036699295,
"step": 1665,
"valid_targets_mean": 4539.7,
"valid_targets_min": 1299
},
{
"epoch": 2.8401360544217686,
"grad_norm": 0.5016505396489435,
"learning_rate": 2.9670135564420016e-05,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940472573041916,
"step": 1670,
"valid_targets_mean": 3977.4,
"valid_targets_min": 1537
},
{
"epoch": 2.8486394557823127,
"grad_norm": 0.5166302635070413,
"learning_rate": 2.9595805751791068e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17951983213424683,
"step": 1675,
"valid_targets_mean": 3933.2,
"valid_targets_min": 793
},
{
"epoch": 2.857142857142857,
"grad_norm": 0.5379845678232543,
"learning_rate": 2.9521303363878774e-05,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1659054160118103,
"step": 1680,
"valid_targets_mean": 2871.5,
"valid_targets_min": 1082
},
{
"epoch": 2.8656462585034013,
"grad_norm": 0.4656889105961351,
"learning_rate": 2.9446629740567566e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16753873229026794,
"step": 1685,
"valid_targets_mean": 3887.4,
"valid_targets_min": 795
},
{
"epoch": 2.8741496598639458,
"grad_norm": 0.4930852645072521,
"learning_rate": 2.9371786224821447e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16282245516777039,
"step": 1690,
"valid_targets_mean": 3396.2,
"valid_targets_min": 1712
},
{
"epoch": 2.88265306122449,
"grad_norm": 0.4445771945139776,
"learning_rate": 2.9296774162659836e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1767793595790863,
"step": 1695,
"valid_targets_mean": 4715.9,
"valid_targets_min": 1373
},
{
"epoch": 2.891156462585034,
"grad_norm": 0.543109477480171,
"learning_rate": 2.9221594903133385e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14414627850055695,
"step": 1700,
"valid_targets_mean": 3009.1,
"valid_targets_min": 325
},
{
"epoch": 2.8996598639455784,
"grad_norm": 0.5234711869685756,
"learning_rate": 2.9146249798299672e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160060852766037,
"step": 1705,
"valid_targets_mean": 3624.4,
"valid_targets_min": 1171
},
{
"epoch": 2.9081632653061225,
"grad_norm": 0.4908520083423699,
"learning_rate": 2.9070740203198927e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1625441312789917,
"step": 1710,
"valid_targets_mean": 3220.1,
"valid_targets_min": 1120
},
{
"epoch": 2.9166666666666665,
"grad_norm": 0.4785558145751867,
"learning_rate": 2.899506747582965e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17338773608207703,
"step": 1715,
"valid_targets_mean": 3640.5,
"valid_targets_min": 906
},
{
"epoch": 2.925170068027211,
"grad_norm": 0.5088298122894733,
"learning_rate": 2.8919232977124177e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1554885059595108,
"step": 1720,
"valid_targets_mean": 3226.2,
"valid_targets_min": 1437
},
{
"epoch": 2.933673469387755,
"grad_norm": 0.453368913569161,
"learning_rate": 2.884323807092423e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17843785881996155,
"step": 1725,
"valid_targets_mean": 4037.4,
"valid_targets_min": 1673
},
{
"epoch": 2.942176870748299,
"grad_norm": 0.5177514931490083,
"learning_rate": 2.8767084123956334e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.178394615650177,
"step": 1730,
"valid_targets_mean": 3508.4,
"valid_targets_min": 1662
},
{
"epoch": 2.9506802721088436,
"grad_norm": 0.5779374351888202,
"learning_rate": 2.8690772505807307e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18779624998569489,
"step": 1735,
"valid_targets_mean": 3212.1,
"valid_targets_min": 1016
},
{
"epoch": 2.9591836734693877,
"grad_norm": 0.5146721357707493,
"learning_rate": 2.8614304588899588e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15629920363426208,
"step": 1740,
"valid_targets_mean": 4015.6,
"valid_targets_min": 1070
},
{
"epoch": 2.967687074829932,
"grad_norm": 0.5189251797092681,
"learning_rate": 2.8537681748466557e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510303020477295,
"step": 1745,
"valid_targets_mean": 3674.2,
"valid_targets_min": 1773
},
{
"epoch": 2.9761904761904763,
"grad_norm": 0.46502180173420404,
"learning_rate": 2.8460905362527832e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15194571018218994,
"step": 1750,
"valid_targets_mean": 3294.1,
"valid_targets_min": 1422
},
{
"epoch": 2.9846938775510203,
"grad_norm": 0.4304082658436519,
"learning_rate": 2.8383976811864416e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20454227924346924,
"step": 1755,
"valid_targets_mean": 4752.8,
"valid_targets_min": 1493
},
{
"epoch": 2.9931972789115644,
"grad_norm": 0.508324313644312,
"learning_rate": 2.8306897479993954e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18964369595050812,
"step": 1760,
"valid_targets_mean": 3695.0,
"valid_targets_min": 629
},
{
"epoch": 3.001700680272109,
"grad_norm": 0.4784598662881332,
"learning_rate": 2.8229668753145797e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313592791557312,
"step": 1765,
"valid_targets_mean": 3611.9,
"valid_targets_min": 1092
},
{
"epoch": 3.010204081632653,
"grad_norm": 0.8446031086831215,
"learning_rate": 2.815229202023607e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1230715960264206,
"step": 1770,
"valid_targets_mean": 3435.1,
"valid_targets_min": 1306
},
{
"epoch": 3.0187074829931975,
"grad_norm": 0.492834562909989,
"learning_rate": 2.8074768672842716e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337684690952301,
"step": 1775,
"valid_targets_mean": 4209.7,
"valid_targets_min": 1836
},
{
"epoch": 3.0272108843537415,
"grad_norm": 0.4601608816984647,
"learning_rate": 2.7997100105180455e-05,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1252722293138504,
"step": 1780,
"valid_targets_mean": 4082.4,
"valid_targets_min": 1347
},
{
"epoch": 3.0357142857142856,
"grad_norm": 0.5489375507244738,
"learning_rate": 2.7919287714075714e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18662264943122864,
"step": 1785,
"valid_targets_mean": 3715.5,
"valid_targets_min": 1090
},
{
"epoch": 3.04421768707483,
"grad_norm": 0.5083714260327757,
"learning_rate": 2.7841332898941513e-05,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16233694553375244,
"step": 1790,
"valid_targets_mean": 3814.8,
"valid_targets_min": 1574
},
{
"epoch": 3.052721088435374,
"grad_norm": 0.6619518014596226,
"learning_rate": 2.7763237061752276e-05,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11884614080190659,
"step": 1795,
"valid_targets_mean": 3849.1,
"valid_targets_min": 1576
},
{
"epoch": 3.061224489795918,
"grad_norm": 0.4621308813867603,
"learning_rate": 2.768500160701864e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337064951658249,
"step": 1800,
"valid_targets_mean": 4491.9,
"valid_targets_min": 1548
},
{
"epoch": 3.0697278911564627,
"grad_norm": 0.46021745248167184,
"learning_rate": 2.7606627941762186e-05,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10864484310150146,
"step": 1805,
"valid_targets_mean": 3335.6,
"valid_targets_min": 1564
},
{
"epoch": 3.078231292517007,
"grad_norm": 0.5483839712270409,
"learning_rate": 2.752811747549013e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1714896559715271,
"step": 1810,
"valid_targets_mean": 3205.5,
"valid_targets_min": 1136
},
{
"epoch": 3.086734693877551,
"grad_norm": 0.5202727539029218,
"learning_rate": 2.7449471620169988e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11642484366893768,
"step": 1815,
"valid_targets_mean": 3250.6,
"valid_targets_min": 826
},
{
"epoch": 3.0952380952380953,
"grad_norm": 0.5993960429294215,
"learning_rate": 2.7370691790204173e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14193883538246155,
"step": 1820,
"valid_targets_mean": 3056.0,
"valid_targets_min": 1417
},
{
"epoch": 3.1037414965986394,
"grad_norm": 0.4559839126604544,
"learning_rate": 2.7291779402404538e-05,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1268749088048935,
"step": 1825,
"valid_targets_mean": 3777.4,
"valid_targets_min": 1210
},
{
"epoch": 3.1122448979591835,
"grad_norm": 0.5604579578162319,
"learning_rate": 2.7212735875966946e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12619996070861816,
"step": 1830,
"valid_targets_mean": 3083.2,
"valid_targets_min": 668
},
{
"epoch": 3.120748299319728,
"grad_norm": 0.5438820371018678,
"learning_rate": 2.713356263244569e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1503400355577469,
"step": 1835,
"valid_targets_mean": 4212.8,
"valid_targets_min": 1288
},
{
"epoch": 3.129251700680272,
"grad_norm": 0.5195545679371458,
"learning_rate": 2.7054261095727977e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16384392976760864,
"step": 1840,
"valid_targets_mean": 3396.9,
"valid_targets_min": 1215
},
{
"epoch": 3.137755102040816,
"grad_norm": 0.5113512295726848,
"learning_rate": 2.6974832692008278e-05,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14530371129512787,
"step": 1845,
"valid_targets_mean": 3812.4,
"valid_targets_min": 468
},
{
"epoch": 3.1462585034013606,
"grad_norm": 0.49306040169984283,
"learning_rate": 2.6895278849762694e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14059320092201233,
"step": 1850,
"valid_targets_mean": 4135.6,
"valid_targets_min": 1137
},
{
"epoch": 3.1547619047619047,
"grad_norm": 0.4826789386729217,
"learning_rate": 2.68156009997233e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12108274549245834,
"step": 1855,
"valid_targets_mean": 3404.0,
"valid_targets_min": 1535
},
{
"epoch": 3.163265306122449,
"grad_norm": 0.509069211171738,
"learning_rate": 2.673580057485234e-05,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1607593148946762,
"step": 1860,
"valid_targets_mean": 3872.3,
"valid_targets_min": 1520
},
{
"epoch": 3.171768707482993,
"grad_norm": 0.5481617769731713,
"learning_rate": 2.6655879010316535e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19412599503993988,
"step": 1865,
"valid_targets_mean": 3780.2,
"valid_targets_min": 1849
},
{
"epoch": 3.1802721088435373,
"grad_norm": 0.4726239103908885,
"learning_rate": 2.657583774346121e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14381511509418488,
"step": 1870,
"valid_targets_mean": 4229.1,
"valid_targets_min": 1817
},
{
"epoch": 3.188775510204082,
"grad_norm": 0.5674638452522066,
"learning_rate": 2.649567821378449e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13234567642211914,
"step": 1875,
"valid_targets_mean": 2603.2,
"valid_targets_min": 1594
},
{
"epoch": 3.197278911564626,
"grad_norm": 0.4844284742271353,
"learning_rate": 2.641540186291138e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11232699453830719,
"step": 1880,
"valid_targets_mean": 3777.3,
"valid_targets_min": 414
},
{
"epoch": 3.20578231292517,
"grad_norm": 0.5928341730053119,
"learning_rate": 2.6335010134567852e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1312047839164734,
"step": 1885,
"valid_targets_mean": 3397.1,
"valid_targets_min": 1745
},
{
"epoch": 3.2142857142857144,
"grad_norm": 0.45839469775941877,
"learning_rate": 2.6254504474554883e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1701536476612091,
"step": 1890,
"valid_targets_mean": 4128.9,
"valid_targets_min": 1446
},
{
"epoch": 3.2227891156462585,
"grad_norm": 0.5008710719767632,
"learning_rate": 2.617388633072244e-05,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15137995779514313,
"step": 1895,
"valid_targets_mean": 3451.7,
"valid_targets_min": 1403
},
{
"epoch": 3.2312925170068025,
"grad_norm": 0.5827041310129761,
"learning_rate": 2.609315715294346e-05,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14786767959594727,
"step": 1900,
"valid_targets_mean": 3197.5,
"valid_targets_min": 844
},
{
"epoch": 3.239795918367347,
"grad_norm": 0.4774939218788078,
"learning_rate": 2.6012318393087754e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12262146174907684,
"step": 1905,
"valid_targets_mean": 3974.2,
"valid_targets_min": 1129
},
{
"epoch": 3.248299319727891,
"grad_norm": 2.3012934366864584,
"learning_rate": 2.593137150499591e-05,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16141125559806824,
"step": 1910,
"valid_targets_mean": 3124.3,
"valid_targets_min": 1540
},
{
"epoch": 3.2568027210884356,
"grad_norm": 0.5643599785855004,
"learning_rate": 2.5850317944453153e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12558527290821075,
"step": 1915,
"valid_targets_mean": 3054.8,
"valid_targets_min": 1355
},
{
"epoch": 3.2653061224489797,
"grad_norm": 0.47636899169835173,
"learning_rate": 2.5769159169163137e-05,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12280717492103577,
"step": 1920,
"valid_targets_mean": 4109.9,
"valid_targets_min": 738
},
{
"epoch": 3.2738095238095237,
"grad_norm": 0.5063508169912114,
"learning_rate": 2.568789663872175e-05,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15989241003990173,
"step": 1925,
"valid_targets_mean": 3856.1,
"valid_targets_min": 1107
},
{
"epoch": 3.282312925170068,
"grad_norm": 0.4811148388189251,
"learning_rate": 2.5606531814590868e-05,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1412792056798935,
"step": 1930,
"valid_targets_mean": 3863.6,
"valid_targets_min": 1217
},
{
"epoch": 3.2908163265306123,
"grad_norm": 0.49396827270191446,
"learning_rate": 2.552506616007205e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16188889741897583,
"step": 1935,
"valid_targets_mean": 4214.9,
"valid_targets_min": 1171
},
{
"epoch": 3.2993197278911564,
"grad_norm": 0.5027361991896958,
"learning_rate": 2.544350114028025e-05,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12943832576274872,
"step": 1940,
"valid_targets_mean": 3637.8,
"valid_targets_min": 1012
},
{
"epoch": 3.307823129251701,
"grad_norm": 0.493648390936752,
"learning_rate": 2.5361838222117435e-05,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1386047899723053,
"step": 1945,
"valid_targets_mean": 3566.7,
"valid_targets_min": 906
},
{
"epoch": 3.316326530612245,
"grad_norm": 0.4934917907617171,
"learning_rate": 2.5280078874246227e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1620742529630661,
"step": 1950,
"valid_targets_mean": 3895.6,
"valid_targets_min": 1382
},
{
"epoch": 3.324829931972789,
"grad_norm": 0.5812143740145603,
"learning_rate": 2.519822456706349e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17321470379829407,
"step": 1955,
"valid_targets_mean": 3244.1,
"valid_targets_min": 1364
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.5157880709455498,
"learning_rate": 2.5116276772673863e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23097273707389832,
"step": 1960,
"valid_targets_mean": 4115.7,
"valid_targets_min": 1517
},
{
"epoch": 3.3418367346938775,
"grad_norm": 0.44313842009506144,
"learning_rate": 2.503423696486332e-05,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13994191586971283,
"step": 1965,
"valid_targets_mean": 4884.8,
"valid_targets_min": 868
},
{
"epoch": 3.3503401360544216,
"grad_norm": 0.4904305036943379,
"learning_rate": 2.495210661907263e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1328560709953308,
"step": 1970,
"valid_targets_mean": 3285.6,
"valid_targets_min": 506
},
{
"epoch": 3.358843537414966,
"grad_norm": 0.5443084350560426,
"learning_rate": 2.4869887212370847e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12956424057483673,
"step": 1975,
"valid_targets_mean": 3053.5,
"valid_targets_min": 1435
},
{
"epoch": 3.36734693877551,
"grad_norm": 0.4573267525975133,
"learning_rate": 2.4787580223428736e-05,
"loss": 0.1337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11794184893369675,
"step": 1980,
"valid_targets_mean": 3524.2,
"valid_targets_min": 1558
},
{
"epoch": 3.3758503401360542,
"grad_norm": 0.48589338823426165,
"learning_rate": 2.470518713249217e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14002826809883118,
"step": 1985,
"valid_targets_mean": 3914.6,
"valid_targets_min": 1507
},
{
"epoch": 3.3843537414965987,
"grad_norm": 0.5119561537935591,
"learning_rate": 2.4622709421355535e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15183639526367188,
"step": 1990,
"valid_targets_mean": 3411.4,
"valid_targets_min": 1311
},
{
"epoch": 3.392857142857143,
"grad_norm": 0.48761202799121056,
"learning_rate": 2.4540148573335057e-05,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14358212053775787,
"step": 1995,
"valid_targets_mean": 3778.9,
"valid_targets_min": 1430
},
{
"epoch": 3.4013605442176873,
"grad_norm": 0.5091769846013783,
"learning_rate": 2.445750607324212e-05,
"loss": 0.1283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12895150482654572,
"step": 2000,
"valid_targets_mean": 3439.9,
"valid_targets_min": 1228
},
{
"epoch": 3.4098639455782314,
"grad_norm": 0.46277855706597215,
"learning_rate": 2.4374783407356602e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13825930655002594,
"step": 2005,
"valid_targets_mean": 4161.5,
"valid_targets_min": 1542
},
{
"epoch": 3.4183673469387754,
"grad_norm": 0.5182823416136738,
"learning_rate": 2.4291982063400096e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15307000279426575,
"step": 2010,
"valid_targets_mean": 3669.1,
"valid_targets_min": 2351
},
{
"epoch": 3.4268707482993195,
"grad_norm": 0.48047265886653706,
"learning_rate": 2.4209103530509196e-05,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1290254145860672,
"step": 2015,
"valid_targets_mean": 3352.1,
"valid_targets_min": 1254
},
{
"epoch": 3.435374149659864,
"grad_norm": 0.5466523776690688,
"learning_rate": 2.412614929920868e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17689591646194458,
"step": 2020,
"valid_targets_mean": 3302.2,
"valid_targets_min": 1393
},
{
"epoch": 3.443877551020408,
"grad_norm": 0.5840183574717508,
"learning_rate": 2.4043120861384723e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18398138880729675,
"step": 2025,
"valid_targets_mean": 3467.4,
"valid_targets_min": 1710
},
{
"epoch": 3.4523809523809526,
"grad_norm": 0.4786308924135924,
"learning_rate": 2.3960019710258068e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13967232406139374,
"step": 2030,
"valid_targets_mean": 4170.2,
"valid_targets_min": 1800
},
{
"epoch": 3.4608843537414966,
"grad_norm": 0.4724083960800044,
"learning_rate": 2.3876847340357164e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14074461162090302,
"step": 2035,
"valid_targets_mean": 3416.8,
"valid_targets_min": 1551
},
{
"epoch": 3.4693877551020407,
"grad_norm": 0.552558554312206,
"learning_rate": 2.3793605247491303e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20764395594596863,
"step": 2040,
"valid_targets_mean": 4187.3,
"valid_targets_min": 1424
},
{
"epoch": 3.477891156462585,
"grad_norm": 0.5163498510728093,
"learning_rate": 2.371029492872369e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14693160355091095,
"step": 2045,
"valid_targets_mean": 3235.4,
"valid_targets_min": 261
},
{
"epoch": 3.4863945578231292,
"grad_norm": 0.5013959306377093,
"learning_rate": 2.362691788234453e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12825211882591248,
"step": 2050,
"valid_targets_mean": 3316.6,
"valid_targets_min": 272
},
{
"epoch": 3.4948979591836733,
"grad_norm": 0.4607494767645447,
"learning_rate": 2.3543475607844105e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15415170788764954,
"step": 2055,
"valid_targets_mean": 4641.1,
"valid_targets_min": 1383
},
{
"epoch": 3.503401360544218,
"grad_norm": 0.4920567824742292,
"learning_rate": 2.3459969605885785e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17793437838554382,
"step": 2060,
"valid_targets_mean": 4237.8,
"valid_targets_min": 648
},
{
"epoch": 3.511904761904762,
"grad_norm": 0.5174711622509411,
"learning_rate": 2.3376401378279037e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1297653764486313,
"step": 2065,
"valid_targets_mean": 2994.3,
"valid_targets_min": 1413
},
{
"epoch": 3.520408163265306,
"grad_norm": 0.5163717376042865,
"learning_rate": 2.329277242795243e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15077583491802216,
"step": 2070,
"valid_targets_mean": 3868.8,
"valid_targets_min": 804
},
{
"epoch": 3.5289115646258504,
"grad_norm": 0.5086218045854233,
"learning_rate": 2.320908425892658e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14013858139514923,
"step": 2075,
"valid_targets_mean": 2993.7,
"valid_targets_min": 649
},
{
"epoch": 3.5374149659863945,
"grad_norm": 0.5462773846852057,
"learning_rate": 2.3125338376287137e-05,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14993932843208313,
"step": 2080,
"valid_targets_mean": 3203.9,
"valid_targets_min": 1236
},
{
"epoch": 3.545918367346939,
"grad_norm": 0.5093830788049976,
"learning_rate": 2.3041536286157706e-05,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12546180188655853,
"step": 2085,
"valid_targets_mean": 3676.3,
"valid_targets_min": 1378
},
{
"epoch": 3.554421768707483,
"grad_norm": 0.5074306671591432,
"learning_rate": 2.295767949567272e-05,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12795674800872803,
"step": 2090,
"valid_targets_mean": 3516.2,
"valid_targets_min": 844
},
{
"epoch": 3.562925170068027,
"grad_norm": 0.4896441751448396,
"learning_rate": 2.28737695129504e-05,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324068009853363,
"step": 2095,
"valid_targets_mean": 3447.2,
"valid_targets_min": 1590
},
{
"epoch": 3.571428571428571,
"grad_norm": 0.5013956210638618,
"learning_rate": 2.2789807847065574e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13823112845420837,
"step": 2100,
"valid_targets_mean": 3616.2,
"valid_targets_min": 777
},
{
"epoch": 3.5799319727891157,
"grad_norm": 0.5306077891974634,
"learning_rate": 2.2705796008022592e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14960964024066925,
"step": 2105,
"valid_targets_mean": 3087.6,
"valid_targets_min": 1262
},
{
"epoch": 3.5884353741496597,
"grad_norm": 0.44147190175386997,
"learning_rate": 2.2621735506728126e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11909447610378265,
"step": 2110,
"valid_targets_mean": 4089.0,
"valid_targets_min": 1714
},
{
"epoch": 3.5969387755102042,
"grad_norm": 0.44351920329660205,
"learning_rate": 2.2537627854963994e-05,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12201227247714996,
"step": 2115,
"valid_targets_mean": 4485.5,
"valid_targets_min": 1318
},
{
"epoch": 3.6054421768707483,
"grad_norm": 0.5202268781406105,
"learning_rate": 2.2453474565360018e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13805070519447327,
"step": 2120,
"valid_targets_mean": 3141.2,
"valid_targets_min": 1354
},
{
"epoch": 3.6139455782312924,
"grad_norm": 0.486925624713484,
"learning_rate": 2.2369277151366776e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417008936405182,
"step": 2125,
"valid_targets_mean": 3789.7,
"valid_targets_min": 1597
},
{
"epoch": 3.622448979591837,
"grad_norm": 0.569357943842269,
"learning_rate": 2.228503712722841e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11663225293159485,
"step": 2130,
"valid_targets_mean": 2776.4,
"valid_targets_min": 1020
},
{
"epoch": 3.630952380952381,
"grad_norm": 0.4708138592970684,
"learning_rate": 2.220075600795537e-05,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12191980332136154,
"step": 2135,
"valid_targets_mean": 4152.0,
"valid_targets_min": 1693
},
{
"epoch": 3.6394557823129254,
"grad_norm": 0.46387557457924355,
"learning_rate": 2.2116435309297177e-05,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13377505540847778,
"step": 2140,
"valid_targets_mean": 4785.8,
"valid_targets_min": 1441
},
{
"epoch": 3.6479591836734695,
"grad_norm": 0.5022621604582599,
"learning_rate": 2.203207654771519e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13495998084545135,
"step": 2145,
"valid_targets_mean": 3572.0,
"valid_targets_min": 1210
},
{
"epoch": 3.6564625850340136,
"grad_norm": 0.4991291175902639,
"learning_rate": 2.1947681240355266e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16433686017990112,
"step": 2150,
"valid_targets_mean": 4432.6,
"valid_targets_min": 1346
},
{
"epoch": 3.6649659863945576,
"grad_norm": 0.5458475179648687,
"learning_rate": 2.1863250905020566e-05,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17905211448669434,
"step": 2155,
"valid_targets_mean": 3504.8,
"valid_targets_min": 626
},
{
"epoch": 3.673469387755102,
"grad_norm": 0.4828154132176292,
"learning_rate": 2.177878706014418e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637372374534607,
"step": 2160,
"valid_targets_mean": 3928.8,
"valid_targets_min": 1146
},
{
"epoch": 3.681972789115646,
"grad_norm": 0.5626269965220437,
"learning_rate": 2.1694291224761845e-05,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14788082242012024,
"step": 2165,
"valid_targets_mean": 3986.1,
"valid_targets_min": 1226
},
{
"epoch": 3.6904761904761907,
"grad_norm": 0.5570323579675244,
"learning_rate": 2.160976491848465e-05,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13803161680698395,
"step": 2170,
"valid_targets_mean": 3307.8,
"valid_targets_min": 1231
},
{
"epoch": 3.6989795918367347,
"grad_norm": 0.5211299091365144,
"learning_rate": 2.1525209661471677e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24160908162593842,
"step": 2175,
"valid_targets_mean": 3941.2,
"valid_targets_min": 429
},
{
"epoch": 3.707482993197279,
"grad_norm": 0.5109203075204358,
"learning_rate": 2.1440626974402664e-05,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11953634023666382,
"step": 2180,
"valid_targets_mean": 3233.4,
"valid_targets_min": 1336
},
{
"epoch": 3.715986394557823,
"grad_norm": 0.5740584045340128,
"learning_rate": 2.135601837845068e-05,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13772159814834595,
"step": 2185,
"valid_targets_mean": 2741.2,
"valid_targets_min": 1184
},
{
"epoch": 3.7244897959183674,
"grad_norm": 0.43522753496781236,
"learning_rate": 2.1271385395254728e-05,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12005556374788284,
"step": 2190,
"valid_targets_mean": 4175.4,
"valid_targets_min": 1728
},
{
"epoch": 3.7329931972789114,
"grad_norm": 0.5339718966786711,
"learning_rate": 2.118672954689242e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13433292508125305,
"step": 2195,
"valid_targets_mean": 2676.1,
"valid_targets_min": 1687
},
{
"epoch": 3.741496598639456,
"grad_norm": 0.5827904357101654,
"learning_rate": 2.1102052355852586e-05,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11353085935115814,
"step": 2200,
"valid_targets_mean": 3892.6,
"valid_targets_min": 1375
},
{
"epoch": 3.75,
"grad_norm": 0.48888577042540315,
"learning_rate": 2.1017355345007883e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756305694580078,
"step": 2205,
"valid_targets_mean": 4875.0,
"valid_targets_min": 1552
},
{
"epoch": 3.758503401360544,
"grad_norm": 0.49314576717231107,
"learning_rate": 2.093264003758742e-05,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13882237672805786,
"step": 2210,
"valid_targets_mean": 3865.2,
"valid_targets_min": 1552
},
{
"epoch": 3.7670068027210886,
"grad_norm": 0.5227981614939449,
"learning_rate": 2.0847907957149348e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14849701523780823,
"step": 2215,
"valid_targets_mean": 4121.2,
"valid_targets_min": 1314
},
{
"epoch": 3.7755102040816326,
"grad_norm": 0.5361785337409101,
"learning_rate": 2.0763160627553502e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1522911787033081,
"step": 2220,
"valid_targets_mean": 3747.4,
"valid_targets_min": 804
},
{
"epoch": 3.784013605442177,
"grad_norm": 0.5108340377650004,
"learning_rate": 2.067839957293394e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375730335712433,
"step": 2225,
"valid_targets_mean": 3813.8,
"valid_targets_min": 1223
},
{
"epoch": 3.792517006802721,
"grad_norm": 0.4981416024908662,
"learning_rate": 2.059362631767156e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11143091320991516,
"step": 2230,
"valid_targets_mean": 3263.8,
"valid_targets_min": 1356
},
{
"epoch": 3.8010204081632653,
"grad_norm": 0.529958261180386,
"learning_rate": 2.0508842386366687e-05,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11649850755929947,
"step": 2235,
"valid_targets_mean": 3105.9,
"valid_targets_min": 1133
},
{
"epoch": 3.8095238095238093,
"grad_norm": 0.5691253179106762,
"learning_rate": 2.0424049303811637e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666107028722763,
"step": 2240,
"valid_targets_mean": 3283.1,
"valid_targets_min": 758
},
{
"epoch": 3.818027210884354,
"grad_norm": 0.5412858572899136,
"learning_rate": 2.0339248594963326e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16017557680606842,
"step": 2245,
"valid_targets_mean": 3838.8,
"valid_targets_min": 1132
},
{
"epoch": 3.826530612244898,
"grad_norm": 0.5565546049385312,
"learning_rate": 2.025444178491582e-05,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15504541993141174,
"step": 2250,
"valid_targets_mean": 3659.4,
"valid_targets_min": 1529
},
{
"epoch": 3.8350340136054424,
"grad_norm": 0.4904628959821808,
"learning_rate": 2.0169630398872897e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11968071758747101,
"step": 2255,
"valid_targets_mean": 3128.1,
"valid_targets_min": 1197
},
{
"epoch": 3.8435374149659864,
"grad_norm": 0.49816193763634675,
"learning_rate": 2.0084815962120644e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13853618502616882,
"step": 2260,
"valid_targets_mean": 3385.1,
"valid_targets_min": 698
},
{
"epoch": 3.8520408163265305,
"grad_norm": 0.5440701366673651,
"learning_rate": 2e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1894933581352234,
"step": 2265,
"valid_targets_mean": 4004.4,
"valid_targets_min": 1517
},
{
"epoch": 3.8605442176870746,
"grad_norm": 0.47898169059031503,
"learning_rate": 1.9915184037879362e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556398719549179,
"step": 2270,
"valid_targets_mean": 3937.4,
"valid_targets_min": 971
},
{
"epoch": 3.869047619047619,
"grad_norm": 0.5521523760232286,
"learning_rate": 1.983036960112711e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1512027531862259,
"step": 2275,
"valid_targets_mean": 3351.7,
"valid_targets_min": 604
},
{
"epoch": 3.877551020408163,
"grad_norm": 0.47757110237107087,
"learning_rate": 1.9745558215084184e-05,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17591100931167603,
"step": 2280,
"valid_targets_mean": 4062.6,
"valid_targets_min": 1438
},
{
"epoch": 3.8860544217687076,
"grad_norm": 0.583060688800655,
"learning_rate": 1.9660751405036677e-05,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1539376825094223,
"step": 2285,
"valid_targets_mean": 2743.6,
"valid_targets_min": 935
},
{
"epoch": 3.8945578231292517,
"grad_norm": 0.47798427896305834,
"learning_rate": 1.9575950696188367e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14273616671562195,
"step": 2290,
"valid_targets_mean": 3535.2,
"valid_targets_min": 1171
},
{
"epoch": 3.9030612244897958,
"grad_norm": 0.5667491614754994,
"learning_rate": 1.949115761363332e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12068904936313629,
"step": 2295,
"valid_targets_mean": 3373.4,
"valid_targets_min": 1811
},
{
"epoch": 3.9115646258503403,
"grad_norm": 0.5217945938589202,
"learning_rate": 1.9406373682328445e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370539665222168,
"step": 2300,
"valid_targets_mean": 3699.2,
"valid_targets_min": 1000
},
{
"epoch": 3.9200680272108843,
"grad_norm": 0.6072733473428619,
"learning_rate": 1.932160042706607e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1537347286939621,
"step": 2305,
"valid_targets_mean": 3188.1,
"valid_targets_min": 507
},
{
"epoch": 3.928571428571429,
"grad_norm": 0.5533462927972612,
"learning_rate": 1.9236839372446504e-05,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640930473804474,
"step": 2310,
"valid_targets_mean": 3405.7,
"valid_targets_min": 1530
},
{
"epoch": 3.937074829931973,
"grad_norm": 0.5003163870992912,
"learning_rate": 1.9152092042850655e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13920584321022034,
"step": 2315,
"valid_targets_mean": 3497.1,
"valid_targets_min": 1151
},
{
"epoch": 3.945578231292517,
"grad_norm": 0.5477685325651052,
"learning_rate": 1.9067359962412588e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13287462294101715,
"step": 2320,
"valid_targets_mean": 2748.6,
"valid_targets_min": 1295
},
{
"epoch": 3.954081632653061,
"grad_norm": 0.5211036734731059,
"learning_rate": 1.8982644654992123e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15169015526771545,
"step": 2325,
"valid_targets_mean": 3769.6,
"valid_targets_min": 1234
},
{
"epoch": 3.9625850340136055,
"grad_norm": 0.4559337481019662,
"learning_rate": 1.8897947644147424e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18945789337158203,
"step": 2330,
"valid_targets_mean": 4717.9,
"valid_targets_min": 1539
},
{
"epoch": 3.9710884353741496,
"grad_norm": 0.5090040830343693,
"learning_rate": 1.8813270453107586e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15533599257469177,
"step": 2335,
"valid_targets_mean": 3687.2,
"valid_targets_min": 785
},
{
"epoch": 3.979591836734694,
"grad_norm": 0.49839328546501366,
"learning_rate": 1.872861460474528e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15626703202724457,
"step": 2340,
"valid_targets_mean": 3522.6,
"valid_targets_min": 755
},
{
"epoch": 3.988095238095238,
"grad_norm": 0.4804577717706921,
"learning_rate": 1.8643981621549325e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.126425102353096,
"step": 2345,
"valid_targets_mean": 3759.1,
"valid_targets_min": 1911
},
{
"epoch": 3.996598639455782,
"grad_norm": 0.482933524469188,
"learning_rate": 1.855937302559734e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16276368498802185,
"step": 2350,
"valid_targets_mean": 4038.2,
"valid_targets_min": 1268
},
{
"epoch": 4.005102040816326,
"grad_norm": 0.5023685365515297,
"learning_rate": 1.8474790338528336e-05,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10188114643096924,
"step": 2355,
"valid_targets_mean": 2653.2,
"valid_targets_min": 1375
},
{
"epoch": 4.01360544217687,
"grad_norm": 0.41928203389131025,
"learning_rate": 1.839023508151536e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13987550139427185,
"step": 2360,
"valid_targets_mean": 5312.6,
"valid_targets_min": 1076
},
{
"epoch": 4.022108843537415,
"grad_norm": 0.5398436343258409,
"learning_rate": 1.8305708775238162e-05,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11938532441854477,
"step": 2365,
"valid_targets_mean": 3537.8,
"valid_targets_min": 1352
},
{
"epoch": 4.030612244897959,
"grad_norm": 0.5239289576849778,
"learning_rate": 1.822121293985583e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14157015085220337,
"step": 2370,
"valid_targets_mean": 4077.9,
"valid_targets_min": 1325
},
{
"epoch": 4.039115646258503,
"grad_norm": 0.5245260864178052,
"learning_rate": 1.813674909497944e-05,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13017112016677856,
"step": 2375,
"valid_targets_mean": 3429.1,
"valid_targets_min": 1505
},
{
"epoch": 4.0476190476190474,
"grad_norm": 0.5522673431765818,
"learning_rate": 1.8052318759644744e-05,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11945690214633942,
"step": 2380,
"valid_targets_mean": 3247.0,
"valid_targets_min": 912
},
{
"epoch": 4.0561224489795915,
"grad_norm": 0.5293497397934687,
"learning_rate": 1.7967923452284824e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16374406218528748,
"step": 2385,
"valid_targets_mean": 4229.2,
"valid_targets_min": 872
},
{
"epoch": 4.0646258503401365,
"grad_norm": 0.5350434092704202,
"learning_rate": 1.7883564690702826e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14136750996112823,
"step": 2390,
"valid_targets_mean": 3507.5,
"valid_targets_min": 1377
},
{
"epoch": 4.0731292517006805,
"grad_norm": 0.4941976972197606,
"learning_rate": 1.7799243992044634e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12425091117620468,
"step": 2395,
"valid_targets_mean": 3654.2,
"valid_targets_min": 859
},
{
"epoch": 4.081632653061225,
"grad_norm": 0.5763725763447235,
"learning_rate": 1.7714962872771593e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12952286005020142,
"step": 2400,
"valid_targets_mean": 3387.6,
"valid_targets_min": 1323
},
{
"epoch": 4.090136054421769,
"grad_norm": 0.5277461938742322,
"learning_rate": 1.7630722848633234e-05,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11460752785205841,
"step": 2405,
"valid_targets_mean": 3624.1,
"valid_targets_min": 918
},
{
"epoch": 4.098639455782313,
"grad_norm": 0.5275777309962448,
"learning_rate": 1.7546525434639992e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16966021060943604,
"step": 2410,
"valid_targets_mean": 3532.3,
"valid_targets_min": 1299
},
{
"epoch": 4.107142857142857,
"grad_norm": 0.5639072274949859,
"learning_rate": 1.7462372145036012e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14622849225997925,
"step": 2415,
"valid_targets_mean": 3383.2,
"valid_targets_min": 1356
},
{
"epoch": 4.115646258503402,
"grad_norm": 0.485846628966218,
"learning_rate": 1.737826449327188e-05,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11411428451538086,
"step": 2420,
"valid_targets_mean": 4078.5,
"valid_targets_min": 1640
},
{
"epoch": 4.124149659863946,
"grad_norm": 0.758272632014816,
"learning_rate": 1.729420399197741e-05,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.146653950214386,
"step": 2425,
"valid_targets_mean": 3492.2,
"valid_targets_min": 1527
},
{
"epoch": 4.13265306122449,
"grad_norm": 0.5290919750861747,
"learning_rate": 1.7210192152934423e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16026335954666138,
"step": 2430,
"valid_targets_mean": 3589.4,
"valid_targets_min": 1354
},
{
"epoch": 4.141156462585034,
"grad_norm": 0.5149616465912613,
"learning_rate": 1.712623048704961e-05,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10995449870824814,
"step": 2435,
"valid_targets_mean": 3371.2,
"valid_targets_min": 1020
},
{
"epoch": 4.149659863945578,
"grad_norm": 0.5180400201990574,
"learning_rate": 1.7042320504327285e-05,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12292209267616272,
"step": 2440,
"valid_targets_mean": 3585.6,
"valid_targets_min": 1436
},
{
"epoch": 4.158163265306122,
"grad_norm": 0.4402765691327618,
"learning_rate": 1.6958463713842298e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10848579555749893,
"step": 2445,
"valid_targets_mean": 4908.5,
"valid_targets_min": 1362
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.583578753213086,
"learning_rate": 1.687466162371286e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14145049452781677,
"step": 2450,
"valid_targets_mean": 3251.1,
"valid_targets_min": 1552
},
{
"epoch": 4.175170068027211,
"grad_norm": 0.5123852752027489,
"learning_rate": 1.6790915741073418e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18500098586082458,
"step": 2455,
"valid_targets_mean": 4195.8,
"valid_targets_min": 1449
},
{
"epoch": 4.183673469387755,
"grad_norm": 0.5311552913814159,
"learning_rate": 1.670722757204758e-05,
"loss": 0.1264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1071048229932785,
"step": 2460,
"valid_targets_mean": 3237.9,
"valid_targets_min": 1101
},
{
"epoch": 4.192176870748299,
"grad_norm": 0.4537481193241964,
"learning_rate": 1.6623598621720966e-05,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09841416776180267,
"step": 2465,
"valid_targets_mean": 4214.3,
"valid_targets_min": 468
},
{
"epoch": 4.200680272108843,
"grad_norm": 0.600717141479778,
"learning_rate": 1.6540030394114218e-05,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13270169496536255,
"step": 2470,
"valid_targets_mean": 2691.5,
"valid_targets_min": 1092
},
{
"epoch": 4.209183673469388,
"grad_norm": 0.4976204585645935,
"learning_rate": 1.64565243921559e-05,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11785245686769485,
"step": 2475,
"valid_targets_mean": 4144.9,
"valid_targets_min": 1762
},
{
"epoch": 4.217687074829932,
"grad_norm": 0.5526481174319252,
"learning_rate": 1.6373082117655473e-05,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11944583803415298,
"step": 2480,
"valid_targets_mean": 3328.4,
"valid_targets_min": 1197
},
{
"epoch": 4.226190476190476,
"grad_norm": 0.5185084228705585,
"learning_rate": 1.6289705071276323e-05,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1478651762008667,
"step": 2485,
"valid_targets_mean": 4074.9,
"valid_targets_min": 1695
},
{
"epoch": 4.23469387755102,
"grad_norm": 0.5064058629657685,
"learning_rate": 1.62063947525087e-05,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1256791353225708,
"step": 2490,
"valid_targets_mean": 3633.2,
"valid_targets_min": 1678
},
{
"epoch": 4.243197278911564,
"grad_norm": 0.5390030705626246,
"learning_rate": 1.612315265964284e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15357208251953125,
"step": 2495,
"valid_targets_mean": 3176.2,
"valid_targets_min": 1591
},
{
"epoch": 4.2517006802721085,
"grad_norm": 0.5406514616868823,
"learning_rate": 1.6039980289741935e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1449306309223175,
"step": 2500,
"valid_targets_mean": 3431.1,
"valid_targets_min": 1080
},
{
"epoch": 4.260204081632653,
"grad_norm": 0.6085265403782985,
"learning_rate": 1.595687913861528e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12832342088222504,
"step": 2505,
"valid_targets_mean": 2708.1,
"valid_targets_min": 883
},
{
"epoch": 4.2687074829931975,
"grad_norm": 0.9958125295487239,
"learning_rate": 1.587385070079133e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2037830352783203,
"step": 2510,
"valid_targets_mean": 4122.8,
"valid_targets_min": 940
},
{
"epoch": 4.2772108843537415,
"grad_norm": 0.4706952960241422,
"learning_rate": 1.5790896469490807e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12226849794387817,
"step": 2515,
"valid_targets_mean": 4755.2,
"valid_targets_min": 1755
},
{
"epoch": 4.285714285714286,
"grad_norm": 0.5054113047148475,
"learning_rate": 1.5708017936599908e-05,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16386127471923828,
"step": 2520,
"valid_targets_mean": 4257.3,
"valid_targets_min": 1214
},
{
"epoch": 4.29421768707483,
"grad_norm": 0.6038493253323483,
"learning_rate": 1.56252165926434e-05,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13769403100013733,
"step": 2525,
"valid_targets_mean": 3143.4,
"valid_targets_min": 1196
},
{
"epoch": 4.302721088435375,
"grad_norm": 0.4879214707147923,
"learning_rate": 1.554249392675788e-05,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14046776294708252,
"step": 2530,
"valid_targets_mean": 4527.4,
"valid_targets_min": 1950
},
{
"epoch": 4.311224489795919,
"grad_norm": 0.4465612512180996,
"learning_rate": 1.5459851426664956e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12744249403476715,
"step": 2535,
"valid_targets_mean": 5046.9,
"valid_targets_min": 1164
},
{
"epoch": 4.319727891156463,
"grad_norm": 0.4637284744313693,
"learning_rate": 1.5377290578644468e-05,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10689014941453934,
"step": 2540,
"valid_targets_mean": 4280.3,
"valid_targets_min": 1835
},
{
"epoch": 4.328231292517007,
"grad_norm": 0.554279265133868,
"learning_rate": 1.5294812867507835e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1094164252281189,
"step": 2545,
"valid_targets_mean": 2614.7,
"valid_targets_min": 1672
},
{
"epoch": 4.336734693877551,
"grad_norm": 0.5440722163559888,
"learning_rate": 1.5212419776571267e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14824722707271576,
"step": 2550,
"valid_targets_mean": 3486.7,
"valid_targets_min": 604
},
{
"epoch": 4.345238095238095,
"grad_norm": 0.45930986665841933,
"learning_rate": 1.5130112787629152e-05,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12556178867816925,
"step": 2555,
"valid_targets_mean": 4062.1,
"valid_targets_min": 1406
},
{
"epoch": 4.35374149659864,
"grad_norm": 0.5347300720312089,
"learning_rate": 1.5047893380927377e-05,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11758849024772644,
"step": 2560,
"valid_targets_mean": 3016.2,
"valid_targets_min": 1447
},
{
"epoch": 4.362244897959184,
"grad_norm": 0.5810110341683714,
"learning_rate": 1.4965763035136687e-05,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13106051087379456,
"step": 2565,
"valid_targets_mean": 2945.5,
"valid_targets_min": 877
},
{
"epoch": 4.370748299319728,
"grad_norm": 0.511549856319123,
"learning_rate": 1.4883723227326144e-05,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12233540415763855,
"step": 2570,
"valid_targets_mean": 4416.4,
"valid_targets_min": 861
},
{
"epoch": 4.379251700680272,
"grad_norm": 0.6141891043153991,
"learning_rate": 1.4801775432936516e-05,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11202485859394073,
"step": 2575,
"valid_targets_mean": 2762.6,
"valid_targets_min": 1015
},
{
"epoch": 4.387755102040816,
"grad_norm": 0.4476473551026391,
"learning_rate": 1.4719921125753773e-05,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13985709846019745,
"step": 2580,
"valid_targets_mean": 5447.8,
"valid_targets_min": 982
},
{
"epoch": 4.39625850340136,
"grad_norm": 0.562406722078899,
"learning_rate": 1.4638161777882573e-05,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11451070010662079,
"step": 2585,
"valid_targets_mean": 3943.8,
"valid_targets_min": 1210
},
{
"epoch": 4.404761904761905,
"grad_norm": 0.5416533168212995,
"learning_rate": 1.4556498859719756e-05,
"loss": 0.1245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11477416008710861,
"step": 2590,
"valid_targets_mean": 3347.1,
"valid_targets_min": 1476
},
{
"epoch": 4.413265306122449,
"grad_norm": 0.5165893385108531,
"learning_rate": 1.4474933839927956e-05,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16060087084770203,
"step": 2595,
"valid_targets_mean": 4232.8,
"valid_targets_min": 1464
},
{
"epoch": 4.421768707482993,
"grad_norm": 0.594151452327815,
"learning_rate": 1.4393468185409139e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1185787171125412,
"step": 2600,
"valid_targets_mean": 2734.9,
"valid_targets_min": 1044
},
{
"epoch": 4.430272108843537,
"grad_norm": 0.47620977994252855,
"learning_rate": 1.4312103361278254e-05,
"loss": 0.1266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13598421216011047,
"step": 2605,
"valid_targets_mean": 4362.1,
"valid_targets_min": 1623
},
{
"epoch": 4.438775510204081,
"grad_norm": 0.5778604626245851,
"learning_rate": 1.4230840830836875e-05,
"loss": 0.1215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0991811454296112,
"step": 2610,
"valid_targets_mean": 3185.3,
"valid_targets_min": 1047
},
{
"epoch": 4.447278911564625,
"grad_norm": 0.5095063044346275,
"learning_rate": 1.4149682055546854e-05,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16175615787506104,
"step": 2615,
"valid_targets_mean": 4249.7,
"valid_targets_min": 1393
},
{
"epoch": 4.45578231292517,
"grad_norm": 0.5230093792172238,
"learning_rate": 1.4068628495004095e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10372944176197052,
"step": 2620,
"valid_targets_mean": 3279.2,
"valid_targets_min": 429
},
{
"epoch": 4.464285714285714,
"grad_norm": 0.4978389319017629,
"learning_rate": 1.3987681606912254e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13917067646980286,
"step": 2625,
"valid_targets_mean": 4139.9,
"valid_targets_min": 1693
},
{
"epoch": 4.4727891156462585,
"grad_norm": 0.48805163978121935,
"learning_rate": 1.3906842847056546e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1258377879858017,
"step": 2630,
"valid_targets_mean": 4221.4,
"valid_targets_min": 1151
},
{
"epoch": 4.4812925170068025,
"grad_norm": 0.5309720392418742,
"learning_rate": 1.382611366927757e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12541979551315308,
"step": 2635,
"valid_targets_mean": 3300.1,
"valid_targets_min": 1103
},
{
"epoch": 4.489795918367347,
"grad_norm": 0.4925804697564766,
"learning_rate": 1.3745495525445126e-05,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12611186504364014,
"step": 2640,
"valid_targets_mean": 3906.4,
"valid_targets_min": 864
},
{
"epoch": 4.4982993197278915,
"grad_norm": 0.5454905313244999,
"learning_rate": 1.3664989865432157e-05,
"loss": 0.1334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10953294485807419,
"step": 2645,
"valid_targets_mean": 3340.1,
"valid_targets_min": 1733
},
{
"epoch": 4.506802721088436,
"grad_norm": 0.5252733550532073,
"learning_rate": 1.3584598137088625e-05,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15157128870487213,
"step": 2650,
"valid_targets_mean": 3560.9,
"valid_targets_min": 1273
},
{
"epoch": 4.51530612244898,
"grad_norm": 0.5198558545652678,
"learning_rate": 1.3504321786215514e-05,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11329950392246246,
"step": 2655,
"valid_targets_mean": 3093.6,
"valid_targets_min": 881
},
{
"epoch": 4.523809523809524,
"grad_norm": 0.6002119548110341,
"learning_rate": 1.3424162256538797e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1460447907447815,
"step": 2660,
"valid_targets_mean": 2855.2,
"valid_targets_min": 1115
},
{
"epoch": 4.532312925170068,
"grad_norm": 0.4690919568996324,
"learning_rate": 1.3344120989683473e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11531253159046173,
"step": 2665,
"valid_targets_mean": 4137.5,
"valid_targets_min": 1170
},
{
"epoch": 4.540816326530612,
"grad_norm": 0.48345732018469006,
"learning_rate": 1.3264199425147667e-05,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12812292575836182,
"step": 2670,
"valid_targets_mean": 4035.9,
"valid_targets_min": 1360
},
{
"epoch": 4.549319727891157,
"grad_norm": 0.6281667762967951,
"learning_rate": 1.3184399000276708e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13768933713436127,
"step": 2675,
"valid_targets_mean": 2721.2,
"valid_targets_min": 759
},
{
"epoch": 4.557823129251701,
"grad_norm": 0.6020408443336502,
"learning_rate": 1.3104721150237305e-05,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13107319176197052,
"step": 2680,
"valid_targets_mean": 3015.6,
"valid_targets_min": 1276
},
{
"epoch": 4.566326530612245,
"grad_norm": 0.5222297457955155,
"learning_rate": 1.3025167307991734e-05,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11526221036911011,
"step": 2685,
"valid_targets_mean": 3457.8,
"valid_targets_min": 1537
},
{
"epoch": 4.574829931972789,
"grad_norm": 0.5399196254993844,
"learning_rate": 1.294573890427203e-05,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16417351365089417,
"step": 2690,
"valid_targets_mean": 4152.0,
"valid_targets_min": 1388
},
{
"epoch": 4.583333333333333,
"grad_norm": 0.5453980131163246,
"learning_rate": 1.2866437367554313e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13150575757026672,
"step": 2695,
"valid_targets_mean": 3255.8,
"valid_targets_min": 1080
},
{
"epoch": 4.591836734693878,
"grad_norm": 0.564868544100156,
"learning_rate": 1.278726412403306e-05,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11302247643470764,
"step": 2700,
"valid_targets_mean": 2766.1,
"valid_targets_min": 288
},
{
"epoch": 4.600340136054422,
"grad_norm": 0.5570067708592675,
"learning_rate": 1.2708220597595462e-05,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16181376576423645,
"step": 2705,
"valid_targets_mean": 3591.7,
"valid_targets_min": 1429
},
{
"epoch": 4.608843537414966,
"grad_norm": 0.4924894979414545,
"learning_rate": 1.2629308209795834e-05,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13477236032485962,
"step": 2710,
"valid_targets_mean": 3979.9,
"valid_targets_min": 1277
},
{
"epoch": 4.61734693877551,
"grad_norm": 0.5395011939137863,
"learning_rate": 1.2550528379830019e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12093565613031387,
"step": 2715,
"valid_targets_mean": 3259.6,
"valid_targets_min": 869
},
{
"epoch": 4.625850340136054,
"grad_norm": 0.48613266875635563,
"learning_rate": 1.2471882524509873e-05,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11778571456670761,
"step": 2720,
"valid_targets_mean": 4093.9,
"valid_targets_min": 1843
},
{
"epoch": 4.634353741496598,
"grad_norm": 0.5920343619245662,
"learning_rate": 1.2393372058237819e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12733955681324005,
"step": 2725,
"valid_targets_mean": 3063.2,
"valid_targets_min": 1169
},
{
"epoch": 4.642857142857143,
"grad_norm": 0.5038080159084226,
"learning_rate": 1.2314998392981364e-05,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13160504400730133,
"step": 2730,
"valid_targets_mean": 4067.9,
"valid_targets_min": 1577
},
{
"epoch": 4.651360544217687,
"grad_norm": 0.5229519935844232,
"learning_rate": 1.2236762938247729e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1371050775051117,
"step": 2735,
"valid_targets_mean": 3716.6,
"valid_targets_min": 1169
},
{
"epoch": 4.659863945578231,
"grad_norm": 0.521745882443459,
"learning_rate": 1.2158667101058497e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13528242707252502,
"step": 2740,
"valid_targets_mean": 3872.4,
"valid_targets_min": 1477
},
{
"epoch": 4.668367346938775,
"grad_norm": 0.4885511062328345,
"learning_rate": 1.208071228592429e-05,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15420043468475342,
"step": 2745,
"valid_targets_mean": 4217.5,
"valid_targets_min": 1480
},
{
"epoch": 4.6768707482993195,
"grad_norm": 0.4178757321541779,
"learning_rate": 1.2002899894819548e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1247992143034935,
"step": 2750,
"valid_targets_mean": 4595.2,
"valid_targets_min": 1157
},
{
"epoch": 4.685374149659864,
"grad_norm": 0.6108750918194292,
"learning_rate": 1.1925231327157288e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12069522589445114,
"step": 2755,
"valid_targets_mean": 2943.6,
"valid_targets_min": 1366
},
{
"epoch": 4.6938775510204085,
"grad_norm": 0.5299847403293142,
"learning_rate": 1.1847707979763934e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20735841989517212,
"step": 2760,
"valid_targets_mean": 4586.6,
"valid_targets_min": 280
},
{
"epoch": 4.7023809523809526,
"grad_norm": 0.5262690909390965,
"learning_rate": 1.1770331246854211e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12230242788791656,
"step": 2765,
"valid_targets_mean": 3189.1,
"valid_targets_min": 1330
},
{
"epoch": 4.710884353741497,
"grad_norm": 0.44464404640066674,
"learning_rate": 1.169310252000605e-05,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11267457902431488,
"step": 2770,
"valid_targets_mean": 4162.7,
"valid_targets_min": 1809
},
{
"epoch": 4.719387755102041,
"grad_norm": 0.5455599156674992,
"learning_rate": 1.1616023188135594e-05,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10474415868520737,
"step": 2775,
"valid_targets_mean": 2892.6,
"valid_targets_min": 626
},
{
"epoch": 4.727891156462585,
"grad_norm": 0.5015898266496815,
"learning_rate": 1.1539094637472181e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17794445157051086,
"step": 2780,
"valid_targets_mean": 4521.5,
"valid_targets_min": 1553
},
{
"epoch": 4.736394557823129,
"grad_norm": 0.5508250011415522,
"learning_rate": 1.1462318251533442e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11678224056959152,
"step": 2785,
"valid_targets_mean": 3110.7,
"valid_targets_min": 1429
},
{
"epoch": 4.744897959183674,
"grad_norm": 0.622408173575908,
"learning_rate": 1.1385695411100424e-05,
"loss": 0.1179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11828910559415817,
"step": 2790,
"valid_targets_mean": 3258.1,
"valid_targets_min": 1122
},
{
"epoch": 4.753401360544218,
"grad_norm": 0.5322995958406667,
"learning_rate": 1.1309227494192703e-05,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13555939495563507,
"step": 2795,
"valid_targets_mean": 3526.5,
"valid_targets_min": 1328
},
{
"epoch": 4.761904761904762,
"grad_norm": 0.5756957552451561,
"learning_rate": 1.1232915876043673e-05,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14180392026901245,
"step": 2800,
"valid_targets_mean": 3444.5,
"valid_targets_min": 1732
},
{
"epoch": 4.770408163265306,
"grad_norm": 0.503634481514556,
"learning_rate": 1.1156761929075777e-05,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13477468490600586,
"step": 2805,
"valid_targets_mean": 3889.4,
"valid_targets_min": 345
},
{
"epoch": 4.77891156462585,
"grad_norm": 0.5122500311184057,
"learning_rate": 1.1080767022875816e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10373985022306442,
"step": 2810,
"valid_targets_mean": 3319.8,
"valid_targets_min": 534
},
{
"epoch": 4.787414965986395,
"grad_norm": 0.4711642587141199,
"learning_rate": 1.100493252417035e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11209157109260559,
"step": 2815,
"valid_targets_mean": 3830.2,
"valid_targets_min": 1861
},
{
"epoch": 4.795918367346939,
"grad_norm": 0.5123035748411254,
"learning_rate": 1.0929259796801075e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18172311782836914,
"step": 2820,
"valid_targets_mean": 4577.3,
"valid_targets_min": 1025
},
{
"epoch": 4.804421768707483,
"grad_norm": 0.5808435182317419,
"learning_rate": 1.085375020170034e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12455550581216812,
"step": 2825,
"valid_targets_mean": 3490.9,
"valid_targets_min": 1254
},
{
"epoch": 4.812925170068027,
"grad_norm": 0.5320315082614337,
"learning_rate": 1.0778405096866624e-05,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13116773962974548,
"step": 2830,
"valid_targets_mean": 3979.3,
"valid_targets_min": 1469
},
{
"epoch": 4.821428571428571,
"grad_norm": 0.5385934682017872,
"learning_rate": 1.0703225837340166e-05,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12079325318336487,
"step": 2835,
"valid_targets_mean": 3281.2,
"valid_targets_min": 795
},
{
"epoch": 4.829931972789115,
"grad_norm": 0.6106526535513195,
"learning_rate": 1.0628213775178561e-05,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12414602935314178,
"step": 2840,
"valid_targets_mean": 2841.2,
"valid_targets_min": 602
},
{
"epoch": 4.83843537414966,
"grad_norm": 0.5093217844857241,
"learning_rate": 1.055337025943244e-05,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140962153673172,
"step": 2845,
"valid_targets_mean": 4046.6,
"valid_targets_min": 1090
},
{
"epoch": 4.846938775510204,
"grad_norm": 0.5601063982178885,
"learning_rate": 1.0478696636121231e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13058549165725708,
"step": 2850,
"valid_targets_mean": 2946.1,
"valid_targets_min": 787
},
{
"epoch": 4.855442176870748,
"grad_norm": 0.5490008558122706,
"learning_rate": 1.0404194248208934e-05,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12004873156547546,
"step": 2855,
"valid_targets_mean": 3107.6,
"valid_targets_min": 1576
},
{
"epoch": 4.863945578231292,
"grad_norm": 0.5390824170618834,
"learning_rate": 1.0329864435579982e-05,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494147628545761,
"step": 2860,
"valid_targets_mean": 3607.8,
"valid_targets_min": 883
},
{
"epoch": 4.872448979591836,
"grad_norm": 0.507051514951129,
"learning_rate": 1.0255708535015137e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14024758338928223,
"step": 2865,
"valid_targets_mean": 3543.3,
"valid_targets_min": 1415
},
{
"epoch": 4.880952380952381,
"grad_norm": 0.4535295124880974,
"learning_rate": 1.0181727880167428e-05,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11601919680833817,
"step": 2870,
"valid_targets_mean": 4292.6,
"valid_targets_min": 1658
},
{
"epoch": 4.889455782312925,
"grad_norm": 0.6284871405176786,
"learning_rate": 1.0107923801538215e-05,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1566929817199707,
"step": 2875,
"valid_targets_mean": 3509.4,
"valid_targets_min": 1154
},
{
"epoch": 4.8979591836734695,
"grad_norm": 0.8017226677266484,
"learning_rate": 1.003429762645321e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12294437736272812,
"step": 2880,
"valid_targets_mean": 3937.1,
"valid_targets_min": 704
},
{
"epoch": 4.906462585034014,
"grad_norm": 0.49364696050021467,
"learning_rate": 9.960850679038632e-06,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12457674741744995,
"step": 2885,
"valid_targets_mean": 3758.8,
"valid_targets_min": 1532
},
{
"epoch": 4.914965986394558,
"grad_norm": 0.4548630723446227,
"learning_rate": 9.887584280197411e-06,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.159095898270607,
"step": 2890,
"valid_targets_mean": 4785.4,
"valid_targets_min": 1638
},
{
"epoch": 4.923469387755102,
"grad_norm": 0.5740124878344341,
"learning_rate": 9.814499747585373e-06,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13639631867408752,
"step": 2895,
"valid_targets_mean": 3424.3,
"valid_targets_min": 1593
},
{
"epoch": 4.931972789115647,
"grad_norm": 0.5928533009251364,
"learning_rate": 9.741598395587606e-06,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1397685408592224,
"step": 2900,
"valid_targets_mean": 3337.0,
"valid_targets_min": 1140
},
{
"epoch": 4.940476190476191,
"grad_norm": 0.4832053251048456,
"learning_rate": 9.668881535294792e-06,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11467613279819489,
"step": 2905,
"valid_targets_mean": 3527.8,
"valid_targets_min": 1355
},
{
"epoch": 4.948979591836735,
"grad_norm": 0.5194202009100961,
"learning_rate": 9.596350474479625e-06,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17165853083133698,
"step": 2910,
"valid_targets_mean": 4053.4,
"valid_targets_min": 1254
},
{
"epoch": 4.957482993197279,
"grad_norm": 0.4710233237676264,
"learning_rate": 9.52400651757331e-06,
"loss": 0.1268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13677963614463806,
"step": 2915,
"valid_targets_mean": 4633.2,
"valid_targets_min": 1389
},
{
"epoch": 4.965986394557823,
"grad_norm": 0.6026856180553531,
"learning_rate": 9.451850965642073e-06,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16165249049663544,
"step": 2920,
"valid_targets_mean": 3169.5,
"valid_targets_min": 1016
},
{
"epoch": 4.974489795918368,
"grad_norm": 0.5579194459953276,
"learning_rate": 9.379885116363786e-06,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13458088040351868,
"step": 2925,
"valid_targets_mean": 3184.6,
"valid_targets_min": 1217
},
{
"epoch": 4.982993197278912,
"grad_norm": 0.6099184803160398,
"learning_rate": 9.308110264004625e-06,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13990472257137299,
"step": 2930,
"valid_targets_mean": 2672.0,
"valid_targets_min": 648
},
{
"epoch": 4.991496598639456,
"grad_norm": 0.5643685144945373,
"learning_rate": 9.236527699395803e-06,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14728853106498718,
"step": 2935,
"valid_targets_mean": 3404.2,
"valid_targets_min": 1531
},
{
"epoch": 5.0,
"grad_norm": 0.49184592411521516,
"learning_rate": 9.165138709910338e-06,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12404905259609222,
"step": 2940,
"valid_targets_mean": 3728.0,
"valid_targets_min": 1129
},
{
"epoch": 5.008503401360544,
"grad_norm": 0.460373687869048,
"learning_rate": 9.093944579439882e-06,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11780281364917755,
"step": 2945,
"valid_targets_mean": 4433.4,
"valid_targets_min": 1551
},
{
"epoch": 5.017006802721088,
"grad_norm": 0.5141394604653041,
"learning_rate": 9.022946588371688e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11578322947025299,
"step": 2950,
"valid_targets_mean": 3810.8,
"valid_targets_min": 792
},
{
"epoch": 5.025510204081633,
"grad_norm": 0.6119126642644851,
"learning_rate": 8.952146013565532e-06,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11888520419597626,
"step": 2955,
"valid_targets_mean": 3330.3,
"valid_targets_min": 1196
},
{
"epoch": 5.034013605442177,
"grad_norm": 0.5334163364241725,
"learning_rate": 8.881544128330777e-06,
"loss": 0.124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10936582833528519,
"step": 2960,
"valid_targets_mean": 3843.6,
"valid_targets_min": 1332
},
{
"epoch": 5.042517006802721,
"grad_norm": 0.5207414438668616,
"learning_rate": 8.81114220240346e-06,
"loss": 0.1163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09396034479141235,
"step": 2965,
"valid_targets_mean": 3615.5,
"valid_targets_min": 1598
},
{
"epoch": 5.051020408163265,
"grad_norm": 0.5325192027606288,
"learning_rate": 8.740941501923454e-06,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11093772947788239,
"step": 2970,
"valid_targets_mean": 3633.8,
"valid_targets_min": 1334
},
{
"epoch": 5.059523809523809,
"grad_norm": 0.5227116634294291,
"learning_rate": 8.6709432894117e-06,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11531760543584824,
"step": 2975,
"valid_targets_mean": 4427.8,
"valid_targets_min": 1586
},
{
"epoch": 5.068027210884353,
"grad_norm": 0.54169564088552,
"learning_rate": 8.601148823747516e-06,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10472555458545685,
"step": 2980,
"valid_targets_mean": 3638.6,
"valid_targets_min": 1494
},
{
"epoch": 5.076530612244898,
"grad_norm": 0.614347963039127,
"learning_rate": 8.531559360145942e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11521926522254944,
"step": 2985,
"valid_targets_mean": 3453.6,
"valid_targets_min": 1551
},
{
"epoch": 5.085034013605442,
"grad_norm": 0.5700921400342378,
"learning_rate": 8.462176150135168e-06,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11983014643192291,
"step": 2990,
"valid_targets_mean": 3673.4,
"valid_targets_min": 1312
},
{
"epoch": 5.093537414965986,
"grad_norm": 0.5606850774518538,
"learning_rate": 8.393000441534036e-06,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1205582469701767,
"step": 2995,
"valid_targets_mean": 3382.2,
"valid_targets_min": 1572
},
{
"epoch": 5.1020408163265305,
"grad_norm": 0.58308967535263,
"learning_rate": 8.324033478429559e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10241550207138062,
"step": 3000,
"valid_targets_mean": 3517.1,
"valid_targets_min": 1789
},
{
"epoch": 5.110544217687075,
"grad_norm": 0.5010560317558209,
"learning_rate": 8.25527650115461e-06,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14672619104385376,
"step": 3005,
"valid_targets_mean": 4090.6,
"valid_targets_min": 613
},
{
"epoch": 5.119047619047619,
"grad_norm": 0.5428848219846862,
"learning_rate": 8.186730746265577e-06,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09942807257175446,
"step": 3010,
"valid_targets_mean": 3168.2,
"valid_targets_min": 1170
},
{
"epoch": 5.127551020408164,
"grad_norm": 0.51701896739521,
"learning_rate": 8.118397446520103e-06,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11356031149625778,
"step": 3015,
"valid_targets_mean": 3822.1,
"valid_targets_min": 1330
},
{
"epoch": 5.136054421768708,
"grad_norm": 0.5610298521254529,
"learning_rate": 8.050277830854984e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10268589854240417,
"step": 3020,
"valid_targets_mean": 3365.3,
"valid_targets_min": 1473
},
{
"epoch": 5.144557823129252,
"grad_norm": 0.5147852147560592,
"learning_rate": 7.982373124363984e-06,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11522484570741653,
"step": 3025,
"valid_targets_mean": 3669.4,
"valid_targets_min": 325
},
{
"epoch": 5.153061224489796,
"grad_norm": 0.5551663697519054,
"learning_rate": 7.914684548275875e-06,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11051298677921295,
"step": 3030,
"valid_targets_mean": 3926.8,
"valid_targets_min": 861
},
{
"epoch": 5.16156462585034,
"grad_norm": 0.7995351940000094,
"learning_rate": 7.847213319932425e-06,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12783026695251465,
"step": 3035,
"valid_targets_mean": 4223.2,
"valid_targets_min": 1160
},
{
"epoch": 5.170068027210885,
"grad_norm": 0.5433303920121849,
"learning_rate": 7.779960652766534e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11100686341524124,
"step": 3040,
"valid_targets_mean": 3678.4,
"valid_targets_min": 1334
},
{
"epoch": 5.178571428571429,
"grad_norm": 0.5233906234955884,
"learning_rate": 7.7129277562804e-06,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12264975905418396,
"step": 3045,
"valid_targets_mean": 3809.6,
"valid_targets_min": 875
},
{
"epoch": 5.187074829931973,
"grad_norm": 0.5461499007910949,
"learning_rate": 7.646115836023744e-06,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12836602330207825,
"step": 3050,
"valid_targets_mean": 4164.1,
"valid_targets_min": 1297
},
{
"epoch": 5.195578231292517,
"grad_norm": 0.4966515297253701,
"learning_rate": 7.5795260935721755e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12989744544029236,
"step": 3055,
"valid_targets_mean": 4977.2,
"valid_targets_min": 1325
},
{
"epoch": 5.204081632653061,
"grad_norm": 0.5603026881528321,
"learning_rate": 7.5131597265055585e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13274753093719482,
"step": 3060,
"valid_targets_mean": 3628.2,
"valid_targets_min": 1993
},
{
"epoch": 5.212585034013605,
"grad_norm": 0.4915563280912599,
"learning_rate": 7.447017928386453e-06,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10731866955757141,
"step": 3065,
"valid_targets_mean": 3817.6,
"valid_targets_min": 1266
},
{
"epoch": 5.22108843537415,
"grad_norm": 0.5880203513035192,
"learning_rate": 7.381101888738693e-06,
"loss": 0.1172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13712306320667267,
"step": 3070,
"valid_targets_mean": 3312.9,
"valid_targets_min": 429
},
{
"epoch": 5.229591836734694,
"grad_norm": 0.6452402993864961,
"learning_rate": 7.315412793025951e-06,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11051145941019058,
"step": 3075,
"valid_targets_mean": 3440.4,
"valid_targets_min": 604
},
{
"epoch": 5.238095238095238,
"grad_norm": 0.47909386074241567,
"learning_rate": 7.24995182263045e-06,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11070841550827026,
"step": 3080,
"valid_targets_mean": 4483.2,
"valid_targets_min": 1584
},
{
"epoch": 5.246598639455782,
"grad_norm": 0.5091807283304515,
"learning_rate": 7.184720154831706e-06,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12383826076984406,
"step": 3085,
"valid_targets_mean": 4121.9,
"valid_targets_min": 1748
},
{
"epoch": 5.255102040816326,
"grad_norm": 0.5561391846264628,
"learning_rate": 7.119718962785349e-06,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10299091786146164,
"step": 3090,
"valid_targets_mean": 3107.9,
"valid_targets_min": 1591
},
{
"epoch": 5.263605442176871,
"grad_norm": 0.5439361172002423,
"learning_rate": 7.054949415502037e-06,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14960172772407532,
"step": 3095,
"valid_targets_mean": 4154.1,
"valid_targets_min": 1514
},
{
"epoch": 5.272108843537415,
"grad_norm": 0.5055115783208214,
"learning_rate": 6.990412677826404e-06,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13446712493896484,
"step": 3100,
"valid_targets_mean": 4222.0,
"valid_targets_min": 1577
},
{
"epoch": 5.280612244897959,
"grad_norm": 0.5051797282464314,
"learning_rate": 6.926109910416153e-06,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11003969609737396,
"step": 3105,
"valid_targets_mean": 3936.0,
"valid_targets_min": 2152
},
{
"epoch": 5.289115646258503,
"grad_norm": 0.6721874443565838,
"learning_rate": 6.862042269721158e-06,
"loss": 0.1084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11099831759929657,
"step": 3110,
"valid_targets_mean": 3415.6,
"valid_targets_min": 1058
},
{
"epoch": 5.2976190476190474,
"grad_norm": 0.5394489454464912,
"learning_rate": 6.798210907962655e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12719398736953735,
"step": 3115,
"valid_targets_mean": 3460.3,
"valid_targets_min": 1271
},
{
"epoch": 5.3061224489795915,
"grad_norm": 0.48288105959872535,
"learning_rate": 6.734616973112549e-06,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10736523568630219,
"step": 3120,
"valid_targets_mean": 4715.4,
"valid_targets_min": 1485
},
{
"epoch": 5.3146258503401365,
"grad_norm": 0.5025747733371888,
"learning_rate": 6.671261608872737e-06,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10189585387706757,
"step": 3125,
"valid_targets_mean": 3567.2,
"valid_targets_min": 1479
},
{
"epoch": 5.3231292517006805,
"grad_norm": 0.5985343176195231,
"learning_rate": 6.60814595465457e-06,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11069802939891815,
"step": 3130,
"valid_targets_mean": 3020.3,
"valid_targets_min": 1210
},
{
"epoch": 5.331632653061225,
"grad_norm": 0.5711246776535795,
"learning_rate": 6.545271145558336e-06,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1153416782617569,
"step": 3135,
"valid_targets_mean": 3687.6,
"valid_targets_min": 354
},
{
"epoch": 5.340136054421769,
"grad_norm": 0.5442736841286343,
"learning_rate": 6.482638312352867e-06,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1518375724554062,
"step": 3140,
"valid_targets_mean": 3984.1,
"valid_targets_min": 1712
},
{
"epoch": 5.348639455782313,
"grad_norm": 0.5921573966375302,
"learning_rate": 6.420248581455184e-06,
"loss": 0.112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12098226696252823,
"step": 3145,
"valid_targets_mean": 3470.0,
"valid_targets_min": 1603
},
{
"epoch": 5.357142857142857,
"grad_norm": 0.5697364605515239,
"learning_rate": 6.358103074910238e-06,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13729847967624664,
"step": 3150,
"valid_targets_mean": 3894.2,
"valid_targets_min": 1645
},
{
"epoch": 5.365646258503402,
"grad_norm": 0.4871709662606649,
"learning_rate": 6.296202910370757e-06,
"loss": 0.1215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13507282733917236,
"step": 3155,
"valid_targets_mean": 4424.4,
"valid_targets_min": 1180
},
{
"epoch": 5.374149659863946,
"grad_norm": 0.577744628501453,
"learning_rate": 6.234549201077124e-06,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10959557443857193,
"step": 3160,
"valid_targets_mean": 3010.2,
"valid_targets_min": 1496
},
{
"epoch": 5.38265306122449,
"grad_norm": 0.5829555774391696,
"learning_rate": 6.173143055837345e-06,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11792930960655212,
"step": 3165,
"valid_targets_mean": 3196.4,
"valid_targets_min": 721
},
{
"epoch": 5.391156462585034,
"grad_norm": 0.4993975366287769,
"learning_rate": 6.111985579007149e-06,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12624284625053406,
"step": 3170,
"valid_targets_mean": 4134.6,
"valid_targets_min": 1236
},
{
"epoch": 5.399659863945578,
"grad_norm": 0.5107866919709771,
"learning_rate": 6.051077870470068e-06,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11668853461742401,
"step": 3175,
"valid_targets_mean": 4047.1,
"valid_targets_min": 1577
},
{
"epoch": 5.408163265306122,
"grad_norm": 0.5252474663513425,
"learning_rate": 5.990421025617716e-06,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09952177107334137,
"step": 3180,
"valid_targets_mean": 3666.6,
"valid_targets_min": 1741
},
{
"epoch": 5.416666666666667,
"grad_norm": 0.5015726628558949,
"learning_rate": 5.930016135330052e-06,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11919872462749481,
"step": 3185,
"valid_targets_mean": 4237.8,
"valid_targets_min": 1198
},
{
"epoch": 5.425170068027211,
"grad_norm": 0.4769102709235795,
"learning_rate": 5.869864285955771e-06,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10949502885341644,
"step": 3190,
"valid_targets_mean": 4599.4,
"valid_targets_min": 1069
},
{
"epoch": 5.433673469387755,
"grad_norm": 0.5498618632742693,
"learning_rate": 5.80996655929277e-06,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12536795437335968,
"step": 3195,
"valid_targets_mean": 3588.6,
"valid_targets_min": 1136
},
{
"epoch": 5.442176870748299,
"grad_norm": 0.545561483870248,
"learning_rate": 5.750324032568677e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12246537208557129,
"step": 3200,
"valid_targets_mean": 3596.1,
"valid_targets_min": 1312
},
{
"epoch": 5.450680272108843,
"grad_norm": 0.6040925588691938,
"learning_rate": 5.6909377784215035e-06,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10457558184862137,
"step": 3205,
"valid_targets_mean": 2857.7,
"valid_targets_min": 1024
},
{
"epoch": 5.459183673469388,
"grad_norm": 0.5913736902327493,
"learning_rate": 5.631808864880342e-06,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11675500869750977,
"step": 3210,
"valid_targets_mean": 3617.6,
"valid_targets_min": 1573
},
{
"epoch": 5.467687074829932,
"grad_norm": 0.564857354499183,
"learning_rate": 5.5729383553461315e-06,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10473236441612244,
"step": 3215,
"valid_targets_mean": 3246.6,
"valid_targets_min": 1352
},
{
"epoch": 5.476190476190476,
"grad_norm": 0.6156419129927186,
"learning_rate": 5.5143273085725894e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11393928527832031,
"step": 3220,
"valid_targets_mean": 2748.5,
"valid_targets_min": 1241
},
{
"epoch": 5.48469387755102,
"grad_norm": 0.45521005132445264,
"learning_rate": 5.45597677864711e-06,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10282590985298157,
"step": 3225,
"valid_targets_mean": 4610.5,
"valid_targets_min": 1112
},
{
"epoch": 5.493197278911564,
"grad_norm": 0.5837854371759927,
"learning_rate": 5.397887814971854e-06,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12497810274362564,
"step": 3230,
"valid_targets_mean": 3359.5,
"valid_targets_min": 1305
},
{
"epoch": 5.5017006802721085,
"grad_norm": 0.5527734282651293,
"learning_rate": 5.34006146224485e-06,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1028062105178833,
"step": 3235,
"valid_targets_mean": 3404.5,
"valid_targets_min": 1249
},
{
"epoch": 5.510204081632653,
"grad_norm": 0.5266096072280819,
"learning_rate": 5.282498760441219e-06,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11795396357774734,
"step": 3240,
"valid_targets_mean": 3558.4,
"valid_targets_min": 1270
},
{
"epoch": 5.5187074829931975,
"grad_norm": 0.540851535403909,
"learning_rate": 5.225200744794465e-06,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17452237010002136,
"step": 3245,
"valid_targets_mean": 4261.2,
"valid_targets_min": 1507
},
{
"epoch": 5.5272108843537415,
"grad_norm": 0.5182603091934628,
"learning_rate": 5.168168445777839e-06,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1529075652360916,
"step": 3250,
"valid_targets_mean": 4521.4,
"valid_targets_min": 389
},
{
"epoch": 5.535714285714286,
"grad_norm": 0.5805823631890119,
"learning_rate": 5.111402889085852e-06,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14389967918395996,
"step": 3255,
"valid_targets_mean": 3602.2,
"valid_targets_min": 1451
},
{
"epoch": 5.54421768707483,
"grad_norm": 0.5729116752291277,
"learning_rate": 5.054905095615779e-06,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11263558268547058,
"step": 3260,
"valid_targets_mean": 3662.2,
"valid_targets_min": 1362
},
{
"epoch": 5.552721088435375,
"grad_norm": 0.5902153815232817,
"learning_rate": 4.9986760814493315e-06,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10420026630163193,
"step": 3265,
"valid_targets_mean": 3085.2,
"valid_targets_min": 1562
},
{
"epoch": 5.561224489795919,
"grad_norm": 0.5079041365032244,
"learning_rate": 4.94271685783438e-06,
"loss": 0.1285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10216909646987915,
"step": 3270,
"valid_targets_mean": 3791.7,
"valid_targets_min": 1329
},
{
"epoch": 5.569727891156463,
"grad_norm": 0.5323053118094618,
"learning_rate": 4.88702843116674e-06,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11844904720783234,
"step": 3275,
"valid_targets_mean": 4096.2,
"valid_targets_min": 717
},
{
"epoch": 5.578231292517007,
"grad_norm": 0.5913613540592834,
"learning_rate": 4.831611802972112e-06,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12086708843708038,
"step": 3280,
"valid_targets_mean": 3125.9,
"valid_targets_min": 1140
},
{
"epoch": 5.586734693877551,
"grad_norm": 0.6067435787352505,
"learning_rate": 4.776467969888041e-06,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1235356330871582,
"step": 3285,
"valid_targets_mean": 2861.3,
"valid_targets_min": 861
},
{
"epoch": 5.595238095238095,
"grad_norm": 0.6143172537137376,
"learning_rate": 4.721597923646008e-06,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13739518821239471,
"step": 3290,
"valid_targets_mean": 3314.9,
"valid_targets_min": 724
},
{
"epoch": 5.603741496598639,
"grad_norm": 0.5285568105683806,
"learning_rate": 4.667002651053582e-06,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10752934962511063,
"step": 3295,
"valid_targets_mean": 3720.3,
"valid_targets_min": 1406
},
{
"epoch": 5.612244897959184,
"grad_norm": 0.5479976862189573,
"learning_rate": 4.612683133976692e-06,
"loss": 0.128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15180706977844238,
"step": 3300,
"valid_targets_mean": 3768.8,
"valid_targets_min": 1531
},
{
"epoch": 5.620748299319728,
"grad_norm": 0.5462163829552453,
"learning_rate": 4.5586403493219365e-06,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10777892172336578,
"step": 3305,
"valid_targets_mean": 3076.4,
"valid_targets_min": 988
},
{
"epoch": 5.629251700680272,
"grad_norm": 0.5243365624661317,
"learning_rate": 4.504875269019038e-06,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1242019534111023,
"step": 3310,
"valid_targets_mean": 4469.8,
"valid_targets_min": 1440
},
{
"epoch": 5.637755102040816,
"grad_norm": 0.6223327575084228,
"learning_rate": 4.451388860003374e-06,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14461229741573334,
"step": 3315,
"valid_targets_mean": 3680.9,
"valid_targets_min": 759
},
{
"epoch": 5.646258503401361,
"grad_norm": 0.5627481662897891,
"learning_rate": 4.398182084198561e-06,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11661049723625183,
"step": 3320,
"valid_targets_mean": 3855.8,
"valid_targets_min": 1624
},
{
"epoch": 5.654761904761905,
"grad_norm": 0.5770944346437502,
"learning_rate": 4.345255898499172e-06,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13459742069244385,
"step": 3325,
"valid_targets_mean": 3598.4,
"valid_targets_min": 1468
},
{
"epoch": 5.663265306122449,
"grad_norm": 0.6063654059969268,
"learning_rate": 4.292611254753509e-06,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1045822948217392,
"step": 3330,
"valid_targets_mean": 4255.0,
"valid_targets_min": 1895
},
{
"epoch": 5.671768707482993,
"grad_norm": 0.6199385704660482,
"learning_rate": 4.24024909974651e-06,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11114975064992905,
"step": 3335,
"valid_targets_mean": 2667.2,
"valid_targets_min": 1101
},
{
"epoch": 5.680272108843537,
"grad_norm": 0.5741341263715167,
"learning_rate": 4.188170375182705e-06,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13209852576255798,
"step": 3340,
"valid_targets_mean": 3331.6,
"valid_targets_min": 766
},
{
"epoch": 5.688775510204081,
"grad_norm": 0.5849953260351614,
"learning_rate": 4.136376017669281e-06,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19509027898311615,
"step": 3345,
"valid_targets_mean": 4514.0,
"valid_targets_min": 1096
},
{
"epoch": 5.697278911564625,
"grad_norm": 0.5184855624946975,
"learning_rate": 4.084866958699247e-06,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11184950917959213,
"step": 3350,
"valid_targets_mean": 3622.2,
"valid_targets_min": 1657
},
{
"epoch": 5.70578231292517,
"grad_norm": 0.4729255009742215,
"learning_rate": 4.0336441246346684e-06,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12170318514108658,
"step": 3355,
"valid_targets_mean": 4347.8,
"valid_targets_min": 1545
},
{
"epoch": 5.714285714285714,
"grad_norm": 0.4886970159573961,
"learning_rate": 3.982708436690001e-06,
"loss": 0.112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10606701672077179,
"step": 3360,
"valid_targets_mean": 4402.9,
"valid_targets_min": 1266
},
{
"epoch": 5.7227891156462585,
"grad_norm": 0.5492917249221348,
"learning_rate": 3.932060810915563e-06,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12230627238750458,
"step": 3365,
"valid_targets_mean": 3404.1,
"valid_targets_min": 1157
},
{
"epoch": 5.7312925170068025,
"grad_norm": 0.5515095288619949,
"learning_rate": 3.881702158181015e-06,
"loss": 0.1127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09741039574146271,
"step": 3370,
"valid_targets_mean": 3078.1,
"valid_targets_min": 1540
},
{
"epoch": 5.739795918367347,
"grad_norm": 0.5994347022720987,
"learning_rate": 3.831633384159006e-06,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10247445851564407,
"step": 3375,
"valid_targets_mean": 2756.9,
"valid_targets_min": 750
},
{
"epoch": 5.7482993197278915,
"grad_norm": 0.5662527226383535,
"learning_rate": 3.7818553893088596e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1331837773323059,
"step": 3380,
"valid_targets_mean": 4074.8,
"valid_targets_min": 1109
},
{
"epoch": 5.756802721088436,
"grad_norm": 0.6312403630388446,
"learning_rate": 3.7323690688604153e-06,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12030863016843796,
"step": 3385,
"valid_targets_mean": 2706.7,
"valid_targets_min": 1132
},
{
"epoch": 5.76530612244898,
"grad_norm": 0.4665440158007456,
"learning_rate": 3.6831753127978974e-06,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11458925902843475,
"step": 3390,
"valid_targets_mean": 4522.5,
"valid_targets_min": 1805
},
{
"epoch": 5.773809523809524,
"grad_norm": 0.5271545621260861,
"learning_rate": 3.634275005843935e-06,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09652923047542572,
"step": 3395,
"valid_targets_mean": 3248.9,
"valid_targets_min": 883
},
{
"epoch": 5.782312925170068,
"grad_norm": 0.5145222459804143,
"learning_rate": 3.585669027443608e-06,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10808805376291275,
"step": 3400,
"valid_targets_mean": 3782.8,
"valid_targets_min": 294
},
{
"epoch": 5.790816326530612,
"grad_norm": 0.6087405762550093,
"learning_rate": 3.537358251748695e-06,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15609332919120789,
"step": 3405,
"valid_targets_mean": 3078.8,
"valid_targets_min": 1245
},
{
"epoch": 5.799319727891157,
"grad_norm": 0.493673691287559,
"learning_rate": 3.489343547601882e-06,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11217699944972992,
"step": 3410,
"valid_targets_mean": 4235.0,
"valid_targets_min": 1172
},
{
"epoch": 5.807823129251701,
"grad_norm": 0.5330291348481382,
"learning_rate": 3.4416257785211983e-06,
"loss": 0.1133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08841429650783539,
"step": 3415,
"valid_targets_mean": 3745.4,
"valid_targets_min": 1474
},
{
"epoch": 5.816326530612245,
"grad_norm": 0.57971467987211,
"learning_rate": 3.3942058026844472e-06,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15836650133132935,
"step": 3420,
"valid_targets_mean": 3547.6,
"valid_targets_min": 1208
},
{
"epoch": 5.824829931972789,
"grad_norm": 0.47906681279107716,
"learning_rate": 3.3470844729137886e-06,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10378694534301758,
"step": 3425,
"valid_targets_mean": 4480.3,
"valid_targets_min": 1556
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.5967888879124165,
"learning_rate": 3.3002626366603896e-06,
"loss": 0.1225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1304030567407608,
"step": 3430,
"valid_targets_mean": 3002.1,
"valid_targets_min": 333
},
{
"epoch": 5.841836734693878,
"grad_norm": 0.5315803544065215,
"learning_rate": 3.253741135989199e-06,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11456482112407684,
"step": 3435,
"valid_targets_mean": 3406.2,
"valid_targets_min": 1408
},
{
"epoch": 5.850340136054422,
"grad_norm": 0.5617527254427237,
"learning_rate": 3.2075208075637953e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13196901977062225,
"step": 3440,
"valid_targets_mean": 3691.4,
"valid_targets_min": 1216
},
{
"epoch": 5.858843537414966,
"grad_norm": 0.5521550371634127,
"learning_rate": 3.161602482631343e-06,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13317209482192993,
"step": 3445,
"valid_targets_mean": 4007.6,
"valid_targets_min": 1478
},
{
"epoch": 5.86734693877551,
"grad_norm": 1.6598007447933765,
"learning_rate": 3.115986987007622e-06,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11910313367843628,
"step": 3450,
"valid_targets_mean": 3475.4,
"valid_targets_min": 1452
},
{
"epoch": 5.875850340136054,
"grad_norm": 0.5198857712479822,
"learning_rate": 3.0706751410622184e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09872958809137344,
"step": 3455,
"valid_targets_mean": 3633.4,
"valid_targets_min": 1608
},
{
"epoch": 5.884353741496598,
"grad_norm": 0.6586650995065951,
"learning_rate": 3.0256677597037253e-06,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15523600578308105,
"step": 3460,
"valid_targets_mean": 2631.6,
"valid_targets_min": 626
},
{
"epoch": 5.892857142857143,
"grad_norm": 0.5820548403555877,
"learning_rate": 2.980965652365122e-06,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12451058626174927,
"step": 3465,
"valid_targets_mean": 3528.8,
"valid_targets_min": 1231
},
{
"epoch": 5.901360544217687,
"grad_norm": 0.5001256201730465,
"learning_rate": 2.936569622989198e-06,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09069167822599411,
"step": 3470,
"valid_targets_mean": 3679.2,
"valid_targets_min": 1597
},
{
"epoch": 5.909863945578231,
"grad_norm": 0.6527876550739389,
"learning_rate": 2.892480470014101e-06,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12368982285261154,
"step": 3475,
"valid_targets_mean": 2663.8,
"valid_targets_min": 1083
},
{
"epoch": 5.918367346938775,
"grad_norm": 0.6049378944092306,
"learning_rate": 2.8486989863589665e-06,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16314776241779327,
"step": 3480,
"valid_targets_mean": 3331.4,
"valid_targets_min": 1199
},
{
"epoch": 5.9268707482993195,
"grad_norm": 0.5321145816925281,
"learning_rate": 2.8052259594096786e-06,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10574959218502045,
"step": 3485,
"valid_targets_mean": 4042.9,
"valid_targets_min": 1737
},
{
"epoch": 5.935374149659864,
"grad_norm": 0.5249443175372537,
"learning_rate": 2.762062171004689e-06,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13219550251960754,
"step": 3490,
"valid_targets_mean": 3747.8,
"valid_targets_min": 1114
},
{
"epoch": 5.9438775510204085,
"grad_norm": 0.5349877929860054,
"learning_rate": 2.719208397420976e-06,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10431113094091415,
"step": 3495,
"valid_targets_mean": 4021.3,
"valid_targets_min": 1584
},
{
"epoch": 5.9523809523809526,
"grad_norm": 0.615252584404469,
"learning_rate": 2.6766654093600554e-06,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10922113060951233,
"step": 3500,
"valid_targets_mean": 2900.0,
"valid_targets_min": 888
},
{
"epoch": 5.960884353741497,
"grad_norm": 0.5660078177837199,
"learning_rate": 2.634433971934145e-06,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16342481970787048,
"step": 3505,
"valid_targets_mean": 4022.2,
"valid_targets_min": 1349
},
{
"epoch": 5.969387755102041,
"grad_norm": 0.5633990506355825,
"learning_rate": 2.592514844652396e-06,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10728654265403748,
"step": 3510,
"valid_targets_mean": 3335.4,
"valid_targets_min": 893
},
{
"epoch": 5.977891156462585,
"grad_norm": 0.5618270096817878,
"learning_rate": 2.5509087814072373e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13099925220012665,
"step": 3515,
"valid_targets_mean": 3559.8,
"valid_targets_min": 1589
},
{
"epoch": 5.986394557823129,
"grad_norm": 0.5950284042429369,
"learning_rate": 2.5096165304608055e-06,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11572650074958801,
"step": 3520,
"valid_targets_mean": 3260.1,
"valid_targets_min": 1543
},
{
"epoch": 5.994897959183674,
"grad_norm": 0.6431959290467469,
"learning_rate": 2.468638834431507e-06,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11295954883098602,
"step": 3525,
"valid_targets_mean": 2737.2,
"valid_targets_min": 1360
},
{
"epoch": 6.003401360544218,
"grad_norm": 0.477579265700717,
"learning_rate": 2.427976430280634e-06,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10084202885627747,
"step": 3530,
"valid_targets_mean": 4324.1,
"valid_targets_min": 1427
},
{
"epoch": 6.011904761904762,
"grad_norm": 0.4454117266637318,
"learning_rate": 2.3876300492991456e-06,
"loss": 0.1012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09745575487613678,
"step": 3535,
"valid_targets_mean": 4572.9,
"valid_targets_min": 1417
},
{
"epoch": 6.020408163265306,
"grad_norm": 0.478412233942278,
"learning_rate": 2.3476004170944843e-06,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278717815876007,
"step": 3540,
"valid_targets_mean": 4723.2,
"valid_targets_min": 1093
},
{
"epoch": 6.02891156462585,
"grad_norm": 0.5184477127041136,
"learning_rate": 2.307888253577557e-06,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12066527456045151,
"step": 3545,
"valid_targets_mean": 4437.1,
"valid_targets_min": 1155
},
{
"epoch": 6.037414965986395,
"grad_norm": 0.5620893513671174,
"learning_rate": 2.2684942729497505e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11014530062675476,
"step": 3550,
"valid_targets_mean": 3719.1,
"valid_targets_min": 1521
},
{
"epoch": 6.045918367346939,
"grad_norm": 0.5352459906510691,
"learning_rate": 2.229419183690118e-06,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10845694690942764,
"step": 3555,
"valid_targets_mean": 3726.8,
"valid_targets_min": 1406
},
{
"epoch": 6.054421768707483,
"grad_norm": 0.55710958865019,
"learning_rate": 2.1906636885426293e-06,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1064843237400055,
"step": 3560,
"valid_targets_mean": 3575.5,
"valid_targets_min": 1709
},
{
"epoch": 6.062925170068027,
"grad_norm": 0.5432557912713459,
"learning_rate": 2.1522284845035246e-06,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11107736825942993,
"step": 3565,
"valid_targets_mean": 3768.4,
"valid_targets_min": 738
},
{
"epoch": 6.071428571428571,
"grad_norm": 0.511605737896378,
"learning_rate": 2.1141142628087908e-06,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15048445761203766,
"step": 3570,
"valid_targets_mean": 5072.7,
"valid_targets_min": 1249
},
{
"epoch": 6.079931972789115,
"grad_norm": 0.5766159647704026,
"learning_rate": 2.0763217089217204e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10604619234800339,
"step": 3575,
"valid_targets_mean": 3533.0,
"valid_targets_min": 1648
},
{
"epoch": 6.08843537414966,
"grad_norm": 0.5836072850396373,
"learning_rate": 2.0388515025205912e-06,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12037845700979233,
"step": 3580,
"valid_targets_mean": 3252.4,
"valid_targets_min": 690
},
{
"epoch": 6.096938775510204,
"grad_norm": 0.6153532334687207,
"learning_rate": 2.0017043174864257e-06,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11313758790493011,
"step": 3585,
"valid_targets_mean": 3177.9,
"valid_targets_min": 526
},
{
"epoch": 6.105442176870748,
"grad_norm": 0.6539832007276991,
"learning_rate": 1.9648808218909023e-06,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11016803234815598,
"step": 3590,
"valid_targets_mean": 3561.9,
"valid_targets_min": 851
},
{
"epoch": 6.113945578231292,
"grad_norm": 0.5088070903468043,
"learning_rate": 1.928381677984319e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10234713554382324,
"step": 3595,
"valid_targets_mean": 3746.4,
"valid_targets_min": 1318
},
{
"epoch": 6.122448979591836,
"grad_norm": 0.5727361664596694,
"learning_rate": 1.8922075421836729e-06,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1115289181470871,
"step": 3600,
"valid_targets_mean": 3681.5,
"valid_targets_min": 1477
},
{
"epoch": 6.130952380952381,
"grad_norm": 0.5703340884857128,
"learning_rate": 1.8563590650608908e-06,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11293356120586395,
"step": 3605,
"valid_targets_mean": 3610.5,
"valid_targets_min": 1115
},
{
"epoch": 6.139455782312925,
"grad_norm": 0.5567638013057162,
"learning_rate": 1.8208368913310881e-06,
"loss": 0.1208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489240676164627,
"step": 3610,
"valid_targets_mean": 4215.0,
"valid_targets_min": 1364
},
{
"epoch": 6.1479591836734695,
"grad_norm": 0.5496607355990576,
"learning_rate": 1.7856416598410064e-06,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08839699625968933,
"step": 3615,
"valid_targets_mean": 3228.2,
"valid_targets_min": 1349
},
{
"epoch": 6.156462585034014,
"grad_norm": 0.6666358234359487,
"learning_rate": 1.7507740035575049e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12748566269874573,
"step": 3620,
"valid_targets_mean": 2800.0,
"valid_targets_min": 288
},
{
"epoch": 6.164965986394558,
"grad_norm": 0.5782864339340296,
"learning_rate": 1.7162345495561905e-06,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14760619401931763,
"step": 3625,
"valid_targets_mean": 3669.2,
"valid_targets_min": 1239
},
{
"epoch": 6.173469387755102,
"grad_norm": 0.5618155339533111,
"learning_rate": 1.682023919010125e-06,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09852004796266556,
"step": 3630,
"valid_targets_mean": 3470.2,
"valid_targets_min": 1202
},
{
"epoch": 6.181972789115647,
"grad_norm": 0.598362631078015,
"learning_rate": 1.6481427271786588e-06,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10615670680999756,
"step": 3635,
"valid_targets_mean": 3053.8,
"valid_targets_min": 814
},
{
"epoch": 6.190476190476191,
"grad_norm": 0.5591508889473271,
"learning_rate": 1.6145915833963788e-06,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09319960325956345,
"step": 3640,
"valid_targets_mean": 3101.5,
"valid_targets_min": 1543
},
{
"epoch": 6.198979591836735,
"grad_norm": 0.5882835479569136,
"learning_rate": 1.5813710910621293e-06,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11982224881649017,
"step": 3645,
"valid_targets_mean": 3055.9,
"valid_targets_min": 1361
},
{
"epoch": 6.207482993197279,
"grad_norm": 0.5792923656094919,
"learning_rate": 1.548481847628176e-06,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11135858297348022,
"step": 3650,
"valid_targets_mean": 3600.5,
"valid_targets_min": 1127
},
{
"epoch": 6.215986394557823,
"grad_norm": 0.5892203254512576,
"learning_rate": 1.5159244445894605e-06,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11109749972820282,
"step": 3655,
"valid_targets_mean": 3371.7,
"valid_targets_min": 1418
},
{
"epoch": 6.224489795918367,
"grad_norm": 0.527490492326501,
"learning_rate": 1.4836994674729433e-06,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09896763414144516,
"step": 3660,
"valid_targets_mean": 3538.0,
"valid_targets_min": 1383
},
{
"epoch": 6.232993197278912,
"grad_norm": 0.563826301919356,
"learning_rate": 1.4518074958271e-06,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13025017082691193,
"step": 3665,
"valid_targets_mean": 3828.9,
"valid_targets_min": 1612
},
{
"epoch": 6.241496598639456,
"grad_norm": 0.5606773143753264,
"learning_rate": 1.4202491032114797e-06,
"loss": 0.1133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10734811425209045,
"step": 3670,
"valid_targets_mean": 3267.6,
"valid_targets_min": 1532
},
{
"epoch": 6.25,
"grad_norm": 0.5854260290454237,
"learning_rate": 1.389024857186403e-06,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09467275440692902,
"step": 3675,
"valid_targets_mean": 3203.1,
"valid_targets_min": 668
},
{
"epoch": 6.258503401360544,
"grad_norm": 0.49104713182267146,
"learning_rate": 1.3581353193027424e-06,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11616228520870209,
"step": 3680,
"valid_targets_mean": 4475.0,
"valid_targets_min": 294
},
{
"epoch": 6.267006802721088,
"grad_norm": 0.6050149142306898,
"learning_rate": 1.3275810450918257e-06,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11099812388420105,
"step": 3685,
"valid_targets_mean": 3569.8,
"valid_targets_min": 1659
},
{
"epoch": 6.275510204081632,
"grad_norm": 0.562170069430547,
"learning_rate": 1.2973625840554593e-06,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10738849639892578,
"step": 3690,
"valid_targets_mean": 3418.9,
"valid_targets_min": 1727
},
{
"epoch": 6.284013605442177,
"grad_norm": 0.5017474742394269,
"learning_rate": 1.2674804796560202e-06,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12143012881278992,
"step": 3695,
"valid_targets_mean": 4531.0,
"valid_targets_min": 534
},
{
"epoch": 6.292517006802721,
"grad_norm": 0.5391996228968388,
"learning_rate": 1.237935269306707e-06,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11418686807155609,
"step": 3700,
"valid_targets_mean": 4400.1,
"valid_targets_min": 1657
},
{
"epoch": 6.301020408163265,
"grad_norm": 0.5104246666127118,
"learning_rate": 1.2087274843618668e-06,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09506049752235413,
"step": 3705,
"valid_targets_mean": 3893.9,
"valid_targets_min": 1584
},
{
"epoch": 6.309523809523809,
"grad_norm": 0.5992141275873888,
"learning_rate": 1.1798576501074233e-06,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10688906162977219,
"step": 3710,
"valid_targets_mean": 2873.1,
"valid_targets_min": 1624
},
{
"epoch": 6.318027210884353,
"grad_norm": 0.6627760286529151,
"learning_rate": 1.151326285751455e-06,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10680701583623886,
"step": 3715,
"valid_targets_mean": 3383.1,
"valid_targets_min": 1469
},
{
"epoch": 6.326530612244898,
"grad_norm": 0.5143956921633834,
"learning_rate": 1.1231339044148393e-06,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11333712935447693,
"step": 3720,
"valid_targets_mean": 4535.8,
"valid_targets_min": 1529
},
{
"epoch": 6.335034013605442,
"grad_norm": 0.5751586207418208,
"learning_rate": 1.095281013122036e-06,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09510093927383423,
"step": 3725,
"valid_targets_mean": 3208.8,
"valid_targets_min": 1558
},
{
"epoch": 6.343537414965986,
"grad_norm": 0.9443328517820183,
"learning_rate": 1.0677681127919581e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12241110950708389,
"step": 3730,
"valid_targets_mean": 3732.4,
"valid_targets_min": 1114
},
{
"epoch": 6.3520408163265305,
"grad_norm": 0.5456126321948206,
"learning_rate": 1.04059569822897e-06,
"loss": 0.1037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11154021322727203,
"step": 3735,
"valid_targets_mean": 3789.4,
"valid_targets_min": 1474
},
{
"epoch": 6.360544217687075,
"grad_norm": 0.6107837672044061,
"learning_rate": 1.0137642581139895e-06,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11448526382446289,
"step": 3740,
"valid_targets_mean": 2861.9,
"valid_targets_min": 1011
},
{
"epoch": 6.369047619047619,
"grad_norm": 0.5550637999848018,
"learning_rate": 9.87274274995693e-07,
"loss": 0.1166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1355058252811432,
"step": 3745,
"valid_targets_mean": 3923.8,
"valid_targets_min": 844
},
{
"epoch": 6.377551020408164,
"grad_norm": 0.5499184670462272,
"learning_rate": 9.61126225281841e-07,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1835326850414276,
"step": 3750,
"valid_targets_mean": 4376.8,
"valid_targets_min": 1386
},
{
"epoch": 6.386054421768708,
"grad_norm": 0.5598653966572599,
"learning_rate": 9.353205792307163e-07,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1339794397354126,
"step": 3755,
"valid_targets_mean": 3800.2,
"valid_targets_min": 1519
},
{
"epoch": 6.394557823129252,
"grad_norm": 0.6026219846226943,
"learning_rate": 9.098578009426484e-07,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10622464120388031,
"step": 3760,
"valid_targets_mean": 3525.6,
"valid_targets_min": 799
},
{
"epoch": 6.403061224489796,
"grad_norm": 0.5525824324094764,
"learning_rate": 8.847383483516903e-07,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11089949309825897,
"step": 3765,
"valid_targets_mean": 3808.2,
"valid_targets_min": 1801
},
{
"epoch": 6.41156462585034,
"grad_norm": 0.5806460615603857,
"learning_rate": 8.599626732173671e-07,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11263792216777802,
"step": 3770,
"valid_targets_mean": 3948.2,
"valid_targets_min": 1166
},
{
"epoch": 6.420068027210885,
"grad_norm": 0.5218407093507026,
"learning_rate": 8.355312211165568e-07,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12748584151268005,
"step": 3775,
"valid_targets_mean": 3853.9,
"valid_targets_min": 1617
},
{
"epoch": 6.428571428571429,
"grad_norm": 0.5270239739962835,
"learning_rate": 8.11444431435473e-07,
"loss": 0.1079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1101468950510025,
"step": 3780,
"valid_targets_mean": 4074.8,
"valid_targets_min": 1047
},
{
"epoch": 6.437074829931973,
"grad_norm": 0.5563024099626601,
"learning_rate": 7.87702737361764e-07,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10898242145776749,
"step": 3785,
"valid_targets_mean": 3889.8,
"valid_targets_min": 626
},
{
"epoch": 6.445578231292517,
"grad_norm": 0.46404697622035623,
"learning_rate": 7.643065658767312e-07,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09871433675289154,
"step": 3790,
"valid_targets_mean": 4953.9,
"valid_targets_min": 1568
},
{
"epoch": 6.454081632653061,
"grad_norm": 0.4990012456904466,
"learning_rate": 7.412563377476312e-07,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11271509528160095,
"step": 3795,
"valid_targets_mean": 4299.8,
"valid_targets_min": 1429
},
{
"epoch": 6.462585034013605,
"grad_norm": 0.5531901069965772,
"learning_rate": 7.185524675201328e-07,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12225601822137833,
"step": 3800,
"valid_targets_mean": 4172.3,
"valid_targets_min": 1159
},
{
"epoch": 6.47108843537415,
"grad_norm": 0.5402043893820961,
"learning_rate": 6.961953635108409e-07,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10706687718629837,
"step": 3805,
"valid_targets_mean": 3612.2,
"valid_targets_min": 1306
},
{
"epoch": 6.479591836734694,
"grad_norm": 0.5789107548087521,
"learning_rate": 6.741854277999583e-07,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11366184055805206,
"step": 3810,
"valid_targets_mean": 3378.6,
"valid_targets_min": 1354
},
{
"epoch": 6.488095238095238,
"grad_norm": 0.4713440181846783,
"learning_rate": 6.525230562240636e-07,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10541140288114548,
"step": 3815,
"valid_targets_mean": 4977.9,
"valid_targets_min": 1681
},
{
"epoch": 6.496598639455782,
"grad_norm": 0.5699975953341101,
"learning_rate": 6.312086383689831e-07,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08873768895864487,
"step": 3820,
"valid_targets_mean": 3275.1,
"valid_targets_min": 1437
},
{
"epoch": 6.505102040816326,
"grad_norm": 0.5571386497340849,
"learning_rate": 6.10242557562788e-07,
"loss": 0.1008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09184282273054123,
"step": 3825,
"valid_targets_mean": 3166.5,
"valid_targets_min": 429
},
{
"epoch": 6.513605442176871,
"grad_norm": 0.5624098278712437,
"learning_rate": 5.896251908688966e-07,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10643933713436127,
"step": 3830,
"valid_targets_mean": 3651.6,
"valid_targets_min": 1300
},
{
"epoch": 6.522108843537415,
"grad_norm": 0.63514069662102,
"learning_rate": 5.693569090792972e-07,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0915570929646492,
"step": 3835,
"valid_targets_mean": 2957.2,
"valid_targets_min": 1249
},
{
"epoch": 6.530612244897959,
"grad_norm": 0.5444838195618228,
"learning_rate": 5.494380767078822e-07,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10774494707584381,
"step": 3840,
"valid_targets_mean": 3686.2,
"valid_targets_min": 2165
},
{
"epoch": 6.539115646258503,
"grad_norm": 0.5054912271298077,
"learning_rate": 5.298690519838823e-07,
"loss": 0.105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0980135053396225,
"step": 3845,
"valid_targets_mean": 3616.6,
"valid_targets_min": 1167
},
{
"epoch": 6.5476190476190474,
"grad_norm": 0.5753976388948479,
"learning_rate": 5.106501868454317e-07,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10707738250494003,
"step": 3850,
"valid_targets_mean": 3197.4,
"valid_targets_min": 1349
},
{
"epoch": 6.5561224489795915,
"grad_norm": 0.5292969551823501,
"learning_rate": 4.917818269332442e-07,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10826131701469421,
"step": 3855,
"valid_targets_mean": 4322.6,
"valid_targets_min": 1402
},
{
"epoch": 6.564625850340136,
"grad_norm": 0.621615696636191,
"learning_rate": 4.7326431158437826e-07,
"loss": 0.1068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10695119947195053,
"step": 3860,
"valid_targets_mean": 3007.0,
"valid_targets_min": 1378
},
{
"epoch": 6.5731292517006805,
"grad_norm": 0.509107661703464,
"learning_rate": 4.5509797382615517e-07,
"loss": 0.1015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09450152516365051,
"step": 3865,
"valid_targets_mean": 3882.9,
"valid_targets_min": 1878
},
{
"epoch": 6.581632653061225,
"grad_norm": 0.5313107105149394,
"learning_rate": 4.372831403701572e-07,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.094798743724823,
"step": 3870,
"valid_targets_mean": 3878.6,
"valid_targets_min": 1342
},
{
"epoch": 6.590136054421769,
"grad_norm": 0.4871663184954264,
"learning_rate": 4.198201316063566e-07,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11148764193058014,
"step": 3875,
"valid_targets_mean": 4325.2,
"valid_targets_min": 1662
},
{
"epoch": 6.598639455782313,
"grad_norm": 0.579299905341723,
"learning_rate": 4.02709261597356e-07,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09807397425174713,
"step": 3880,
"valid_targets_mean": 3303.0,
"valid_targets_min": 1271
},
{
"epoch": 6.607142857142857,
"grad_norm": 0.5720297842675975,
"learning_rate": 3.8595083807272393e-07,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09346231073141098,
"step": 3885,
"valid_targets_mean": 3077.5,
"valid_targets_min": 1364
},
{
"epoch": 6.615646258503402,
"grad_norm": 0.5158229677829215,
"learning_rate": 3.695451624234836e-07,
"loss": 0.1048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11520027369260788,
"step": 3890,
"valid_targets_mean": 4364.4,
"valid_targets_min": 1833
},
{
"epoch": 6.624149659863946,
"grad_norm": 0.5571817676018703,
"learning_rate": 3.5349252969667956e-07,
"loss": 0.1181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11287274956703186,
"step": 3895,
"valid_targets_mean": 3659.2,
"valid_targets_min": 1374
},
{
"epoch": 6.63265306122449,
"grad_norm": 0.5405013862537791,
"learning_rate": 3.3779322859007536e-07,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13448761403560638,
"step": 3900,
"valid_targets_mean": 3958.9,
"valid_targets_min": 1882
},
{
"epoch": 6.641156462585034,
"grad_norm": 0.5917561818550695,
"learning_rate": 3.224475414469552e-07,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12737716734409332,
"step": 3905,
"valid_targets_mean": 4113.4,
"valid_targets_min": 1245
},
{
"epoch": 6.649659863945578,
"grad_norm": 0.557946447045777,
"learning_rate": 3.0745574425105505e-07,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10673606395721436,
"step": 3910,
"valid_targets_mean": 4236.9,
"valid_targets_min": 1210
},
{
"epoch": 6.658163265306122,
"grad_norm": 0.5164919683603588,
"learning_rate": 2.928181066215929e-07,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11876433342695236,
"step": 3915,
"valid_targets_mean": 4077.7,
"valid_targets_min": 940
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.5499308726469657,
"learning_rate": 2.785348918084241e-07,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489306092262268,
"step": 3920,
"valid_targets_mean": 3865.4,
"valid_targets_min": 1396
},
{
"epoch": 6.675170068027211,
"grad_norm": 0.5678142167877335,
"learning_rate": 2.6460635668730027e-07,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09267286211252213,
"step": 3925,
"valid_targets_mean": 2827.5,
"valid_targets_min": 345
},
{
"epoch": 6.683673469387755,
"grad_norm": 0.6608311371489237,
"learning_rate": 2.5103275175526023e-07,
"loss": 0.1155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14703533053398132,
"step": 3930,
"valid_targets_mean": 3164.3,
"valid_targets_min": 1164
},
{
"epoch": 6.692176870748299,
"grad_norm": 0.5221678778571415,
"learning_rate": 2.3781432112611303e-07,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10101592540740967,
"step": 3935,
"valid_targets_mean": 3994.5,
"valid_targets_min": 1762
},
{
"epoch": 6.700680272108843,
"grad_norm": 0.5651651379644324,
"learning_rate": 2.2495130252605746e-07,
"loss": 0.1181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11423544585704803,
"step": 3940,
"valid_targets_mean": 4024.6,
"valid_targets_min": 1439
},
{
"epoch": 6.709183673469388,
"grad_norm": 0.5199949463759391,
"learning_rate": 2.1244392728939857e-07,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10502418875694275,
"step": 3945,
"valid_targets_mean": 3820.6,
"valid_targets_min": 1377
},
{
"epoch": 6.717687074829932,
"grad_norm": 0.583526962887543,
"learning_rate": 2.0029242035439768e-07,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14046607911586761,
"step": 3950,
"valid_targets_mean": 3444.8,
"valid_targets_min": 1483
},
{
"epoch": 6.726190476190476,
"grad_norm": 0.5810830942373014,
"learning_rate": 1.8849700025921347e-07,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10181055963039398,
"step": 3955,
"valid_targets_mean": 3560.2,
"valid_targets_min": 1243
},
{
"epoch": 6.73469387755102,
"grad_norm": 0.5491006914828277,
"learning_rate": 1.7705787913798734e-07,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09634849429130554,
"step": 3960,
"valid_targets_mean": 3517.1,
"valid_targets_min": 1240
},
{
"epoch": 6.743197278911564,
"grad_norm": 0.511896203300437,
"learning_rate": 1.659752627170086e-07,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10449256002902985,
"step": 3965,
"valid_targets_mean": 3527.1,
"valid_targets_min": 1141
},
{
"epoch": 6.7517006802721085,
"grad_norm": 0.5336137499248547,
"learning_rate": 1.5524935031103305e-07,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12154018133878708,
"step": 3970,
"valid_targets_mean": 3592.3,
"valid_targets_min": 1241
},
{
"epoch": 6.760204081632653,
"grad_norm": 0.5627708148417632,
"learning_rate": 1.4488033481969478e-07,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09863865375518799,
"step": 3975,
"valid_targets_mean": 3483.6,
"valid_targets_min": 826
},
{
"epoch": 6.7687074829931975,
"grad_norm": 0.5196827469634108,
"learning_rate": 1.3486840272402213e-07,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10619688779115677,
"step": 3980,
"valid_targets_mean": 3646.9,
"valid_targets_min": 1196
},
{
"epoch": 6.7772108843537415,
"grad_norm": 0.5718874037000535,
"learning_rate": 1.252137340831072e-07,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1136164665222168,
"step": 3985,
"valid_targets_mean": 3522.7,
"valid_targets_min": 1267
},
{
"epoch": 6.785714285714286,
"grad_norm": 0.5816806292415059,
"learning_rate": 1.1591650253084619e-07,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11231759190559387,
"step": 3990,
"valid_targets_mean": 3649.8,
"valid_targets_min": 1956
},
{
"epoch": 6.79421768707483,
"grad_norm": 0.5720471677766351,
"learning_rate": 1.0697687527283062e-07,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08975514769554138,
"step": 3995,
"valid_targets_mean": 2904.6,
"valid_targets_min": 1441
},
{
"epoch": 6.802721088435375,
"grad_norm": 0.5465150224292055,
"learning_rate": 9.839501308333666e-08,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12105758488178253,
"step": 4000,
"valid_targets_mean": 3943.8,
"valid_targets_min": 1551
},
{
"epoch": 6.811224489795919,
"grad_norm": 0.5775321617047376,
"learning_rate": 9.017107030242944e-08,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10549725592136383,
"step": 4005,
"valid_targets_mean": 3177.4,
"valid_targets_min": 870
},
{
"epoch": 6.819727891156463,
"grad_norm": 0.5675733876780689,
"learning_rate": 8.230519483319211e-08,
"loss": 0.1166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10369785130023956,
"step": 4010,
"valid_targets_mean": 3497.2,
"valid_targets_min": 1801
},
{
"epoch": 6.828231292517007,
"grad_norm": 0.5774913215786752,
"learning_rate": 7.479752813906338e-08,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12983883917331696,
"step": 4015,
"valid_targets_mean": 3454.6,
"valid_targets_min": 724
},
{
"epoch": 6.836734693877551,
"grad_norm": 0.5837816943629295,
"learning_rate": 6.764820524129745e-08,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11133235692977905,
"step": 4020,
"valid_targets_mean": 3369.7,
"valid_targets_min": 1349
},
{
"epoch": 6.845238095238095,
"grad_norm": 0.5189943403965727,
"learning_rate": 6.085735471653032e-08,
"loss": 0.0981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08331690728664398,
"step": 4025,
"valid_targets_mean": 3523.8,
"valid_targets_min": 1276
},
{
"epoch": 6.853741496598639,
"grad_norm": 0.5419837374263143,
"learning_rate": 5.442509869446833e-08,
"loss": 0.101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11506151407957077,
"step": 4030,
"valid_targets_mean": 3857.5,
"valid_targets_min": 1666
},
{
"epoch": 6.862244897959184,
"grad_norm": 0.5684055839237468,
"learning_rate": 4.835155285569659e-08,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09615157544612885,
"step": 4035,
"valid_targets_mean": 3268.4,
"valid_targets_min": 1424
},
{
"epoch": 6.870748299319728,
"grad_norm": 0.5365731291138811,
"learning_rate": 4.263682642959177e-08,
"loss": 0.1133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10993782430887222,
"step": 4040,
"valid_targets_mean": 3738.6,
"valid_targets_min": 1367
},
{
"epoch": 6.879251700680272,
"grad_norm": 0.5476111470480821,
"learning_rate": 3.72810221923614e-08,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09571518003940582,
"step": 4045,
"valid_targets_mean": 3979.3,
"valid_targets_min": 1498
},
{
"epoch": 6.887755102040816,
"grad_norm": 0.48869823313324573,
"learning_rate": 3.228423646519652e-08,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10207545012235641,
"step": 4050,
"valid_targets_mean": 4221.0,
"valid_targets_min": 1183
},
{
"epoch": 6.896258503401361,
"grad_norm": 0.5769761101009117,
"learning_rate": 2.764655911253744e-08,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10221989452838898,
"step": 4055,
"valid_targets_mean": 3082.2,
"valid_targets_min": 1526
},
{
"epoch": 6.904761904761905,
"grad_norm": 0.5304203511947876,
"learning_rate": 2.3368073540461778e-08,
"loss": 0.1093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10058721154928207,
"step": 4060,
"valid_targets_mean": 3711.4,
"valid_targets_min": 1177
},
{
"epoch": 6.913265306122449,
"grad_norm": 0.5527928596168906,
"learning_rate": 1.944885669517005e-08,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13187864422798157,
"step": 4065,
"valid_targets_mean": 3627.0,
"valid_targets_min": 1362
},
{
"epoch": 6.921768707482993,
"grad_norm": 0.5876230043161286,
"learning_rate": 1.5888979061624566e-08,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11860952526330948,
"step": 4070,
"valid_targets_mean": 2997.6,
"valid_targets_min": 626
},
{
"epoch": 6.930272108843537,
"grad_norm": 0.5180428031623431,
"learning_rate": 1.268850466226379e-08,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09902661293745041,
"step": 4075,
"valid_targets_mean": 3874.1,
"valid_targets_min": 1468
},
{
"epoch": 6.938775510204081,
"grad_norm": 0.5457182235510927,
"learning_rate": 9.847491055856583e-09,
"loss": 0.1179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11753236502408981,
"step": 4080,
"valid_targets_mean": 3958.4,
"valid_targets_min": 1682
},
{
"epoch": 6.947278911564625,
"grad_norm": 0.5025326829506257,
"learning_rate": 7.365989336469704e-09,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1078265979886055,
"step": 4085,
"valid_targets_mean": 4657.9,
"valid_targets_min": 1975
},
{
"epoch": 6.95578231292517,
"grad_norm": 0.47189441731529835,
"learning_rate": 5.244044132544091e-09,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09616608917713165,
"step": 4090,
"valid_targets_mean": 4282.3,
"valid_targets_min": 2271
},
{
"epoch": 6.964285714285714,
"grad_norm": 0.5099985972571627,
"learning_rate": 3.481693606095515e-09,
"loss": 0.1205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11529235541820526,
"step": 4095,
"valid_targets_mean": 4522.9,
"valid_targets_min": 1137
},
{
"epoch": 6.9727891156462585,
"grad_norm": 0.6013770623754892,
"learning_rate": 2.078969452030677e-09,
"loss": 0.1054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11263397336006165,
"step": 4100,
"valid_targets_mean": 3301.1,
"valid_targets_min": 305
},
{
"epoch": 6.9812925170068025,
"grad_norm": 0.5717510938365082,
"learning_rate": 1.0358968975676675e-09,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10689924657344818,
"step": 4105,
"valid_targets_mean": 3414.9,
"valid_targets_min": 1270
},
{
"epoch": 6.989795918367347,
"grad_norm": 0.4870239489699717,
"learning_rate": 3.524947017941038e-10,
"loss": 0.1024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1097535490989685,
"step": 4110,
"valid_targets_mean": 5220.9,
"valid_targets_min": 1480
},
{
"epoch": 6.9982993197278915,
"grad_norm": 0.638306218851505,
"learning_rate": 2.8775155322957604e-11,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12985992431640625,
"step": 4115,
"valid_targets_mean": 2803.8,
"valid_targets_min": 861
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10281726717948914,
"step": 4116,
"total_flos": 1032895789924352.0,
"train_loss": 0.16274532378516346,
"train_runtime": 18062.791,
"train_samples_per_second": 3.643,
"train_steps_per_second": 0.228,
"valid_targets_mean": 3705.9,
"valid_targets_min": 1332
}
],
"logging_steps": 5,
"max_steps": 4116,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1032895789924352.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}