{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4116, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008503401360544218, "grad_norm": 16.284088332723297, "learning_rate": 3.883495145631068e-07, "loss": 0.7008, "loss_nan_ranks": 0, "loss_rank_avg": 0.6880989074707031, "step": 5, "valid_targets_mean": 3394.2, "valid_targets_min": 1520 }, { "epoch": 0.017006802721088437, "grad_norm": 14.839739819166988, "learning_rate": 8.737864077669904e-07, "loss": 0.6754, "loss_nan_ranks": 0, "loss_rank_avg": 0.6068336367607117, "step": 10, "valid_targets_mean": 3490.3, "valid_targets_min": 1012 }, { "epoch": 0.025510204081632654, "grad_norm": 13.952466669607169, "learning_rate": 1.359223300970874e-06, "loss": 0.6342, "loss_nan_ranks": 0, "loss_rank_avg": 0.6203460693359375, "step": 15, "valid_targets_mean": 3233.2, "valid_targets_min": 1535 }, { "epoch": 0.034013605442176874, "grad_norm": 12.6446610614783, "learning_rate": 1.8446601941747574e-06, "loss": 0.6454, "loss_nan_ranks": 0, "loss_rank_avg": 0.6516385674476624, "step": 20, "valid_targets_mean": 3449.2, "valid_targets_min": 1103 }, { "epoch": 0.04251700680272109, "grad_norm": 8.19224953585781, "learning_rate": 2.330097087378641e-06, "loss": 0.5636, "loss_nan_ranks": 0, "loss_rank_avg": 0.5059263110160828, "step": 25, "valid_targets_mean": 3176.9, "valid_targets_min": 1296 }, { "epoch": 0.05102040816326531, "grad_norm": 5.247631542695172, "learning_rate": 2.8155339805825245e-06, "loss": 0.5175, "loss_nan_ranks": 0, "loss_rank_avg": 0.4891727566719055, "step": 30, "valid_targets_mean": 3418.7, "valid_targets_min": 1376 }, { "epoch": 0.05952380952380952, "grad_norm": 3.1552727841621153, "learning_rate": 3.300970873786408e-06, "loss": 0.4638, "loss_nan_ranks": 0, "loss_rank_avg": 0.4893268942832947, "step": 35, "valid_targets_mean": 3089.0, "valid_targets_min": 1058 }, { "epoch": 0.06802721088435375, "grad_norm": 1.6068476825700668, "learning_rate": 3.7864077669902915e-06, "loss": 0.4355, "loss_nan_ranks": 0, "loss_rank_avg": 0.4086935222148895, "step": 40, "valid_targets_mean": 4035.6, "valid_targets_min": 1506 }, { "epoch": 0.07653061224489796, "grad_norm": 1.2002679568552468, "learning_rate": 4.271844660194175e-06, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.403389573097229, "step": 45, "valid_targets_mean": 3934.1, "valid_targets_min": 1328 }, { "epoch": 0.08503401360544217, "grad_norm": 0.9667513884903771, "learning_rate": 4.7572815533980585e-06, "loss": 0.3921, "loss_nan_ranks": 0, "loss_rank_avg": 0.39787787199020386, "step": 50, "valid_targets_mean": 4216.1, "valid_targets_min": 1416 }, { "epoch": 0.0935374149659864, "grad_norm": 0.8925696727275947, "learning_rate": 5.242718446601942e-06, "loss": 0.3858, "loss_nan_ranks": 0, "loss_rank_avg": 0.46847638487815857, "step": 55, "valid_targets_mean": 4303.9, "valid_targets_min": 1352 }, { "epoch": 0.10204081632653061, "grad_norm": 0.8357941987187405, "learning_rate": 5.728155339805825e-06, "loss": 0.3561, "loss_nan_ranks": 0, "loss_rank_avg": 0.3789106011390686, "step": 60, "valid_targets_mean": 3574.6, "valid_targets_min": 1645 }, { "epoch": 0.11054421768707483, "grad_norm": 0.7397059160537327, "learning_rate": 6.213592233009709e-06, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.42246219515800476, "step": 65, "valid_targets_mean": 3720.4, "valid_targets_min": 1078 }, { "epoch": 0.11904761904761904, "grad_norm": 1.126422671830154, "learning_rate": 6.6990291262135935e-06, "loss": 0.3923, "loss_nan_ranks": 0, "loss_rank_avg": 0.3333202600479126, "step": 70, "valid_targets_mean": 3193.3, "valid_targets_min": 1204 }, { "epoch": 0.12755102040816327, "grad_norm": 0.632940371104463, "learning_rate": 7.184466019417476e-06, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.33268964290618896, "step": 75, "valid_targets_mean": 3355.2, "valid_targets_min": 1090 }, { "epoch": 0.1360544217687075, "grad_norm": 0.6098061945319946, "learning_rate": 7.66990291262136e-06, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.3157602846622467, "step": 80, "valid_targets_mean": 3896.2, "valid_targets_min": 1676 }, { "epoch": 0.1445578231292517, "grad_norm": 0.6247199509119066, "learning_rate": 8.155339805825243e-06, "loss": 0.3412, "loss_nan_ranks": 0, "loss_rank_avg": 0.38960957527160645, "step": 85, "valid_targets_mean": 3736.6, "valid_targets_min": 793 }, { "epoch": 0.15306122448979592, "grad_norm": 0.7385270073420317, "learning_rate": 8.640776699029127e-06, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.33316653966903687, "step": 90, "valid_targets_mean": 2948.8, "valid_targets_min": 1070 }, { "epoch": 0.16156462585034015, "grad_norm": 0.492100707949269, "learning_rate": 9.12621359223301e-06, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.2514708340167999, "step": 95, "valid_targets_mean": 4425.4, "valid_targets_min": 1240 }, { "epoch": 0.17006802721088435, "grad_norm": 0.5951003547593199, "learning_rate": 9.611650485436894e-06, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2692122757434845, "step": 100, "valid_targets_mean": 2710.9, "valid_targets_min": 1322 }, { "epoch": 0.17857142857142858, "grad_norm": 0.7613709438724316, "learning_rate": 1.0097087378640778e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.38309434056282043, "step": 105, "valid_targets_mean": 3319.0, "valid_targets_min": 1125 }, { "epoch": 0.1870748299319728, "grad_norm": 0.5914325453792764, "learning_rate": 1.0582524271844662e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.25947824120521545, "step": 110, "valid_targets_mean": 2820.6, "valid_targets_min": 690 }, { "epoch": 0.195578231292517, "grad_norm": 0.6002580182988407, "learning_rate": 1.1067961165048544e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.35196587443351746, "step": 115, "valid_targets_mean": 3586.2, "valid_targets_min": 668 }, { "epoch": 0.20408163265306123, "grad_norm": 0.5372570805761464, "learning_rate": 1.1553398058252427e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.28968310356140137, "step": 120, "valid_targets_mean": 4067.5, "valid_targets_min": 1436 }, { "epoch": 0.21258503401360543, "grad_norm": 0.5237896767254485, "learning_rate": 1.2038834951456311e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.32339826226234436, "step": 125, "valid_targets_mean": 4317.6, "valid_targets_min": 1065 }, { "epoch": 0.22108843537414966, "grad_norm": 0.5670068619189014, "learning_rate": 1.2524271844660197e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.3546511232852936, "step": 130, "valid_targets_mean": 3980.6, "valid_targets_min": 758 }, { "epoch": 0.22959183673469388, "grad_norm": 0.5255698995362615, "learning_rate": 1.300970873786408e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.28089749813079834, "step": 135, "valid_targets_mean": 4137.8, "valid_targets_min": 804 }, { "epoch": 0.23809523809523808, "grad_norm": 0.5595742490638705, "learning_rate": 1.3495145631067962e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.267475962638855, "step": 140, "valid_targets_mean": 3784.4, "valid_targets_min": 1328 }, { "epoch": 0.2465986394557823, "grad_norm": 0.588682917285768, "learning_rate": 1.3980582524271846e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.28826704621315, "step": 145, "valid_targets_mean": 3321.7, "valid_targets_min": 1237 }, { "epoch": 0.25510204081632654, "grad_norm": 0.6379265355221891, "learning_rate": 1.446601941747573e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.3119679093360901, "step": 150, "valid_targets_mean": 3228.9, "valid_targets_min": 1314 }, { "epoch": 0.26360544217687076, "grad_norm": 1.1311868788928263, "learning_rate": 1.4951456310679614e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.28038668632507324, "step": 155, "valid_targets_mean": 3130.2, "valid_targets_min": 1197 }, { "epoch": 0.272108843537415, "grad_norm": 0.5961390202565682, "learning_rate": 1.5436893203883496e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.23698543012142181, "step": 160, "valid_targets_mean": 3128.9, "valid_targets_min": 1230 }, { "epoch": 0.28061224489795916, "grad_norm": 0.748114955090481, "learning_rate": 1.592233009708738e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2971285581588745, "step": 165, "valid_targets_mean": 3631.0, "valid_targets_min": 1322 }, { "epoch": 0.2891156462585034, "grad_norm": 0.5913012294912496, "learning_rate": 1.6407766990291263e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2528142035007477, "step": 170, "valid_targets_mean": 3472.6, "valid_targets_min": 1044 }, { "epoch": 0.2976190476190476, "grad_norm": 0.6335415710139134, "learning_rate": 1.6893203883495145e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000209629535675, "step": 175, "valid_targets_mean": 3211.1, "valid_targets_min": 951 }, { "epoch": 0.30612244897959184, "grad_norm": 0.5716361790983413, "learning_rate": 1.737864077669903e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.25265321135520935, "step": 180, "valid_targets_mean": 3723.9, "valid_targets_min": 1553 }, { "epoch": 0.31462585034013607, "grad_norm": 0.5461651660212551, "learning_rate": 1.7864077669902916e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.22830471396446228, "step": 185, "valid_targets_mean": 3600.1, "valid_targets_min": 277 }, { "epoch": 0.3231292517006803, "grad_norm": 0.6266878783879113, "learning_rate": 1.8349514563106798e-05, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.27608734369277954, "step": 190, "valid_targets_mean": 3576.2, "valid_targets_min": 1838 }, { "epoch": 0.33163265306122447, "grad_norm": 0.6262564074677799, "learning_rate": 1.883495145631068e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.33075207471847534, "step": 195, "valid_targets_mean": 3644.2, "valid_targets_min": 1408 }, { "epoch": 0.3401360544217687, "grad_norm": 0.6222343963607243, "learning_rate": 1.9320388349514565e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.28491562604904175, "step": 200, "valid_targets_mean": 3473.6, "valid_targets_min": 1591 }, { "epoch": 0.3486394557823129, "grad_norm": 0.5692531688349544, "learning_rate": 1.9805825242718447e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638142704963684, "step": 205, "valid_targets_mean": 4383.2, "valid_targets_min": 1505 }, { "epoch": 0.35714285714285715, "grad_norm": 0.6016824349437719, "learning_rate": 2.0291262135922333e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.2720300257205963, "step": 210, "valid_targets_mean": 3857.2, "valid_targets_min": 1115 }, { "epoch": 0.3656462585034014, "grad_norm": 0.5660323710291796, "learning_rate": 2.0776699029126215e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.20892475545406342, "step": 215, "valid_targets_mean": 3352.7, "valid_targets_min": 1090 }, { "epoch": 0.3741496598639456, "grad_norm": 0.5397652134256967, "learning_rate": 2.1262135922330097e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.2417203038930893, "step": 220, "valid_targets_mean": 3862.2, "valid_targets_min": 1166 }, { "epoch": 0.3826530612244898, "grad_norm": 0.9020207934335027, "learning_rate": 2.1747572815533982e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550874948501587, "step": 225, "valid_targets_mean": 4108.3, "valid_targets_min": 1093 }, { "epoch": 0.391156462585034, "grad_norm": 0.5496806077798531, "learning_rate": 2.2233009708737864e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.2542770206928253, "step": 230, "valid_targets_mean": 3857.4, "valid_targets_min": 1737 }, { "epoch": 0.39965986394557823, "grad_norm": 0.5786260227985688, "learning_rate": 2.271844660194175e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.23735564947128296, "step": 235, "valid_targets_mean": 3291.6, "valid_targets_min": 1552 }, { "epoch": 0.40816326530612246, "grad_norm": 0.624916105565735, "learning_rate": 2.3203883495145632e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.25283026695251465, "step": 240, "valid_targets_mean": 3140.6, "valid_targets_min": 1101 }, { "epoch": 0.4166666666666667, "grad_norm": 0.6230467099115211, "learning_rate": 2.3689320388349514e-05, "loss": 0.2554, "loss_nan_ranks": 0, "loss_rank_avg": 0.23698002099990845, "step": 245, "valid_targets_mean": 3379.9, "valid_targets_min": 868 }, { "epoch": 0.42517006802721086, "grad_norm": 0.5654277458214261, "learning_rate": 2.41747572815534e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.25777631998062134, "step": 250, "valid_targets_mean": 4212.4, "valid_targets_min": 1376 }, { "epoch": 0.4336734693877551, "grad_norm": 0.845325859827072, "learning_rate": 2.466019417475728e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.28165894746780396, "step": 255, "valid_targets_mean": 3721.9, "valid_targets_min": 1469 }, { "epoch": 0.4421768707482993, "grad_norm": 0.5477155296016747, "learning_rate": 2.514563106796117e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.22638031840324402, "step": 260, "valid_targets_mean": 3850.2, "valid_targets_min": 1020 }, { "epoch": 0.45068027210884354, "grad_norm": 0.590971583313143, "learning_rate": 2.5631067961165052e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.25587913393974304, "step": 265, "valid_targets_mean": 3664.8, "valid_targets_min": 1193 }, { "epoch": 0.45918367346938777, "grad_norm": 0.7112768961498113, "learning_rate": 2.6116504854368934e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2385358214378357, "step": 270, "valid_targets_mean": 3111.2, "valid_targets_min": 738 }, { "epoch": 0.467687074829932, "grad_norm": 0.5301764242793776, "learning_rate": 2.660194174757282e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.267933189868927, "step": 275, "valid_targets_mean": 4447.9, "valid_targets_min": 1926 }, { "epoch": 0.47619047619047616, "grad_norm": 0.5551111127425339, "learning_rate": 2.7087378640776702e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.21886155009269714, "step": 280, "valid_targets_mean": 3772.6, "valid_targets_min": 1751 }, { "epoch": 0.4846938775510204, "grad_norm": 0.5167918851842331, "learning_rate": 2.7572815533980587e-05, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.27086275815963745, "step": 285, "valid_targets_mean": 4184.1, "valid_targets_min": 1025 }, { "epoch": 0.4931972789115646, "grad_norm": 0.7009839725364524, "learning_rate": 2.805825242718447e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.23540431261062622, "step": 290, "valid_targets_mean": 3462.0, "valid_targets_min": 1618 }, { "epoch": 0.5017006802721088, "grad_norm": 0.6603793288831256, "learning_rate": 2.854368932038835e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.22473765909671783, "step": 295, "valid_targets_mean": 2997.2, "valid_targets_min": 1662 }, { "epoch": 0.5102040816326531, "grad_norm": 0.5472173526564987, "learning_rate": 2.9029126213592237e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.2626279294490814, "step": 300, "valid_targets_mean": 4095.4, "valid_targets_min": 1374 }, { "epoch": 0.5187074829931972, "grad_norm": 0.583901679673355, "learning_rate": 2.951456310679612e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.25624722242355347, "step": 305, "valid_targets_mean": 3267.6, "valid_targets_min": 1342 }, { "epoch": 0.5272108843537415, "grad_norm": 0.5974779827455141, "learning_rate": 3.0000000000000004e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.29399585723876953, "step": 310, "valid_targets_mean": 3656.5, "valid_targets_min": 1623 }, { "epoch": 0.5357142857142857, "grad_norm": 0.5848328720235239, "learning_rate": 3.0485436893203886e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.22116899490356445, "step": 315, "valid_targets_mean": 3654.2, "valid_targets_min": 1822 }, { "epoch": 0.54421768707483, "grad_norm": 0.5219255102519595, "learning_rate": 3.097087378640777e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.269960880279541, "step": 320, "valid_targets_mean": 4145.9, "valid_targets_min": 1355 }, { "epoch": 0.5527210884353742, "grad_norm": 0.5503971512937593, "learning_rate": 3.1456310679611654e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.24401246011257172, "step": 325, "valid_targets_mean": 4419.8, "valid_targets_min": 1234 }, { "epoch": 0.5612244897959183, "grad_norm": 0.5701637940871919, "learning_rate": 3.194174757281554e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.21285384893417358, "step": 330, "valid_targets_mean": 3603.2, "valid_targets_min": 1061 }, { "epoch": 0.5697278911564626, "grad_norm": 0.616506008664278, "learning_rate": 3.242718446601942e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.27921557426452637, "step": 335, "valid_targets_mean": 3437.5, "valid_targets_min": 1340 }, { "epoch": 0.5782312925170068, "grad_norm": 0.6116541556683032, "learning_rate": 3.29126213592233e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.24892035126686096, "step": 340, "valid_targets_mean": 3190.8, "valid_targets_min": 1245 }, { "epoch": 0.5867346938775511, "grad_norm": 0.5147623109762519, "learning_rate": 3.339805825242719e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.2467966079711914, "step": 345, "valid_targets_mean": 4105.7, "valid_targets_min": 2111 }, { "epoch": 0.5952380952380952, "grad_norm": 0.5560814376438035, "learning_rate": 3.388349514563107e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.26886463165283203, "step": 350, "valid_targets_mean": 3899.1, "valid_targets_min": 792 }, { "epoch": 0.6037414965986394, "grad_norm": 0.5999655031743574, "learning_rate": 3.436893203883495e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.39038926362991333, "step": 355, "valid_targets_mean": 4675.1, "valid_targets_min": 1261 }, { "epoch": 0.6122448979591837, "grad_norm": 0.5430030557117063, "learning_rate": 3.485436893203884e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.2600330114364624, "step": 360, "valid_targets_mean": 3977.9, "valid_targets_min": 1596 }, { "epoch": 0.6207482993197279, "grad_norm": 0.5731887626204569, "learning_rate": 3.5339805825242724e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.22550851106643677, "step": 365, "valid_targets_mean": 3385.5, "valid_targets_min": 1171 }, { "epoch": 0.6292517006802721, "grad_norm": 0.5627496362039582, "learning_rate": 3.582524271844661e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.2910814881324768, "step": 370, "valid_targets_mean": 4556.4, "valid_targets_min": 1882 }, { "epoch": 0.6377551020408163, "grad_norm": 0.5991575814558935, "learning_rate": 3.631067961165049e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.211978018283844, "step": 375, "valid_targets_mean": 3452.8, "valid_targets_min": 1318 }, { "epoch": 0.6462585034013606, "grad_norm": 0.6102343665862296, "learning_rate": 3.679611650485437e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.21666033565998077, "step": 380, "valid_targets_mean": 3131.9, "valid_targets_min": 1314 }, { "epoch": 0.6547619047619048, "grad_norm": 0.5948668213611634, "learning_rate": 3.728155339805826e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.24347296357154846, "step": 385, "valid_targets_mean": 3611.2, "valid_targets_min": 883 }, { "epoch": 0.6632653061224489, "grad_norm": 0.6047163659117363, "learning_rate": 3.776699029126214e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.2162351906299591, "step": 390, "valid_targets_mean": 3810.4, "valid_targets_min": 771 }, { "epoch": 0.6717687074829932, "grad_norm": 0.5375529397120948, "learning_rate": 3.825242718446602e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.22332267463207245, "step": 395, "valid_targets_mean": 3901.6, "valid_targets_min": 773 }, { "epoch": 0.6802721088435374, "grad_norm": 1.0342771407751923, "learning_rate": 3.873786407766991e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1947087049484253, "step": 400, "valid_targets_mean": 3132.8, "valid_targets_min": 1457 }, { "epoch": 0.6887755102040817, "grad_norm": 0.5626435257811521, "learning_rate": 3.9223300970873787e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347477376461029, "step": 405, "valid_targets_mean": 3649.8, "valid_targets_min": 1331 }, { "epoch": 0.6972789115646258, "grad_norm": 0.569318137076344, "learning_rate": 3.970873786407767e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.20133861899375916, "step": 410, "valid_targets_mean": 3133.1, "valid_targets_min": 1569 }, { "epoch": 0.70578231292517, "grad_norm": 1.0743284208556751, "learning_rate": 3.9999971224844676e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.24629156291484833, "step": 415, "valid_targets_mean": 3826.4, "valid_targets_min": 1325 }, { "epoch": 0.7142857142857143, "grad_norm": 0.6635319496766661, "learning_rate": 3.9999647505298214e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.18993477523326874, "step": 420, "valid_targets_mean": 2720.0, "valid_targets_min": 1349 }, { "epoch": 0.7227891156462585, "grad_norm": 0.6170915333057738, "learning_rate": 3.999896410310244e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.22692041099071503, "step": 425, "valid_targets_mean": 3027.8, "valid_targets_min": 726 }, { "epoch": 0.7312925170068028, "grad_norm": 0.5463223980088899, "learning_rate": 3.9997921030547975e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502792477607727, "step": 430, "valid_targets_mean": 4274.4, "valid_targets_min": 1318 }, { "epoch": 0.7397959183673469, "grad_norm": 0.6317330429857803, "learning_rate": 3.9996518306393906e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.2522296607494354, "step": 435, "valid_targets_mean": 4349.2, "valid_targets_min": 1531 }, { "epoch": 0.7482993197278912, "grad_norm": 0.5589182010307014, "learning_rate": 3.999475595586746e-05, "loss": 0.2106, "loss_nan_ranks": 0, "loss_rank_avg": 0.22174233198165894, "step": 440, "valid_targets_mean": 3621.8, "valid_targets_min": 1171 }, { "epoch": 0.7568027210884354, "grad_norm": 0.6274192316998353, "learning_rate": 3.9992634010663535e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.19328610599040985, "step": 445, "valid_targets_mean": 3207.5, "valid_targets_min": 1380 }, { "epoch": 0.7653061224489796, "grad_norm": 0.7143188282236254, "learning_rate": 3.999015250894415e-05, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.24878516793251038, "step": 450, "valid_targets_mean": 2905.9, "valid_targets_min": 704 }, { "epoch": 0.7738095238095238, "grad_norm": 0.6357498516540245, "learning_rate": 3.998731149533774e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.2257612943649292, "step": 455, "valid_targets_mean": 4270.8, "valid_targets_min": 1016 }, { "epoch": 0.782312925170068, "grad_norm": 0.608459313439396, "learning_rate": 3.9984111020938376e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.23315557837486267, "step": 460, "valid_targets_mean": 3114.2, "valid_targets_min": 468 }, { "epoch": 0.7908163265306123, "grad_norm": 0.5311014249453725, "learning_rate": 3.998055114330483e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.22066374123096466, "step": 465, "valid_targets_mean": 4115.8, "valid_targets_min": 237 }, { "epoch": 0.7993197278911565, "grad_norm": 0.5517724265625736, "learning_rate": 3.9976631926459536e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.21982333064079285, "step": 470, "valid_targets_mean": 3534.5, "valid_targets_min": 1529 }, { "epoch": 0.8078231292517006, "grad_norm": 0.5625719777203932, "learning_rate": 3.997235344088747e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.19416046142578125, "step": 475, "valid_targets_mean": 3017.0, "valid_targets_min": 740 }, { "epoch": 0.8163265306122449, "grad_norm": 0.6799480818848552, "learning_rate": 3.9967715763534805e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595263123512268, "step": 480, "valid_targets_mean": 3761.9, "valid_targets_min": 1567 }, { "epoch": 0.8248299319727891, "grad_norm": 0.6509377180428996, "learning_rate": 3.9962718977807637e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.21661224961280823, "step": 485, "valid_targets_mean": 3430.8, "valid_targets_min": 516 }, { "epoch": 0.8333333333333334, "grad_norm": 0.6165176687499115, "learning_rate": 3.995736317357041e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.20129480957984924, "step": 490, "valid_targets_mean": 3195.6, "valid_targets_min": 864 }, { "epoch": 0.8418367346938775, "grad_norm": 0.5318159802711743, "learning_rate": 3.9951648447144305e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.27752143144607544, "step": 495, "valid_targets_mean": 4461.1, "valid_targets_min": 1431 }, { "epoch": 0.8503401360544217, "grad_norm": 0.5556209073828486, "learning_rate": 3.9945574901305534e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.202958345413208, "step": 500, "valid_targets_mean": 3815.9, "valid_targets_min": 1488 }, { "epoch": 0.858843537414966, "grad_norm": 1.0342886678960757, "learning_rate": 3.9939142645283475e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.19952651858329773, "step": 505, "valid_targets_mean": 2500.6, "valid_targets_min": 844 }, { "epoch": 0.8673469387755102, "grad_norm": 0.5402963048438412, "learning_rate": 3.9932351794758705e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.27289947867393494, "step": 510, "valid_targets_mean": 4066.7, "valid_targets_min": 1590 }, { "epoch": 0.8758503401360545, "grad_norm": 0.4961205211173556, "learning_rate": 3.992520247186094e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.20045743882656097, "step": 515, "valid_targets_mean": 3896.8, "valid_targets_min": 1635 }, { "epoch": 0.8843537414965986, "grad_norm": 0.5120923461971542, "learning_rate": 3.991769480516681e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.18355634808540344, "step": 520, "valid_targets_mean": 3659.9, "valid_targets_min": 1564 }, { "epoch": 0.8928571428571429, "grad_norm": 0.5623713120504147, "learning_rate": 3.9909828929697575e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.22784064710140228, "step": 525, "valid_targets_mean": 3482.8, "valid_targets_min": 1422 }, { "epoch": 0.9013605442176871, "grad_norm": 0.7661825249423273, "learning_rate": 3.9901604986916666e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.24556386470794678, "step": 530, "valid_targets_mean": 4166.4, "valid_targets_min": 656 }, { "epoch": 0.9098639455782312, "grad_norm": 0.5954424304699879, "learning_rate": 3.9893023124727176e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2076413780450821, "step": 535, "valid_targets_mean": 3791.6, "valid_targets_min": 1222 }, { "epoch": 0.9183673469387755, "grad_norm": 0.5761225149341407, "learning_rate": 3.988408349746916e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.1701766699552536, "step": 540, "valid_targets_mean": 3159.8, "valid_targets_min": 292 }, { "epoch": 0.9268707482993197, "grad_norm": 0.6231094057313721, "learning_rate": 3.9874786265916895e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.19349026679992676, "step": 545, "valid_targets_mean": 3046.1, "valid_targets_min": 1543 }, { "epoch": 0.935374149659864, "grad_norm": 0.5278032564391175, "learning_rate": 3.986513159727598e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.22423487901687622, "step": 550, "valid_targets_mean": 3591.6, "valid_targets_min": 1361 }, { "epoch": 0.9438775510204082, "grad_norm": 0.5593996618941262, "learning_rate": 3.985511966518031e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.21108989417552948, "step": 555, "valid_targets_mean": 3543.1, "valid_targets_min": 785 }, { "epoch": 0.9523809523809523, "grad_norm": 0.6004996101097438, "learning_rate": 3.984475064968897e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.20403581857681274, "step": 560, "valid_targets_mean": 2996.8, "valid_targets_min": 1127 }, { "epoch": 0.9608843537414966, "grad_norm": 0.5607013766195372, "learning_rate": 3.9834024737282994e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2213515192270279, "step": 565, "valid_targets_mean": 3813.0, "valid_targets_min": 712 }, { "epoch": 0.9693877551020408, "grad_norm": 0.5378418432619649, "learning_rate": 3.9822942120862016e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.22113119065761566, "step": 570, "valid_targets_mean": 3979.8, "valid_targets_min": 1487 }, { "epoch": 0.9778911564625851, "grad_norm": 0.5155096520501556, "learning_rate": 3.981150299974079e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.17551299929618835, "step": 575, "valid_targets_mean": 4004.7, "valid_targets_min": 1841 }, { "epoch": 0.9863945578231292, "grad_norm": 1.0096571246008348, "learning_rate": 3.979970757964561e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.19910582900047302, "step": 580, "valid_targets_mean": 4383.6, "valid_targets_min": 1271 }, { "epoch": 0.9948979591836735, "grad_norm": 0.4896747460569099, "learning_rate": 3.978755607271061e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.23156213760375977, "step": 585, "valid_targets_mean": 4823.2, "valid_targets_min": 1267 }, { "epoch": 1.0034013605442176, "grad_norm": 0.5672962424422774, "learning_rate": 3.977504869747395e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.22572076320648193, "step": 590, "valid_targets_mean": 3516.4, "valid_targets_min": 345 }, { "epoch": 1.0119047619047619, "grad_norm": 0.5312338195955498, "learning_rate": 3.976218567887389e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.20064997673034668, "step": 595, "valid_targets_mean": 3369.6, "valid_targets_min": 791 }, { "epoch": 1.0204081632653061, "grad_norm": 0.5907568049016817, "learning_rate": 3.974896724824475e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.1838887631893158, "step": 600, "valid_targets_mean": 3293.3, "valid_targets_min": 1016 }, { "epoch": 1.0289115646258504, "grad_norm": 0.5741661915632267, "learning_rate": 3.97353936433127e-05, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.22130995988845825, "step": 605, "valid_targets_mean": 3553.5, "valid_targets_min": 1363 }, { "epoch": 1.0374149659863945, "grad_norm": 0.5548887515405546, "learning_rate": 3.972146510819158e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.20798607170581818, "step": 610, "valid_targets_mean": 3264.7, "valid_targets_min": 759 }, { "epoch": 1.0459183673469388, "grad_norm": 0.48775913922713154, "learning_rate": 3.970718189337841e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1696465015411377, "step": 615, "valid_targets_mean": 3921.0, "valid_targets_min": 1030 }, { "epoch": 1.054421768707483, "grad_norm": 0.5390452642348323, "learning_rate": 3.969254425574895e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.27588415145874023, "step": 620, "valid_targets_mean": 3971.6, "valid_targets_min": 1047 }, { "epoch": 1.0629251700680271, "grad_norm": 0.5601492770617569, "learning_rate": 3.9677552458553046e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.1914624273777008, "step": 625, "valid_targets_mean": 3866.6, "valid_targets_min": 1334 }, { "epoch": 1.0714285714285714, "grad_norm": 0.5372040764678854, "learning_rate": 3.9662206771409925e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.18735885620117188, "step": 630, "valid_targets_mean": 3296.4, "valid_targets_min": 1828 }, { "epoch": 1.0799319727891157, "grad_norm": 0.4929419148783689, "learning_rate": 3.964650747030332e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.2222883701324463, "step": 635, "valid_targets_mean": 4493.8, "valid_targets_min": 766 }, { "epoch": 1.08843537414966, "grad_norm": 0.5087861156990097, "learning_rate": 3.963045483757652e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.2039588987827301, "step": 640, "valid_targets_mean": 3933.9, "valid_targets_min": 1732 }, { "epoch": 1.096938775510204, "grad_norm": 0.5471473406579418, "learning_rate": 3.961404916192728e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.1703445315361023, "step": 645, "valid_targets_mean": 3236.4, "valid_targets_min": 1522 }, { "epoch": 1.1054421768707483, "grad_norm": 0.601726665077757, "learning_rate": 3.959729073840265e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.2089315801858902, "step": 650, "valid_targets_mean": 2669.9, "valid_targets_min": 771 }, { "epoch": 1.1139455782312926, "grad_norm": 0.5342431672997215, "learning_rate": 3.958017986839364e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.16569793224334717, "step": 655, "valid_targets_mean": 4190.9, "valid_targets_min": 1653 }, { "epoch": 1.1224489795918366, "grad_norm": 0.47771373985756477, "learning_rate": 3.956271685962985e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.18933849036693573, "step": 660, "valid_targets_mean": 4276.8, "valid_targets_min": 1203 }, { "epoch": 1.130952380952381, "grad_norm": 0.5180075636533443, "learning_rate": 3.954490202617385e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.20420797169208527, "step": 665, "valid_targets_mean": 3466.0, "valid_targets_min": 1387 }, { "epoch": 1.1394557823129252, "grad_norm": 0.4810886562810522, "learning_rate": 3.9526735688415624e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.14678673446178436, "step": 670, "valid_targets_mean": 3429.4, "valid_targets_min": 1151 }, { "epoch": 1.1479591836734695, "grad_norm": 0.43889872604968944, "learning_rate": 3.9508218173066766e-05, "loss": 0.2169, "loss_nan_ranks": 0, "loss_rank_avg": 0.18565359711647034, "step": 675, "valid_targets_mean": 4528.4, "valid_targets_min": 1485 }, { "epoch": 1.1564625850340136, "grad_norm": 0.5494878687879327, "learning_rate": 3.948934981315457e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.21876271069049835, "step": 680, "valid_targets_mean": 3376.0, "valid_targets_min": 1641 }, { "epoch": 1.1649659863945578, "grad_norm": 0.5527438745919528, "learning_rate": 3.947013094801612e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.18596649169921875, "step": 685, "valid_targets_mean": 3657.0, "valid_targets_min": 1586 }, { "epoch": 1.1734693877551021, "grad_norm": 0.5825833837175836, "learning_rate": 3.945056192329212e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.1742013394832611, "step": 690, "valid_targets_mean": 2917.1, "valid_targets_min": 1281 }, { "epoch": 1.1819727891156462, "grad_norm": 0.503721095345985, "learning_rate": 3.9430643090920705e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.2232275754213333, "step": 695, "valid_targets_mean": 4089.5, "valid_targets_min": 1418 }, { "epoch": 1.1904761904761905, "grad_norm": 0.5218165403092541, "learning_rate": 3.941037480913111e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.1619264781475067, "step": 700, "valid_targets_mean": 3523.6, "valid_targets_min": 1437 }, { "epoch": 1.1989795918367347, "grad_norm": 0.5281430386469016, "learning_rate": 3.9389757442437214e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.17680522799491882, "step": 705, "valid_targets_mean": 3565.9, "valid_targets_min": 1325 }, { "epoch": 1.2074829931972788, "grad_norm": 0.5235289654221893, "learning_rate": 3.936879136163102e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.17753741145133972, "step": 710, "valid_targets_mean": 3354.5, "valid_targets_min": 861 }, { "epoch": 1.215986394557823, "grad_norm": 0.5243131901993361, "learning_rate": 3.934747694377594e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.17617300152778625, "step": 715, "valid_targets_mean": 3630.2, "valid_targets_min": 740 }, { "epoch": 1.2244897959183674, "grad_norm": 0.507546135504406, "learning_rate": 3.932581457220004e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.20022642612457275, "step": 720, "valid_targets_mean": 3641.4, "valid_targets_min": 1358 }, { "epoch": 1.2329931972789117, "grad_norm": 0.4976716238444004, "learning_rate": 3.9303804636489165e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.1976463496685028, "step": 725, "valid_targets_mean": 4419.9, "valid_targets_min": 1633 }, { "epoch": 1.2414965986394557, "grad_norm": 0.5483850422579489, "learning_rate": 3.928144753247987e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.1868499368429184, "step": 730, "valid_targets_mean": 3198.6, "valid_targets_min": 1518 }, { "epoch": 1.25, "grad_norm": 0.5488817504510112, "learning_rate": 3.925874366225237e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.1806359589099884, "step": 735, "valid_targets_mean": 3055.3, "valid_targets_min": 1080 }, { "epoch": 1.2585034013605443, "grad_norm": 0.5066572269595151, "learning_rate": 3.923569343412327e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1659495234489441, "step": 740, "valid_targets_mean": 3302.1, "valid_targets_min": 1180 }, { "epoch": 1.2670068027210886, "grad_norm": 0.5849934441349959, "learning_rate": 3.921229726263824e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.1774701178073883, "step": 745, "valid_targets_mean": 2528.7, "valid_targets_min": 1202 }, { "epoch": 1.2755102040816326, "grad_norm": 0.49696403833836683, "learning_rate": 3.918855556856453e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.18610414862632751, "step": 750, "valid_targets_mean": 3840.2, "valid_targets_min": 1166 }, { "epoch": 1.284013605442177, "grad_norm": 0.51760011092419, "learning_rate": 3.916446877888345e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.152181014418602, "step": 755, "valid_targets_mean": 3712.1, "valid_targets_min": 1562 }, { "epoch": 1.2925170068027212, "grad_norm": 0.5197150478352947, "learning_rate": 3.914003732678264e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.17886745929718018, "step": 760, "valid_targets_mean": 3652.8, "valid_targets_min": 1389 }, { "epoch": 1.3010204081632653, "grad_norm": 0.6469050227526758, "learning_rate": 3.911526165164831e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.18235021829605103, "step": 765, "valid_targets_mean": 3708.6, "valid_targets_min": 1362 }, { "epoch": 1.3095238095238095, "grad_norm": 0.49033685187396464, "learning_rate": 3.909014219905736e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.17945152521133423, "step": 770, "valid_targets_mean": 4450.9, "valid_targets_min": 1164 }, { "epoch": 1.3180272108843538, "grad_norm": 0.48357041587084415, "learning_rate": 3.906467942076929e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.16390027105808258, "step": 775, "valid_targets_mean": 3853.2, "valid_targets_min": 261 }, { "epoch": 1.3265306122448979, "grad_norm": 0.5416106118859744, "learning_rate": 3.903887377471816e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1834583282470703, "step": 780, "valid_targets_mean": 3806.6, "valid_targets_min": 626 }, { "epoch": 1.3350340136054422, "grad_norm": 0.5709573952961344, "learning_rate": 3.901272572500431e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.2096044272184372, "step": 785, "valid_targets_mean": 3210.9, "valid_targets_min": 1076 }, { "epoch": 1.3435374149659864, "grad_norm": 0.49261093365090397, "learning_rate": 3.8986235741886016e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.19666042923927307, "step": 790, "valid_targets_mean": 4010.6, "valid_targets_min": 1349 }, { "epoch": 1.3520408163265305, "grad_norm": 0.5295408603491522, "learning_rate": 3.8959404301771035e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.17796075344085693, "step": 795, "valid_targets_mean": 3584.5, "valid_targets_min": 1196 }, { "epoch": 1.3605442176870748, "grad_norm": 0.5009867989877805, "learning_rate": 3.893223188720804e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.16877491772174835, "step": 800, "valid_targets_mean": 3927.5, "valid_targets_min": 1379 }, { "epoch": 1.369047619047619, "grad_norm": 0.5414078300255754, "learning_rate": 3.890471898687797e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.19157296419143677, "step": 805, "valid_targets_mean": 3358.6, "valid_targets_min": 1356 }, { "epoch": 1.3775510204081631, "grad_norm": 0.5222165452421504, "learning_rate": 3.887686609558516e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.23859623074531555, "step": 810, "valid_targets_mean": 4134.9, "valid_targets_min": 1487 }, { "epoch": 1.3860544217687074, "grad_norm": 0.5217149334650539, "learning_rate": 3.8848673714248545e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.26612165570259094, "step": 815, "valid_targets_mean": 4028.3, "valid_targets_min": 1564 }, { "epoch": 1.3945578231292517, "grad_norm": 0.5170659251716594, "learning_rate": 3.882014234989258e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.22827790677547455, "step": 820, "valid_targets_mean": 3701.8, "valid_targets_min": 1093 }, { "epoch": 1.403061224489796, "grad_norm": 0.4688236578703589, "learning_rate": 3.879127251563814e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2379659116268158, "step": 825, "valid_targets_mean": 4414.6, "valid_targets_min": 602 }, { "epoch": 1.4115646258503403, "grad_norm": 0.49118587067228825, "learning_rate": 3.87620647306933e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.15896081924438477, "step": 830, "valid_targets_mean": 3619.9, "valid_targets_min": 872 }, { "epoch": 1.4200680272108843, "grad_norm": 0.5821773109112104, "learning_rate": 3.873251952034398e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.18274542689323425, "step": 835, "valid_targets_mean": 2929.2, "valid_targets_min": 656 }, { "epoch": 1.4285714285714286, "grad_norm": 0.5452331430405628, "learning_rate": 3.8702637415944554e-05, "loss": 0.1851, "loss_nan_ranks": 0, "loss_rank_avg": 0.17982515692710876, "step": 840, "valid_targets_mean": 3342.9, "valid_targets_min": 1236 }, { "epoch": 1.4370748299319729, "grad_norm": 0.46140086600989344, "learning_rate": 3.867241895490818e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.1850546896457672, "step": 845, "valid_targets_mean": 4547.8, "valid_targets_min": 1230 }, { "epoch": 1.445578231292517, "grad_norm": 0.6096456433047177, "learning_rate": 3.864186468069727e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.20062093436717987, "step": 850, "valid_targets_mean": 3861.6, "valid_targets_min": 1361 }, { "epoch": 1.4540816326530612, "grad_norm": 0.4585502938921594, "learning_rate": 3.86109751428136e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.22109025716781616, "step": 855, "valid_targets_mean": 4631.1, "valid_targets_min": 649 }, { "epoch": 1.4625850340136055, "grad_norm": 0.6500708452308398, "learning_rate": 3.8579750896788526e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.19890360534191132, "step": 860, "valid_targets_mean": 3457.9, "valid_targets_min": 1516 }, { "epoch": 1.4710884353741496, "grad_norm": 0.5301669401019695, "learning_rate": 3.8548192504172905e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.16666162014007568, "step": 865, "valid_targets_mean": 3235.4, "valid_targets_min": 1496 }, { "epoch": 1.4795918367346939, "grad_norm": 0.5003852480841234, "learning_rate": 3.851630053252706e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.19342686235904694, "step": 870, "valid_targets_mean": 3817.6, "valid_targets_min": 1010 }, { "epoch": 1.4880952380952381, "grad_norm": 0.7206386070487517, "learning_rate": 3.848407555541054e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.1805090308189392, "step": 875, "valid_targets_mean": 3128.2, "valid_targets_min": 1237 }, { "epoch": 1.4965986394557822, "grad_norm": 0.5325698260432379, "learning_rate": 3.845151815237183e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.22101525962352753, "step": 880, "valid_targets_mean": 3731.1, "valid_targets_min": 1267 }, { "epoch": 1.5051020408163265, "grad_norm": 0.49784608869204255, "learning_rate": 3.841862890893787e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.21092960238456726, "step": 885, "valid_targets_mean": 4910.1, "valid_targets_min": 2027 }, { "epoch": 1.5136054421768708, "grad_norm": 0.5139966586488321, "learning_rate": 3.838540841660363e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.17927789688110352, "step": 890, "valid_targets_mean": 3502.6, "valid_targets_min": 1390 }, { "epoch": 1.5221088435374148, "grad_norm": 0.5753720323032561, "learning_rate": 3.835185727282135e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.17120110988616943, "step": 895, "valid_targets_mean": 3286.3, "valid_targets_min": 1413 }, { "epoch": 1.5306122448979593, "grad_norm": 0.47592158361035486, "learning_rate": 3.8317976080989884e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.163374125957489, "step": 900, "valid_targets_mean": 3801.1, "valid_targets_min": 1384 }, { "epoch": 1.5391156462585034, "grad_norm": 0.5502887147122869, "learning_rate": 3.828376545044381e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637812852859497, "step": 905, "valid_targets_mean": 3125.3, "valid_targets_min": 1185 }, { "epoch": 1.5476190476190477, "grad_norm": 0.49349113517485865, "learning_rate": 3.824922599644249e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1690322607755661, "step": 910, "valid_targets_mean": 3258.8, "valid_targets_min": 1083 }, { "epoch": 1.556122448979592, "grad_norm": 0.5864646081268652, "learning_rate": 3.8214358340159e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.19114357233047485, "step": 915, "valid_targets_mean": 2737.2, "valid_targets_min": 294 }, { "epoch": 1.564625850340136, "grad_norm": 0.6146750809665836, "learning_rate": 3.817916310866892e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.2137393355369568, "step": 920, "valid_targets_mean": 3575.6, "valid_targets_min": 1833 }, { "epoch": 1.5731292517006803, "grad_norm": 0.5497560800319427, "learning_rate": 3.814364093493912e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.1964998096227646, "step": 925, "valid_targets_mean": 3551.7, "valid_targets_min": 1423 }, { "epoch": 1.5816326530612246, "grad_norm": 0.5252883761247669, "learning_rate": 3.810779245781633e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.1650836169719696, "step": 930, "valid_targets_mean": 3089.8, "valid_targets_min": 1403 }, { "epoch": 1.5901360544217686, "grad_norm": 0.5121570735439744, "learning_rate": 3.807161832201569e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.19136366248130798, "step": 935, "valid_targets_mean": 4138.2, "valid_targets_min": 1424 }, { "epoch": 1.598639455782313, "grad_norm": 0.5958778544952104, "learning_rate": 3.80351191781091e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.19539722800254822, "step": 940, "valid_targets_mean": 3694.7, "valid_targets_min": 1215 }, { "epoch": 1.6071428571428572, "grad_norm": 0.46321527919315125, "learning_rate": 3.799829568251358e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710878312587738, "step": 945, "valid_targets_mean": 4287.4, "valid_targets_min": 1580 }, { "epoch": 1.6156462585034013, "grad_norm": 0.4474705462489259, "learning_rate": 3.7961148497479414e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.14631542563438416, "step": 950, "valid_targets_mean": 3635.0, "valid_targets_min": 1443 }, { "epoch": 1.6241496598639455, "grad_norm": 0.41640737339744915, "learning_rate": 3.792367829107828e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.16833257675170898, "step": 955, "valid_targets_mean": 4065.6, "valid_targets_min": 870 }, { "epoch": 1.6326530612244898, "grad_norm": 0.5577723930562095, "learning_rate": 3.7885885737191214e-05, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.20395566523075104, "step": 960, "valid_targets_mean": 3751.8, "valid_targets_min": 773 }, { "epoch": 1.641156462585034, "grad_norm": 0.5370007375191718, "learning_rate": 3.784777151549648e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.23845341801643372, "step": 965, "valid_targets_mean": 3401.8, "valid_targets_min": 1196 }, { "epoch": 1.6496598639455784, "grad_norm": 0.4890736313125839, "learning_rate": 3.780933631145738e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.19676534831523895, "step": 970, "valid_targets_mean": 4242.6, "valid_targets_min": 1641 }, { "epoch": 1.6581632653061225, "grad_norm": 0.5462693213339227, "learning_rate": 3.777058081630989e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.1821269541978836, "step": 975, "valid_targets_mean": 2902.4, "valid_targets_min": 758 }, { "epoch": 1.6666666666666665, "grad_norm": 0.8337967865673986, "learning_rate": 3.773150572705026e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.20385128259658813, "step": 980, "valid_targets_mean": 2980.2, "valid_targets_min": 1114 }, { "epoch": 1.675170068027211, "grad_norm": 0.5621665933713426, "learning_rate": 3.769211174642245e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.18322809040546417, "step": 985, "valid_targets_mean": 3570.9, "valid_targets_min": 1141 }, { "epoch": 1.683673469387755, "grad_norm": 0.5494341598343004, "learning_rate": 3.765239958290551e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.19005733728408813, "step": 990, "valid_targets_mean": 3032.7, "valid_targets_min": 1423 }, { "epoch": 1.6921768707482994, "grad_norm": 0.48352418832732824, "learning_rate": 3.761236995070086e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.16157102584838867, "step": 995, "valid_targets_mean": 3347.1, "valid_targets_min": 1193 }, { "epoch": 1.7006802721088436, "grad_norm": 0.5632869048679273, "learning_rate": 3.757202356971937e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.18931040167808533, "step": 1000, "valid_targets_mean": 3152.6, "valid_targets_min": 1561 }, { "epoch": 1.7091836734693877, "grad_norm": 0.5192329176419131, "learning_rate": 3.75313611655685e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.21477651596069336, "step": 1005, "valid_targets_mean": 3273.4, "valid_targets_min": 1808 }, { "epoch": 1.717687074829932, "grad_norm": 0.537867998522921, "learning_rate": 3.74903834695392e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.20665214955806732, "step": 1010, "valid_targets_mean": 2862.1, "valid_targets_min": 1222 }, { "epoch": 1.7261904761904763, "grad_norm": 0.4845497530535329, "learning_rate": 3.7449091218592765e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.17452441155910492, "step": 1015, "valid_targets_mean": 3869.9, "valid_targets_min": 820 }, { "epoch": 1.7346938775510203, "grad_norm": 0.6076016507448156, "learning_rate": 3.740748515534761e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.17511403560638428, "step": 1020, "valid_targets_mean": 3225.7, "valid_targets_min": 1603 }, { "epoch": 1.7431972789115646, "grad_norm": 0.4883623691095037, "learning_rate": 3.736556602806587e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.172734797000885, "step": 1025, "valid_targets_mean": 3836.9, "valid_targets_min": 2000 }, { "epoch": 1.751700680272109, "grad_norm": 0.46550827165041286, "learning_rate": 3.732333459063995e-05, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.199026957154274, "step": 1030, "valid_targets_mean": 4062.8, "valid_targets_min": 1556 }, { "epoch": 1.760204081632653, "grad_norm": 0.5129468567005807, "learning_rate": 3.728079160257903e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.14423376321792603, "step": 1035, "valid_targets_mean": 2858.1, "valid_targets_min": 1339 }, { "epoch": 1.7687074829931972, "grad_norm": 0.5574813775362133, "learning_rate": 3.723793782899531e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.18245592713356018, "step": 1040, "valid_targets_mean": 3276.6, "valid_targets_min": 670 }, { "epoch": 1.7772108843537415, "grad_norm": 0.4670140940140349, "learning_rate": 3.719477404059032e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.1462934911251068, "step": 1045, "valid_targets_mean": 3054.8, "valid_targets_min": 1503 }, { "epoch": 1.7857142857142856, "grad_norm": 0.46194682964420647, "learning_rate": 3.715130101364103e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.16554617881774902, "step": 1050, "valid_targets_mean": 3644.1, "valid_targets_min": 1373 }, { "epoch": 1.79421768707483, "grad_norm": 0.5984466271446732, "learning_rate": 3.710751952998591e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.2118651270866394, "step": 1055, "valid_targets_mean": 4197.6, "valid_targets_min": 1768 }, { "epoch": 1.8027210884353742, "grad_norm": 0.5456400454044104, "learning_rate": 3.7063430377010804e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.17311958968639374, "step": 1060, "valid_targets_mean": 2987.2, "valid_targets_min": 1077 }, { "epoch": 1.8112244897959182, "grad_norm": 0.4767702066385362, "learning_rate": 3.7019034347634884e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.19531995058059692, "step": 1065, "valid_targets_mean": 3875.5, "valid_targets_min": 656 }, { "epoch": 1.8197278911564627, "grad_norm": 0.5195825806924265, "learning_rate": 3.6974332240296285e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.16434217989444733, "step": 1070, "valid_targets_mean": 3075.5, "valid_targets_min": 272 }, { "epoch": 1.8282312925170068, "grad_norm": 0.49345991558681523, "learning_rate": 3.692932485893779e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.20877480506896973, "step": 1075, "valid_targets_mean": 3642.0, "valid_targets_min": 1468 }, { "epoch": 1.836734693877551, "grad_norm": 0.47208468050600655, "learning_rate": 3.6884013012992384e-05, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.17622429132461548, "step": 1080, "valid_targets_mean": 4071.4, "valid_targets_min": 1942 }, { "epoch": 1.8452380952380953, "grad_norm": 0.48753304789559393, "learning_rate": 3.683839751736866e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.18847878277301788, "step": 1085, "valid_targets_mean": 3604.7, "valid_targets_min": 1249 }, { "epoch": 1.8537414965986394, "grad_norm": 0.5185334909460225, "learning_rate": 3.67924791924362e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.18857452273368835, "step": 1090, "valid_targets_mean": 3293.7, "valid_targets_min": 1583 }, { "epoch": 1.8622448979591837, "grad_norm": 0.5361821399516076, "learning_rate": 3.6746258864010804e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.21333011984825134, "step": 1095, "valid_targets_mean": 3541.9, "valid_targets_min": 1101 }, { "epoch": 1.870748299319728, "grad_norm": 0.5150375744442169, "learning_rate": 3.669973736333961e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.18149079382419586, "step": 1100, "valid_targets_mean": 3461.7, "valid_targets_min": 1551 }, { "epoch": 1.879251700680272, "grad_norm": 0.47641795347351734, "learning_rate": 3.665291552708622e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.16541434824466705, "step": 1105, "valid_targets_mean": 3537.1, "valid_targets_min": 721 }, { "epoch": 1.8877551020408163, "grad_norm": 0.44107915244193463, "learning_rate": 3.660579419731556e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.17657120525836945, "step": 1110, "valid_targets_mean": 4444.3, "valid_targets_min": 1768 }, { "epoch": 1.8962585034013606, "grad_norm": 0.4490354679780014, "learning_rate": 3.655837422147881e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.18245811760425568, "step": 1115, "valid_targets_mean": 3821.4, "valid_targets_min": 832 }, { "epoch": 1.9047619047619047, "grad_norm": 0.5471874801090619, "learning_rate": 3.6510656452398124e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.19018134474754333, "step": 1120, "valid_targets_mean": 3944.4, "valid_targets_min": 704 }, { "epoch": 1.913265306122449, "grad_norm": 0.5210175865126913, "learning_rate": 3.646264174825131e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890740543603897, "step": 1125, "valid_targets_mean": 2996.8, "valid_targets_min": 1240 }, { "epoch": 1.9217687074829932, "grad_norm": 0.44413848715103277, "learning_rate": 3.6414330972556396e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.1596677303314209, "step": 1130, "valid_targets_mean": 3841.4, "valid_targets_min": 1839 }, { "epoch": 1.9302721088435373, "grad_norm": 0.5011986427153032, "learning_rate": 3.6365724994156074e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710270792245865, "step": 1135, "valid_targets_mean": 3877.1, "valid_targets_min": 1103 }, { "epoch": 1.9387755102040818, "grad_norm": 0.507796898706084, "learning_rate": 3.63168246872021e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.19725248217582703, "step": 1140, "valid_targets_mean": 4247.8, "valid_targets_min": 1249 }, { "epoch": 1.9472789115646258, "grad_norm": 0.44045711685293365, "learning_rate": 3.626763093113959e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.19037358462810516, "step": 1145, "valid_targets_mean": 3963.4, "valid_targets_min": 1103 }, { "epoch": 1.95578231292517, "grad_norm": 0.47446755779794997, "learning_rate": 3.621814461069114e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.25513309240341187, "step": 1150, "valid_targets_mean": 5124.9, "valid_targets_min": 1921 }, { "epoch": 1.9642857142857144, "grad_norm": 0.5301424189044126, "learning_rate": 3.6168366615841e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.22564446926116943, "step": 1155, "valid_targets_mean": 3610.2, "valid_targets_min": 1429 }, { "epoch": 1.9727891156462585, "grad_norm": 0.45622538657301903, "learning_rate": 3.6118297841818986e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16688859462738037, "step": 1160, "valid_targets_mean": 3964.9, "valid_targets_min": 1107 }, { "epoch": 1.9812925170068028, "grad_norm": 0.4665999563671873, "learning_rate": 3.6067939189084446e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.19204774498939514, "step": 1165, "valid_targets_mean": 4142.7, "valid_targets_min": 1263 }, { "epoch": 1.989795918367347, "grad_norm": 0.6056661231032858, "learning_rate": 3.6017291563310005e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.19215795397758484, "step": 1170, "valid_targets_mean": 3911.9, "valid_targets_min": 1572 }, { "epoch": 1.998299319727891, "grad_norm": 0.4928298103688405, "learning_rate": 3.5966355875365344e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.15711480379104614, "step": 1175, "valid_targets_mean": 3181.3, "valid_targets_min": 1284 }, { "epoch": 2.006802721088435, "grad_norm": 0.5046280559739479, "learning_rate": 3.591513304130076e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1728023886680603, "step": 1180, "valid_targets_mean": 3395.6, "valid_targets_min": 366 }, { "epoch": 2.0153061224489797, "grad_norm": 0.4858331630925101, "learning_rate": 3.586362398233072e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.15058520436286926, "step": 1185, "valid_targets_mean": 3435.6, "valid_targets_min": 1263 }, { "epoch": 2.0238095238095237, "grad_norm": 0.4598459736943386, "learning_rate": 3.58118296248173e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.1740441918373108, "step": 1190, "valid_targets_mean": 4536.1, "valid_targets_min": 1025 }, { "epoch": 2.0323129251700682, "grad_norm": 0.5668851483118568, "learning_rate": 3.57597509002535e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1615862250328064, "step": 1195, "valid_targets_mean": 3981.8, "valid_targets_min": 1479 }, { "epoch": 2.0408163265306123, "grad_norm": 0.5400385121875237, "learning_rate": 3.57073887452465e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.18597358465194702, "step": 1200, "valid_targets_mean": 3258.4, "valid_targets_min": 1617 }, { "epoch": 2.0493197278911564, "grad_norm": 0.5191849885658418, "learning_rate": 3.565474410150083e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.14795230329036713, "step": 1205, "valid_targets_mean": 3404.8, "valid_targets_min": 1328 }, { "epoch": 2.057823129251701, "grad_norm": 0.5615079980327268, "learning_rate": 3.560181791580144e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724962741136551, "step": 1210, "valid_targets_mean": 3804.8, "valid_targets_min": 1510 }, { "epoch": 2.066326530612245, "grad_norm": 0.5078447283351805, "learning_rate": 3.5548611139996634e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.18177998065948486, "step": 1215, "valid_targets_mean": 3558.1, "valid_targets_min": 1636 }, { "epoch": 2.074829931972789, "grad_norm": 0.5101085621115222, "learning_rate": 3.549512473098097e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.17449212074279785, "step": 1220, "valid_targets_mean": 3910.8, "valid_targets_min": 881 }, { "epoch": 2.0833333333333335, "grad_norm": 0.5548489837592624, "learning_rate": 3.544135965067807e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575036644935608, "step": 1225, "valid_targets_mean": 3391.7, "valid_targets_min": 1339 }, { "epoch": 2.0918367346938775, "grad_norm": 0.4790386496422741, "learning_rate": 3.5387316866023314e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.16516387462615967, "step": 1230, "valid_targets_mean": 4590.2, "valid_targets_min": 1000 }, { "epoch": 2.1003401360544216, "grad_norm": 0.5504333723509913, "learning_rate": 3.533299734894642e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.1627981960773468, "step": 1235, "valid_targets_mean": 3015.6, "valid_targets_min": 1230 }, { "epoch": 2.108843537414966, "grad_norm": 0.5147065086665726, "learning_rate": 3.527840207635399e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.14713545143604279, "step": 1240, "valid_targets_mean": 3302.9, "valid_targets_min": 1533 }, { "epoch": 2.11734693877551, "grad_norm": 0.49542337740054593, "learning_rate": 3.522353203011197e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.17458561062812805, "step": 1245, "valid_targets_mean": 3551.1, "valid_targets_min": 740 }, { "epoch": 2.1258503401360542, "grad_norm": 0.5262275942748199, "learning_rate": 3.5168388197027894e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.19332650303840637, "step": 1250, "valid_targets_mean": 3784.7, "valid_targets_min": 2209 }, { "epoch": 2.1343537414965987, "grad_norm": 0.5194049620721893, "learning_rate": 3.5112971568833265e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.1369602084159851, "step": 1255, "valid_targets_mean": 3164.5, "valid_targets_min": 1186 }, { "epoch": 2.142857142857143, "grad_norm": 0.4894157553384943, "learning_rate": 3.505728314216563e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.1559082269668579, "step": 1260, "valid_targets_mean": 3526.8, "valid_targets_min": 1441 }, { "epoch": 2.1513605442176873, "grad_norm": 0.5306280181793118, "learning_rate": 3.500132391855067e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1700558364391327, "step": 1265, "valid_targets_mean": 3411.9, "valid_targets_min": 1526 }, { "epoch": 2.1598639455782314, "grad_norm": 0.5439788996564396, "learning_rate": 3.494509490438422e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.17945188283920288, "step": 1270, "valid_targets_mean": 3294.2, "valid_targets_min": 1077 }, { "epoch": 2.1683673469387754, "grad_norm": 0.5426839393421363, "learning_rate": 3.4888597110914155e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.20356306433677673, "step": 1275, "valid_targets_mean": 3401.2, "valid_targets_min": 766 }, { "epoch": 2.17687074829932, "grad_norm": 0.49376468682501007, "learning_rate": 3.483183155422216e-05, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475028395652771, "step": 1280, "valid_targets_mean": 3422.0, "valid_targets_min": 1364 }, { "epoch": 2.185374149659864, "grad_norm": 0.4822219704611301, "learning_rate": 3.477479925520555e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.18960726261138916, "step": 1285, "valid_targets_mean": 3851.6, "valid_targets_min": 701 }, { "epoch": 2.193877551020408, "grad_norm": 0.5238254870802262, "learning_rate": 3.471750123955878e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.17107030749320984, "step": 1290, "valid_targets_mean": 4155.1, "valid_targets_min": 1339 }, { "epoch": 2.2023809523809526, "grad_norm": 0.47745457726658785, "learning_rate": 3.465993853775516e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.15339364111423492, "step": 1295, "valid_targets_mean": 4033.9, "valid_targets_min": 1507 }, { "epoch": 2.2108843537414966, "grad_norm": 0.44068028477047305, "learning_rate": 3.460211218502815e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628030687570572, "step": 1300, "valid_targets_mean": 4219.1, "valid_targets_min": 1276 }, { "epoch": 2.2193877551020407, "grad_norm": 0.6017847646540015, "learning_rate": 3.45440232213529e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.17169851064682007, "step": 1305, "valid_targets_mean": 3840.2, "valid_targets_min": 280 }, { "epoch": 2.227891156462585, "grad_norm": 0.54520808841801, "learning_rate": 3.4485672691427416e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.14305715262889862, "step": 1310, "valid_targets_mean": 2790.1, "valid_targets_min": 1090 }, { "epoch": 2.2363945578231292, "grad_norm": 0.5069630613900863, "learning_rate": 3.4427061644653873e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.14984074234962463, "step": 1315, "valid_targets_mean": 3722.7, "valid_targets_min": 1552 }, { "epoch": 2.2448979591836733, "grad_norm": 0.5074028738160252, "learning_rate": 3.436819113511967e-05, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426405906677246, "step": 1320, "valid_targets_mean": 3276.1, "valid_targets_min": 1724 }, { "epoch": 2.253401360544218, "grad_norm": 0.4860031673915145, "learning_rate": 3.43090622215785e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.13676658272743225, "step": 1325, "valid_targets_mean": 3905.1, "valid_targets_min": 910 }, { "epoch": 2.261904761904762, "grad_norm": 0.4673453723403358, "learning_rate": 3.4249675967431325e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.15425705909729004, "step": 1330, "valid_targets_mean": 3778.6, "valid_targets_min": 918 }, { "epoch": 2.270408163265306, "grad_norm": 0.5466310303785124, "learning_rate": 3.419003344070723e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.15783560276031494, "step": 1335, "valid_targets_mean": 2919.6, "valid_targets_min": 1198 }, { "epoch": 2.2789115646258504, "grad_norm": 0.5031432547752726, "learning_rate": 3.413013571404423e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.13498738408088684, "step": 1340, "valid_targets_mean": 3161.5, "valid_targets_min": 1101 }, { "epoch": 2.2874149659863945, "grad_norm": 0.4510753214929706, "learning_rate": 3.406998386466995e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.14579127728939056, "step": 1345, "valid_targets_mean": 4415.7, "valid_targets_min": 1551 }, { "epoch": 2.295918367346939, "grad_norm": 0.48263377269745095, "learning_rate": 3.400957897438229e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15821559727191925, "step": 1350, "valid_targets_mean": 4076.9, "valid_targets_min": 1378 }, { "epoch": 2.304421768707483, "grad_norm": 0.5644267830161144, "learning_rate": 3.3948922129529935e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.19237931072711945, "step": 1355, "valid_targets_mean": 3423.6, "valid_targets_min": 1047 }, { "epoch": 2.312925170068027, "grad_norm": 0.49196181950491424, "learning_rate": 3.388801442099286e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.1689063459634781, "step": 1360, "valid_targets_mean": 3449.7, "valid_targets_min": 1569 }, { "epoch": 2.3214285714285716, "grad_norm": 0.7510781582658744, "learning_rate": 3.3826856944162655e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.1868104636669159, "step": 1365, "valid_targets_mean": 3785.6, "valid_targets_min": 1125 }, { "epoch": 2.3299319727891157, "grad_norm": 0.4746939257817625, "learning_rate": 3.376545079892288e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.18635499477386475, "step": 1370, "valid_targets_mean": 4005.7, "valid_targets_min": 1397 }, { "epoch": 2.3384353741496597, "grad_norm": 0.47890327016140144, "learning_rate": 3.3703797089629245e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.15403881669044495, "step": 1375, "valid_targets_mean": 3932.6, "valid_targets_min": 429 }, { "epoch": 2.3469387755102042, "grad_norm": 0.6080390195957247, "learning_rate": 3.364189692508976e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.20440378785133362, "step": 1380, "valid_targets_mean": 3630.7, "valid_targets_min": 1517 }, { "epoch": 2.3554421768707483, "grad_norm": 0.5322930693149741, "learning_rate": 3.357975141854482e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.26613375544548035, "step": 1385, "valid_targets_mean": 3968.5, "valid_targets_min": 1073 }, { "epoch": 2.3639455782312924, "grad_norm": 0.4547239931273904, "learning_rate": 3.3517361687647136e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.1697888970375061, "step": 1390, "valid_targets_mean": 4553.2, "valid_targets_min": 1024 }, { "epoch": 2.372448979591837, "grad_norm": 0.5000330158435863, "learning_rate": 3.3454728854441667e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.15525534749031067, "step": 1395, "valid_targets_mean": 3786.2, "valid_targets_min": 1926 }, { "epoch": 2.380952380952381, "grad_norm": 0.413483824010835, "learning_rate": 3.3391854045345437e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.15179120004177094, "step": 1400, "valid_targets_mean": 4099.1, "valid_targets_min": 1398 }, { "epoch": 2.389455782312925, "grad_norm": 0.554412863715429, "learning_rate": 3.332873839112727e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.15291377902030945, "step": 1405, "valid_targets_mean": 3096.1, "valid_targets_min": 1376 }, { "epoch": 2.3979591836734695, "grad_norm": 0.48293985993173416, "learning_rate": 3.3265383026887464e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.14159250259399414, "step": 1410, "valid_targets_mean": 3414.8, "valid_targets_min": 1532 }, { "epoch": 2.4064625850340136, "grad_norm": 0.5300362438284278, "learning_rate": 3.320178909203735e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.17707979679107666, "step": 1415, "valid_targets_mean": 3817.1, "valid_targets_min": 1698 }, { "epoch": 2.4149659863945576, "grad_norm": 0.6038778356769944, "learning_rate": 3.313795773027885e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.19175416231155396, "step": 1420, "valid_targets_mean": 3383.4, "valid_targets_min": 590 }, { "epoch": 2.423469387755102, "grad_norm": 0.6333836363677777, "learning_rate": 3.307389008958385e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16913290321826935, "step": 1425, "valid_targets_mean": 2575.2, "valid_targets_min": 787 }, { "epoch": 2.431972789115646, "grad_norm": 0.47277667370501736, "learning_rate": 3.30095873221736e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.15604209899902344, "step": 1430, "valid_targets_mean": 3869.1, "valid_targets_min": 1412 }, { "epoch": 2.4404761904761907, "grad_norm": 0.477865671202061, "learning_rate": 3.294505058449797e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.18286634981632233, "step": 1435, "valid_targets_mean": 5235.6, "valid_targets_min": 1369 }, { "epoch": 2.4489795918367347, "grad_norm": 0.48362971440543534, "learning_rate": 3.288028103721465e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.15418080985546112, "step": 1440, "valid_targets_mean": 3559.9, "valid_targets_min": 414 }, { "epoch": 2.457482993197279, "grad_norm": 0.5232022183706239, "learning_rate": 3.2815279845168296e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.18612605333328247, "step": 1445, "valid_targets_mean": 3365.7, "valid_targets_min": 1283 }, { "epoch": 2.4659863945578233, "grad_norm": 0.506042116749104, "learning_rate": 3.2750048177369554e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.18770621716976166, "step": 1450, "valid_targets_mean": 3635.6, "valid_targets_min": 1733 }, { "epoch": 2.4744897959183674, "grad_norm": 0.572670882166851, "learning_rate": 3.268458720697406e-05, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.14232869446277618, "step": 1455, "valid_targets_mean": 2885.1, "valid_targets_min": 1269 }, { "epoch": 2.4829931972789114, "grad_norm": 0.5196864471454508, "learning_rate": 3.2618898111261316e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.13820812106132507, "step": 1460, "valid_targets_mean": 3341.0, "valid_targets_min": 820 }, { "epoch": 2.491496598639456, "grad_norm": 0.5015347039801419, "learning_rate": 3.2552982071613555e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.13426734507083893, "step": 1465, "valid_targets_mean": 3133.6, "valid_targets_min": 1657 }, { "epoch": 2.5, "grad_norm": 0.4921036727094327, "learning_rate": 3.248684027349445e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.14220476150512695, "step": 1470, "valid_targets_mean": 3232.5, "valid_targets_min": 1359 }, { "epoch": 2.508503401360544, "grad_norm": 0.44217854739998835, "learning_rate": 3.2420473906427824e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.17743223905563354, "step": 1475, "valid_targets_mean": 4313.5, "valid_targets_min": 1603 }, { "epoch": 2.5170068027210886, "grad_norm": 0.4778736306901132, "learning_rate": 3.235388416397626e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.16074007749557495, "step": 1480, "valid_targets_mean": 3948.7, "valid_targets_min": 1540 }, { "epoch": 2.5255102040816326, "grad_norm": 0.6095052805264233, "learning_rate": 3.228707224371961e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.17271192371845245, "step": 1485, "valid_targets_mean": 3558.2, "valid_targets_min": 1375 }, { "epoch": 2.534013605442177, "grad_norm": 0.45590045375975136, "learning_rate": 3.222003934723347e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.1279994696378708, "step": 1490, "valid_targets_mean": 3846.9, "valid_targets_min": 1859 }, { "epoch": 2.542517006802721, "grad_norm": 0.49738813457635117, "learning_rate": 3.215278668006757e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.1717885434627533, "step": 1495, "valid_targets_mean": 3760.4, "valid_targets_min": 1279 }, { "epoch": 2.5510204081632653, "grad_norm": 0.4090299383293233, "learning_rate": 3.208531545172413e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.15844562649726868, "step": 1500, "valid_targets_mean": 4329.8, "valid_targets_min": 1368 }, { "epoch": 2.5595238095238093, "grad_norm": 0.5431786244764008, "learning_rate": 3.2017626875636024e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.14518578350543976, "step": 1505, "valid_targets_mean": 3229.6, "valid_targets_min": 1434 }, { "epoch": 2.568027210884354, "grad_norm": 0.49615820264902144, "learning_rate": 3.194972216914502e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.1399931013584137, "step": 1510, "valid_targets_mean": 3413.1, "valid_targets_min": 670 }, { "epoch": 2.576530612244898, "grad_norm": 0.9718435300877193, "learning_rate": 3.18816025534799e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514762043952942, "step": 1515, "valid_targets_mean": 3781.0, "valid_targets_min": 1671 }, { "epoch": 2.5850340136054424, "grad_norm": 0.5068549521619831, "learning_rate": 3.181326925373443e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.19092750549316406, "step": 1520, "valid_targets_mean": 4007.5, "valid_targets_min": 1248 }, { "epoch": 2.5935374149659864, "grad_norm": 0.47078024333063895, "learning_rate": 3.174472349884539e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.13935624063014984, "step": 1525, "valid_targets_mean": 3828.7, "valid_targets_min": 893 }, { "epoch": 2.6020408163265305, "grad_norm": 0.4738214558863609, "learning_rate": 3.1675966521570444e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.14629226922988892, "step": 1530, "valid_targets_mean": 3698.9, "valid_targets_min": 1408 }, { "epoch": 2.6105442176870746, "grad_norm": 0.49017231137420236, "learning_rate": 3.160699955846597e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.15869465470314026, "step": 1535, "valid_targets_mean": 3895.1, "valid_targets_min": 1622 }, { "epoch": 2.619047619047619, "grad_norm": 0.5202593666777702, "learning_rate": 3.1537823849864834e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.20912855863571167, "step": 1540, "valid_targets_mean": 3743.7, "valid_targets_min": 912 }, { "epoch": 2.627551020408163, "grad_norm": 0.5005906380020121, "learning_rate": 3.1468440639854056e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.13278600573539734, "step": 1545, "valid_targets_mean": 3161.0, "valid_targets_min": 1611 }, { "epoch": 2.6360544217687076, "grad_norm": 0.4999686965484099, "learning_rate": 3.139885117625249e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.15896578133106232, "step": 1550, "valid_targets_mean": 3742.4, "valid_targets_min": 1355 }, { "epoch": 2.6445578231292517, "grad_norm": 0.5263565414304656, "learning_rate": 3.132905671058831e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.18690796196460724, "step": 1555, "valid_targets_mean": 4175.1, "valid_targets_min": 1608 }, { "epoch": 2.6530612244897958, "grad_norm": 0.46022006535755816, "learning_rate": 3.1259058498076554e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319347470998764, "step": 1560, "valid_targets_mean": 3780.4, "valid_targets_min": 1459 }, { "epoch": 2.6615646258503403, "grad_norm": 0.48588937455117837, "learning_rate": 3.1188857797596545e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.12452636659145355, "step": 1565, "valid_targets_mean": 2937.5, "valid_targets_min": 1096 }, { "epoch": 2.6700680272108843, "grad_norm": 0.5191575759086287, "learning_rate": 3.111845587166922e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.2404664009809494, "step": 1570, "valid_targets_mean": 4137.2, "valid_targets_min": 1510 }, { "epoch": 2.678571428571429, "grad_norm": 0.5208651523922655, "learning_rate": 3.104785398643447e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.14865821599960327, "step": 1575, "valid_targets_mean": 2932.2, "valid_targets_min": 292 }, { "epoch": 2.687074829931973, "grad_norm": 0.4114567953463469, "learning_rate": 3.0977053411628315e-05, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.14979563653469086, "step": 1580, "valid_targets_mean": 4161.8, "valid_targets_min": 1572 }, { "epoch": 2.695578231292517, "grad_norm": 0.4913074740374502, "learning_rate": 3.090605542056013e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.15900972485542297, "step": 1585, "valid_targets_mean": 3456.5, "valid_targets_min": 1115 }, { "epoch": 2.704081632653061, "grad_norm": 0.4442392356579173, "learning_rate": 3.083486129008967e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.18399524688720703, "step": 1590, "valid_targets_mean": 4740.0, "valid_targets_min": 1565 }, { "epoch": 2.7125850340136055, "grad_norm": 0.4754861826964586, "learning_rate": 3.07634723006042e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.1808849275112152, "step": 1595, "valid_targets_mean": 4251.0, "valid_targets_min": 1249 }, { "epoch": 2.7210884353741496, "grad_norm": 0.4655468525053816, "learning_rate": 3.069188973599538e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.1294795274734497, "step": 1600, "valid_targets_mean": 3314.2, "valid_targets_min": 723 }, { "epoch": 2.729591836734694, "grad_norm": 0.43464410382803953, "learning_rate": 3.062011488363623e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.147240549325943, "step": 1605, "valid_targets_mean": 3935.8, "valid_targets_min": 1130 }, { "epoch": 2.738095238095238, "grad_norm": 0.46040122910771636, "learning_rate": 3.054814903435794e-05, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.14695018529891968, "step": 1610, "valid_targets_mean": 3722.0, "valid_targets_min": 1673 }, { "epoch": 2.746598639455782, "grad_norm": 0.45733532745749556, "learning_rate": 3.0475993482426695e-05, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.2099800556898117, "step": 1615, "valid_targets_mean": 4918.6, "valid_targets_min": 1845 }, { "epoch": 2.7551020408163263, "grad_norm": 0.4956060655830285, "learning_rate": 3.0403649525520374e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.18889182806015015, "step": 1620, "valid_targets_mean": 3856.4, "valid_targets_min": 988 }, { "epoch": 2.7636054421768708, "grad_norm": 0.4768716386514472, "learning_rate": 3.033111846470521e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.15743374824523926, "step": 1625, "valid_targets_mean": 3608.8, "valid_targets_min": 872 }, { "epoch": 2.772108843537415, "grad_norm": 0.525730309515445, "learning_rate": 3.02584016044124e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.15813755989074707, "step": 1630, "valid_targets_mean": 3100.8, "valid_targets_min": 642 }, { "epoch": 2.7806122448979593, "grad_norm": 0.5351477674686339, "learning_rate": 3.0185500252414633e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.16096732020378113, "step": 1635, "valid_targets_mean": 3815.7, "valid_targets_min": 1239 }, { "epoch": 2.7891156462585034, "grad_norm": 0.4716262544441501, "learning_rate": 3.01124157198026e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.1661742478609085, "step": 1640, "valid_targets_mean": 3724.4, "valid_targets_min": 1140 }, { "epoch": 2.7976190476190474, "grad_norm": 0.4138239303384503, "learning_rate": 3.003914932096137e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16232448816299438, "step": 1645, "valid_targets_mean": 4448.6, "valid_targets_min": 1633 }, { "epoch": 2.806122448979592, "grad_norm": 0.46852819112237687, "learning_rate": 2.99657023735468e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.20756766200065613, "step": 1650, "valid_targets_mean": 4463.3, "valid_targets_min": 1380 }, { "epoch": 2.814625850340136, "grad_norm": 0.39483602863790196, "learning_rate": 2.9892076198461794e-05, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.1203012689948082, "step": 1655, "valid_targets_mean": 4115.1, "valid_targets_min": 859 }, { "epoch": 2.8231292517006805, "grad_norm": 0.48880278190048604, "learning_rate": 2.9818272119832576e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.17082348465919495, "step": 1660, "valid_targets_mean": 3551.8, "valid_targets_min": 692 }, { "epoch": 2.8316326530612246, "grad_norm": 0.41769851905531785, "learning_rate": 2.974429146498487e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666543036699295, "step": 1665, "valid_targets_mean": 4539.7, "valid_targets_min": 1299 }, { "epoch": 2.8401360544217686, "grad_norm": 0.5016505396489435, "learning_rate": 2.9670135564420016e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940472573041916, "step": 1670, "valid_targets_mean": 3977.4, "valid_targets_min": 1537 }, { "epoch": 2.8486394557823127, "grad_norm": 0.5166302635070413, "learning_rate": 2.9595805751791068e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.17951983213424683, "step": 1675, "valid_targets_mean": 3933.2, "valid_targets_min": 793 }, { "epoch": 2.857142857142857, "grad_norm": 0.5379845678232543, "learning_rate": 2.9521303363878774e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1659054160118103, "step": 1680, "valid_targets_mean": 2871.5, "valid_targets_min": 1082 }, { "epoch": 2.8656462585034013, "grad_norm": 0.4656889105961351, "learning_rate": 2.9446629740567566e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.16753873229026794, "step": 1685, "valid_targets_mean": 3887.4, "valid_targets_min": 795 }, { "epoch": 2.8741496598639458, "grad_norm": 0.4930852645072521, "learning_rate": 2.9371786224821447e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.16282245516777039, "step": 1690, "valid_targets_mean": 3396.2, "valid_targets_min": 1712 }, { "epoch": 2.88265306122449, "grad_norm": 0.4445771945139776, "learning_rate": 2.9296774162659836e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.1767793595790863, "step": 1695, "valid_targets_mean": 4715.9, "valid_targets_min": 1373 }, { "epoch": 2.891156462585034, "grad_norm": 0.543109477480171, "learning_rate": 2.9221594903133385e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.14414627850055695, "step": 1700, "valid_targets_mean": 3009.1, "valid_targets_min": 325 }, { "epoch": 2.8996598639455784, "grad_norm": 0.5234711869685756, "learning_rate": 2.9146249798299672e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.160060852766037, "step": 1705, "valid_targets_mean": 3624.4, "valid_targets_min": 1171 }, { "epoch": 2.9081632653061225, "grad_norm": 0.4908520083423699, "learning_rate": 2.9070740203198927e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.1625441312789917, "step": 1710, "valid_targets_mean": 3220.1, "valid_targets_min": 1120 }, { "epoch": 2.9166666666666665, "grad_norm": 0.4785558145751867, "learning_rate": 2.899506747582965e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.17338773608207703, "step": 1715, "valid_targets_mean": 3640.5, "valid_targets_min": 906 }, { "epoch": 2.925170068027211, "grad_norm": 0.5088298122894733, "learning_rate": 2.8919232977124177e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.1554885059595108, "step": 1720, "valid_targets_mean": 3226.2, "valid_targets_min": 1437 }, { "epoch": 2.933673469387755, "grad_norm": 0.453368913569161, "learning_rate": 2.884323807092423e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.17843785881996155, "step": 1725, "valid_targets_mean": 4037.4, "valid_targets_min": 1673 }, { "epoch": 2.942176870748299, "grad_norm": 0.5177514931490083, "learning_rate": 2.8767084123956334e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.178394615650177, "step": 1730, "valid_targets_mean": 3508.4, "valid_targets_min": 1662 }, { "epoch": 2.9506802721088436, "grad_norm": 0.5779374351888202, "learning_rate": 2.8690772505807307e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18779624998569489, "step": 1735, "valid_targets_mean": 3212.1, "valid_targets_min": 1016 }, { "epoch": 2.9591836734693877, "grad_norm": 0.5146721357707493, "learning_rate": 2.8614304588899588e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.15629920363426208, "step": 1740, "valid_targets_mean": 4015.6, "valid_targets_min": 1070 }, { "epoch": 2.967687074829932, "grad_norm": 0.5189251797092681, "learning_rate": 2.8537681748466557e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.1510303020477295, "step": 1745, "valid_targets_mean": 3674.2, "valid_targets_min": 1773 }, { "epoch": 2.9761904761904763, "grad_norm": 0.46502180173420404, "learning_rate": 2.8460905362527832e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.15194571018218994, "step": 1750, "valid_targets_mean": 3294.1, "valid_targets_min": 1422 }, { "epoch": 2.9846938775510203, "grad_norm": 0.4304082658436519, "learning_rate": 2.8383976811864416e-05, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.20454227924346924, "step": 1755, "valid_targets_mean": 4752.8, "valid_targets_min": 1493 }, { "epoch": 2.9931972789115644, "grad_norm": 0.508324313644312, "learning_rate": 2.8306897479993954e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.18964369595050812, "step": 1760, "valid_targets_mean": 3695.0, "valid_targets_min": 629 }, { "epoch": 3.001700680272109, "grad_norm": 0.4784598662881332, "learning_rate": 2.8229668753145797e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313592791557312, "step": 1765, "valid_targets_mean": 3611.9, "valid_targets_min": 1092 }, { "epoch": 3.010204081632653, "grad_norm": 0.8446031086831215, "learning_rate": 2.815229202023607e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.1230715960264206, "step": 1770, "valid_targets_mean": 3435.1, "valid_targets_min": 1306 }, { "epoch": 3.0187074829931975, "grad_norm": 0.492834562909989, "learning_rate": 2.8074768672842716e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.1337684690952301, "step": 1775, "valid_targets_mean": 4209.7, "valid_targets_min": 1836 }, { "epoch": 3.0272108843537415, "grad_norm": 0.4601608816984647, "learning_rate": 2.7997100105180455e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.1252722293138504, "step": 1780, "valid_targets_mean": 4082.4, "valid_targets_min": 1347 }, { "epoch": 3.0357142857142856, "grad_norm": 0.5489375507244738, "learning_rate": 2.7919287714075714e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.18662264943122864, "step": 1785, "valid_targets_mean": 3715.5, "valid_targets_min": 1090 }, { "epoch": 3.04421768707483, "grad_norm": 0.5083714260327757, "learning_rate": 2.7841332898941513e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.16233694553375244, "step": 1790, "valid_targets_mean": 3814.8, "valid_targets_min": 1574 }, { "epoch": 3.052721088435374, "grad_norm": 0.6619518014596226, "learning_rate": 2.7763237061752276e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.11884614080190659, "step": 1795, "valid_targets_mean": 3849.1, "valid_targets_min": 1576 }, { "epoch": 3.061224489795918, "grad_norm": 0.4621308813867603, "learning_rate": 2.768500160701864e-05, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.1337064951658249, "step": 1800, "valid_targets_mean": 4491.9, "valid_targets_min": 1548 }, { "epoch": 3.0697278911564627, "grad_norm": 0.46021745248167184, "learning_rate": 2.7606627941762186e-05, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.10864484310150146, "step": 1805, "valid_targets_mean": 3335.6, "valid_targets_min": 1564 }, { "epoch": 3.078231292517007, "grad_norm": 0.5483839712270409, "learning_rate": 2.752811747549013e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.1714896559715271, "step": 1810, "valid_targets_mean": 3205.5, "valid_targets_min": 1136 }, { "epoch": 3.086734693877551, "grad_norm": 0.5202727539029218, "learning_rate": 2.7449471620169988e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.11642484366893768, "step": 1815, "valid_targets_mean": 3250.6, "valid_targets_min": 826 }, { "epoch": 3.0952380952380953, "grad_norm": 0.5993960429294215, "learning_rate": 2.7370691790204173e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.14193883538246155, "step": 1820, "valid_targets_mean": 3056.0, "valid_targets_min": 1417 }, { "epoch": 3.1037414965986394, "grad_norm": 0.4559839126604544, "learning_rate": 2.7291779402404538e-05, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.1268749088048935, "step": 1825, "valid_targets_mean": 3777.4, "valid_targets_min": 1210 }, { "epoch": 3.1122448979591835, "grad_norm": 0.5604579578162319, "learning_rate": 2.7212735875966946e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.12619996070861816, "step": 1830, "valid_targets_mean": 3083.2, "valid_targets_min": 668 }, { "epoch": 3.120748299319728, "grad_norm": 0.5438820371018678, "learning_rate": 2.713356263244569e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.1503400355577469, "step": 1835, "valid_targets_mean": 4212.8, "valid_targets_min": 1288 }, { "epoch": 3.129251700680272, "grad_norm": 0.5195545679371458, "learning_rate": 2.7054261095727977e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.16384392976760864, "step": 1840, "valid_targets_mean": 3396.9, "valid_targets_min": 1215 }, { "epoch": 3.137755102040816, "grad_norm": 0.5113512295726848, "learning_rate": 2.6974832692008278e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14530371129512787, "step": 1845, "valid_targets_mean": 3812.4, "valid_targets_min": 468 }, { "epoch": 3.1462585034013606, "grad_norm": 0.49306040169984283, "learning_rate": 2.6895278849762694e-05, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.14059320092201233, "step": 1850, "valid_targets_mean": 4135.6, "valid_targets_min": 1137 }, { "epoch": 3.1547619047619047, "grad_norm": 0.4826789386729217, "learning_rate": 2.68156009997233e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.12108274549245834, "step": 1855, "valid_targets_mean": 3404.0, "valid_targets_min": 1535 }, { "epoch": 3.163265306122449, "grad_norm": 0.509069211171738, "learning_rate": 2.673580057485234e-05, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1607593148946762, "step": 1860, "valid_targets_mean": 3872.3, "valid_targets_min": 1520 }, { "epoch": 3.171768707482993, "grad_norm": 0.5481617769731713, "learning_rate": 2.6655879010316535e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.19412599503993988, "step": 1865, "valid_targets_mean": 3780.2, "valid_targets_min": 1849 }, { "epoch": 3.1802721088435373, "grad_norm": 0.4726239103908885, "learning_rate": 2.657583774346121e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.14381511509418488, "step": 1870, "valid_targets_mean": 4229.1, "valid_targets_min": 1817 }, { "epoch": 3.188775510204082, "grad_norm": 0.5674638452522066, "learning_rate": 2.649567821378449e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.13234567642211914, "step": 1875, "valid_targets_mean": 2603.2, "valid_targets_min": 1594 }, { "epoch": 3.197278911564626, "grad_norm": 0.4844284742271353, "learning_rate": 2.641540186291138e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.11232699453830719, "step": 1880, "valid_targets_mean": 3777.3, "valid_targets_min": 414 }, { "epoch": 3.20578231292517, "grad_norm": 0.5928341730053119, "learning_rate": 2.6335010134567852e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.1312047839164734, "step": 1885, "valid_targets_mean": 3397.1, "valid_targets_min": 1745 }, { "epoch": 3.2142857142857144, "grad_norm": 0.45839469775941877, "learning_rate": 2.6254504474554883e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.1701536476612091, "step": 1890, "valid_targets_mean": 4128.9, "valid_targets_min": 1446 }, { "epoch": 3.2227891156462585, "grad_norm": 0.5008710719767632, "learning_rate": 2.617388633072244e-05, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.15137995779514313, "step": 1895, "valid_targets_mean": 3451.7, "valid_targets_min": 1403 }, { "epoch": 3.2312925170068025, "grad_norm": 0.5827041310129761, "learning_rate": 2.609315715294346e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.14786767959594727, "step": 1900, "valid_targets_mean": 3197.5, "valid_targets_min": 844 }, { "epoch": 3.239795918367347, "grad_norm": 0.4774939218788078, "learning_rate": 2.6012318393087754e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.12262146174907684, "step": 1905, "valid_targets_mean": 3974.2, "valid_targets_min": 1129 }, { "epoch": 3.248299319727891, "grad_norm": 2.3012934366864584, "learning_rate": 2.593137150499591e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.16141125559806824, "step": 1910, "valid_targets_mean": 3124.3, "valid_targets_min": 1540 }, { "epoch": 3.2568027210884356, "grad_norm": 0.5643599785855004, "learning_rate": 2.5850317944453153e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.12558527290821075, "step": 1915, "valid_targets_mean": 3054.8, "valid_targets_min": 1355 }, { "epoch": 3.2653061224489797, "grad_norm": 0.47636899169835173, "learning_rate": 2.5769159169163137e-05, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.12280717492103577, "step": 1920, "valid_targets_mean": 4109.9, "valid_targets_min": 738 }, { "epoch": 3.2738095238095237, "grad_norm": 0.5063508169912114, "learning_rate": 2.568789663872175e-05, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.15989241003990173, "step": 1925, "valid_targets_mean": 3856.1, "valid_targets_min": 1107 }, { "epoch": 3.282312925170068, "grad_norm": 0.4811148388189251, "learning_rate": 2.5606531814590868e-05, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412792056798935, "step": 1930, "valid_targets_mean": 3863.6, "valid_targets_min": 1217 }, { "epoch": 3.2908163265306123, "grad_norm": 0.49396827270191446, "learning_rate": 2.552506616007205e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.16188889741897583, "step": 1935, "valid_targets_mean": 4214.9, "valid_targets_min": 1171 }, { "epoch": 3.2993197278911564, "grad_norm": 0.5027361991896958, "learning_rate": 2.544350114028025e-05, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.12943832576274872, "step": 1940, "valid_targets_mean": 3637.8, "valid_targets_min": 1012 }, { "epoch": 3.307823129251701, "grad_norm": 0.493648390936752, "learning_rate": 2.5361838222117435e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.1386047899723053, "step": 1945, "valid_targets_mean": 3566.7, "valid_targets_min": 906 }, { "epoch": 3.316326530612245, "grad_norm": 0.4934917907617171, "learning_rate": 2.5280078874246227e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1620742529630661, "step": 1950, "valid_targets_mean": 3895.6, "valid_targets_min": 1382 }, { "epoch": 3.324829931972789, "grad_norm": 0.5812143740145603, "learning_rate": 2.519822456706349e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.17321470379829407, "step": 1955, "valid_targets_mean": 3244.1, "valid_targets_min": 1364 }, { "epoch": 3.3333333333333335, "grad_norm": 0.5157880709455498, "learning_rate": 2.5116276772673863e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.23097273707389832, "step": 1960, "valid_targets_mean": 4115.7, "valid_targets_min": 1517 }, { "epoch": 3.3418367346938775, "grad_norm": 0.44313842009506144, "learning_rate": 2.503423696486332e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.13994191586971283, "step": 1965, "valid_targets_mean": 4884.8, "valid_targets_min": 868 }, { "epoch": 3.3503401360544216, "grad_norm": 0.4904305036943379, "learning_rate": 2.495210661907263e-05, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.1328560709953308, "step": 1970, "valid_targets_mean": 3285.6, "valid_targets_min": 506 }, { "epoch": 3.358843537414966, "grad_norm": 0.5443084350560426, "learning_rate": 2.4869887212370847e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.12956424057483673, "step": 1975, "valid_targets_mean": 3053.5, "valid_targets_min": 1435 }, { "epoch": 3.36734693877551, "grad_norm": 0.4573267525975133, "learning_rate": 2.4787580223428736e-05, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11794184893369675, "step": 1980, "valid_targets_mean": 3524.2, "valid_targets_min": 1558 }, { "epoch": 3.3758503401360542, "grad_norm": 0.48589338823426165, "learning_rate": 2.470518713249217e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.14002826809883118, "step": 1985, "valid_targets_mean": 3914.6, "valid_targets_min": 1507 }, { "epoch": 3.3843537414965987, "grad_norm": 0.5119561537935591, "learning_rate": 2.4622709421355535e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.15183639526367188, "step": 1990, "valid_targets_mean": 3411.4, "valid_targets_min": 1311 }, { "epoch": 3.392857142857143, "grad_norm": 0.48761202799121056, "learning_rate": 2.4540148573335057e-05, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.14358212053775787, "step": 1995, "valid_targets_mean": 3778.9, "valid_targets_min": 1430 }, { "epoch": 3.4013605442176873, "grad_norm": 0.5091769846013783, "learning_rate": 2.445750607324212e-05, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.12895150482654572, "step": 2000, "valid_targets_mean": 3439.9, "valid_targets_min": 1228 }, { "epoch": 3.4098639455782314, "grad_norm": 0.46277855706597215, "learning_rate": 2.4374783407356602e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.13825930655002594, "step": 2005, "valid_targets_mean": 4161.5, "valid_targets_min": 1542 }, { "epoch": 3.4183673469387754, "grad_norm": 0.5182823416136738, "learning_rate": 2.4291982063400096e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15307000279426575, "step": 2010, "valid_targets_mean": 3669.1, "valid_targets_min": 2351 }, { "epoch": 3.4268707482993195, "grad_norm": 0.48047265886653706, "learning_rate": 2.4209103530509196e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.1290254145860672, "step": 2015, "valid_targets_mean": 3352.1, "valid_targets_min": 1254 }, { "epoch": 3.435374149659864, "grad_norm": 0.5466523776690688, "learning_rate": 2.412614929920868e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.17689591646194458, "step": 2020, "valid_targets_mean": 3302.2, "valid_targets_min": 1393 }, { "epoch": 3.443877551020408, "grad_norm": 0.5840183574717508, "learning_rate": 2.4043120861384723e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.18398138880729675, "step": 2025, "valid_targets_mean": 3467.4, "valid_targets_min": 1710 }, { "epoch": 3.4523809523809526, "grad_norm": 0.4786308924135924, "learning_rate": 2.3960019710258068e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.13967232406139374, "step": 2030, "valid_targets_mean": 4170.2, "valid_targets_min": 1800 }, { "epoch": 3.4608843537414966, "grad_norm": 0.4724083960800044, "learning_rate": 2.3876847340357164e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.14074461162090302, "step": 2035, "valid_targets_mean": 3416.8, "valid_targets_min": 1551 }, { "epoch": 3.4693877551020407, "grad_norm": 0.552558554312206, "learning_rate": 2.3793605247491303e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.20764395594596863, "step": 2040, "valid_targets_mean": 4187.3, "valid_targets_min": 1424 }, { "epoch": 3.477891156462585, "grad_norm": 0.5163498510728093, "learning_rate": 2.371029492872369e-05, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.14693160355091095, "step": 2045, "valid_targets_mean": 3235.4, "valid_targets_min": 261 }, { "epoch": 3.4863945578231292, "grad_norm": 0.5013959306377093, "learning_rate": 2.362691788234453e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.12825211882591248, "step": 2050, "valid_targets_mean": 3316.6, "valid_targets_min": 272 }, { "epoch": 3.4948979591836733, "grad_norm": 0.4607494767645447, "learning_rate": 2.3543475607844105e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15415170788764954, "step": 2055, "valid_targets_mean": 4641.1, "valid_targets_min": 1383 }, { "epoch": 3.503401360544218, "grad_norm": 0.4920567824742292, "learning_rate": 2.3459969605885785e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.17793437838554382, "step": 2060, "valid_targets_mean": 4237.8, "valid_targets_min": 648 }, { "epoch": 3.511904761904762, "grad_norm": 0.5174711622509411, "learning_rate": 2.3376401378279037e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297653764486313, "step": 2065, "valid_targets_mean": 2994.3, "valid_targets_min": 1413 }, { "epoch": 3.520408163265306, "grad_norm": 0.5163717376042865, "learning_rate": 2.329277242795243e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.15077583491802216, "step": 2070, "valid_targets_mean": 3868.8, "valid_targets_min": 804 }, { "epoch": 3.5289115646258504, "grad_norm": 0.5086218045854233, "learning_rate": 2.320908425892658e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.14013858139514923, "step": 2075, "valid_targets_mean": 2993.7, "valid_targets_min": 649 }, { "epoch": 3.5374149659863945, "grad_norm": 0.5462773846852057, "learning_rate": 2.3125338376287137e-05, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.14993932843208313, "step": 2080, "valid_targets_mean": 3203.9, "valid_targets_min": 1236 }, { "epoch": 3.545918367346939, "grad_norm": 0.5093830788049976, "learning_rate": 2.3041536286157706e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.12546180188655853, "step": 2085, "valid_targets_mean": 3676.3, "valid_targets_min": 1378 }, { "epoch": 3.554421768707483, "grad_norm": 0.5074306671591432, "learning_rate": 2.295767949567272e-05, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.12795674800872803, "step": 2090, "valid_targets_mean": 3516.2, "valid_targets_min": 844 }, { "epoch": 3.562925170068027, "grad_norm": 0.4896441751448396, "learning_rate": 2.28737695129504e-05, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1324068009853363, "step": 2095, "valid_targets_mean": 3447.2, "valid_targets_min": 1590 }, { "epoch": 3.571428571428571, "grad_norm": 0.5013956210638618, "learning_rate": 2.2789807847065574e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.13823112845420837, "step": 2100, "valid_targets_mean": 3616.2, "valid_targets_min": 777 }, { "epoch": 3.5799319727891157, "grad_norm": 0.5306077891974634, "learning_rate": 2.2705796008022592e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.14960964024066925, "step": 2105, "valid_targets_mean": 3087.6, "valid_targets_min": 1262 }, { "epoch": 3.5884353741496597, "grad_norm": 0.44147190175386997, "learning_rate": 2.2621735506728126e-05, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.11909447610378265, "step": 2110, "valid_targets_mean": 4089.0, "valid_targets_min": 1714 }, { "epoch": 3.5969387755102042, "grad_norm": 0.44351920329660205, "learning_rate": 2.2537627854963994e-05, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.12201227247714996, "step": 2115, "valid_targets_mean": 4485.5, "valid_targets_min": 1318 }, { "epoch": 3.6054421768707483, "grad_norm": 0.5202268781406105, "learning_rate": 2.2453474565360018e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.13805070519447327, "step": 2120, "valid_targets_mean": 3141.2, "valid_targets_min": 1354 }, { "epoch": 3.6139455782312924, "grad_norm": 0.486925624713484, "learning_rate": 2.2369277151366776e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1417008936405182, "step": 2125, "valid_targets_mean": 3789.7, "valid_targets_min": 1597 }, { "epoch": 3.622448979591837, "grad_norm": 0.569357943842269, "learning_rate": 2.228503712722841e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.11663225293159485, "step": 2130, "valid_targets_mean": 2776.4, "valid_targets_min": 1020 }, { "epoch": 3.630952380952381, "grad_norm": 0.4708138592970684, "learning_rate": 2.220075600795537e-05, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.12191980332136154, "step": 2135, "valid_targets_mean": 4152.0, "valid_targets_min": 1693 }, { "epoch": 3.6394557823129254, "grad_norm": 0.46387557457924355, "learning_rate": 2.2116435309297177e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.13377505540847778, "step": 2140, "valid_targets_mean": 4785.8, "valid_targets_min": 1441 }, { "epoch": 3.6479591836734695, "grad_norm": 0.5022621604582599, "learning_rate": 2.203207654771519e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.13495998084545135, "step": 2145, "valid_targets_mean": 3572.0, "valid_targets_min": 1210 }, { "epoch": 3.6564625850340136, "grad_norm": 0.4991291175902639, "learning_rate": 2.1947681240355266e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.16433686017990112, "step": 2150, "valid_targets_mean": 4432.6, "valid_targets_min": 1346 }, { "epoch": 3.6649659863945576, "grad_norm": 0.5458475179648687, "learning_rate": 2.1863250905020566e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.17905211448669434, "step": 2155, "valid_targets_mean": 3504.8, "valid_targets_min": 626 }, { "epoch": 3.673469387755102, "grad_norm": 0.4828154132176292, "learning_rate": 2.177878706014418e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637372374534607, "step": 2160, "valid_targets_mean": 3928.8, "valid_targets_min": 1146 }, { "epoch": 3.681972789115646, "grad_norm": 0.5626269965220437, "learning_rate": 2.1694291224761845e-05, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.14788082242012024, "step": 2165, "valid_targets_mean": 3986.1, "valid_targets_min": 1226 }, { "epoch": 3.6904761904761907, "grad_norm": 0.5570323579675244, "learning_rate": 2.160976491848465e-05, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.13803161680698395, "step": 2170, "valid_targets_mean": 3307.8, "valid_targets_min": 1231 }, { "epoch": 3.6989795918367347, "grad_norm": 0.5211299091365144, "learning_rate": 2.1525209661471677e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.24160908162593842, "step": 2175, "valid_targets_mean": 3941.2, "valid_targets_min": 429 }, { "epoch": 3.707482993197279, "grad_norm": 0.5109203075204358, "learning_rate": 2.1440626974402664e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.11953634023666382, "step": 2180, "valid_targets_mean": 3233.4, "valid_targets_min": 1336 }, { "epoch": 3.715986394557823, "grad_norm": 0.5740584045340128, "learning_rate": 2.135601837845068e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.13772159814834595, "step": 2185, "valid_targets_mean": 2741.2, "valid_targets_min": 1184 }, { "epoch": 3.7244897959183674, "grad_norm": 0.43522753496781236, "learning_rate": 2.1271385395254728e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.12005556374788284, "step": 2190, "valid_targets_mean": 4175.4, "valid_targets_min": 1728 }, { "epoch": 3.7329931972789114, "grad_norm": 0.5339718966786711, "learning_rate": 2.118672954689242e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.13433292508125305, "step": 2195, "valid_targets_mean": 2676.1, "valid_targets_min": 1687 }, { "epoch": 3.741496598639456, "grad_norm": 0.5827904357101654, "learning_rate": 2.1102052355852586e-05, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.11353085935115814, "step": 2200, "valid_targets_mean": 3892.6, "valid_targets_min": 1375 }, { "epoch": 3.75, "grad_norm": 0.48888577042540315, "learning_rate": 2.1017355345007883e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.1756305694580078, "step": 2205, "valid_targets_mean": 4875.0, "valid_targets_min": 1552 }, { "epoch": 3.758503401360544, "grad_norm": 0.49314576717231107, "learning_rate": 2.093264003758742e-05, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.13882237672805786, "step": 2210, "valid_targets_mean": 3865.2, "valid_targets_min": 1552 }, { "epoch": 3.7670068027210886, "grad_norm": 0.5227981614939449, "learning_rate": 2.0847907957149348e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.14849701523780823, "step": 2215, "valid_targets_mean": 4121.2, "valid_targets_min": 1314 }, { "epoch": 3.7755102040816326, "grad_norm": 0.5361785337409101, "learning_rate": 2.0763160627553502e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1522911787033081, "step": 2220, "valid_targets_mean": 3747.4, "valid_targets_min": 804 }, { "epoch": 3.784013605442177, "grad_norm": 0.5108340377650004, "learning_rate": 2.067839957293394e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375730335712433, "step": 2225, "valid_targets_mean": 3813.8, "valid_targets_min": 1223 }, { "epoch": 3.792517006802721, "grad_norm": 0.4981416024908662, "learning_rate": 2.059362631767156e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.11143091320991516, "step": 2230, "valid_targets_mean": 3263.8, "valid_targets_min": 1356 }, { "epoch": 3.8010204081632653, "grad_norm": 0.529958261180386, "learning_rate": 2.0508842386366687e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.11649850755929947, "step": 2235, "valid_targets_mean": 3105.9, "valid_targets_min": 1133 }, { "epoch": 3.8095238095238093, "grad_norm": 0.5691253179106762, "learning_rate": 2.0424049303811637e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666107028722763, "step": 2240, "valid_targets_mean": 3283.1, "valid_targets_min": 758 }, { "epoch": 3.818027210884354, "grad_norm": 0.5412858572899136, "learning_rate": 2.0339248594963326e-05, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.16017557680606842, "step": 2245, "valid_targets_mean": 3838.8, "valid_targets_min": 1132 }, { "epoch": 3.826530612244898, "grad_norm": 0.5565546049385312, "learning_rate": 2.025444178491582e-05, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.15504541993141174, "step": 2250, "valid_targets_mean": 3659.4, "valid_targets_min": 1529 }, { "epoch": 3.8350340136054424, "grad_norm": 0.4904628959821808, "learning_rate": 2.0169630398872897e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.11968071758747101, "step": 2255, "valid_targets_mean": 3128.1, "valid_targets_min": 1197 }, { "epoch": 3.8435374149659864, "grad_norm": 0.49816193763634675, "learning_rate": 2.0084815962120644e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.13853618502616882, "step": 2260, "valid_targets_mean": 3385.1, "valid_targets_min": 698 }, { "epoch": 3.8520408163265305, "grad_norm": 0.5440701366673651, "learning_rate": 2e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.1894933581352234, "step": 2265, "valid_targets_mean": 4004.4, "valid_targets_min": 1517 }, { "epoch": 3.8605442176870746, "grad_norm": 0.47898169059031503, "learning_rate": 1.9915184037879362e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1556398719549179, "step": 2270, "valid_targets_mean": 3937.4, "valid_targets_min": 971 }, { "epoch": 3.869047619047619, "grad_norm": 0.5521523760232286, "learning_rate": 1.983036960112711e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1512027531862259, "step": 2275, "valid_targets_mean": 3351.7, "valid_targets_min": 604 }, { "epoch": 3.877551020408163, "grad_norm": 0.47757110237107087, "learning_rate": 1.9745558215084184e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.17591100931167603, "step": 2280, "valid_targets_mean": 4062.6, "valid_targets_min": 1438 }, { "epoch": 3.8860544217687076, "grad_norm": 0.583060688800655, "learning_rate": 1.9660751405036677e-05, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.1539376825094223, "step": 2285, "valid_targets_mean": 2743.6, "valid_targets_min": 935 }, { "epoch": 3.8945578231292517, "grad_norm": 0.47798427896305834, "learning_rate": 1.9575950696188367e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.14273616671562195, "step": 2290, "valid_targets_mean": 3535.2, "valid_targets_min": 1171 }, { "epoch": 3.9030612244897958, "grad_norm": 0.5667491614754994, "learning_rate": 1.949115761363332e-05, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.12068904936313629, "step": 2295, "valid_targets_mean": 3373.4, "valid_targets_min": 1811 }, { "epoch": 3.9115646258503403, "grad_norm": 0.5217945938589202, "learning_rate": 1.9406373682328445e-05, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370539665222168, "step": 2300, "valid_targets_mean": 3699.2, "valid_targets_min": 1000 }, { "epoch": 3.9200680272108843, "grad_norm": 0.6072733473428619, "learning_rate": 1.932160042706607e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537347286939621, "step": 2305, "valid_targets_mean": 3188.1, "valid_targets_min": 507 }, { "epoch": 3.928571428571429, "grad_norm": 0.5533462927972612, "learning_rate": 1.9236839372446504e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1640930473804474, "step": 2310, "valid_targets_mean": 3405.7, "valid_targets_min": 1530 }, { "epoch": 3.937074829931973, "grad_norm": 0.5003163870992912, "learning_rate": 1.9152092042850655e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.13920584321022034, "step": 2315, "valid_targets_mean": 3497.1, "valid_targets_min": 1151 }, { "epoch": 3.945578231292517, "grad_norm": 0.5477685325651052, "learning_rate": 1.9067359962412588e-05, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.13287462294101715, "step": 2320, "valid_targets_mean": 2748.6, "valid_targets_min": 1295 }, { "epoch": 3.954081632653061, "grad_norm": 0.5211036734731059, "learning_rate": 1.8982644654992123e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.15169015526771545, "step": 2325, "valid_targets_mean": 3769.6, "valid_targets_min": 1234 }, { "epoch": 3.9625850340136055, "grad_norm": 0.4559337481019662, "learning_rate": 1.8897947644147424e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.18945789337158203, "step": 2330, "valid_targets_mean": 4717.9, "valid_targets_min": 1539 }, { "epoch": 3.9710884353741496, "grad_norm": 0.5090040830343693, "learning_rate": 1.8813270453107586e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.15533599257469177, "step": 2335, "valid_targets_mean": 3687.2, "valid_targets_min": 785 }, { "epoch": 3.979591836734694, "grad_norm": 0.49839328546501366, "learning_rate": 1.872861460474528e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.15626703202724457, "step": 2340, "valid_targets_mean": 3522.6, "valid_targets_min": 755 }, { "epoch": 3.988095238095238, "grad_norm": 0.4804577717706921, "learning_rate": 1.8643981621549325e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.126425102353096, "step": 2345, "valid_targets_mean": 3759.1, "valid_targets_min": 1911 }, { "epoch": 3.996598639455782, "grad_norm": 0.482933524469188, "learning_rate": 1.855937302559734e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.16276368498802185, "step": 2350, "valid_targets_mean": 4038.2, "valid_targets_min": 1268 }, { "epoch": 4.005102040816326, "grad_norm": 0.5023685365515297, "learning_rate": 1.8474790338528336e-05, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.10188114643096924, "step": 2355, "valid_targets_mean": 2653.2, "valid_targets_min": 1375 }, { "epoch": 4.01360544217687, "grad_norm": 0.41928203389131025, "learning_rate": 1.839023508151536e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13987550139427185, "step": 2360, "valid_targets_mean": 5312.6, "valid_targets_min": 1076 }, { "epoch": 4.022108843537415, "grad_norm": 0.5398436343258409, "learning_rate": 1.8305708775238162e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.11938532441854477, "step": 2365, "valid_targets_mean": 3537.8, "valid_targets_min": 1352 }, { "epoch": 4.030612244897959, "grad_norm": 0.5239289576849778, "learning_rate": 1.822121293985583e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.14157015085220337, "step": 2370, "valid_targets_mean": 4077.9, "valid_targets_min": 1325 }, { "epoch": 4.039115646258503, "grad_norm": 0.5245260864178052, "learning_rate": 1.813674909497944e-05, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.13017112016677856, "step": 2375, "valid_targets_mean": 3429.1, "valid_targets_min": 1505 }, { "epoch": 4.0476190476190474, "grad_norm": 0.5522673431765818, "learning_rate": 1.8052318759644744e-05, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.11945690214633942, "step": 2380, "valid_targets_mean": 3247.0, "valid_targets_min": 912 }, { "epoch": 4.0561224489795915, "grad_norm": 0.5293497397934687, "learning_rate": 1.7967923452284824e-05, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.16374406218528748, "step": 2385, "valid_targets_mean": 4229.2, "valid_targets_min": 872 }, { "epoch": 4.0646258503401365, "grad_norm": 0.5350434092704202, "learning_rate": 1.7883564690702826e-05, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.14136750996112823, "step": 2390, "valid_targets_mean": 3507.5, "valid_targets_min": 1377 }, { "epoch": 4.0731292517006805, "grad_norm": 0.4941976972197606, "learning_rate": 1.7799243992044634e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.12425091117620468, "step": 2395, "valid_targets_mean": 3654.2, "valid_targets_min": 859 }, { "epoch": 4.081632653061225, "grad_norm": 0.5763725763447235, "learning_rate": 1.7714962872771593e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.12952286005020142, "step": 2400, "valid_targets_mean": 3387.6, "valid_targets_min": 1323 }, { "epoch": 4.090136054421769, "grad_norm": 0.5277461938742322, "learning_rate": 1.7630722848633234e-05, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.11460752785205841, "step": 2405, "valid_targets_mean": 3624.1, "valid_targets_min": 918 }, { "epoch": 4.098639455782313, "grad_norm": 0.5275777309962448, "learning_rate": 1.7546525434639992e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.16966021060943604, "step": 2410, "valid_targets_mean": 3532.3, "valid_targets_min": 1299 }, { "epoch": 4.107142857142857, "grad_norm": 0.5639072274949859, "learning_rate": 1.7462372145036012e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.14622849225997925, "step": 2415, "valid_targets_mean": 3383.2, "valid_targets_min": 1356 }, { "epoch": 4.115646258503402, "grad_norm": 0.485846628966218, "learning_rate": 1.737826449327188e-05, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11411428451538086, "step": 2420, "valid_targets_mean": 4078.5, "valid_targets_min": 1640 }, { "epoch": 4.124149659863946, "grad_norm": 0.758272632014816, "learning_rate": 1.729420399197741e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.146653950214386, "step": 2425, "valid_targets_mean": 3492.2, "valid_targets_min": 1527 }, { "epoch": 4.13265306122449, "grad_norm": 0.5290919750861747, "learning_rate": 1.7210192152934423e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.16026335954666138, "step": 2430, "valid_targets_mean": 3589.4, "valid_targets_min": 1354 }, { "epoch": 4.141156462585034, "grad_norm": 0.5149616465912613, "learning_rate": 1.712623048704961e-05, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.10995449870824814, "step": 2435, "valid_targets_mean": 3371.2, "valid_targets_min": 1020 }, { "epoch": 4.149659863945578, "grad_norm": 0.5180400201990574, "learning_rate": 1.7042320504327285e-05, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.12292209267616272, "step": 2440, "valid_targets_mean": 3585.6, "valid_targets_min": 1436 }, { "epoch": 4.158163265306122, "grad_norm": 0.4402765691327618, "learning_rate": 1.6958463713842298e-05, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.10848579555749893, "step": 2445, "valid_targets_mean": 4908.5, "valid_targets_min": 1362 }, { "epoch": 4.166666666666667, "grad_norm": 0.583578753213086, "learning_rate": 1.687466162371286e-05, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.14145049452781677, "step": 2450, "valid_targets_mean": 3251.1, "valid_targets_min": 1552 }, { "epoch": 4.175170068027211, "grad_norm": 0.5123852752027489, "learning_rate": 1.6790915741073418e-05, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.18500098586082458, "step": 2455, "valid_targets_mean": 4195.8, "valid_targets_min": 1449 }, { "epoch": 4.183673469387755, "grad_norm": 0.5311552913814159, "learning_rate": 1.670722757204758e-05, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.1071048229932785, "step": 2460, "valid_targets_mean": 3237.9, "valid_targets_min": 1101 }, { "epoch": 4.192176870748299, "grad_norm": 0.4537481193241964, "learning_rate": 1.6623598621720966e-05, "loss": 0.1157, "loss_nan_ranks": 0, "loss_rank_avg": 0.09841416776180267, "step": 2465, "valid_targets_mean": 4214.3, "valid_targets_min": 468 }, { "epoch": 4.200680272108843, "grad_norm": 0.600717141479778, "learning_rate": 1.6540030394114218e-05, "loss": 0.1206, "loss_nan_ranks": 0, "loss_rank_avg": 0.13270169496536255, "step": 2470, "valid_targets_mean": 2691.5, "valid_targets_min": 1092 }, { "epoch": 4.209183673469388, "grad_norm": 0.4976204585645935, "learning_rate": 1.64565243921559e-05, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.11785245686769485, "step": 2475, "valid_targets_mean": 4144.9, "valid_targets_min": 1762 }, { "epoch": 4.217687074829932, "grad_norm": 0.5526481174319252, "learning_rate": 1.6373082117655473e-05, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.11944583803415298, "step": 2480, "valid_targets_mean": 3328.4, "valid_targets_min": 1197 }, { "epoch": 4.226190476190476, "grad_norm": 0.5185084228705585, "learning_rate": 1.6289705071276323e-05, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1478651762008667, "step": 2485, "valid_targets_mean": 4074.9, "valid_targets_min": 1695 }, { "epoch": 4.23469387755102, "grad_norm": 0.5064058629657685, "learning_rate": 1.62063947525087e-05, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1256791353225708, "step": 2490, "valid_targets_mean": 3633.2, "valid_targets_min": 1678 }, { "epoch": 4.243197278911564, "grad_norm": 0.5390030705626246, "learning_rate": 1.612315265964284e-05, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.15357208251953125, "step": 2495, "valid_targets_mean": 3176.2, "valid_targets_min": 1591 }, { "epoch": 4.2517006802721085, "grad_norm": 0.5406514616868823, "learning_rate": 1.6039980289741935e-05, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.1449306309223175, "step": 2500, "valid_targets_mean": 3431.1, "valid_targets_min": 1080 }, { "epoch": 4.260204081632653, "grad_norm": 0.6085265403782985, "learning_rate": 1.595687913861528e-05, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.12832342088222504, "step": 2505, "valid_targets_mean": 2708.1, "valid_targets_min": 883 }, { "epoch": 4.2687074829931975, "grad_norm": 0.9958125295487239, "learning_rate": 1.587385070079133e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.2037830352783203, "step": 2510, "valid_targets_mean": 4122.8, "valid_targets_min": 940 }, { "epoch": 4.2772108843537415, "grad_norm": 0.4706952960241422, "learning_rate": 1.5790896469490807e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.12226849794387817, "step": 2515, "valid_targets_mean": 4755.2, "valid_targets_min": 1755 }, { "epoch": 4.285714285714286, "grad_norm": 0.5054113047148475, "learning_rate": 1.5708017936599908e-05, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.16386127471923828, "step": 2520, "valid_targets_mean": 4257.3, "valid_targets_min": 1214 }, { "epoch": 4.29421768707483, "grad_norm": 0.6038493253323483, "learning_rate": 1.56252165926434e-05, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.13769403100013733, "step": 2525, "valid_targets_mean": 3143.4, "valid_targets_min": 1196 }, { "epoch": 4.302721088435375, "grad_norm": 0.4879214707147923, "learning_rate": 1.554249392675788e-05, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.14046776294708252, "step": 2530, "valid_targets_mean": 4527.4, "valid_targets_min": 1950 }, { "epoch": 4.311224489795919, "grad_norm": 0.4465612512180996, "learning_rate": 1.5459851426664956e-05, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12744249403476715, "step": 2535, "valid_targets_mean": 5046.9, "valid_targets_min": 1164 }, { "epoch": 4.319727891156463, "grad_norm": 0.4637284744313693, "learning_rate": 1.5377290578644468e-05, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.10689014941453934, "step": 2540, "valid_targets_mean": 4280.3, "valid_targets_min": 1835 }, { "epoch": 4.328231292517007, "grad_norm": 0.554279265133868, "learning_rate": 1.5294812867507835e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.1094164252281189, "step": 2545, "valid_targets_mean": 2614.7, "valid_targets_min": 1672 }, { "epoch": 4.336734693877551, "grad_norm": 0.5440722163559888, "learning_rate": 1.5212419776571267e-05, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.14824722707271576, "step": 2550, "valid_targets_mean": 3486.7, "valid_targets_min": 604 }, { "epoch": 4.345238095238095, "grad_norm": 0.45930986665841933, "learning_rate": 1.5130112787629152e-05, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.12556178867816925, "step": 2555, "valid_targets_mean": 4062.1, "valid_targets_min": 1406 }, { "epoch": 4.35374149659864, "grad_norm": 0.5347300720312089, "learning_rate": 1.5047893380927377e-05, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.11758849024772644, "step": 2560, "valid_targets_mean": 3016.2, "valid_targets_min": 1447 }, { "epoch": 4.362244897959184, "grad_norm": 0.5810110341683714, "learning_rate": 1.4965763035136687e-05, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.13106051087379456, "step": 2565, "valid_targets_mean": 2945.5, "valid_targets_min": 877 }, { "epoch": 4.370748299319728, "grad_norm": 0.511549856319123, "learning_rate": 1.4883723227326144e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.12233540415763855, "step": 2570, "valid_targets_mean": 4416.4, "valid_targets_min": 861 }, { "epoch": 4.379251700680272, "grad_norm": 0.6141891043153991, "learning_rate": 1.4801775432936516e-05, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.11202485859394073, "step": 2575, "valid_targets_mean": 2762.6, "valid_targets_min": 1015 }, { "epoch": 4.387755102040816, "grad_norm": 0.4476473551026391, "learning_rate": 1.4719921125753773e-05, "loss": 0.1213, "loss_nan_ranks": 0, "loss_rank_avg": 0.13985709846019745, "step": 2580, "valid_targets_mean": 5447.8, "valid_targets_min": 982 }, { "epoch": 4.39625850340136, "grad_norm": 0.562406722078899, "learning_rate": 1.4638161777882573e-05, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.11451070010662079, "step": 2585, "valid_targets_mean": 3943.8, "valid_targets_min": 1210 }, { "epoch": 4.404761904761905, "grad_norm": 0.5416533168212995, "learning_rate": 1.4556498859719756e-05, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.11477416008710861, "step": 2590, "valid_targets_mean": 3347.1, "valid_targets_min": 1476 }, { "epoch": 4.413265306122449, "grad_norm": 0.5165893385108531, "learning_rate": 1.4474933839927956e-05, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.16060087084770203, "step": 2595, "valid_targets_mean": 4232.8, "valid_targets_min": 1464 }, { "epoch": 4.421768707482993, "grad_norm": 0.594151452327815, "learning_rate": 1.4393468185409139e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.1185787171125412, "step": 2600, "valid_targets_mean": 2734.9, "valid_targets_min": 1044 }, { "epoch": 4.430272108843537, "grad_norm": 0.47620977994252855, "learning_rate": 1.4312103361278254e-05, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.13598421216011047, "step": 2605, "valid_targets_mean": 4362.1, "valid_targets_min": 1623 }, { "epoch": 4.438775510204081, "grad_norm": 0.5778604626245851, "learning_rate": 1.4230840830836875e-05, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.0991811454296112, "step": 2610, "valid_targets_mean": 3185.3, "valid_targets_min": 1047 }, { "epoch": 4.447278911564625, "grad_norm": 0.5095063044346275, "learning_rate": 1.4149682055546854e-05, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.16175615787506104, "step": 2615, "valid_targets_mean": 4249.7, "valid_targets_min": 1393 }, { "epoch": 4.45578231292517, "grad_norm": 0.5230093792172238, "learning_rate": 1.4068628495004095e-05, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.10372944176197052, "step": 2620, "valid_targets_mean": 3279.2, "valid_targets_min": 429 }, { "epoch": 4.464285714285714, "grad_norm": 0.4978389319017629, "learning_rate": 1.3987681606912254e-05, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.13917067646980286, "step": 2625, "valid_targets_mean": 4139.9, "valid_targets_min": 1693 }, { "epoch": 4.4727891156462585, "grad_norm": 0.48805163978121935, "learning_rate": 1.3906842847056546e-05, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.1258377879858017, "step": 2630, "valid_targets_mean": 4221.4, "valid_targets_min": 1151 }, { "epoch": 4.4812925170068025, "grad_norm": 0.5309720392418742, "learning_rate": 1.382611366927757e-05, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.12541979551315308, "step": 2635, "valid_targets_mean": 3300.1, "valid_targets_min": 1103 }, { "epoch": 4.489795918367347, "grad_norm": 0.4925804697564766, "learning_rate": 1.3745495525445126e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12611186504364014, "step": 2640, "valid_targets_mean": 3906.4, "valid_targets_min": 864 }, { "epoch": 4.4982993197278915, "grad_norm": 0.5454905313244999, "learning_rate": 1.3664989865432157e-05, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.10953294485807419, "step": 2645, "valid_targets_mean": 3340.1, "valid_targets_min": 1733 }, { "epoch": 4.506802721088436, "grad_norm": 0.5252733550532073, "learning_rate": 1.3584598137088625e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.15157128870487213, "step": 2650, "valid_targets_mean": 3560.9, "valid_targets_min": 1273 }, { "epoch": 4.51530612244898, "grad_norm": 0.5198558545652678, "learning_rate": 1.3504321786215514e-05, "loss": 0.1192, "loss_nan_ranks": 0, "loss_rank_avg": 0.11329950392246246, "step": 2655, "valid_targets_mean": 3093.6, "valid_targets_min": 881 }, { "epoch": 4.523809523809524, "grad_norm": 0.6002119548110341, "learning_rate": 1.3424162256538797e-05, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.1460447907447815, "step": 2660, "valid_targets_mean": 2855.2, "valid_targets_min": 1115 }, { "epoch": 4.532312925170068, "grad_norm": 0.4690919568996324, "learning_rate": 1.3344120989683473e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.11531253159046173, "step": 2665, "valid_targets_mean": 4137.5, "valid_targets_min": 1170 }, { "epoch": 4.540816326530612, "grad_norm": 0.48345732018469006, "learning_rate": 1.3264199425147667e-05, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.12812292575836182, "step": 2670, "valid_targets_mean": 4035.9, "valid_targets_min": 1360 }, { "epoch": 4.549319727891157, "grad_norm": 0.6281667762967951, "learning_rate": 1.3184399000276708e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.13768933713436127, "step": 2675, "valid_targets_mean": 2721.2, "valid_targets_min": 759 }, { "epoch": 4.557823129251701, "grad_norm": 0.6020408443336502, "learning_rate": 1.3104721150237305e-05, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.13107319176197052, "step": 2680, "valid_targets_mean": 3015.6, "valid_targets_min": 1276 }, { "epoch": 4.566326530612245, "grad_norm": 0.5222297457955155, "learning_rate": 1.3025167307991734e-05, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.11526221036911011, "step": 2685, "valid_targets_mean": 3457.8, "valid_targets_min": 1537 }, { "epoch": 4.574829931972789, "grad_norm": 0.5399196254993844, "learning_rate": 1.294573890427203e-05, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.16417351365089417, "step": 2690, "valid_targets_mean": 4152.0, "valid_targets_min": 1388 }, { "epoch": 4.583333333333333, "grad_norm": 0.5453980131163246, "learning_rate": 1.2866437367554313e-05, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13150575757026672, "step": 2695, "valid_targets_mean": 3255.8, "valid_targets_min": 1080 }, { "epoch": 4.591836734693878, "grad_norm": 0.564868544100156, "learning_rate": 1.278726412403306e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.11302247643470764, "step": 2700, "valid_targets_mean": 2766.1, "valid_targets_min": 288 }, { "epoch": 4.600340136054422, "grad_norm": 0.5570067708592675, "learning_rate": 1.2708220597595462e-05, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.16181376576423645, "step": 2705, "valid_targets_mean": 3591.7, "valid_targets_min": 1429 }, { "epoch": 4.608843537414966, "grad_norm": 0.4924894979414545, "learning_rate": 1.2629308209795834e-05, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.13477236032485962, "step": 2710, "valid_targets_mean": 3979.9, "valid_targets_min": 1277 }, { "epoch": 4.61734693877551, "grad_norm": 0.5395011939137863, "learning_rate": 1.2550528379830019e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.12093565613031387, "step": 2715, "valid_targets_mean": 3259.6, "valid_targets_min": 869 }, { "epoch": 4.625850340136054, "grad_norm": 0.48613266875635563, "learning_rate": 1.2471882524509873e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.11778571456670761, "step": 2720, "valid_targets_mean": 4093.9, "valid_targets_min": 1843 }, { "epoch": 4.634353741496598, "grad_norm": 0.5920343619245662, "learning_rate": 1.2393372058237819e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.12733955681324005, "step": 2725, "valid_targets_mean": 3063.2, "valid_targets_min": 1169 }, { "epoch": 4.642857142857143, "grad_norm": 0.5038080159084226, "learning_rate": 1.2314998392981364e-05, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.13160504400730133, "step": 2730, "valid_targets_mean": 4067.9, "valid_targets_min": 1577 }, { "epoch": 4.651360544217687, "grad_norm": 0.5229519935844232, "learning_rate": 1.2236762938247729e-05, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371050775051117, "step": 2735, "valid_targets_mean": 3716.6, "valid_targets_min": 1169 }, { "epoch": 4.659863945578231, "grad_norm": 0.521745882443459, "learning_rate": 1.2158667101058497e-05, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13528242707252502, "step": 2740, "valid_targets_mean": 3872.4, "valid_targets_min": 1477 }, { "epoch": 4.668367346938775, "grad_norm": 0.4885511062328345, "learning_rate": 1.208071228592429e-05, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.15420043468475342, "step": 2745, "valid_targets_mean": 4217.5, "valid_targets_min": 1480 }, { "epoch": 4.6768707482993195, "grad_norm": 0.4178757321541779, "learning_rate": 1.2002899894819548e-05, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247992143034935, "step": 2750, "valid_targets_mean": 4595.2, "valid_targets_min": 1157 }, { "epoch": 4.685374149659864, "grad_norm": 0.6108750918194292, "learning_rate": 1.1925231327157288e-05, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12069522589445114, "step": 2755, "valid_targets_mean": 2943.6, "valid_targets_min": 1366 }, { "epoch": 4.6938775510204085, "grad_norm": 0.5299847403293142, "learning_rate": 1.1847707979763934e-05, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.20735841989517212, "step": 2760, "valid_targets_mean": 4586.6, "valid_targets_min": 280 }, { "epoch": 4.7023809523809526, "grad_norm": 0.5262690909390965, "learning_rate": 1.1770331246854211e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.12230242788791656, "step": 2765, "valid_targets_mean": 3189.1, "valid_targets_min": 1330 }, { "epoch": 4.710884353741497, "grad_norm": 0.44464404640066674, "learning_rate": 1.169310252000605e-05, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.11267457902431488, "step": 2770, "valid_targets_mean": 4162.7, "valid_targets_min": 1809 }, { "epoch": 4.719387755102041, "grad_norm": 0.5455599156674992, "learning_rate": 1.1616023188135594e-05, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.10474415868520737, "step": 2775, "valid_targets_mean": 2892.6, "valid_targets_min": 626 }, { "epoch": 4.727891156462585, "grad_norm": 0.5015898266496815, "learning_rate": 1.1539094637472181e-05, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.17794445157051086, "step": 2780, "valid_targets_mean": 4521.5, "valid_targets_min": 1553 }, { "epoch": 4.736394557823129, "grad_norm": 0.5508250011415522, "learning_rate": 1.1462318251533442e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.11678224056959152, "step": 2785, "valid_targets_mean": 3110.7, "valid_targets_min": 1429 }, { "epoch": 4.744897959183674, "grad_norm": 0.622408173575908, "learning_rate": 1.1385695411100424e-05, "loss": 0.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.11828910559415817, "step": 2790, "valid_targets_mean": 3258.1, "valid_targets_min": 1122 }, { "epoch": 4.753401360544218, "grad_norm": 0.5322995958406667, "learning_rate": 1.1309227494192703e-05, "loss": 0.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.13555939495563507, "step": 2795, "valid_targets_mean": 3526.5, "valid_targets_min": 1328 }, { "epoch": 4.761904761904762, "grad_norm": 0.5756957552451561, "learning_rate": 1.1232915876043673e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.14180392026901245, "step": 2800, "valid_targets_mean": 3444.5, "valid_targets_min": 1732 }, { "epoch": 4.770408163265306, "grad_norm": 0.503634481514556, "learning_rate": 1.1156761929075777e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.13477468490600586, "step": 2805, "valid_targets_mean": 3889.4, "valid_targets_min": 345 }, { "epoch": 4.77891156462585, "grad_norm": 0.5122500311184057, "learning_rate": 1.1080767022875816e-05, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.10373985022306442, "step": 2810, "valid_targets_mean": 3319.8, "valid_targets_min": 534 }, { "epoch": 4.787414965986395, "grad_norm": 0.4711642587141199, "learning_rate": 1.100493252417035e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.11209157109260559, "step": 2815, "valid_targets_mean": 3830.2, "valid_targets_min": 1861 }, { "epoch": 4.795918367346939, "grad_norm": 0.5123035748411254, "learning_rate": 1.0929259796801075e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.18172311782836914, "step": 2820, "valid_targets_mean": 4577.3, "valid_targets_min": 1025 }, { "epoch": 4.804421768707483, "grad_norm": 0.5808435182317419, "learning_rate": 1.085375020170034e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.12455550581216812, "step": 2825, "valid_targets_mean": 3490.9, "valid_targets_min": 1254 }, { "epoch": 4.812925170068027, "grad_norm": 0.5320315082614337, "learning_rate": 1.0778405096866624e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.13116773962974548, "step": 2830, "valid_targets_mean": 3979.3, "valid_targets_min": 1469 }, { "epoch": 4.821428571428571, "grad_norm": 0.5385934682017872, "learning_rate": 1.0703225837340166e-05, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.12079325318336487, "step": 2835, "valid_targets_mean": 3281.2, "valid_targets_min": 795 }, { "epoch": 4.829931972789115, "grad_norm": 0.6106526535513195, "learning_rate": 1.0628213775178561e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.12414602935314178, "step": 2840, "valid_targets_mean": 2841.2, "valid_targets_min": 602 }, { "epoch": 4.83843537414966, "grad_norm": 0.5093217844857241, "learning_rate": 1.055337025943244e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.140962153673172, "step": 2845, "valid_targets_mean": 4046.6, "valid_targets_min": 1090 }, { "epoch": 4.846938775510204, "grad_norm": 0.5601063982178885, "learning_rate": 1.0478696636121231e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.13058549165725708, "step": 2850, "valid_targets_mean": 2946.1, "valid_targets_min": 787 }, { "epoch": 4.855442176870748, "grad_norm": 0.5490008558122706, "learning_rate": 1.0404194248208934e-05, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.12004873156547546, "step": 2855, "valid_targets_mean": 3107.6, "valid_targets_min": 1576 }, { "epoch": 4.863945578231292, "grad_norm": 0.5390824170618834, "learning_rate": 1.0329864435579982e-05, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494147628545761, "step": 2860, "valid_targets_mean": 3607.8, "valid_targets_min": 883 }, { "epoch": 4.872448979591836, "grad_norm": 0.507051514951129, "learning_rate": 1.0255708535015137e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.14024758338928223, "step": 2865, "valid_targets_mean": 3543.3, "valid_targets_min": 1415 }, { "epoch": 4.880952380952381, "grad_norm": 0.4535295124880974, "learning_rate": 1.0181727880167428e-05, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.11601919680833817, "step": 2870, "valid_targets_mean": 4292.6, "valid_targets_min": 1658 }, { "epoch": 4.889455782312925, "grad_norm": 0.6284871405176786, "learning_rate": 1.0107923801538215e-05, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.1566929817199707, "step": 2875, "valid_targets_mean": 3509.4, "valid_targets_min": 1154 }, { "epoch": 4.8979591836734695, "grad_norm": 0.8017226677266484, "learning_rate": 1.003429762645321e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.12294437736272812, "step": 2880, "valid_targets_mean": 3937.1, "valid_targets_min": 704 }, { "epoch": 4.906462585034014, "grad_norm": 0.49364696050021467, "learning_rate": 9.960850679038632e-06, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.12457674741744995, "step": 2885, "valid_targets_mean": 3758.8, "valid_targets_min": 1532 }, { "epoch": 4.914965986394558, "grad_norm": 0.4548630723446227, "learning_rate": 9.887584280197411e-06, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.159095898270607, "step": 2890, "valid_targets_mean": 4785.4, "valid_targets_min": 1638 }, { "epoch": 4.923469387755102, "grad_norm": 0.5740124878344341, "learning_rate": 9.814499747585373e-06, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.13639631867408752, "step": 2895, "valid_targets_mean": 3424.3, "valid_targets_min": 1593 }, { "epoch": 4.931972789115647, "grad_norm": 0.5928533009251364, "learning_rate": 9.741598395587606e-06, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397685408592224, "step": 2900, "valid_targets_mean": 3337.0, "valid_targets_min": 1140 }, { "epoch": 4.940476190476191, "grad_norm": 0.4832053251048456, "learning_rate": 9.668881535294792e-06, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.11467613279819489, "step": 2905, "valid_targets_mean": 3527.8, "valid_targets_min": 1355 }, { "epoch": 4.948979591836735, "grad_norm": 0.5194202009100961, "learning_rate": 9.596350474479625e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.17165853083133698, "step": 2910, "valid_targets_mean": 4053.4, "valid_targets_min": 1254 }, { "epoch": 4.957482993197279, "grad_norm": 0.4710233237676264, "learning_rate": 9.52400651757331e-06, "loss": 0.1268, "loss_nan_ranks": 0, "loss_rank_avg": 0.13677963614463806, "step": 2915, "valid_targets_mean": 4633.2, "valid_targets_min": 1389 }, { "epoch": 4.965986394557823, "grad_norm": 0.6026856180553531, "learning_rate": 9.451850965642073e-06, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.16165249049663544, "step": 2920, "valid_targets_mean": 3169.5, "valid_targets_min": 1016 }, { "epoch": 4.974489795918368, "grad_norm": 0.5579194459953276, "learning_rate": 9.379885116363786e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.13458088040351868, "step": 2925, "valid_targets_mean": 3184.6, "valid_targets_min": 1217 }, { "epoch": 4.982993197278912, "grad_norm": 0.6099184803160398, "learning_rate": 9.308110264004625e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.13990472257137299, "step": 2930, "valid_targets_mean": 2672.0, "valid_targets_min": 648 }, { "epoch": 4.991496598639456, "grad_norm": 0.5643685144945373, "learning_rate": 9.236527699395803e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.14728853106498718, "step": 2935, "valid_targets_mean": 3404.2, "valid_targets_min": 1531 }, { "epoch": 5.0, "grad_norm": 0.49184592411521516, "learning_rate": 9.165138709910338e-06, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.12404905259609222, "step": 2940, "valid_targets_mean": 3728.0, "valid_targets_min": 1129 }, { "epoch": 5.008503401360544, "grad_norm": 0.460373687869048, "learning_rate": 9.093944579439882e-06, "loss": 0.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.11780281364917755, "step": 2945, "valid_targets_mean": 4433.4, "valid_targets_min": 1551 }, { "epoch": 5.017006802721088, "grad_norm": 0.5141394604653041, "learning_rate": 9.022946588371688e-06, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.11578322947025299, "step": 2950, "valid_targets_mean": 3810.8, "valid_targets_min": 792 }, { "epoch": 5.025510204081633, "grad_norm": 0.6119126642644851, "learning_rate": 8.952146013565532e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.11888520419597626, "step": 2955, "valid_targets_mean": 3330.3, "valid_targets_min": 1196 }, { "epoch": 5.034013605442177, "grad_norm": 0.5334163364241725, "learning_rate": 8.881544128330777e-06, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.10936582833528519, "step": 2960, "valid_targets_mean": 3843.6, "valid_targets_min": 1332 }, { "epoch": 5.042517006802721, "grad_norm": 0.5207414438668616, "learning_rate": 8.81114220240346e-06, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.09396034479141235, "step": 2965, "valid_targets_mean": 3615.5, "valid_targets_min": 1598 }, { "epoch": 5.051020408163265, "grad_norm": 0.5325192027606288, "learning_rate": 8.740941501923454e-06, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.11093772947788239, "step": 2970, "valid_targets_mean": 3633.8, "valid_targets_min": 1334 }, { "epoch": 5.059523809523809, "grad_norm": 0.5227116634294291, "learning_rate": 8.6709432894117e-06, "loss": 0.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.11531760543584824, "step": 2975, "valid_targets_mean": 4427.8, "valid_targets_min": 1586 }, { "epoch": 5.068027210884353, "grad_norm": 0.54169564088552, "learning_rate": 8.601148823747516e-06, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.10472555458545685, "step": 2980, "valid_targets_mean": 3638.6, "valid_targets_min": 1494 }, { "epoch": 5.076530612244898, "grad_norm": 0.614347963039127, "learning_rate": 8.531559360145942e-06, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11521926522254944, "step": 2985, "valid_targets_mean": 3453.6, "valid_targets_min": 1551 }, { "epoch": 5.085034013605442, "grad_norm": 0.5700921400342378, "learning_rate": 8.462176150135168e-06, "loss": 0.1356, "loss_nan_ranks": 0, "loss_rank_avg": 0.11983014643192291, "step": 2990, "valid_targets_mean": 3673.4, "valid_targets_min": 1312 }, { "epoch": 5.093537414965986, "grad_norm": 0.5606850774518538, "learning_rate": 8.393000441534036e-06, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.1205582469701767, "step": 2995, "valid_targets_mean": 3382.2, "valid_targets_min": 1572 }, { "epoch": 5.1020408163265305, "grad_norm": 0.58308967535263, "learning_rate": 8.324033478429559e-06, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.10241550207138062, "step": 3000, "valid_targets_mean": 3517.1, "valid_targets_min": 1789 }, { "epoch": 5.110544217687075, "grad_norm": 0.5010560317558209, "learning_rate": 8.25527650115461e-06, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.14672619104385376, "step": 3005, "valid_targets_mean": 4090.6, "valid_targets_min": 613 }, { "epoch": 5.119047619047619, "grad_norm": 0.5428848219846862, "learning_rate": 8.186730746265577e-06, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.09942807257175446, "step": 3010, "valid_targets_mean": 3168.2, "valid_targets_min": 1170 }, { "epoch": 5.127551020408164, "grad_norm": 0.51701896739521, "learning_rate": 8.118397446520103e-06, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.11356031149625778, "step": 3015, "valid_targets_mean": 3822.1, "valid_targets_min": 1330 }, { "epoch": 5.136054421768708, "grad_norm": 0.5610298521254529, "learning_rate": 8.050277830854984e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.10268589854240417, "step": 3020, "valid_targets_mean": 3365.3, "valid_targets_min": 1473 }, { "epoch": 5.144557823129252, "grad_norm": 0.5147852147560592, "learning_rate": 7.982373124363984e-06, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11522484570741653, "step": 3025, "valid_targets_mean": 3669.4, "valid_targets_min": 325 }, { "epoch": 5.153061224489796, "grad_norm": 0.5551663697519054, "learning_rate": 7.914684548275875e-06, "loss": 0.1094, "loss_nan_ranks": 0, "loss_rank_avg": 0.11051298677921295, "step": 3030, "valid_targets_mean": 3926.8, "valid_targets_min": 861 }, { "epoch": 5.16156462585034, "grad_norm": 0.7995351940000094, "learning_rate": 7.847213319932425e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12783026695251465, "step": 3035, "valid_targets_mean": 4223.2, "valid_targets_min": 1160 }, { "epoch": 5.170068027210885, "grad_norm": 0.5433303920121849, "learning_rate": 7.779960652766534e-06, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.11100686341524124, "step": 3040, "valid_targets_mean": 3678.4, "valid_targets_min": 1334 }, { "epoch": 5.178571428571429, "grad_norm": 0.5233906234955884, "learning_rate": 7.7129277562804e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.12264975905418396, "step": 3045, "valid_targets_mean": 3809.6, "valid_targets_min": 875 }, { "epoch": 5.187074829931973, "grad_norm": 0.5461499007910949, "learning_rate": 7.646115836023744e-06, "loss": 0.1157, "loss_nan_ranks": 0, "loss_rank_avg": 0.12836602330207825, "step": 3050, "valid_targets_mean": 4164.1, "valid_targets_min": 1297 }, { "epoch": 5.195578231292517, "grad_norm": 0.4966515297253701, "learning_rate": 7.5795260935721755e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.12989744544029236, "step": 3055, "valid_targets_mean": 4977.2, "valid_targets_min": 1325 }, { "epoch": 5.204081632653061, "grad_norm": 0.5603026881528321, "learning_rate": 7.5131597265055585e-06, "loss": 0.1146, "loss_nan_ranks": 0, "loss_rank_avg": 0.13274753093719482, "step": 3060, "valid_targets_mean": 3628.2, "valid_targets_min": 1993 }, { "epoch": 5.212585034013605, "grad_norm": 0.4915563280912599, "learning_rate": 7.447017928386453e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.10731866955757141, "step": 3065, "valid_targets_mean": 3817.6, "valid_targets_min": 1266 }, { "epoch": 5.22108843537415, "grad_norm": 0.5880203513035192, "learning_rate": 7.381101888738693e-06, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.13712306320667267, "step": 3070, "valid_targets_mean": 3312.9, "valid_targets_min": 429 }, { "epoch": 5.229591836734694, "grad_norm": 0.6452402993864961, "learning_rate": 7.315412793025951e-06, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.11051145941019058, "step": 3075, "valid_targets_mean": 3440.4, "valid_targets_min": 604 }, { "epoch": 5.238095238095238, "grad_norm": 0.47909386074241567, "learning_rate": 7.24995182263045e-06, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11070841550827026, "step": 3080, "valid_targets_mean": 4483.2, "valid_targets_min": 1584 }, { "epoch": 5.246598639455782, "grad_norm": 0.5091807283304515, "learning_rate": 7.184720154831706e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.12383826076984406, "step": 3085, "valid_targets_mean": 4121.9, "valid_targets_min": 1748 }, { "epoch": 5.255102040816326, "grad_norm": 0.5561391846264628, "learning_rate": 7.119718962785349e-06, "loss": 0.11, "loss_nan_ranks": 0, "loss_rank_avg": 0.10299091786146164, "step": 3090, "valid_targets_mean": 3107.9, "valid_targets_min": 1591 }, { "epoch": 5.263605442176871, "grad_norm": 0.5439361172002423, "learning_rate": 7.054949415502037e-06, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.14960172772407532, "step": 3095, "valid_targets_mean": 4154.1, "valid_targets_min": 1514 }, { "epoch": 5.272108843537415, "grad_norm": 0.5055115783208214, "learning_rate": 6.990412677826404e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.13446712493896484, "step": 3100, "valid_targets_mean": 4222.0, "valid_targets_min": 1577 }, { "epoch": 5.280612244897959, "grad_norm": 0.5051797282464314, "learning_rate": 6.926109910416153e-06, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.11003969609737396, "step": 3105, "valid_targets_mean": 3936.0, "valid_targets_min": 2152 }, { "epoch": 5.289115646258503, "grad_norm": 0.6721874443565838, "learning_rate": 6.862042269721158e-06, "loss": 0.1084, "loss_nan_ranks": 0, "loss_rank_avg": 0.11099831759929657, "step": 3110, "valid_targets_mean": 3415.6, "valid_targets_min": 1058 }, { "epoch": 5.2976190476190474, "grad_norm": 0.5394489454464912, "learning_rate": 6.798210907962655e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.12719398736953735, "step": 3115, "valid_targets_mean": 3460.3, "valid_targets_min": 1271 }, { "epoch": 5.3061224489795915, "grad_norm": 0.48288105959872535, "learning_rate": 6.734616973112549e-06, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.10736523568630219, "step": 3120, "valid_targets_mean": 4715.4, "valid_targets_min": 1485 }, { "epoch": 5.3146258503401365, "grad_norm": 0.5025747733371888, "learning_rate": 6.671261608872737e-06, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.10189585387706757, "step": 3125, "valid_targets_mean": 3567.2, "valid_targets_min": 1479 }, { "epoch": 5.3231292517006805, "grad_norm": 0.5985343176195231, "learning_rate": 6.60814595465457e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.11069802939891815, "step": 3130, "valid_targets_mean": 3020.3, "valid_targets_min": 1210 }, { "epoch": 5.331632653061225, "grad_norm": 0.5711246776535795, "learning_rate": 6.545271145558336e-06, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.1153416782617569, "step": 3135, "valid_targets_mean": 3687.6, "valid_targets_min": 354 }, { "epoch": 5.340136054421769, "grad_norm": 0.5442736841286343, "learning_rate": 6.482638312352867e-06, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.1518375724554062, "step": 3140, "valid_targets_mean": 3984.1, "valid_targets_min": 1712 }, { "epoch": 5.348639455782313, "grad_norm": 0.5921573966375302, "learning_rate": 6.420248581455184e-06, "loss": 0.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.12098226696252823, "step": 3145, "valid_targets_mean": 3470.0, "valid_targets_min": 1603 }, { "epoch": 5.357142857142857, "grad_norm": 0.5697364605515239, "learning_rate": 6.358103074910238e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.13729847967624664, "step": 3150, "valid_targets_mean": 3894.2, "valid_targets_min": 1645 }, { "epoch": 5.365646258503402, "grad_norm": 0.4871709662606649, "learning_rate": 6.296202910370757e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.13507282733917236, "step": 3155, "valid_targets_mean": 4424.4, "valid_targets_min": 1180 }, { "epoch": 5.374149659863946, "grad_norm": 0.577744628501453, "learning_rate": 6.234549201077124e-06, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.10959557443857193, "step": 3160, "valid_targets_mean": 3010.2, "valid_targets_min": 1496 }, { "epoch": 5.38265306122449, "grad_norm": 0.5829555774391696, "learning_rate": 6.173143055837345e-06, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.11792930960655212, "step": 3165, "valid_targets_mean": 3196.4, "valid_targets_min": 721 }, { "epoch": 5.391156462585034, "grad_norm": 0.4993975366287769, "learning_rate": 6.111985579007149e-06, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.12624284625053406, "step": 3170, "valid_targets_mean": 4134.6, "valid_targets_min": 1236 }, { "epoch": 5.399659863945578, "grad_norm": 0.5107866919709771, "learning_rate": 6.051077870470068e-06, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.11668853461742401, "step": 3175, "valid_targets_mean": 4047.1, "valid_targets_min": 1577 }, { "epoch": 5.408163265306122, "grad_norm": 0.5252474663513425, "learning_rate": 5.990421025617716e-06, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.09952177107334137, "step": 3180, "valid_targets_mean": 3666.6, "valid_targets_min": 1741 }, { "epoch": 5.416666666666667, "grad_norm": 0.5015726628558949, "learning_rate": 5.930016135330052e-06, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.11919872462749481, "step": 3185, "valid_targets_mean": 4237.8, "valid_targets_min": 1198 }, { "epoch": 5.425170068027211, "grad_norm": 0.4769102709235795, "learning_rate": 5.869864285955771e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.10949502885341644, "step": 3190, "valid_targets_mean": 4599.4, "valid_targets_min": 1069 }, { "epoch": 5.433673469387755, "grad_norm": 0.5498618632742693, "learning_rate": 5.80996655929277e-06, "loss": 0.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.12536795437335968, "step": 3195, "valid_targets_mean": 3588.6, "valid_targets_min": 1136 }, { "epoch": 5.442176870748299, "grad_norm": 0.545561483870248, "learning_rate": 5.750324032568677e-06, "loss": 0.1206, "loss_nan_ranks": 0, "loss_rank_avg": 0.12246537208557129, "step": 3200, "valid_targets_mean": 3596.1, "valid_targets_min": 1312 }, { "epoch": 5.450680272108843, "grad_norm": 0.6040925588691938, "learning_rate": 5.6909377784215035e-06, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.10457558184862137, "step": 3205, "valid_targets_mean": 2857.7, "valid_targets_min": 1024 }, { "epoch": 5.459183673469388, "grad_norm": 0.5913736902327493, "learning_rate": 5.631808864880342e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.11675500869750977, "step": 3210, "valid_targets_mean": 3617.6, "valid_targets_min": 1573 }, { "epoch": 5.467687074829932, "grad_norm": 0.564857354499183, "learning_rate": 5.5729383553461315e-06, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.10473236441612244, "step": 3215, "valid_targets_mean": 3246.6, "valid_targets_min": 1352 }, { "epoch": 5.476190476190476, "grad_norm": 0.6156419129927186, "learning_rate": 5.5143273085725894e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.11393928527832031, "step": 3220, "valid_targets_mean": 2748.5, "valid_targets_min": 1241 }, { "epoch": 5.48469387755102, "grad_norm": 0.45521005132445264, "learning_rate": 5.45597677864711e-06, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.10282590985298157, "step": 3225, "valid_targets_mean": 4610.5, "valid_targets_min": 1112 }, { "epoch": 5.493197278911564, "grad_norm": 0.5837854371759927, "learning_rate": 5.397887814971854e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497810274362564, "step": 3230, "valid_targets_mean": 3359.5, "valid_targets_min": 1305 }, { "epoch": 5.5017006802721085, "grad_norm": 0.5527734282651293, "learning_rate": 5.34006146224485e-06, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.1028062105178833, "step": 3235, "valid_targets_mean": 3404.5, "valid_targets_min": 1249 }, { "epoch": 5.510204081632653, "grad_norm": 0.5266096072280819, "learning_rate": 5.282498760441219e-06, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.11795396357774734, "step": 3240, "valid_targets_mean": 3558.4, "valid_targets_min": 1270 }, { "epoch": 5.5187074829931975, "grad_norm": 0.540851535403909, "learning_rate": 5.225200744794465e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.17452237010002136, "step": 3245, "valid_targets_mean": 4261.2, "valid_targets_min": 1507 }, { "epoch": 5.5272108843537415, "grad_norm": 0.5182603091934628, "learning_rate": 5.168168445777839e-06, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529075652360916, "step": 3250, "valid_targets_mean": 4521.4, "valid_targets_min": 389 }, { "epoch": 5.535714285714286, "grad_norm": 0.5805823631890119, "learning_rate": 5.111402889085852e-06, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.14389967918395996, "step": 3255, "valid_targets_mean": 3602.2, "valid_targets_min": 1451 }, { "epoch": 5.54421768707483, "grad_norm": 0.5729116752291277, "learning_rate": 5.054905095615779e-06, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.11263558268547058, "step": 3260, "valid_targets_mean": 3662.2, "valid_targets_min": 1362 }, { "epoch": 5.552721088435375, "grad_norm": 0.5902153815232817, "learning_rate": 4.9986760814493315e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.10420026630163193, "step": 3265, "valid_targets_mean": 3085.2, "valid_targets_min": 1562 }, { "epoch": 5.561224489795919, "grad_norm": 0.5079041365032244, "learning_rate": 4.94271685783438e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.10216909646987915, "step": 3270, "valid_targets_mean": 3791.7, "valid_targets_min": 1329 }, { "epoch": 5.569727891156463, "grad_norm": 0.5323053118094618, "learning_rate": 4.88702843116674e-06, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.11844904720783234, "step": 3275, "valid_targets_mean": 4096.2, "valid_targets_min": 717 }, { "epoch": 5.578231292517007, "grad_norm": 0.5913613540592834, "learning_rate": 4.831611802972112e-06, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.12086708843708038, "step": 3280, "valid_targets_mean": 3125.9, "valid_targets_min": 1140 }, { "epoch": 5.586734693877551, "grad_norm": 0.6067435787352505, "learning_rate": 4.776467969888041e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.1235356330871582, "step": 3285, "valid_targets_mean": 2861.3, "valid_targets_min": 861 }, { "epoch": 5.595238095238095, "grad_norm": 0.6143172537137376, "learning_rate": 4.721597923646008e-06, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.13739518821239471, "step": 3290, "valid_targets_mean": 3314.9, "valid_targets_min": 724 }, { "epoch": 5.603741496598639, "grad_norm": 0.5285568105683806, "learning_rate": 4.667002651053582e-06, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.10752934962511063, "step": 3295, "valid_targets_mean": 3720.3, "valid_targets_min": 1406 }, { "epoch": 5.612244897959184, "grad_norm": 0.5479976862189573, "learning_rate": 4.612683133976692e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.15180706977844238, "step": 3300, "valid_targets_mean": 3768.8, "valid_targets_min": 1531 }, { "epoch": 5.620748299319728, "grad_norm": 0.5462163829552453, "learning_rate": 4.5586403493219365e-06, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.10777892172336578, "step": 3305, "valid_targets_mean": 3076.4, "valid_targets_min": 988 }, { "epoch": 5.629251700680272, "grad_norm": 0.5243365624661317, "learning_rate": 4.504875269019038e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.1242019534111023, "step": 3310, "valid_targets_mean": 4469.8, "valid_targets_min": 1440 }, { "epoch": 5.637755102040816, "grad_norm": 0.6223327575084228, "learning_rate": 4.451388860003374e-06, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.14461229741573334, "step": 3315, "valid_targets_mean": 3680.9, "valid_targets_min": 759 }, { "epoch": 5.646258503401361, "grad_norm": 0.5627481662897891, "learning_rate": 4.398182084198561e-06, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.11661049723625183, "step": 3320, "valid_targets_mean": 3855.8, "valid_targets_min": 1624 }, { "epoch": 5.654761904761905, "grad_norm": 0.5770944346437502, "learning_rate": 4.345255898499172e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.13459742069244385, "step": 3325, "valid_targets_mean": 3598.4, "valid_targets_min": 1468 }, { "epoch": 5.663265306122449, "grad_norm": 0.6063654059969268, "learning_rate": 4.292611254753509e-06, "loss": 0.1173, "loss_nan_ranks": 0, "loss_rank_avg": 0.1045822948217392, "step": 3330, "valid_targets_mean": 4255.0, "valid_targets_min": 1895 }, { "epoch": 5.671768707482993, "grad_norm": 0.6199385704660482, "learning_rate": 4.24024909974651e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.11114975064992905, "step": 3335, "valid_targets_mean": 2667.2, "valid_targets_min": 1101 }, { "epoch": 5.680272108843537, "grad_norm": 0.5741341263715167, "learning_rate": 4.188170375182705e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.13209852576255798, "step": 3340, "valid_targets_mean": 3331.6, "valid_targets_min": 766 }, { "epoch": 5.688775510204081, "grad_norm": 0.5849953260351614, "learning_rate": 4.136376017669281e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.19509027898311615, "step": 3345, "valid_targets_mean": 4514.0, "valid_targets_min": 1096 }, { "epoch": 5.697278911564625, "grad_norm": 0.5184855624946975, "learning_rate": 4.084866958699247e-06, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.11184950917959213, "step": 3350, "valid_targets_mean": 3622.2, "valid_targets_min": 1657 }, { "epoch": 5.70578231292517, "grad_norm": 0.4729255009742215, "learning_rate": 4.0336441246346684e-06, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.12170318514108658, "step": 3355, "valid_targets_mean": 4347.8, "valid_targets_min": 1545 }, { "epoch": 5.714285714285714, "grad_norm": 0.4886970159573961, "learning_rate": 3.982708436690001e-06, "loss": 0.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.10606701672077179, "step": 3360, "valid_targets_mean": 4402.9, "valid_targets_min": 1266 }, { "epoch": 5.7227891156462585, "grad_norm": 0.5492917249221348, "learning_rate": 3.932060810915563e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.12230627238750458, "step": 3365, "valid_targets_mean": 3404.1, "valid_targets_min": 1157 }, { "epoch": 5.7312925170068025, "grad_norm": 0.5515095288619949, "learning_rate": 3.881702158181015e-06, "loss": 0.1127, "loss_nan_ranks": 0, "loss_rank_avg": 0.09741039574146271, "step": 3370, "valid_targets_mean": 3078.1, "valid_targets_min": 1540 }, { "epoch": 5.739795918367347, "grad_norm": 0.5994347022720987, "learning_rate": 3.831633384159006e-06, "loss": 0.114, "loss_nan_ranks": 0, "loss_rank_avg": 0.10247445851564407, "step": 3375, "valid_targets_mean": 2756.9, "valid_targets_min": 750 }, { "epoch": 5.7482993197278915, "grad_norm": 0.5662527226383535, "learning_rate": 3.7818553893088596e-06, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.1331837773323059, "step": 3380, "valid_targets_mean": 4074.8, "valid_targets_min": 1109 }, { "epoch": 5.756802721088436, "grad_norm": 0.6312403630388446, "learning_rate": 3.7323690688604153e-06, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.12030863016843796, "step": 3385, "valid_targets_mean": 2706.7, "valid_targets_min": 1132 }, { "epoch": 5.76530612244898, "grad_norm": 0.4665440158007456, "learning_rate": 3.6831753127978974e-06, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11458925902843475, "step": 3390, "valid_targets_mean": 4522.5, "valid_targets_min": 1805 }, { "epoch": 5.773809523809524, "grad_norm": 0.5271545621260861, "learning_rate": 3.634275005843935e-06, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.09652923047542572, "step": 3395, "valid_targets_mean": 3248.9, "valid_targets_min": 883 }, { "epoch": 5.782312925170068, "grad_norm": 0.5145222459804143, "learning_rate": 3.585669027443608e-06, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.10808805376291275, "step": 3400, "valid_targets_mean": 3782.8, "valid_targets_min": 294 }, { "epoch": 5.790816326530612, "grad_norm": 0.6087405762550093, "learning_rate": 3.537358251748695e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.15609332919120789, "step": 3405, "valid_targets_mean": 3078.8, "valid_targets_min": 1245 }, { "epoch": 5.799319727891157, "grad_norm": 0.493673691287559, "learning_rate": 3.489343547601882e-06, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.11217699944972992, "step": 3410, "valid_targets_mean": 4235.0, "valid_targets_min": 1172 }, { "epoch": 5.807823129251701, "grad_norm": 0.5330291348481382, "learning_rate": 3.4416257785211983e-06, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.08841429650783539, "step": 3415, "valid_targets_mean": 3745.4, "valid_targets_min": 1474 }, { "epoch": 5.816326530612245, "grad_norm": 0.57971467987211, "learning_rate": 3.3942058026844472e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.15836650133132935, "step": 3420, "valid_targets_mean": 3547.6, "valid_targets_min": 1208 }, { "epoch": 5.824829931972789, "grad_norm": 0.47906681279107716, "learning_rate": 3.3470844729137886e-06, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.10378694534301758, "step": 3425, "valid_targets_mean": 4480.3, "valid_targets_min": 1556 }, { "epoch": 5.833333333333333, "grad_norm": 0.5967888879124165, "learning_rate": 3.3002626366603896e-06, "loss": 0.1225, "loss_nan_ranks": 0, "loss_rank_avg": 0.1304030567407608, "step": 3430, "valid_targets_mean": 3002.1, "valid_targets_min": 333 }, { "epoch": 5.841836734693878, "grad_norm": 0.5315803544065215, "learning_rate": 3.253741135989199e-06, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.11456482112407684, "step": 3435, "valid_targets_mean": 3406.2, "valid_targets_min": 1408 }, { "epoch": 5.850340136054422, "grad_norm": 0.5617527254427237, "learning_rate": 3.2075208075637953e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.13196901977062225, "step": 3440, "valid_targets_mean": 3691.4, "valid_targets_min": 1216 }, { "epoch": 5.858843537414966, "grad_norm": 0.5521550371634127, "learning_rate": 3.161602482631343e-06, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.13317209482192993, "step": 3445, "valid_targets_mean": 4007.6, "valid_targets_min": 1478 }, { "epoch": 5.86734693877551, "grad_norm": 1.6598007447933765, "learning_rate": 3.115986987007622e-06, "loss": 0.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.11910313367843628, "step": 3450, "valid_targets_mean": 3475.4, "valid_targets_min": 1452 }, { "epoch": 5.875850340136054, "grad_norm": 0.5198857712479822, "learning_rate": 3.0706751410622184e-06, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.09872958809137344, "step": 3455, "valid_targets_mean": 3633.4, "valid_targets_min": 1608 }, { "epoch": 5.884353741496598, "grad_norm": 0.6586650995065951, "learning_rate": 3.0256677597037253e-06, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.15523600578308105, "step": 3460, "valid_targets_mean": 2631.6, "valid_targets_min": 626 }, { "epoch": 5.892857142857143, "grad_norm": 0.5820548403555877, "learning_rate": 2.980965652365122e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.12451058626174927, "step": 3465, "valid_targets_mean": 3528.8, "valid_targets_min": 1231 }, { "epoch": 5.901360544217687, "grad_norm": 0.5001256201730465, "learning_rate": 2.936569622989198e-06, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.09069167822599411, "step": 3470, "valid_targets_mean": 3679.2, "valid_targets_min": 1597 }, { "epoch": 5.909863945578231, "grad_norm": 0.6527876550739389, "learning_rate": 2.892480470014101e-06, "loss": 0.1173, "loss_nan_ranks": 0, "loss_rank_avg": 0.12368982285261154, "step": 3475, "valid_targets_mean": 2663.8, "valid_targets_min": 1083 }, { "epoch": 5.918367346938775, "grad_norm": 0.6049378944092306, "learning_rate": 2.8486989863589665e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.16314776241779327, "step": 3480, "valid_targets_mean": 3331.4, "valid_targets_min": 1199 }, { "epoch": 5.9268707482993195, "grad_norm": 0.5321145816925281, "learning_rate": 2.8052259594096786e-06, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.10574959218502045, "step": 3485, "valid_targets_mean": 4042.9, "valid_targets_min": 1737 }, { "epoch": 5.935374149659864, "grad_norm": 0.5249443175372537, "learning_rate": 2.762062171004689e-06, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.13219550251960754, "step": 3490, "valid_targets_mean": 3747.8, "valid_targets_min": 1114 }, { "epoch": 5.9438775510204085, "grad_norm": 0.5349877929860054, "learning_rate": 2.719208397420976e-06, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.10431113094091415, "step": 3495, "valid_targets_mean": 4021.3, "valid_targets_min": 1584 }, { "epoch": 5.9523809523809526, "grad_norm": 0.615252584404469, "learning_rate": 2.6766654093600554e-06, "loss": 0.1138, "loss_nan_ranks": 0, "loss_rank_avg": 0.10922113060951233, "step": 3500, "valid_targets_mean": 2900.0, "valid_targets_min": 888 }, { "epoch": 5.960884353741497, "grad_norm": 0.5660078177837199, "learning_rate": 2.634433971934145e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.16342481970787048, "step": 3505, "valid_targets_mean": 4022.2, "valid_targets_min": 1349 }, { "epoch": 5.969387755102041, "grad_norm": 0.5633990506355825, "learning_rate": 2.592514844652396e-06, "loss": 0.1157, "loss_nan_ranks": 0, "loss_rank_avg": 0.10728654265403748, "step": 3510, "valid_targets_mean": 3335.4, "valid_targets_min": 893 }, { "epoch": 5.977891156462585, "grad_norm": 0.5618270096817878, "learning_rate": 2.5509087814072373e-06, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.13099925220012665, "step": 3515, "valid_targets_mean": 3559.8, "valid_targets_min": 1589 }, { "epoch": 5.986394557823129, "grad_norm": 0.5950284042429369, "learning_rate": 2.5096165304608055e-06, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.11572650074958801, "step": 3520, "valid_targets_mean": 3260.1, "valid_targets_min": 1543 }, { "epoch": 5.994897959183674, "grad_norm": 0.6431959290467469, "learning_rate": 2.468638834431507e-06, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.11295954883098602, "step": 3525, "valid_targets_mean": 2737.2, "valid_targets_min": 1360 }, { "epoch": 6.003401360544218, "grad_norm": 0.477579265700717, "learning_rate": 2.427976430280634e-06, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.10084202885627747, "step": 3530, "valid_targets_mean": 4324.1, "valid_targets_min": 1427 }, { "epoch": 6.011904761904762, "grad_norm": 0.4454117266637318, "learning_rate": 2.3876300492991456e-06, "loss": 0.1012, "loss_nan_ranks": 0, "loss_rank_avg": 0.09745575487613678, "step": 3535, "valid_targets_mean": 4572.9, "valid_targets_min": 1417 }, { "epoch": 6.020408163265306, "grad_norm": 0.478412233942278, "learning_rate": 2.3476004170944843e-06, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278717815876007, "step": 3540, "valid_targets_mean": 4723.2, "valid_targets_min": 1093 }, { "epoch": 6.02891156462585, "grad_norm": 0.5184477127041136, "learning_rate": 2.307888253577557e-06, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.12066527456045151, "step": 3545, "valid_targets_mean": 4437.1, "valid_targets_min": 1155 }, { "epoch": 6.037414965986395, "grad_norm": 0.5620893513671174, "learning_rate": 2.2684942729497505e-06, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.11014530062675476, "step": 3550, "valid_targets_mean": 3719.1, "valid_targets_min": 1521 }, { "epoch": 6.045918367346939, "grad_norm": 0.5352459906510691, "learning_rate": 2.229419183690118e-06, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.10845694690942764, "step": 3555, "valid_targets_mean": 3726.8, "valid_targets_min": 1406 }, { "epoch": 6.054421768707483, "grad_norm": 0.55710958865019, "learning_rate": 2.1906636885426293e-06, "loss": 0.1058, "loss_nan_ranks": 0, "loss_rank_avg": 0.1064843237400055, "step": 3560, "valid_targets_mean": 3575.5, "valid_targets_min": 1709 }, { "epoch": 6.062925170068027, "grad_norm": 0.5432557912713459, "learning_rate": 2.1522284845035246e-06, "loss": 0.1056, "loss_nan_ranks": 0, "loss_rank_avg": 0.11107736825942993, "step": 3565, "valid_targets_mean": 3768.4, "valid_targets_min": 738 }, { "epoch": 6.071428571428571, "grad_norm": 0.511605737896378, "learning_rate": 2.1141142628087908e-06, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.15048445761203766, "step": 3570, "valid_targets_mean": 5072.7, "valid_targets_min": 1249 }, { "epoch": 6.079931972789115, "grad_norm": 0.5766159647704026, "learning_rate": 2.0763217089217204e-06, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.10604619234800339, "step": 3575, "valid_targets_mean": 3533.0, "valid_targets_min": 1648 }, { "epoch": 6.08843537414966, "grad_norm": 0.5836072850396373, "learning_rate": 2.0388515025205912e-06, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.12037845700979233, "step": 3580, "valid_targets_mean": 3252.4, "valid_targets_min": 690 }, { "epoch": 6.096938775510204, "grad_norm": 0.6153532334687207, "learning_rate": 2.0017043174864257e-06, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.11313758790493011, "step": 3585, "valid_targets_mean": 3177.9, "valid_targets_min": 526 }, { "epoch": 6.105442176870748, "grad_norm": 0.6539832007276991, "learning_rate": 1.9648808218909023e-06, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.11016803234815598, "step": 3590, "valid_targets_mean": 3561.9, "valid_targets_min": 851 }, { "epoch": 6.113945578231292, "grad_norm": 0.5088070903468043, "learning_rate": 1.928381677984319e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.10234713554382324, "step": 3595, "valid_targets_mean": 3746.4, "valid_targets_min": 1318 }, { "epoch": 6.122448979591836, "grad_norm": 0.5727361664596694, "learning_rate": 1.8922075421836729e-06, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.1115289181470871, "step": 3600, "valid_targets_mean": 3681.5, "valid_targets_min": 1477 }, { "epoch": 6.130952380952381, "grad_norm": 0.5703340884857128, "learning_rate": 1.8563590650608908e-06, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.11293356120586395, "step": 3605, "valid_targets_mean": 3610.5, "valid_targets_min": 1115 }, { "epoch": 6.139455782312925, "grad_norm": 0.5567638013057162, "learning_rate": 1.8208368913310881e-06, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489240676164627, "step": 3610, "valid_targets_mean": 4215.0, "valid_targets_min": 1364 }, { "epoch": 6.1479591836734695, "grad_norm": 0.5496607355990576, "learning_rate": 1.7856416598410064e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.08839699625968933, "step": 3615, "valid_targets_mean": 3228.2, "valid_targets_min": 1349 }, { "epoch": 6.156462585034014, "grad_norm": 0.6666358234359487, "learning_rate": 1.7507740035575049e-06, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.12748566269874573, "step": 3620, "valid_targets_mean": 2800.0, "valid_targets_min": 288 }, { "epoch": 6.164965986394558, "grad_norm": 0.5782864339340296, "learning_rate": 1.7162345495561905e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.14760619401931763, "step": 3625, "valid_targets_mean": 3669.2, "valid_targets_min": 1239 }, { "epoch": 6.173469387755102, "grad_norm": 0.5618155339533111, "learning_rate": 1.682023919010125e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.09852004796266556, "step": 3630, "valid_targets_mean": 3470.2, "valid_targets_min": 1202 }, { "epoch": 6.181972789115647, "grad_norm": 0.598362631078015, "learning_rate": 1.6481427271786588e-06, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.10615670680999756, "step": 3635, "valid_targets_mean": 3053.8, "valid_targets_min": 814 }, { "epoch": 6.190476190476191, "grad_norm": 0.5591508889473271, "learning_rate": 1.6145915833963788e-06, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.09319960325956345, "step": 3640, "valid_targets_mean": 3101.5, "valid_targets_min": 1543 }, { "epoch": 6.198979591836735, "grad_norm": 0.5882835479569136, "learning_rate": 1.5813710910621293e-06, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.11982224881649017, "step": 3645, "valid_targets_mean": 3055.9, "valid_targets_min": 1361 }, { "epoch": 6.207482993197279, "grad_norm": 0.5792923656094919, "learning_rate": 1.548481847628176e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.11135858297348022, "step": 3650, "valid_targets_mean": 3600.5, "valid_targets_min": 1127 }, { "epoch": 6.215986394557823, "grad_norm": 0.5892203254512576, "learning_rate": 1.5159244445894605e-06, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.11109749972820282, "step": 3655, "valid_targets_mean": 3371.7, "valid_targets_min": 1418 }, { "epoch": 6.224489795918367, "grad_norm": 0.527490492326501, "learning_rate": 1.4836994674729433e-06, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.09896763414144516, "step": 3660, "valid_targets_mean": 3538.0, "valid_targets_min": 1383 }, { "epoch": 6.232993197278912, "grad_norm": 0.563826301919356, "learning_rate": 1.4518074958271e-06, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.13025017082691193, "step": 3665, "valid_targets_mean": 3828.9, "valid_targets_min": 1612 }, { "epoch": 6.241496598639456, "grad_norm": 0.5606773143753264, "learning_rate": 1.4202491032114797e-06, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.10734811425209045, "step": 3670, "valid_targets_mean": 3267.6, "valid_targets_min": 1532 }, { "epoch": 6.25, "grad_norm": 0.5854260290454237, "learning_rate": 1.389024857186403e-06, "loss": 0.0964, "loss_nan_ranks": 0, "loss_rank_avg": 0.09467275440692902, "step": 3675, "valid_targets_mean": 3203.1, "valid_targets_min": 668 }, { "epoch": 6.258503401360544, "grad_norm": 0.49104713182267146, "learning_rate": 1.3581353193027424e-06, "loss": 0.1201, "loss_nan_ranks": 0, "loss_rank_avg": 0.11616228520870209, "step": 3680, "valid_targets_mean": 4475.0, "valid_targets_min": 294 }, { "epoch": 6.267006802721088, "grad_norm": 0.6050149142306898, "learning_rate": 1.3275810450918257e-06, "loss": 0.1149, "loss_nan_ranks": 0, "loss_rank_avg": 0.11099812388420105, "step": 3685, "valid_targets_mean": 3569.8, "valid_targets_min": 1659 }, { "epoch": 6.275510204081632, "grad_norm": 0.562170069430547, "learning_rate": 1.2973625840554593e-06, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.10738849639892578, "step": 3690, "valid_targets_mean": 3418.9, "valid_targets_min": 1727 }, { "epoch": 6.284013605442177, "grad_norm": 0.5017474742394269, "learning_rate": 1.2674804796560202e-06, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.12143012881278992, "step": 3695, "valid_targets_mean": 4531.0, "valid_targets_min": 534 }, { "epoch": 6.292517006802721, "grad_norm": 0.5391996228968388, "learning_rate": 1.237935269306707e-06, "loss": 0.114, "loss_nan_ranks": 0, "loss_rank_avg": 0.11418686807155609, "step": 3700, "valid_targets_mean": 4400.1, "valid_targets_min": 1657 }, { "epoch": 6.301020408163265, "grad_norm": 0.5104246666127118, "learning_rate": 1.2087274843618668e-06, "loss": 0.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.09506049752235413, "step": 3705, "valid_targets_mean": 3893.9, "valid_targets_min": 1584 }, { "epoch": 6.309523809523809, "grad_norm": 0.5992141275873888, "learning_rate": 1.1798576501074233e-06, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.10688906162977219, "step": 3710, "valid_targets_mean": 2873.1, "valid_targets_min": 1624 }, { "epoch": 6.318027210884353, "grad_norm": 0.6627760286529151, "learning_rate": 1.151326285751455e-06, "loss": 0.1027, "loss_nan_ranks": 0, "loss_rank_avg": 0.10680701583623886, "step": 3715, "valid_targets_mean": 3383.1, "valid_targets_min": 1469 }, { "epoch": 6.326530612244898, "grad_norm": 0.5143956921633834, "learning_rate": 1.1231339044148393e-06, "loss": 0.1114, "loss_nan_ranks": 0, "loss_rank_avg": 0.11333712935447693, "step": 3720, "valid_targets_mean": 4535.8, "valid_targets_min": 1529 }, { "epoch": 6.335034013605442, "grad_norm": 0.5751586207418208, "learning_rate": 1.095281013122036e-06, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.09510093927383423, "step": 3725, "valid_targets_mean": 3208.8, "valid_targets_min": 1558 }, { "epoch": 6.343537414965986, "grad_norm": 0.9443328517820183, "learning_rate": 1.0677681127919581e-06, "loss": 0.1122, "loss_nan_ranks": 0, "loss_rank_avg": 0.12241110950708389, "step": 3730, "valid_targets_mean": 3732.4, "valid_targets_min": 1114 }, { "epoch": 6.3520408163265305, "grad_norm": 0.5456126321948206, "learning_rate": 1.04059569822897e-06, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.11154021322727203, "step": 3735, "valid_targets_mean": 3789.4, "valid_targets_min": 1474 }, { "epoch": 6.360544217687075, "grad_norm": 0.6107837672044061, "learning_rate": 1.0137642581139895e-06, "loss": 0.1165, "loss_nan_ranks": 0, "loss_rank_avg": 0.11448526382446289, "step": 3740, "valid_targets_mean": 2861.9, "valid_targets_min": 1011 }, { "epoch": 6.369047619047619, "grad_norm": 0.5550637999848018, "learning_rate": 9.87274274995693e-07, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1355058252811432, "step": 3745, "valid_targets_mean": 3923.8, "valid_targets_min": 844 }, { "epoch": 6.377551020408164, "grad_norm": 0.5499184670462272, "learning_rate": 9.61126225281841e-07, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.1835326850414276, "step": 3750, "valid_targets_mean": 4376.8, "valid_targets_min": 1386 }, { "epoch": 6.386054421768708, "grad_norm": 0.5598653966572599, "learning_rate": 9.353205792307163e-07, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1339794397354126, "step": 3755, "valid_targets_mean": 3800.2, "valid_targets_min": 1519 }, { "epoch": 6.394557823129252, "grad_norm": 0.6026219846226943, "learning_rate": 9.098578009426484e-07, "loss": 0.1063, "loss_nan_ranks": 0, "loss_rank_avg": 0.10622464120388031, "step": 3760, "valid_targets_mean": 3525.6, "valid_targets_min": 799 }, { "epoch": 6.403061224489796, "grad_norm": 0.5525824324094764, "learning_rate": 8.847383483516903e-07, "loss": 0.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.11089949309825897, "step": 3765, "valid_targets_mean": 3808.2, "valid_targets_min": 1801 }, { "epoch": 6.41156462585034, "grad_norm": 0.5806460615603857, "learning_rate": 8.599626732173671e-07, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11263792216777802, "step": 3770, "valid_targets_mean": 3948.2, "valid_targets_min": 1166 }, { "epoch": 6.420068027210885, "grad_norm": 0.5218407093507026, "learning_rate": 8.355312211165568e-07, "loss": 0.1148, "loss_nan_ranks": 0, "loss_rank_avg": 0.12748584151268005, "step": 3775, "valid_targets_mean": 3853.9, "valid_targets_min": 1617 }, { "epoch": 6.428571428571429, "grad_norm": 0.5270239739962835, "learning_rate": 8.11444431435473e-07, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.1101468950510025, "step": 3780, "valid_targets_mean": 4074.8, "valid_targets_min": 1047 }, { "epoch": 6.437074829931973, "grad_norm": 0.5563024099626601, "learning_rate": 7.87702737361764e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.10898242145776749, "step": 3785, "valid_targets_mean": 3889.8, "valid_targets_min": 626 }, { "epoch": 6.445578231292517, "grad_norm": 0.46404697622035623, "learning_rate": 7.643065658767312e-07, "loss": 0.1173, "loss_nan_ranks": 0, "loss_rank_avg": 0.09871433675289154, "step": 3790, "valid_targets_mean": 4953.9, "valid_targets_min": 1568 }, { "epoch": 6.454081632653061, "grad_norm": 0.4990012456904466, "learning_rate": 7.412563377476312e-07, "loss": 0.1138, "loss_nan_ranks": 0, "loss_rank_avg": 0.11271509528160095, "step": 3795, "valid_targets_mean": 4299.8, "valid_targets_min": 1429 }, { "epoch": 6.462585034013605, "grad_norm": 0.5531901069965772, "learning_rate": 7.185524675201328e-07, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.12225601822137833, "step": 3800, "valid_targets_mean": 4172.3, "valid_targets_min": 1159 }, { "epoch": 6.47108843537415, "grad_norm": 0.5402043893820961, "learning_rate": 6.961953635108409e-07, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.10706687718629837, "step": 3805, "valid_targets_mean": 3612.2, "valid_targets_min": 1306 }, { "epoch": 6.479591836734694, "grad_norm": 0.5789107548087521, "learning_rate": 6.741854277999583e-07, "loss": 0.1016, "loss_nan_ranks": 0, "loss_rank_avg": 0.11366184055805206, "step": 3810, "valid_targets_mean": 3378.6, "valid_targets_min": 1354 }, { "epoch": 6.488095238095238, "grad_norm": 0.4713440181846783, "learning_rate": 6.525230562240636e-07, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.10541140288114548, "step": 3815, "valid_targets_mean": 4977.9, "valid_targets_min": 1681 }, { "epoch": 6.496598639455782, "grad_norm": 0.5699975953341101, "learning_rate": 6.312086383689831e-07, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.08873768895864487, "step": 3820, "valid_targets_mean": 3275.1, "valid_targets_min": 1437 }, { "epoch": 6.505102040816326, "grad_norm": 0.5571386497340849, "learning_rate": 6.10242557562788e-07, "loss": 0.1008, "loss_nan_ranks": 0, "loss_rank_avg": 0.09184282273054123, "step": 3825, "valid_targets_mean": 3166.5, "valid_targets_min": 429 }, { "epoch": 6.513605442176871, "grad_norm": 0.5624098278712437, "learning_rate": 5.896251908688966e-07, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.10643933713436127, "step": 3830, "valid_targets_mean": 3651.6, "valid_targets_min": 1300 }, { "epoch": 6.522108843537415, "grad_norm": 0.63514069662102, "learning_rate": 5.693569090792972e-07, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.0915570929646492, "step": 3835, "valid_targets_mean": 2957.2, "valid_targets_min": 1249 }, { "epoch": 6.530612244897959, "grad_norm": 0.5444838195618228, "learning_rate": 5.494380767078822e-07, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.10774494707584381, "step": 3840, "valid_targets_mean": 3686.2, "valid_targets_min": 2165 }, { "epoch": 6.539115646258503, "grad_norm": 0.5054912271298077, "learning_rate": 5.298690519838823e-07, "loss": 0.105, "loss_nan_ranks": 0, "loss_rank_avg": 0.0980135053396225, "step": 3845, "valid_targets_mean": 3616.6, "valid_targets_min": 1167 }, { "epoch": 6.5476190476190474, "grad_norm": 0.5753976388948479, "learning_rate": 5.106501868454317e-07, "loss": 0.1032, "loss_nan_ranks": 0, "loss_rank_avg": 0.10707738250494003, "step": 3850, "valid_targets_mean": 3197.4, "valid_targets_min": 1349 }, { "epoch": 6.5561224489795915, "grad_norm": 0.5292969551823501, "learning_rate": 4.917818269332442e-07, "loss": 0.1063, "loss_nan_ranks": 0, "loss_rank_avg": 0.10826131701469421, "step": 3855, "valid_targets_mean": 4322.6, "valid_targets_min": 1402 }, { "epoch": 6.564625850340136, "grad_norm": 0.621615696636191, "learning_rate": 4.7326431158437826e-07, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.10695119947195053, "step": 3860, "valid_targets_mean": 3007.0, "valid_targets_min": 1378 }, { "epoch": 6.5731292517006805, "grad_norm": 0.509107661703464, "learning_rate": 4.5509797382615517e-07, "loss": 0.1015, "loss_nan_ranks": 0, "loss_rank_avg": 0.09450152516365051, "step": 3865, "valid_targets_mean": 3882.9, "valid_targets_min": 1878 }, { "epoch": 6.581632653061225, "grad_norm": 0.5313107105149394, "learning_rate": 4.372831403701572e-07, "loss": 0.1039, "loss_nan_ranks": 0, "loss_rank_avg": 0.094798743724823, "step": 3870, "valid_targets_mean": 3878.6, "valid_targets_min": 1342 }, { "epoch": 6.590136054421769, "grad_norm": 0.4871663184954264, "learning_rate": 4.198201316063566e-07, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.11148764193058014, "step": 3875, "valid_targets_mean": 4325.2, "valid_targets_min": 1662 }, { "epoch": 6.598639455782313, "grad_norm": 0.579299905341723, "learning_rate": 4.02709261597356e-07, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.09807397425174713, "step": 3880, "valid_targets_mean": 3303.0, "valid_targets_min": 1271 }, { "epoch": 6.607142857142857, "grad_norm": 0.5720297842675975, "learning_rate": 3.8595083807272393e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.09346231073141098, "step": 3885, "valid_targets_mean": 3077.5, "valid_targets_min": 1364 }, { "epoch": 6.615646258503402, "grad_norm": 0.5158229677829215, "learning_rate": 3.695451624234836e-07, "loss": 0.1048, "loss_nan_ranks": 0, "loss_rank_avg": 0.11520027369260788, "step": 3890, "valid_targets_mean": 4364.4, "valid_targets_min": 1833 }, { "epoch": 6.624149659863946, "grad_norm": 0.5571817676018703, "learning_rate": 3.5349252969667956e-07, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11287274956703186, "step": 3895, "valid_targets_mean": 3659.2, "valid_targets_min": 1374 }, { "epoch": 6.63265306122449, "grad_norm": 0.5405013862537791, "learning_rate": 3.3779322859007536e-07, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.13448761403560638, "step": 3900, "valid_targets_mean": 3958.9, "valid_targets_min": 1882 }, { "epoch": 6.641156462585034, "grad_norm": 0.5917561818550695, "learning_rate": 3.224475414469552e-07, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.12737716734409332, "step": 3905, "valid_targets_mean": 4113.4, "valid_targets_min": 1245 }, { "epoch": 6.649659863945578, "grad_norm": 0.557946447045777, "learning_rate": 3.0745574425105505e-07, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.10673606395721436, "step": 3910, "valid_targets_mean": 4236.9, "valid_targets_min": 1210 }, { "epoch": 6.658163265306122, "grad_norm": 0.5164919683603588, "learning_rate": 2.928181066215929e-07, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.11876433342695236, "step": 3915, "valid_targets_mean": 4077.7, "valid_targets_min": 940 }, { "epoch": 6.666666666666667, "grad_norm": 0.5499308726469657, "learning_rate": 2.785348918084241e-07, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489306092262268, "step": 3920, "valid_targets_mean": 3865.4, "valid_targets_min": 1396 }, { "epoch": 6.675170068027211, "grad_norm": 0.5678142167877335, "learning_rate": 2.6460635668730027e-07, "loss": 0.1021, "loss_nan_ranks": 0, "loss_rank_avg": 0.09267286211252213, "step": 3925, "valid_targets_mean": 2827.5, "valid_targets_min": 345 }, { "epoch": 6.683673469387755, "grad_norm": 0.6608311371489237, "learning_rate": 2.5103275175526023e-07, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.14703533053398132, "step": 3930, "valid_targets_mean": 3164.3, "valid_targets_min": 1164 }, { "epoch": 6.692176870748299, "grad_norm": 0.5221678778571415, "learning_rate": 2.3781432112611303e-07, "loss": 0.1097, "loss_nan_ranks": 0, "loss_rank_avg": 0.10101592540740967, "step": 3935, "valid_targets_mean": 3994.5, "valid_targets_min": 1762 }, { "epoch": 6.700680272108843, "grad_norm": 0.5651651379644324, "learning_rate": 2.2495130252605746e-07, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11423544585704803, "step": 3940, "valid_targets_mean": 4024.6, "valid_targets_min": 1439 }, { "epoch": 6.709183673469388, "grad_norm": 0.5199949463759391, "learning_rate": 2.1244392728939857e-07, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.10502418875694275, "step": 3945, "valid_targets_mean": 3820.6, "valid_targets_min": 1377 }, { "epoch": 6.717687074829932, "grad_norm": 0.583526962887543, "learning_rate": 2.0029242035439768e-07, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.14046607911586761, "step": 3950, "valid_targets_mean": 3444.8, "valid_targets_min": 1483 }, { "epoch": 6.726190476190476, "grad_norm": 0.5810830942373014, "learning_rate": 1.8849700025921347e-07, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.10181055963039398, "step": 3955, "valid_targets_mean": 3560.2, "valid_targets_min": 1243 }, { "epoch": 6.73469387755102, "grad_norm": 0.5491006914828277, "learning_rate": 1.7705787913798734e-07, "loss": 0.1117, "loss_nan_ranks": 0, "loss_rank_avg": 0.09634849429130554, "step": 3960, "valid_targets_mean": 3517.1, "valid_targets_min": 1240 }, { "epoch": 6.743197278911564, "grad_norm": 0.511896203300437, "learning_rate": 1.659752627170086e-07, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.10449256002902985, "step": 3965, "valid_targets_mean": 3527.1, "valid_targets_min": 1141 }, { "epoch": 6.7517006802721085, "grad_norm": 0.5336137499248547, "learning_rate": 1.5524935031103305e-07, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.12154018133878708, "step": 3970, "valid_targets_mean": 3592.3, "valid_targets_min": 1241 }, { "epoch": 6.760204081632653, "grad_norm": 0.5627708148417632, "learning_rate": 1.4488033481969478e-07, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.09863865375518799, "step": 3975, "valid_targets_mean": 3483.6, "valid_targets_min": 826 }, { "epoch": 6.7687074829931975, "grad_norm": 0.5196827469634108, "learning_rate": 1.3486840272402213e-07, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.10619688779115677, "step": 3980, "valid_targets_mean": 3646.9, "valid_targets_min": 1196 }, { "epoch": 6.7772108843537415, "grad_norm": 0.5718874037000535, "learning_rate": 1.252137340831072e-07, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.1136164665222168, "step": 3985, "valid_targets_mean": 3522.7, "valid_targets_min": 1267 }, { "epoch": 6.785714285714286, "grad_norm": 0.5816806292415059, "learning_rate": 1.1591650253084619e-07, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.11231759190559387, "step": 3990, "valid_targets_mean": 3649.8, "valid_targets_min": 1956 }, { "epoch": 6.79421768707483, "grad_norm": 0.5720471677766351, "learning_rate": 1.0697687527283062e-07, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.08975514769554138, "step": 3995, "valid_targets_mean": 2904.6, "valid_targets_min": 1441 }, { "epoch": 6.802721088435375, "grad_norm": 0.5465150224292055, "learning_rate": 9.839501308333666e-08, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.12105758488178253, "step": 4000, "valid_targets_mean": 3943.8, "valid_targets_min": 1551 }, { "epoch": 6.811224489795919, "grad_norm": 0.5775321617047376, "learning_rate": 9.017107030242944e-08, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.10549725592136383, "step": 4005, "valid_targets_mean": 3177.4, "valid_targets_min": 870 }, { "epoch": 6.819727891156463, "grad_norm": 0.5675733876780689, "learning_rate": 8.230519483319211e-08, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.10369785130023956, "step": 4010, "valid_targets_mean": 3497.2, "valid_targets_min": 1801 }, { "epoch": 6.828231292517007, "grad_norm": 0.5774913215786752, "learning_rate": 7.479752813906338e-08, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.12983883917331696, "step": 4015, "valid_targets_mean": 3454.6, "valid_targets_min": 724 }, { "epoch": 6.836734693877551, "grad_norm": 0.5837816943629295, "learning_rate": 6.764820524129745e-08, "loss": 0.1131, "loss_nan_ranks": 0, "loss_rank_avg": 0.11133235692977905, "step": 4020, "valid_targets_mean": 3369.7, "valid_targets_min": 1349 }, { "epoch": 6.845238095238095, "grad_norm": 0.5189943403965727, "learning_rate": 6.085735471653032e-08, "loss": 0.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.08331690728664398, "step": 4025, "valid_targets_mean": 3523.8, "valid_targets_min": 1276 }, { "epoch": 6.853741496598639, "grad_norm": 0.5419837374263143, "learning_rate": 5.442509869446833e-08, "loss": 0.101, "loss_nan_ranks": 0, "loss_rank_avg": 0.11506151407957077, "step": 4030, "valid_targets_mean": 3857.5, "valid_targets_min": 1666 }, { "epoch": 6.862244897959184, "grad_norm": 0.5684055839237468, "learning_rate": 4.835155285569659e-08, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.09615157544612885, "step": 4035, "valid_targets_mean": 3268.4, "valid_targets_min": 1424 }, { "epoch": 6.870748299319728, "grad_norm": 0.5365731291138811, "learning_rate": 4.263682642959177e-08, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.10993782430887222, "step": 4040, "valid_targets_mean": 3738.6, "valid_targets_min": 1367 }, { "epoch": 6.879251700680272, "grad_norm": 0.5476111470480821, "learning_rate": 3.72810221923614e-08, "loss": 0.1056, "loss_nan_ranks": 0, "loss_rank_avg": 0.09571518003940582, "step": 4045, "valid_targets_mean": 3979.3, "valid_targets_min": 1498 }, { "epoch": 6.887755102040816, "grad_norm": 0.48869823313324573, "learning_rate": 3.228423646519652e-08, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.10207545012235641, "step": 4050, "valid_targets_mean": 4221.0, "valid_targets_min": 1183 }, { "epoch": 6.896258503401361, "grad_norm": 0.5769761101009117, "learning_rate": 2.764655911253744e-08, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.10221989452838898, "step": 4055, "valid_targets_mean": 3082.2, "valid_targets_min": 1526 }, { "epoch": 6.904761904761905, "grad_norm": 0.5304203511947876, "learning_rate": 2.3368073540461778e-08, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.10058721154928207, "step": 4060, "valid_targets_mean": 3711.4, "valid_targets_min": 1177 }, { "epoch": 6.913265306122449, "grad_norm": 0.5527928596168906, "learning_rate": 1.944885669517005e-08, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.13187864422798157, "step": 4065, "valid_targets_mean": 3627.0, "valid_targets_min": 1362 }, { "epoch": 6.921768707482993, "grad_norm": 0.5876230043161286, "learning_rate": 1.5888979061624566e-08, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.11860952526330948, "step": 4070, "valid_targets_mean": 2997.6, "valid_targets_min": 626 }, { "epoch": 6.930272108843537, "grad_norm": 0.5180428031623431, "learning_rate": 1.268850466226379e-08, "loss": 0.1041, "loss_nan_ranks": 0, "loss_rank_avg": 0.09902661293745041, "step": 4075, "valid_targets_mean": 3874.1, "valid_targets_min": 1468 }, { "epoch": 6.938775510204081, "grad_norm": 0.5457182235510927, "learning_rate": 9.847491055856583e-09, "loss": 0.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.11753236502408981, "step": 4080, "valid_targets_mean": 3958.4, "valid_targets_min": 1682 }, { "epoch": 6.947278911564625, "grad_norm": 0.5025326829506257, "learning_rate": 7.365989336469704e-09, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1078265979886055, "step": 4085, "valid_targets_mean": 4657.9, "valid_targets_min": 1975 }, { "epoch": 6.95578231292517, "grad_norm": 0.47189441731529835, "learning_rate": 5.244044132544091e-09, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.09616608917713165, "step": 4090, "valid_targets_mean": 4282.3, "valid_targets_min": 2271 }, { "epoch": 6.964285714285714, "grad_norm": 0.5099985972571627, "learning_rate": 3.481693606095515e-09, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.11529235541820526, "step": 4095, "valid_targets_mean": 4522.9, "valid_targets_min": 1137 }, { "epoch": 6.9727891156462585, "grad_norm": 0.6013770623754892, "learning_rate": 2.078969452030677e-09, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.11263397336006165, "step": 4100, "valid_targets_mean": 3301.1, "valid_targets_min": 305 }, { "epoch": 6.9812925170068025, "grad_norm": 0.5717510938365082, "learning_rate": 1.0358968975676675e-09, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.10689924657344818, "step": 4105, "valid_targets_mean": 3414.9, "valid_targets_min": 1270 }, { "epoch": 6.989795918367347, "grad_norm": 0.4870239489699717, "learning_rate": 3.524947017941038e-10, "loss": 0.1024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1097535490989685, "step": 4110, "valid_targets_mean": 5220.9, "valid_targets_min": 1480 }, { "epoch": 6.9982993197278915, "grad_norm": 0.638306218851505, "learning_rate": 2.8775155322957604e-11, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.12985992431640625, "step": 4115, "valid_targets_mean": 2803.8, "valid_targets_min": 861 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.10281726717948914, "step": 4116, "total_flos": 1032895789924352.0, "train_loss": 0.16274532378516346, "train_runtime": 18062.791, "train_samples_per_second": 3.643, "train_steps_per_second": 0.228, "valid_targets_mean": 3705.9, "valid_targets_min": 1332 } ], "logging_steps": 5, "max_steps": 4116, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1032895789924352.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }