{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 3577, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.009784735812133072, "grad_norm": 7.664685937206668, "learning_rate": 4.46927374301676e-07, "loss": 0.5047, "loss_nan_ranks": 0, "loss_rank_avg": 0.40290629863739014, "step": 5, "valid_targets_mean": 3617.4, "valid_targets_min": 741 }, { "epoch": 0.019569471624266144, "grad_norm": 8.50433555316219, "learning_rate": 1.005586592178771e-06, "loss": 0.5159, "loss_nan_ranks": 0, "loss_rank_avg": 0.4588755965232849, "step": 10, "valid_targets_mean": 3822.6, "valid_targets_min": 914 }, { "epoch": 0.029354207436399216, "grad_norm": 8.480800377443527, "learning_rate": 1.564245810055866e-06, "loss": 0.5094, "loss_nan_ranks": 0, "loss_rank_avg": 0.5068870782852173, "step": 15, "valid_targets_mean": 3282.5, "valid_targets_min": 854 }, { "epoch": 0.03913894324853229, "grad_norm": 6.389055588909931, "learning_rate": 2.1229050279329612e-06, "loss": 0.4612, "loss_nan_ranks": 0, "loss_rank_avg": 0.47990190982818604, "step": 20, "valid_targets_mean": 2669.2, "valid_targets_min": 696 }, { "epoch": 0.04892367906066536, "grad_norm": 4.830165379278388, "learning_rate": 2.6815642458100562e-06, "loss": 0.4547, "loss_nan_ranks": 0, "loss_rank_avg": 0.47788089513778687, "step": 25, "valid_targets_mean": 2784.6, "valid_targets_min": 700 }, { "epoch": 0.05870841487279843, "grad_norm": 3.079180456646436, "learning_rate": 3.240223463687151e-06, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.3710671663284302, "step": 30, "valid_targets_mean": 2843.2, "valid_targets_min": 658 }, { "epoch": 0.0684931506849315, "grad_norm": 2.7785737491972933, "learning_rate": 3.798882681564246e-06, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.3115715980529785, "step": 35, "valid_targets_mean": 2966.5, "valid_targets_min": 324 }, { "epoch": 0.07827788649706457, "grad_norm": 1.5502383905218011, "learning_rate": 4.357541899441341e-06, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.26140934228897095, "step": 40, "valid_targets_mean": 3349.2, "valid_targets_min": 606 }, { "epoch": 0.08806262230919765, "grad_norm": 1.209196728082173, "learning_rate": 4.916201117318436e-06, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.2740545868873596, "step": 45, "valid_targets_mean": 2365.2, "valid_targets_min": 459 }, { "epoch": 0.09784735812133072, "grad_norm": 1.028489362532582, "learning_rate": 5.474860335195531e-06, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.2979404330253601, "step": 50, "valid_targets_mean": 2470.4, "valid_targets_min": 794 }, { "epoch": 0.10763209393346379, "grad_norm": 0.9537486210298864, "learning_rate": 6.033519553072626e-06, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.2909826934337616, "step": 55, "valid_targets_mean": 2224.9, "valid_targets_min": 596 }, { "epoch": 0.11741682974559686, "grad_norm": 0.8658000347460151, "learning_rate": 6.592178770949721e-06, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.291208416223526, "step": 60, "valid_targets_mean": 2375.1, "valid_targets_min": 589 }, { "epoch": 0.12720156555772993, "grad_norm": 0.6647224322577404, "learning_rate": 7.150837988826816e-06, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.24509967863559723, "step": 65, "valid_targets_mean": 2958.6, "valid_targets_min": 595 }, { "epoch": 0.136986301369863, "grad_norm": 0.6073269190290562, "learning_rate": 7.709497206703911e-06, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.20280693471431732, "step": 70, "valid_targets_mean": 2785.6, "valid_targets_min": 535 }, { "epoch": 0.14677103718199608, "grad_norm": 0.6870346313715996, "learning_rate": 8.268156424581007e-06, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.2646217346191406, "step": 75, "valid_targets_mean": 2854.3, "valid_targets_min": 589 }, { "epoch": 0.15655577299412915, "grad_norm": 0.5472437159642437, "learning_rate": 8.826815642458101e-06, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.19694247841835022, "step": 80, "valid_targets_mean": 3170.3, "valid_targets_min": 534 }, { "epoch": 0.16634050880626222, "grad_norm": 0.5389183745441031, "learning_rate": 9.385474860335197e-06, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.17740264534950256, "step": 85, "valid_targets_mean": 2783.5, "valid_targets_min": 527 }, { "epoch": 0.1761252446183953, "grad_norm": 0.5944677207861985, "learning_rate": 9.944134078212291e-06, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.22743840515613556, "step": 90, "valid_targets_mean": 2798.4, "valid_targets_min": 524 }, { "epoch": 0.18590998043052837, "grad_norm": 0.571414117444414, "learning_rate": 1.0502793296089386e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.18952876329421997, "step": 95, "valid_targets_mean": 2777.1, "valid_targets_min": 737 }, { "epoch": 0.19569471624266144, "grad_norm": 0.4604883444760045, "learning_rate": 1.1061452513966481e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.15866714715957642, "step": 100, "valid_targets_mean": 3476.1, "valid_targets_min": 826 }, { "epoch": 0.2054794520547945, "grad_norm": 0.5755387019398245, "learning_rate": 1.1620111731843577e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.17682120203971863, "step": 105, "valid_targets_mean": 2597.6, "valid_targets_min": 569 }, { "epoch": 0.21526418786692758, "grad_norm": 0.6252526071380757, "learning_rate": 1.2178770949720671e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.1682274341583252, "step": 110, "valid_targets_mean": 2008.2, "valid_targets_min": 623 }, { "epoch": 0.22504892367906065, "grad_norm": 0.7444119586394704, "learning_rate": 1.2737430167597766e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.19016528129577637, "step": 115, "valid_targets_mean": 2239.0, "valid_targets_min": 554 }, { "epoch": 0.23483365949119372, "grad_norm": 0.4890590982481748, "learning_rate": 1.3296089385474861e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630125641822815, "step": 120, "valid_targets_mean": 3072.8, "valid_targets_min": 659 }, { "epoch": 0.2446183953033268, "grad_norm": 0.465912335927827, "learning_rate": 1.3854748603351957e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.15328490734100342, "step": 125, "valid_targets_mean": 3095.4, "valid_targets_min": 447 }, { "epoch": 0.25440313111545987, "grad_norm": 0.6891592359602547, "learning_rate": 1.4413407821229052e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.26953524351119995, "step": 130, "valid_targets_mean": 3000.7, "valid_targets_min": 597 }, { "epoch": 0.26418786692759294, "grad_norm": 0.6641646030161167, "learning_rate": 1.4972067039106146e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.21545499563217163, "step": 135, "valid_targets_mean": 2525.5, "valid_targets_min": 616 }, { "epoch": 0.273972602739726, "grad_norm": 0.5830725755570016, "learning_rate": 1.553072625698324e-05, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.216715008020401, "step": 140, "valid_targets_mean": 2687.6, "valid_targets_min": 893 }, { "epoch": 0.2837573385518591, "grad_norm": 0.5767631139839036, "learning_rate": 1.6089385474860336e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.19670595228672028, "step": 145, "valid_targets_mean": 3301.4, "valid_targets_min": 860 }, { "epoch": 0.29354207436399216, "grad_norm": 0.49142360319674744, "learning_rate": 1.664804469273743e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.14769160747528076, "step": 150, "valid_targets_mean": 3333.7, "valid_targets_min": 582 }, { "epoch": 0.30332681017612523, "grad_norm": 0.5716984289756593, "learning_rate": 1.7206703910614527e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.17623479664325714, "step": 155, "valid_targets_mean": 2626.4, "valid_targets_min": 502 }, { "epoch": 0.3131115459882583, "grad_norm": 0.5084369227675787, "learning_rate": 1.776536312849162e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.15722373127937317, "step": 160, "valid_targets_mean": 2934.6, "valid_targets_min": 333 }, { "epoch": 0.32289628180039137, "grad_norm": 0.5735742518385566, "learning_rate": 1.8324022346368716e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.23492315411567688, "step": 165, "valid_targets_mean": 3038.0, "valid_targets_min": 865 }, { "epoch": 0.33268101761252444, "grad_norm": 0.4693397977357504, "learning_rate": 1.888268156424581e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.15091291069984436, "step": 170, "valid_targets_mean": 3301.8, "valid_targets_min": 811 }, { "epoch": 0.3424657534246575, "grad_norm": 0.48675755956862893, "learning_rate": 1.9441340782122907e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.15300670266151428, "step": 175, "valid_targets_mean": 3417.9, "valid_targets_min": 715 }, { "epoch": 0.3522504892367906, "grad_norm": 0.5102150154869952, "learning_rate": 2e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.16056200861930847, "step": 180, "valid_targets_mean": 3057.6, "valid_targets_min": 803 }, { "epoch": 0.36203522504892366, "grad_norm": 0.5515832587824223, "learning_rate": 2.0558659217877096e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.14652328193187714, "step": 185, "valid_targets_mean": 2680.7, "valid_targets_min": 464 }, { "epoch": 0.37181996086105673, "grad_norm": 0.5989282020525712, "learning_rate": 2.1117318435754193e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.18726202845573425, "step": 190, "valid_targets_mean": 2799.1, "valid_targets_min": 520 }, { "epoch": 0.3816046966731898, "grad_norm": 0.4504168777552236, "learning_rate": 2.1675977653631288e-05, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.12995876371860504, "step": 195, "valid_targets_mean": 3549.4, "valid_targets_min": 795 }, { "epoch": 0.3913894324853229, "grad_norm": 0.5818242440905317, "learning_rate": 2.2234636871508385e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.17200620472431183, "step": 200, "valid_targets_mean": 2801.2, "valid_targets_min": 363 }, { "epoch": 0.40117416829745595, "grad_norm": 0.5177140652573206, "learning_rate": 2.2793296089385476e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1553056240081787, "step": 205, "valid_targets_mean": 3184.4, "valid_targets_min": 868 }, { "epoch": 0.410958904109589, "grad_norm": 0.490634701023724, "learning_rate": 2.335195530726257e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.14875340461730957, "step": 210, "valid_targets_mean": 3164.2, "valid_targets_min": 824 }, { "epoch": 0.4207436399217221, "grad_norm": 0.5871331423256096, "learning_rate": 2.3910614525139668e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.20259450376033783, "step": 215, "valid_targets_mean": 2785.0, "valid_targets_min": 693 }, { "epoch": 0.43052837573385516, "grad_norm": 0.5333267414306153, "learning_rate": 2.4469273743016762e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.16707800328731537, "step": 220, "valid_targets_mean": 3486.7, "valid_targets_min": 702 }, { "epoch": 0.44031311154598823, "grad_norm": 0.45969079039542965, "learning_rate": 2.5027932960893856e-05, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.14990051090717316, "step": 225, "valid_targets_mean": 3446.0, "valid_targets_min": 889 }, { "epoch": 0.4500978473581213, "grad_norm": 0.5556944949224483, "learning_rate": 2.5586592178770953e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.16094809770584106, "step": 230, "valid_targets_mean": 3048.9, "valid_targets_min": 729 }, { "epoch": 0.4598825831702544, "grad_norm": 0.49961250529766793, "learning_rate": 2.6145251396648048e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.1248483955860138, "step": 235, "valid_targets_mean": 2743.2, "valid_targets_min": 459 }, { "epoch": 0.46966731898238745, "grad_norm": 0.5630898453724997, "learning_rate": 2.6703910614525145e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.13761404156684875, "step": 240, "valid_targets_mean": 2726.6, "valid_targets_min": 703 }, { "epoch": 0.4794520547945205, "grad_norm": 0.4731743705256023, "learning_rate": 2.7262569832402236e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.13565003871917725, "step": 245, "valid_targets_mean": 3192.2, "valid_targets_min": 704 }, { "epoch": 0.4892367906066536, "grad_norm": 0.6416047138090571, "learning_rate": 2.782122905027933e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502951830625534, "step": 250, "valid_targets_mean": 2625.6, "valid_targets_min": 684 }, { "epoch": 0.49902152641878667, "grad_norm": 0.5557971187389114, "learning_rate": 2.8379888268156424e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.15362128615379333, "step": 255, "valid_targets_mean": 2840.2, "valid_targets_min": 693 }, { "epoch": 0.5088062622309197, "grad_norm": 0.4690894971847644, "learning_rate": 2.8938547486033522e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330149620771408, "step": 260, "valid_targets_mean": 3050.8, "valid_targets_min": 673 }, { "epoch": 0.5185909980430529, "grad_norm": 0.6025829145137604, "learning_rate": 2.9497206703910616e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.13668930530548096, "step": 265, "valid_targets_mean": 2562.8, "valid_targets_min": 549 }, { "epoch": 0.5283757338551859, "grad_norm": 0.4779769696150171, "learning_rate": 3.0055865921787714e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378680169582367, "step": 270, "valid_targets_mean": 3117.8, "valid_targets_min": 645 }, { "epoch": 0.538160469667319, "grad_norm": 0.5087206893144688, "learning_rate": 3.061452513966481e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.15285688638687134, "step": 275, "valid_targets_mean": 3502.2, "valid_targets_min": 773 }, { "epoch": 0.547945205479452, "grad_norm": 0.46853867062532467, "learning_rate": 3.11731843575419e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13073411583900452, "step": 280, "valid_targets_mean": 3103.8, "valid_targets_min": 851 }, { "epoch": 0.5577299412915852, "grad_norm": 0.5244592262420299, "learning_rate": 3.1731843575418996e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.16360273957252502, "step": 285, "valid_targets_mean": 2776.2, "valid_targets_min": 563 }, { "epoch": 0.5675146771037182, "grad_norm": 0.6304714586468612, "learning_rate": 3.229050279329609e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.2574073374271393, "step": 290, "valid_targets_mean": 2842.6, "valid_targets_min": 531 }, { "epoch": 0.5772994129158513, "grad_norm": 0.5060780163327306, "learning_rate": 3.2849162011173184e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.12446580827236176, "step": 295, "valid_targets_mean": 3434.2, "valid_targets_min": 925 }, { "epoch": 0.5870841487279843, "grad_norm": 0.5645619555774959, "learning_rate": 3.340782122905028e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.14075535535812378, "step": 300, "valid_targets_mean": 2749.1, "valid_targets_min": 765 }, { "epoch": 0.5968688845401174, "grad_norm": 0.5019563126770876, "learning_rate": 3.396648044692738e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.1525002121925354, "step": 305, "valid_targets_mean": 2889.3, "valid_targets_min": 342 }, { "epoch": 0.6066536203522505, "grad_norm": 0.8633134325378282, "learning_rate": 3.4525139664804474e-05, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.15216107666492462, "step": 310, "valid_targets_mean": 2542.5, "valid_targets_min": 742 }, { "epoch": 0.6164383561643836, "grad_norm": 0.518661419343394, "learning_rate": 3.508379888268157e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.14660073816776276, "step": 315, "valid_targets_mean": 3098.8, "valid_targets_min": 600 }, { "epoch": 0.6262230919765166, "grad_norm": 0.4288729432621478, "learning_rate": 3.564245810055866e-05, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.1281621754169464, "step": 320, "valid_targets_mean": 3366.9, "valid_targets_min": 492 }, { "epoch": 0.6360078277886497, "grad_norm": 0.5245999073963563, "learning_rate": 3.6201117318435756e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.14279915392398834, "step": 325, "valid_targets_mean": 2867.5, "valid_targets_min": 658 }, { "epoch": 0.6457925636007827, "grad_norm": 0.5409938601242019, "learning_rate": 3.675977653631285e-05, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1241241842508316, "step": 330, "valid_targets_mean": 2814.8, "valid_targets_min": 650 }, { "epoch": 0.6555772994129159, "grad_norm": 0.5367639238304938, "learning_rate": 3.7318435754189944e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.13935647904872894, "step": 335, "valid_targets_mean": 2107.4, "valid_targets_min": 598 }, { "epoch": 0.6653620352250489, "grad_norm": 0.5190264673793914, "learning_rate": 3.787709497206704e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.13536672294139862, "step": 340, "valid_targets_mean": 3303.1, "valid_targets_min": 805 }, { "epoch": 0.675146771037182, "grad_norm": 0.4810572486523759, "learning_rate": 3.843575418994414e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.15841111540794373, "step": 345, "valid_targets_mean": 3270.0, "valid_targets_min": 762 }, { "epoch": 0.684931506849315, "grad_norm": 0.45491328608286835, "learning_rate": 3.8994413407821234e-05, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.14639562368392944, "step": 350, "valid_targets_mean": 3250.1, "valid_targets_min": 807 }, { "epoch": 0.6947162426614482, "grad_norm": 0.4672379304521524, "learning_rate": 3.955307262569833e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.13699516654014587, "step": 355, "valid_targets_mean": 3220.0, "valid_targets_min": 808 }, { "epoch": 0.7045009784735812, "grad_norm": 0.587847822651443, "learning_rate": 3.99999904751585e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.21118012070655823, "step": 360, "valid_targets_mean": 2303.2, "valid_targets_min": 600 }, { "epoch": 0.7142857142857143, "grad_norm": 0.5160918575652919, "learning_rate": 3.999965710665851e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.14607413113117218, "step": 365, "valid_targets_mean": 2839.4, "valid_targets_min": 494 }, { "epoch": 0.7240704500978473, "grad_norm": 0.4341683819577898, "learning_rate": 3.999884750515563e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.13683652877807617, "step": 370, "valid_targets_mean": 3752.6, "valid_targets_min": 550 }, { "epoch": 0.7338551859099804, "grad_norm": 0.5603714103623396, "learning_rate": 3.999756168992814e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.17999452352523804, "step": 375, "valid_targets_mean": 2864.7, "valid_targets_min": 482 }, { "epoch": 0.7436399217221135, "grad_norm": 0.4578337150635251, "learning_rate": 3.999579969159395e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.1431577503681183, "step": 380, "valid_targets_mean": 3439.2, "valid_targets_min": 852 }, { "epoch": 0.7534246575342466, "grad_norm": 0.48938549638567597, "learning_rate": 3.999356155210986e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.19597536325454712, "step": 385, "valid_targets_mean": 3274.6, "valid_targets_min": 553 }, { "epoch": 0.7632093933463796, "grad_norm": 0.5734981062865676, "learning_rate": 3.9990847324770584e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.13992062211036682, "step": 390, "valid_targets_mean": 2851.9, "valid_targets_min": 685 }, { "epoch": 0.7729941291585127, "grad_norm": 0.5219177121218723, "learning_rate": 3.998765707420746e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.16220493614673615, "step": 395, "valid_targets_mean": 2681.6, "valid_targets_min": 912 }, { "epoch": 0.7827788649706457, "grad_norm": 0.5117389003410739, "learning_rate": 3.998399087638692e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.13427501916885376, "step": 400, "valid_targets_mean": 2833.2, "valid_targets_min": 357 }, { "epoch": 0.7925636007827789, "grad_norm": 0.45630749060617215, "learning_rate": 3.997984881860869e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.13904061913490295, "step": 405, "valid_targets_mean": 2951.7, "valid_targets_min": 664 }, { "epoch": 0.8023483365949119, "grad_norm": 0.532441802548241, "learning_rate": 3.9975230999503674e-05, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.18587175011634827, "step": 410, "valid_targets_mean": 2718.6, "valid_targets_min": 731 }, { "epoch": 0.812133072407045, "grad_norm": 0.5201313018088487, "learning_rate": 3.997013752903166e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.17946481704711914, "step": 415, "valid_targets_mean": 2429.7, "valid_targets_min": 602 }, { "epoch": 0.821917808219178, "grad_norm": 0.4733086498760068, "learning_rate": 3.996456852847867e-05, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.15358425676822662, "step": 420, "valid_targets_mean": 3413.8, "valid_targets_min": 1009 }, { "epoch": 0.8317025440313112, "grad_norm": 0.43812773082093437, "learning_rate": 3.995852413045406e-05, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.13964691758155823, "step": 425, "valid_targets_mean": 3069.9, "valid_targets_min": 1049 }, { "epoch": 0.8414872798434442, "grad_norm": 0.41481899566210445, "learning_rate": 3.995200447888739e-05, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.11863437294960022, "step": 430, "valid_targets_mean": 3568.8, "valid_targets_min": 821 }, { "epoch": 0.8512720156555773, "grad_norm": 0.4498805859648879, "learning_rate": 3.9945009729024984e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.16341759264469147, "step": 435, "valid_targets_mean": 2945.4, "valid_targets_min": 731 }, { "epoch": 0.8610567514677103, "grad_norm": 0.49895994291075085, "learning_rate": 3.993754004742625e-05, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.13261038064956665, "step": 440, "valid_targets_mean": 2722.4, "valid_targets_min": 766 }, { "epoch": 0.8708414872798435, "grad_norm": 0.47491888903670937, "learning_rate": 3.992959561195965e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.20256978273391724, "step": 445, "valid_targets_mean": 3347.3, "valid_targets_min": 837 }, { "epoch": 0.8806262230919765, "grad_norm": 0.4455913646457985, "learning_rate": 3.9921176611798577e-05, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.11824070662260056, "step": 450, "valid_targets_mean": 3272.7, "valid_targets_min": 1058 }, { "epoch": 0.8904109589041096, "grad_norm": 0.5687543644243216, "learning_rate": 3.9912283247416746e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.13478372991085052, "step": 455, "valid_targets_mean": 3132.4, "valid_targets_min": 742 }, { "epoch": 0.9001956947162426, "grad_norm": 0.37827545084266456, "learning_rate": 3.990291573058345e-05, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.10885334014892578, "step": 460, "valid_targets_mean": 3407.7, "valid_targets_min": 943 }, { "epoch": 0.9099804305283757, "grad_norm": 0.4175485573365561, "learning_rate": 3.989307428435858e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.1276848316192627, "step": 465, "valid_targets_mean": 3251.0, "valid_targets_min": 867 }, { "epoch": 0.9197651663405088, "grad_norm": 0.49808980526853586, "learning_rate": 3.9882759143087194e-05, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.14108321070671082, "step": 470, "valid_targets_mean": 2904.2, "valid_targets_min": 503 }, { "epoch": 0.9295499021526419, "grad_norm": 0.40177200330690865, "learning_rate": 3.9871970552394066e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.13899895548820496, "step": 475, "valid_targets_mean": 3147.8, "valid_targets_min": 795 }, { "epoch": 0.9393346379647749, "grad_norm": 0.42481204661487465, "learning_rate": 3.986070876917773e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.16770583391189575, "step": 480, "valid_targets_mean": 3443.7, "valid_targets_min": 691 }, { "epoch": 0.949119373776908, "grad_norm": 0.5444357960985896, "learning_rate": 3.984897406160443e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.16325880587100983, "step": 485, "valid_targets_mean": 2540.9, "valid_targets_min": 714 }, { "epoch": 0.958904109589041, "grad_norm": 0.4632384623061562, "learning_rate": 3.9836766709101714e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.17608124017715454, "step": 490, "valid_targets_mean": 3103.3, "valid_targets_min": 613 }, { "epoch": 0.9686888454011742, "grad_norm": 0.4187576842004876, "learning_rate": 3.9824087002351765e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1268356442451477, "step": 495, "valid_targets_mean": 3034.8, "valid_targets_min": 873 }, { "epoch": 0.9784735812133072, "grad_norm": 0.48280261413787057, "learning_rate": 3.9810935243284496e-05, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.12477391213178635, "step": 500, "valid_targets_mean": 3063.3, "valid_targets_min": 738 }, { "epoch": 0.9882583170254403, "grad_norm": 0.39168001410008785, "learning_rate": 3.979731174507038e-05, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12986153364181519, "step": 505, "valid_targets_mean": 3226.4, "valid_targets_min": 559 }, { "epoch": 0.9980430528375733, "grad_norm": 0.46896658336753394, "learning_rate": 3.978321683211294e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.15444520115852356, "step": 510, "valid_targets_mean": 2962.0, "valid_targets_min": 669 }, { "epoch": 1.0078277886497065, "grad_norm": 0.4298181968101464, "learning_rate": 3.976865084004107e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293889433145523, "step": 515, "valid_targets_mean": 2834.4, "valid_targets_min": 516 }, { "epoch": 1.0176125244618395, "grad_norm": 0.4403428932485871, "learning_rate": 3.975361411570101e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426129937171936, "step": 520, "valid_targets_mean": 3185.1, "valid_targets_min": 559 }, { "epoch": 1.0273972602739727, "grad_norm": 0.43223418895898846, "learning_rate": 3.9738107017148145e-05, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.11700769513845444, "step": 525, "valid_targets_mean": 2929.1, "valid_targets_min": 524 }, { "epoch": 1.0371819960861057, "grad_norm": 0.383816735814963, "learning_rate": 3.972212991363839e-05, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.11716213077306747, "step": 530, "valid_targets_mean": 3100.0, "valid_targets_min": 195 }, { "epoch": 1.0469667318982387, "grad_norm": 0.47087470364735173, "learning_rate": 3.970568318561947e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.14262157678604126, "step": 535, "valid_targets_mean": 3104.8, "valid_targets_min": 559 }, { "epoch": 1.0567514677103718, "grad_norm": 0.4263249245829921, "learning_rate": 3.9688767224721834e-05, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.11953842639923096, "step": 540, "valid_targets_mean": 2913.2, "valid_targets_min": 629 }, { "epoch": 1.0665362035225048, "grad_norm": 0.4098653850081825, "learning_rate": 3.9671382433749335e-05, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.12505799531936646, "step": 545, "valid_targets_mean": 3437.8, "valid_targets_min": 789 }, { "epoch": 1.076320939334638, "grad_norm": 0.4263174933585311, "learning_rate": 3.965352922666963e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353525072336197, "step": 550, "valid_targets_mean": 3178.6, "valid_targets_min": 916 }, { "epoch": 1.086105675146771, "grad_norm": 0.34866454920181195, "learning_rate": 3.963520802860433e-05, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.11077715456485748, "step": 555, "valid_targets_mean": 3791.6, "valid_targets_min": 1366 }, { "epoch": 1.095890410958904, "grad_norm": 0.4611779341003833, "learning_rate": 3.961641927581886e-05, "loss": 0.1206, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390659213066101, "step": 560, "valid_targets_mean": 3071.4, "valid_targets_min": 805 }, { "epoch": 1.1056751467710373, "grad_norm": 0.4407781207124439, "learning_rate": 3.9597163415712115e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.11901605874300003, "step": 565, "valid_targets_mean": 2988.6, "valid_targets_min": 531 }, { "epoch": 1.1154598825831703, "grad_norm": 0.4893014553120929, "learning_rate": 3.957744090680575e-05, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.14788511395454407, "step": 570, "valid_targets_mean": 2563.8, "valid_targets_min": 801 }, { "epoch": 1.1252446183953033, "grad_norm": 0.4451966676623463, "learning_rate": 3.9557252218733306e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.13166627287864685, "step": 575, "valid_targets_mean": 3022.2, "valid_targets_min": 531 }, { "epoch": 1.1350293542074363, "grad_norm": 0.4128155142273592, "learning_rate": 3.9536597832228995e-05, "loss": 0.1213, "loss_nan_ranks": 0, "loss_rank_avg": 0.13153548538684845, "step": 580, "valid_targets_mean": 3557.9, "valid_targets_min": 856 }, { "epoch": 1.1448140900195694, "grad_norm": 0.52173362133626, "learning_rate": 3.951547823911628e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.14766138792037964, "step": 585, "valid_targets_mean": 2381.2, "valid_targets_min": 490 }, { "epoch": 1.1545988258317026, "grad_norm": 0.43298593648168354, "learning_rate": 3.9493893942296146e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12547074258327484, "step": 590, "valid_targets_mean": 3065.9, "valid_targets_min": 748 }, { "epoch": 1.1643835616438356, "grad_norm": 0.5197412292961334, "learning_rate": 3.947184545573513e-05, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12710896134376526, "step": 595, "valid_targets_mean": 2627.9, "valid_targets_min": 492 }, { "epoch": 1.1741682974559686, "grad_norm": 0.4474540656691777, "learning_rate": 3.944933330445307e-05, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.12056642025709152, "step": 600, "valid_targets_mean": 2639.8, "valid_targets_min": 663 }, { "epoch": 1.1839530332681019, "grad_norm": 0.40153254889780027, "learning_rate": 3.942635802451064e-05, "loss": 0.1047, "loss_nan_ranks": 0, "loss_rank_avg": 0.104750856757164, "step": 605, "valid_targets_mean": 3113.3, "valid_targets_min": 518 }, { "epoch": 1.1937377690802349, "grad_norm": 0.41024686531210736, "learning_rate": 3.940292016299654e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.13328008353710175, "step": 610, "valid_targets_mean": 2628.1, "valid_targets_min": 602 }, { "epoch": 1.203522504892368, "grad_norm": 0.4610646996665633, "learning_rate": 3.93790202780145e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.13698866963386536, "step": 615, "valid_targets_mean": 2848.0, "valid_targets_min": 577 }, { "epoch": 1.213307240704501, "grad_norm": 0.38926695397791977, "learning_rate": 3.935465893866998e-05, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.10700084269046783, "step": 620, "valid_targets_mean": 3378.0, "valid_targets_min": 681 }, { "epoch": 1.223091976516634, "grad_norm": 0.45388226915219076, "learning_rate": 3.932983672505661e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.12499846518039703, "step": 625, "valid_targets_mean": 2968.1, "valid_targets_min": 472 }, { "epoch": 1.2328767123287672, "grad_norm": 0.5155794540649574, "learning_rate": 3.9304554228242396e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.16853684186935425, "step": 630, "valid_targets_mean": 2686.6, "valid_targets_min": 613 }, { "epoch": 1.2426614481409002, "grad_norm": 0.4305098652867405, "learning_rate": 3.927881205025562e-05, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1281091570854187, "step": 635, "valid_targets_mean": 2797.1, "valid_targets_min": 689 }, { "epoch": 1.2524461839530332, "grad_norm": 0.3947701639870653, "learning_rate": 3.9252610804070526e-05, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.11794069409370422, "step": 640, "valid_targets_mean": 3482.6, "valid_targets_min": 554 }, { "epoch": 1.2622309197651664, "grad_norm": 0.5334016538211457, "learning_rate": 3.9225951113592735e-05, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.147422656416893, "step": 645, "valid_targets_mean": 2707.8, "valid_targets_min": 493 }, { "epoch": 1.2720156555772995, "grad_norm": 0.5165896986431493, "learning_rate": 3.9198833613644333e-05, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.12175339460372925, "step": 650, "valid_targets_mean": 2479.2, "valid_targets_min": 583 }, { "epoch": 1.2818003913894325, "grad_norm": 0.40502772636845047, "learning_rate": 3.9171258949948827e-05, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.11957898736000061, "step": 655, "valid_targets_mean": 3226.8, "valid_targets_min": 891 }, { "epoch": 1.2915851272015655, "grad_norm": 0.48197554939891096, "learning_rate": 3.914322777911571e-05, "loss": 0.1144, "loss_nan_ranks": 0, "loss_rank_avg": 0.112558513879776, "step": 660, "valid_targets_mean": 2785.1, "valid_targets_min": 710 }, { "epoch": 1.3013698630136985, "grad_norm": 0.4295467516080876, "learning_rate": 3.911474076862487e-05, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.14773568511009216, "step": 665, "valid_targets_mean": 2864.2, "valid_targets_min": 795 }, { "epoch": 1.3111545988258317, "grad_norm": 0.4615813117659187, "learning_rate": 3.908579859681065e-05, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.12034747749567032, "step": 670, "valid_targets_mean": 2775.5, "valid_targets_min": 726 }, { "epoch": 1.3209393346379648, "grad_norm": 0.5034226535478493, "learning_rate": 3.905640195284574e-05, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.16286320984363556, "step": 675, "valid_targets_mean": 2521.2, "valid_targets_min": 766 }, { "epoch": 1.3307240704500978, "grad_norm": 0.42231990338171094, "learning_rate": 3.9026551536724754e-05, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.13433174788951874, "step": 680, "valid_targets_mean": 3121.4, "valid_targets_min": 721 }, { "epoch": 1.340508806262231, "grad_norm": 0.4038708539406575, "learning_rate": 3.899624805924753e-05, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403772532939911, "step": 685, "valid_targets_mean": 3254.3, "valid_targets_min": 647 }, { "epoch": 1.350293542074364, "grad_norm": 0.4299434106098187, "learning_rate": 3.896549224200225e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12135376781225204, "step": 690, "valid_targets_mean": 2571.9, "valid_targets_min": 618 }, { "epoch": 1.360078277886497, "grad_norm": 0.4306682083734945, "learning_rate": 3.8934284817348224e-05, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.10059612989425659, "step": 695, "valid_targets_mean": 3323.1, "valid_targets_min": 811 }, { "epoch": 1.36986301369863, "grad_norm": 0.5108627017777738, "learning_rate": 3.890262652839847e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.14139822125434875, "step": 700, "valid_targets_mean": 3045.6, "valid_targets_min": 633 }, { "epoch": 1.379647749510763, "grad_norm": 0.43419713202620003, "learning_rate": 3.887051812900203e-05, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.15847548842430115, "step": 705, "valid_targets_mean": 2795.1, "valid_targets_min": 803 }, { "epoch": 1.3894324853228963, "grad_norm": 0.40330836063363107, "learning_rate": 3.883796038372596e-05, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.1492297649383545, "step": 710, "valid_targets_mean": 3402.1, "valid_targets_min": 636 }, { "epoch": 1.3992172211350293, "grad_norm": 0.4967106304379057, "learning_rate": 3.8804954067837215e-05, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.14624662697315216, "step": 715, "valid_targets_mean": 3127.6, "valid_targets_min": 1054 }, { "epoch": 1.4090019569471623, "grad_norm": 0.4217697643614769, "learning_rate": 3.87714999672841e-05, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.13098879158496857, "step": 720, "valid_targets_mean": 2735.1, "valid_targets_min": 678 }, { "epoch": 1.4187866927592956, "grad_norm": 0.3863038902644223, "learning_rate": 3.873759887867762e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.1081153154373169, "step": 725, "valid_targets_mean": 2962.9, "valid_targets_min": 333 }, { "epoch": 1.4285714285714286, "grad_norm": 0.4366298043459826, "learning_rate": 3.8703251609272464e-05, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.12468526512384415, "step": 730, "valid_targets_mean": 2868.8, "valid_targets_min": 623 }, { "epoch": 1.4383561643835616, "grad_norm": 0.5389918919734983, "learning_rate": 3.8668458976947834e-05, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12536370754241943, "step": 735, "valid_targets_mean": 2728.8, "valid_targets_min": 730 }, { "epoch": 1.4481409001956946, "grad_norm": 0.4209283462484907, "learning_rate": 3.8633221810187914e-05, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.14346784353256226, "step": 740, "valid_targets_mean": 2871.4, "valid_targets_min": 523 }, { "epoch": 1.4579256360078277, "grad_norm": 0.3944143889984141, "learning_rate": 3.859754094806217e-05, "loss": 0.1232, "loss_nan_ranks": 0, "loss_rank_avg": 0.11453887820243835, "step": 745, "valid_targets_mean": 3111.7, "valid_targets_min": 779 }, { "epoch": 1.467710371819961, "grad_norm": 0.4509652697403836, "learning_rate": 3.856141724020539e-05, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.11700256168842316, "step": 750, "valid_targets_mean": 2824.9, "valid_targets_min": 535 }, { "epoch": 1.477495107632094, "grad_norm": 0.4838886367870153, "learning_rate": 3.85248515467974e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.13873013854026794, "step": 755, "valid_targets_mean": 2238.0, "valid_targets_min": 526 }, { "epoch": 1.487279843444227, "grad_norm": 0.5509873326146855, "learning_rate": 3.848784473854264e-05, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.14058071374893188, "step": 760, "valid_targets_mean": 2273.0, "valid_targets_min": 634 }, { "epoch": 1.4970645792563602, "grad_norm": 0.39915637445399327, "learning_rate": 3.8450397696649375e-05, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.0962296724319458, "step": 765, "valid_targets_mean": 2820.8, "valid_targets_min": 799 }, { "epoch": 1.5068493150684932, "grad_norm": 0.4256620360833589, "learning_rate": 3.841251131280877e-05, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.13869571685791016, "step": 770, "valid_targets_mean": 2889.6, "valid_targets_min": 572 }, { "epoch": 1.5166340508806262, "grad_norm": 0.4738644474376625, "learning_rate": 3.8374186489173586e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.15252867341041565, "step": 775, "valid_targets_mean": 2849.9, "valid_targets_min": 568 }, { "epoch": 1.5264187866927594, "grad_norm": 0.4586682660406289, "learning_rate": 3.833542413833678e-05, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.11463161557912827, "step": 780, "valid_targets_mean": 2530.9, "valid_targets_min": 578 }, { "epoch": 1.5362035225048922, "grad_norm": 0.5624104088370981, "learning_rate": 3.8296225183309717e-05, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.13047656416893005, "step": 785, "valid_targets_mean": 2341.8, "valid_targets_min": 676 }, { "epoch": 1.5459882583170255, "grad_norm": 0.4198461156087575, "learning_rate": 3.825659055750019e-05, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.13537245988845825, "step": 790, "valid_targets_mean": 3042.0, "valid_targets_min": 727 }, { "epoch": 1.5557729941291585, "grad_norm": 0.36831522550408496, "learning_rate": 3.821652120469023e-05, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.12275904417037964, "step": 795, "valid_targets_mean": 3540.9, "valid_targets_min": 1425 }, { "epoch": 1.5655577299412915, "grad_norm": 0.5195803523592514, "learning_rate": 3.81760180790136e-05, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.17436471581459045, "step": 800, "valid_targets_mean": 2270.1, "valid_targets_min": 497 }, { "epoch": 1.5753424657534247, "grad_norm": 0.3900604756464933, "learning_rate": 3.81350821449331e-05, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12121501564979553, "step": 805, "valid_targets_mean": 3190.0, "valid_targets_min": 634 }, { "epoch": 1.5851272015655578, "grad_norm": 0.40674054952886596, "learning_rate": 3.809371437721758e-05, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.129991352558136, "step": 810, "valid_targets_mean": 3047.8, "valid_targets_min": 882 }, { "epoch": 1.5949119373776908, "grad_norm": 0.46210844804033524, "learning_rate": 3.805191576091874e-05, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.1609773337841034, "step": 815, "valid_targets_mean": 2791.4, "valid_targets_min": 726 }, { "epoch": 1.604696673189824, "grad_norm": 0.44015961841612017, "learning_rate": 3.800968729134767e-05, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.11716459691524506, "step": 820, "valid_targets_mean": 2432.6, "valid_targets_min": 503 }, { "epoch": 1.6144814090019568, "grad_norm": 0.3674024934355759, "learning_rate": 3.7967029974051166e-05, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.12538853287696838, "step": 825, "valid_targets_mean": 3603.0, "valid_targets_min": 2751 }, { "epoch": 1.62426614481409, "grad_norm": 0.445318152082194, "learning_rate": 3.7923944824787746e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.12994927167892456, "step": 830, "valid_targets_mean": 2598.8, "valid_targets_min": 623 }, { "epoch": 1.634050880626223, "grad_norm": 0.3890277594921652, "learning_rate": 3.78804328695035e-05, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1315343677997589, "step": 835, "valid_targets_mean": 3161.4, "valid_targets_min": 960 }, { "epoch": 1.643835616438356, "grad_norm": 0.389914488948936, "learning_rate": 3.7836495144307644e-05, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.12948748469352722, "step": 840, "valid_targets_mean": 3036.4, "valid_targets_min": 677 }, { "epoch": 1.6536203522504893, "grad_norm": 0.40333039661437403, "learning_rate": 3.779213269544788e-05, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1190645694732666, "step": 845, "valid_targets_mean": 2843.1, "valid_targets_min": 950 }, { "epoch": 1.6634050880626223, "grad_norm": 0.3781685193021049, "learning_rate": 3.77473465792854e-05, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.10028046369552612, "step": 850, "valid_targets_mean": 3250.7, "valid_targets_min": 786 }, { "epoch": 1.6731898238747553, "grad_norm": 0.4260461202222236, "learning_rate": 3.770213786226984e-05, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.11517356336116791, "step": 855, "valid_targets_mean": 2516.8, "valid_targets_min": 647 }, { "epoch": 1.6829745596868886, "grad_norm": 0.43990271393461494, "learning_rate": 3.7656507620913796e-05, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.14541923999786377, "step": 860, "valid_targets_mean": 2481.6, "valid_targets_min": 652 }, { "epoch": 1.6927592954990214, "grad_norm": 0.44787305256684223, "learning_rate": 3.761045694176725e-05, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.1405627429485321, "step": 865, "valid_targets_mean": 2722.5, "valid_targets_min": 837 }, { "epoch": 1.7025440313111546, "grad_norm": 0.4117925127419459, "learning_rate": 3.756398692139165e-05, "loss": 0.1183, "loss_nan_ranks": 0, "loss_rank_avg": 0.1328292191028595, "step": 870, "valid_targets_mean": 3010.8, "valid_targets_min": 333 }, { "epoch": 1.7123287671232876, "grad_norm": 0.35516745903521674, "learning_rate": 3.751709866633384e-05, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.11084195226430893, "step": 875, "valid_targets_mean": 3389.6, "valid_targets_min": 758 }, { "epoch": 1.7221135029354206, "grad_norm": 0.38527383980094254, "learning_rate": 3.74697932930997e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.11033222079277039, "step": 880, "valid_targets_mean": 2953.3, "valid_targets_min": 826 }, { "epoch": 1.7318982387475539, "grad_norm": 0.3706588060490617, "learning_rate": 3.742207192812752e-05, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.14947205781936646, "step": 885, "valid_targets_mean": 3483.3, "valid_targets_min": 1061 }, { "epoch": 1.741682974559687, "grad_norm": 0.42813076779856735, "learning_rate": 3.737393570776124e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.16240671277046204, "step": 890, "valid_targets_mean": 3113.2, "valid_targets_min": 761 }, { "epoch": 1.75146771037182, "grad_norm": 0.4217288729608291, "learning_rate": 3.732538577822335e-05, "loss": 0.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.12056794762611389, "step": 895, "valid_targets_mean": 2541.4, "valid_targets_min": 575 }, { "epoch": 1.7612524461839532, "grad_norm": 0.4173165892277017, "learning_rate": 3.7276423295587614e-05, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11108045279979706, "step": 900, "valid_targets_mean": 3487.0, "valid_targets_min": 744 }, { "epoch": 1.771037181996086, "grad_norm": 0.42994312549627534, "learning_rate": 3.722704942575151e-05, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.12259448319673538, "step": 905, "valid_targets_mean": 2648.9, "valid_targets_min": 720 }, { "epoch": 1.7808219178082192, "grad_norm": 0.3880527350360599, "learning_rate": 3.717726534440853e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.13088837265968323, "step": 910, "valid_targets_mean": 3324.6, "valid_targets_min": 566 }, { "epoch": 1.7906066536203522, "grad_norm": 0.4434184187700376, "learning_rate": 3.71270722370201e-05, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504274606704712, "step": 915, "valid_targets_mean": 3018.6, "valid_targets_min": 1146 }, { "epoch": 1.8003913894324852, "grad_norm": 0.4292410117909898, "learning_rate": 3.7076471298787454e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.12650364637374878, "step": 920, "valid_targets_mean": 2849.6, "valid_targets_min": 635 }, { "epoch": 1.8101761252446185, "grad_norm": 0.4620328865073727, "learning_rate": 3.702546373462307e-05, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.14168865978717804, "step": 925, "valid_targets_mean": 2532.8, "valid_targets_min": 458 }, { "epoch": 1.8199608610567515, "grad_norm": 0.39121311292947436, "learning_rate": 3.697405075912204e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334732323884964, "step": 930, "valid_targets_mean": 2946.3, "valid_targets_min": 763 }, { "epoch": 1.8297455968688845, "grad_norm": 0.4231935245395829, "learning_rate": 3.692223359653316e-05, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.12490694969892502, "step": 935, "valid_targets_mean": 2961.6, "valid_targets_min": 875 }, { "epoch": 1.8395303326810177, "grad_norm": 0.3836018694964112, "learning_rate": 3.6870013480729714e-05, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1226375624537468, "step": 940, "valid_targets_mean": 3168.6, "valid_targets_min": 818 }, { "epoch": 1.8493150684931505, "grad_norm": 0.3817306405122374, "learning_rate": 3.681739165518015e-05, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.11338752508163452, "step": 945, "valid_targets_mean": 3203.5, "valid_targets_min": 829 }, { "epoch": 1.8590998043052838, "grad_norm": 0.36451803335347466, "learning_rate": 3.676436937291845e-05, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.10180258750915527, "step": 950, "valid_targets_mean": 3313.1, "valid_targets_min": 540 }, { "epoch": 1.8688845401174168, "grad_norm": 0.4176609159216137, "learning_rate": 3.671094789651431e-05, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.13892988860607147, "step": 955, "valid_targets_mean": 2564.2, "valid_targets_min": 622 }, { "epoch": 1.8786692759295498, "grad_norm": 0.34566771786799344, "learning_rate": 3.665712849804303e-05, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.10103757679462433, "step": 960, "valid_targets_mean": 2706.9, "valid_targets_min": 545 }, { "epoch": 1.888454011741683, "grad_norm": 0.3774548068273026, "learning_rate": 3.660291245905527e-05, "loss": 0.1148, "loss_nan_ranks": 0, "loss_rank_avg": 0.11747957766056061, "step": 965, "valid_targets_mean": 3305.8, "valid_targets_min": 917 }, { "epoch": 1.898238747553816, "grad_norm": 0.3120169544499443, "learning_rate": 3.654830107054653e-05, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.09748544543981552, "step": 970, "valid_targets_mean": 3459.0, "valid_targets_min": 673 }, { "epoch": 1.908023483365949, "grad_norm": 0.33933572630751907, "learning_rate": 3.649329563292636e-05, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.09858500957489014, "step": 975, "valid_targets_mean": 3246.3, "valid_targets_min": 675 }, { "epoch": 1.9178082191780823, "grad_norm": 0.40603295725781186, "learning_rate": 3.643789745598747e-05, "loss": 0.1142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1274852752685547, "step": 980, "valid_targets_mean": 2795.3, "valid_targets_min": 682 }, { "epoch": 1.927592954990215, "grad_norm": 0.4191871755564024, "learning_rate": 3.6382107858874486e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.10585680603981018, "step": 985, "valid_targets_mean": 3008.0, "valid_targets_min": 523 }, { "epoch": 1.9373776908023483, "grad_norm": 0.3377742800232099, "learning_rate": 3.6325928170052544e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.12053216248750687, "step": 990, "valid_targets_mean": 3640.9, "valid_targets_min": 579 }, { "epoch": 1.9471624266144814, "grad_norm": 0.36466290074318763, "learning_rate": 3.626935972727568e-05, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.1167193278670311, "step": 995, "valid_targets_mean": 3513.2, "valid_targets_min": 387 }, { "epoch": 1.9569471624266144, "grad_norm": 0.40372660130343563, "learning_rate": 3.621240387755494e-05, "loss": 0.1149, "loss_nan_ranks": 0, "loss_rank_avg": 0.11789439618587494, "step": 1000, "valid_targets_mean": 2972.4, "valid_targets_min": 912 }, { "epoch": 1.9667318982387476, "grad_norm": 0.42797189481651093, "learning_rate": 3.615506197712637e-05, "loss": 0.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1452379822731018, "step": 1005, "valid_targets_mean": 2670.8, "valid_targets_min": 536 }, { "epoch": 1.9765166340508806, "grad_norm": 0.35936118436803327, "learning_rate": 3.6097335391418634e-05, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.10821876674890518, "step": 1010, "valid_targets_mean": 3538.1, "valid_targets_min": 736 }, { "epoch": 1.9863013698630136, "grad_norm": 0.4019939735333693, "learning_rate": 3.603922549502056e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.122370645403862, "step": 1015, "valid_targets_mean": 2999.8, "valid_targets_min": 688 }, { "epoch": 1.9960861056751469, "grad_norm": 0.4079341056255008, "learning_rate": 3.59807336716484e-05, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.13142286241054535, "step": 1020, "valid_targets_mean": 2939.8, "valid_targets_min": 723 }, { "epoch": 2.0058708414872797, "grad_norm": 0.37927102783719413, "learning_rate": 3.592186131411288e-05, "loss": 0.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.1184164509177208, "step": 1025, "valid_targets_mean": 3151.8, "valid_targets_min": 549 }, { "epoch": 2.015655577299413, "grad_norm": 0.35567280100676857, "learning_rate": 3.5862609824285995e-05, "loss": 0.11, "loss_nan_ranks": 0, "loss_rank_avg": 0.09433744847774506, "step": 1030, "valid_targets_mean": 3086.3, "valid_targets_min": 689 }, { "epoch": 2.025440313111546, "grad_norm": 0.3202690936990612, "learning_rate": 3.580298061306769e-05, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.08629706501960754, "step": 1035, "valid_targets_mean": 3638.2, "valid_targets_min": 1517 }, { "epoch": 2.035225048923679, "grad_norm": 0.41815661879008403, "learning_rate": 3.574297510035222e-05, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.13752664625644684, "step": 1040, "valid_targets_mean": 2789.5, "valid_targets_min": 712 }, { "epoch": 2.045009784735812, "grad_norm": 0.4285897024481416, "learning_rate": 3.568259471499437e-05, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.12494560331106186, "step": 1045, "valid_targets_mean": 2809.8, "valid_targets_min": 542 }, { "epoch": 2.0547945205479454, "grad_norm": 0.42321458686631774, "learning_rate": 3.562184089477539e-05, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.11364944279193878, "step": 1050, "valid_targets_mean": 3062.5, "valid_targets_min": 702 }, { "epoch": 2.064579256360078, "grad_norm": 0.39688700303262975, "learning_rate": 3.556071508636879e-05, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.10698528587818146, "step": 1055, "valid_targets_mean": 3079.9, "valid_targets_min": 612 }, { "epoch": 2.0743639921722115, "grad_norm": 0.4363705848578071, "learning_rate": 3.5499218745305906e-05, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.11804713308811188, "step": 1060, "valid_targets_mean": 2758.2, "valid_targets_min": 650 }, { "epoch": 2.0841487279843443, "grad_norm": 0.33761894592833736, "learning_rate": 3.5437353335941194e-05, "loss": 0.0965, "loss_nan_ranks": 0, "loss_rank_avg": 0.08259192854166031, "step": 1065, "valid_targets_mean": 3166.1, "valid_targets_min": 727 }, { "epoch": 2.0939334637964775, "grad_norm": 0.393251902764125, "learning_rate": 3.537512033141739e-05, "loss": 0.1014, "loss_nan_ranks": 0, "loss_rank_avg": 0.10607272386550903, "step": 1070, "valid_targets_mean": 3049.6, "valid_targets_min": 635 }, { "epoch": 2.1037181996086107, "grad_norm": 0.39166697829631236, "learning_rate": 3.531252121363044e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.10185883939266205, "step": 1075, "valid_targets_mean": 2846.7, "valid_targets_min": 577 }, { "epoch": 2.1135029354207435, "grad_norm": 0.5046667169575071, "learning_rate": 3.524955747319419e-05, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.11997954547405243, "step": 1080, "valid_targets_mean": 2414.1, "valid_targets_min": 734 }, { "epoch": 2.1232876712328768, "grad_norm": 0.40188627311027003, "learning_rate": 3.5186230609404895e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.10753701627254486, "step": 1085, "valid_targets_mean": 3123.8, "valid_targets_min": 933 }, { "epoch": 2.1330724070450096, "grad_norm": 0.42426388964255, "learning_rate": 3.512254213020554e-05, "loss": 0.1073, "loss_nan_ranks": 0, "loss_rank_avg": 0.10298150777816772, "step": 1090, "valid_targets_mean": 3043.2, "valid_targets_min": 350 }, { "epoch": 2.142857142857143, "grad_norm": 0.4492568368515402, "learning_rate": 3.5058493552149917e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.13410577178001404, "step": 1095, "valid_targets_mean": 3618.4, "valid_targets_min": 863 }, { "epoch": 2.152641878669276, "grad_norm": 0.417502185720637, "learning_rate": 3.499408640036649e-05, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.12203118950128555, "step": 1100, "valid_targets_mean": 3457.2, "valid_targets_min": 329 }, { "epoch": 2.162426614481409, "grad_norm": 0.4353056795928977, "learning_rate": 3.492932220852214e-05, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.10841433703899384, "step": 1105, "valid_targets_mean": 2355.2, "valid_targets_min": 605 }, { "epoch": 2.172211350293542, "grad_norm": 0.41782255813374414, "learning_rate": 3.486420251878557e-05, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.10531320422887802, "step": 1110, "valid_targets_mean": 2684.2, "valid_targets_min": 605 }, { "epoch": 2.1819960861056753, "grad_norm": 0.32549855933739147, "learning_rate": 3.4798728881790645e-05, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11060058325529099, "step": 1115, "valid_targets_mean": 3967.6, "valid_targets_min": 647 }, { "epoch": 2.191780821917808, "grad_norm": 0.41464471586125, "learning_rate": 3.4732902856599425e-05, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.11559237539768219, "step": 1120, "valid_targets_mean": 2882.2, "valid_targets_min": 609 }, { "epoch": 2.2015655577299413, "grad_norm": 0.42718370156925883, "learning_rate": 3.466672601066506e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.12083616107702255, "step": 1125, "valid_targets_mean": 2868.4, "valid_targets_min": 876 }, { "epoch": 2.2113502935420746, "grad_norm": 0.4615524479310674, "learning_rate": 3.460019991979448e-05, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.12627968192100525, "step": 1130, "valid_targets_mean": 2956.2, "valid_targets_min": 693 }, { "epoch": 2.2211350293542074, "grad_norm": 0.3793457912875511, "learning_rate": 3.453332616811084e-05, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.09939718246459961, "step": 1135, "valid_targets_mean": 3136.5, "valid_targets_min": 554 }, { "epoch": 2.2309197651663406, "grad_norm": 0.3594596351840816, "learning_rate": 3.446610634801583e-05, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.09593316167593002, "step": 1140, "valid_targets_mean": 3030.4, "valid_targets_min": 474 }, { "epoch": 2.2407045009784734, "grad_norm": 0.4171021162376825, "learning_rate": 3.439854206015172e-05, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.1409609317779541, "step": 1145, "valid_targets_mean": 2861.6, "valid_targets_min": 743 }, { "epoch": 2.2504892367906066, "grad_norm": 0.38835562412908814, "learning_rate": 3.4330634913363283e-05, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.13764947652816772, "step": 1150, "valid_targets_mean": 3205.4, "valid_targets_min": 1001 }, { "epoch": 2.26027397260274, "grad_norm": 0.33531554597240587, "learning_rate": 3.426238652465945e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.10017026215791702, "step": 1155, "valid_targets_mean": 3359.6, "valid_targets_min": 662 }, { "epoch": 2.2700587084148727, "grad_norm": 0.40441508691761036, "learning_rate": 3.4193798519174865e-05, "loss": 0.1094, "loss_nan_ranks": 0, "loss_rank_avg": 0.10481183230876923, "step": 1160, "valid_targets_mean": 2804.2, "valid_targets_min": 512 }, { "epoch": 2.279843444227006, "grad_norm": 0.3538663740998075, "learning_rate": 3.41248725301311e-05, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.09048883616924286, "step": 1165, "valid_targets_mean": 3445.9, "valid_targets_min": 635 }, { "epoch": 2.2896281800391387, "grad_norm": 0.3712507430976939, "learning_rate": 3.405561019879784e-05, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.09899841248989105, "step": 1170, "valid_targets_mean": 3065.1, "valid_targets_min": 623 }, { "epoch": 2.299412915851272, "grad_norm": 0.3637032799817131, "learning_rate": 3.398601317445375e-05, "loss": 0.1018, "loss_nan_ranks": 0, "loss_rank_avg": 0.08682147413492203, "step": 1175, "valid_targets_mean": 2818.9, "valid_targets_min": 745 }, { "epoch": 2.309197651663405, "grad_norm": 0.3549849338540409, "learning_rate": 3.391608311434726e-05, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.11768273264169693, "step": 1180, "valid_targets_mean": 2909.6, "valid_targets_min": 839 }, { "epoch": 2.318982387475538, "grad_norm": 0.4136254318220814, "learning_rate": 3.384582168365703e-05, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.13258326053619385, "step": 1185, "valid_targets_mean": 2655.4, "valid_targets_min": 323 }, { "epoch": 2.328767123287671, "grad_norm": 0.4216592344674509, "learning_rate": 3.377523055545235e-05, "loss": 0.1024, "loss_nan_ranks": 0, "loss_rank_avg": 0.10435128957033157, "step": 1190, "valid_targets_mean": 3124.4, "valid_targets_min": 550 }, { "epoch": 2.3385518590998045, "grad_norm": 0.3909841531161173, "learning_rate": 3.370431141065329e-05, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.11007117480039597, "step": 1195, "valid_targets_mean": 2939.0, "valid_targets_min": 627 }, { "epoch": 2.3483365949119372, "grad_norm": 0.37065177231009755, "learning_rate": 3.363306593799066e-05, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.08931955695152283, "step": 1200, "valid_targets_mean": 2879.9, "valid_targets_min": 720 }, { "epoch": 2.3581213307240705, "grad_norm": 0.4199158543373936, "learning_rate": 3.3561495833965824e-05, "loss": 0.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.09923933446407318, "step": 1205, "valid_targets_mean": 2743.2, "valid_targets_min": 523 }, { "epoch": 2.3679060665362037, "grad_norm": 0.3746622479896516, "learning_rate": 3.3489602802810276e-05, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.10282056033611298, "step": 1210, "valid_targets_mean": 2939.0, "valid_targets_min": 609 }, { "epoch": 2.3776908023483365, "grad_norm": 0.4513364760083478, "learning_rate": 3.3417388556445084e-05, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419263631105423, "step": 1215, "valid_targets_mean": 2800.4, "valid_targets_min": 730 }, { "epoch": 2.3874755381604698, "grad_norm": 0.40657555459747047, "learning_rate": 3.3344854814440076e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.09741845726966858, "step": 1220, "valid_targets_mean": 3114.3, "valid_targets_min": 758 }, { "epoch": 2.3972602739726026, "grad_norm": 0.37832023349019445, "learning_rate": 3.327200330397297e-05, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.08784421533346176, "step": 1225, "valid_targets_mean": 2816.4, "valid_targets_min": 690 }, { "epoch": 2.407045009784736, "grad_norm": 0.41506010334022525, "learning_rate": 3.319883575978818e-05, "loss": 0.106, "loss_nan_ranks": 0, "loss_rank_avg": 0.10869326442480087, "step": 1230, "valid_targets_mean": 2765.4, "valid_targets_min": 766 }, { "epoch": 2.416829745596869, "grad_norm": 0.4792475285631822, "learning_rate": 3.312535392415554e-05, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.11564777046442032, "step": 1235, "valid_targets_mean": 2251.7, "valid_targets_min": 625 }, { "epoch": 2.426614481409002, "grad_norm": 0.39428259324977244, "learning_rate": 3.305155954682881e-05, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.09808069467544556, "step": 1240, "valid_targets_mean": 3245.1, "valid_targets_min": 637 }, { "epoch": 2.436399217221135, "grad_norm": 0.4195848772997183, "learning_rate": 3.297745438500402e-05, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.11323357373476028, "step": 1245, "valid_targets_mean": 2847.3, "valid_targets_min": 690 }, { "epoch": 2.446183953033268, "grad_norm": 0.42741752250777426, "learning_rate": 3.290304020327761e-05, "loss": 0.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.10795131325721741, "step": 1250, "valid_targets_mean": 2699.6, "valid_targets_min": 507 }, { "epoch": 2.455968688845401, "grad_norm": 0.40882254202245477, "learning_rate": 3.282831877360441e-05, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.10642804205417633, "step": 1255, "valid_targets_mean": 2908.2, "valid_targets_min": 657 }, { "epoch": 2.4657534246575343, "grad_norm": 0.35084753480045056, "learning_rate": 3.275329187525547e-05, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.10106814652681351, "step": 1260, "valid_targets_mean": 3006.5, "valid_targets_min": 513 }, { "epoch": 2.475538160469667, "grad_norm": 0.36699970096352375, "learning_rate": 3.2677961294775686e-05, "loss": 0.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.09151563793420792, "step": 1265, "valid_targets_mean": 2794.2, "valid_targets_min": 488 }, { "epoch": 2.4853228962818004, "grad_norm": 0.3556386173650718, "learning_rate": 3.2602328825941225e-05, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.10737474262714386, "step": 1270, "valid_targets_mean": 3092.9, "valid_targets_min": 673 }, { "epoch": 2.4951076320939336, "grad_norm": 0.3751799706125244, "learning_rate": 3.2526396269716856e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.10193692892789841, "step": 1275, "valid_targets_mean": 3543.3, "valid_targets_min": 653 }, { "epoch": 2.5048923679060664, "grad_norm": 0.38573758460528124, "learning_rate": 3.245016543421305e-05, "loss": 0.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.09200307726860046, "step": 1280, "valid_targets_mean": 2936.6, "valid_targets_min": 560 }, { "epoch": 2.5146771037181996, "grad_norm": 0.42837841993074, "learning_rate": 3.23736381346429e-05, "loss": 0.1024, "loss_nan_ranks": 0, "loss_rank_avg": 0.10868542641401291, "step": 1285, "valid_targets_mean": 2723.4, "valid_targets_min": 605 }, { "epoch": 2.524461839530333, "grad_norm": 0.4050058503579518, "learning_rate": 3.229681619327894e-05, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.14006638526916504, "step": 1290, "valid_targets_mean": 3020.4, "valid_targets_min": 564 }, { "epoch": 2.5342465753424657, "grad_norm": 0.4201197105368221, "learning_rate": 3.221970143940973e-05, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.10334217548370361, "step": 1295, "valid_targets_mean": 2442.4, "valid_targets_min": 806 }, { "epoch": 2.544031311154599, "grad_norm": 0.41541097510697117, "learning_rate": 3.2142295709296274e-05, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.14761820435523987, "step": 1300, "valid_targets_mean": 3183.7, "valid_targets_min": 536 }, { "epoch": 2.553816046966732, "grad_norm": 0.45131929268936527, "learning_rate": 3.206460084612835e-05, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.12431158125400543, "step": 1305, "valid_targets_mean": 2544.8, "valid_targets_min": 589 }, { "epoch": 2.563600782778865, "grad_norm": 0.39494238913307517, "learning_rate": 3.1986618699980586e-05, "loss": 0.1021, "loss_nan_ranks": 0, "loss_rank_avg": 0.09494001418352127, "step": 1310, "valid_targets_mean": 2799.4, "valid_targets_min": 518 }, { "epoch": 2.573385518590998, "grad_norm": 0.32517864786117584, "learning_rate": 3.1908351127768374e-05, "loss": 0.1027, "loss_nan_ranks": 0, "loss_rank_avg": 0.07930716872215271, "step": 1315, "valid_targets_mean": 3285.2, "valid_targets_min": 669 }, { "epoch": 2.583170254403131, "grad_norm": 0.4330795967908774, "learning_rate": 3.182979999320373e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11279530823230743, "step": 1320, "valid_targets_mean": 3316.5, "valid_targets_min": 567 }, { "epoch": 2.592954990215264, "grad_norm": 0.3903225044565865, "learning_rate": 3.175096716675087e-05, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.14655640721321106, "step": 1325, "valid_targets_mean": 3319.7, "valid_targets_min": 826 }, { "epoch": 2.602739726027397, "grad_norm": 0.3349866071473293, "learning_rate": 3.1671854525581625e-05, "loss": 0.1127, "loss_nan_ranks": 0, "loss_rank_avg": 0.08214075118303299, "step": 1330, "valid_targets_mean": 3446.7, "valid_targets_min": 981 }, { "epoch": 2.6125244618395302, "grad_norm": 0.4197218725607564, "learning_rate": 3.159246395353086e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.110893614590168, "step": 1335, "valid_targets_mean": 2602.2, "valid_targets_min": 680 }, { "epoch": 2.6223091976516635, "grad_norm": 0.39357060094694973, "learning_rate": 3.151279734105151e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.11349768191576004, "step": 1340, "valid_targets_mean": 2960.3, "valid_targets_min": 647 }, { "epoch": 2.6320939334637963, "grad_norm": 0.3694651983894364, "learning_rate": 3.1432856585169576e-05, "loss": 0.1012, "loss_nan_ranks": 0, "loss_rank_avg": 0.11032050102949142, "step": 1345, "valid_targets_mean": 3003.5, "valid_targets_min": 574 }, { "epoch": 2.6418786692759295, "grad_norm": 0.3480652593011676, "learning_rate": 3.135264358943903e-05, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.11561337858438492, "step": 1350, "valid_targets_mean": 3375.7, "valid_targets_min": 535 }, { "epoch": 2.6516634050880628, "grad_norm": 0.42225286123376454, "learning_rate": 3.127216026389641e-05, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.11898268759250641, "step": 1355, "valid_targets_mean": 2994.9, "valid_targets_min": 585 }, { "epoch": 2.6614481409001955, "grad_norm": 0.3668356779097436, "learning_rate": 3.1191408525015344e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.09555927664041519, "step": 1360, "valid_targets_mean": 2917.9, "valid_targets_min": 703 }, { "epoch": 2.671232876712329, "grad_norm": 0.4792096383507245, "learning_rate": 3.1110390295660976e-05, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.1280497908592224, "step": 1365, "valid_targets_mean": 2813.3, "valid_targets_min": 885 }, { "epoch": 2.681017612524462, "grad_norm": 0.4861908230527638, "learning_rate": 3.10291075050441e-05, "loss": 0.1117, "loss_nan_ranks": 0, "loss_rank_avg": 0.15495100617408752, "step": 1370, "valid_targets_mean": 2758.3, "valid_targets_min": 502 }, { "epoch": 2.690802348336595, "grad_norm": 0.3450995082913833, "learning_rate": 3.094756208867528e-05, "loss": 0.0983, "loss_nan_ranks": 0, "loss_rank_avg": 0.08989180624485016, "step": 1375, "valid_targets_mean": 3410.1, "valid_targets_min": 685 }, { "epoch": 2.700587084148728, "grad_norm": 0.4008397494171553, "learning_rate": 3.086575598831873e-05, "loss": 0.1127, "loss_nan_ranks": 0, "loss_rank_avg": 0.10978572070598602, "step": 1380, "valid_targets_mean": 2615.2, "valid_targets_min": 719 }, { "epoch": 2.7103718199608613, "grad_norm": 0.3503551086666885, "learning_rate": 3.078369115194609e-05, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.0917101576924324, "step": 1385, "valid_targets_mean": 3238.8, "valid_targets_min": 788 }, { "epoch": 2.720156555772994, "grad_norm": 0.3879357205588297, "learning_rate": 3.0701369533690035e-05, "loss": 0.0958, "loss_nan_ranks": 0, "loss_rank_avg": 0.09571725130081177, "step": 1390, "valid_targets_mean": 2725.3, "valid_targets_min": 446 }, { "epoch": 2.7299412915851273, "grad_norm": 0.33036722394947055, "learning_rate": 3.061879309379774e-05, "loss": 0.1062, "loss_nan_ranks": 0, "loss_rank_avg": 0.10175631940364838, "step": 1395, "valid_targets_mean": 3565.9, "valid_targets_min": 333 }, { "epoch": 2.73972602739726, "grad_norm": 0.35924320904735907, "learning_rate": 3.053596379858422e-05, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.10558217763900757, "step": 1400, "valid_targets_mean": 2973.7, "valid_targets_min": 776 }, { "epoch": 2.7495107632093934, "grad_norm": 0.3803671568191816, "learning_rate": 3.045288362038549e-05, "loss": 0.103, "loss_nan_ranks": 0, "loss_rank_avg": 0.10167603194713593, "step": 1405, "valid_targets_mean": 2803.1, "valid_targets_min": 555 }, { "epoch": 2.759295499021526, "grad_norm": 0.3653145793525553, "learning_rate": 3.0369554537511607e-05, "loss": 0.1024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1083512157201767, "step": 1410, "valid_targets_mean": 3030.9, "valid_targets_min": 906 }, { "epoch": 2.7690802348336594, "grad_norm": 0.3190701118141104, "learning_rate": 3.028597853419955e-05, "loss": 0.1065, "loss_nan_ranks": 0, "loss_rank_avg": 0.09129766374826431, "step": 1415, "valid_targets_mean": 3725.6, "valid_targets_min": 1512 }, { "epoch": 2.7788649706457926, "grad_norm": 0.3889832014166842, "learning_rate": 3.0202157600565997e-05, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.1031104102730751, "step": 1420, "valid_targets_mean": 2825.6, "valid_targets_min": 520 }, { "epoch": 2.7886497064579254, "grad_norm": 0.37801201319116307, "learning_rate": 3.0118093732559914e-05, "loss": 0.1018, "loss_nan_ranks": 0, "loss_rank_avg": 0.1037970706820488, "step": 1425, "valid_targets_mean": 2680.2, "valid_targets_min": 726 }, { "epoch": 2.7984344422700587, "grad_norm": 0.3817751239677767, "learning_rate": 3.0033788931915028e-05, "loss": 0.1095, "loss_nan_ranks": 0, "loss_rank_avg": 0.10228165984153748, "step": 1430, "valid_targets_mean": 2815.8, "valid_targets_min": 1005 }, { "epoch": 2.808219178082192, "grad_norm": 0.379648144825907, "learning_rate": 2.9949245206102185e-05, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.10076449811458588, "step": 1435, "valid_targets_mean": 3059.8, "valid_targets_min": 960 }, { "epoch": 2.8180039138943247, "grad_norm": 0.4402766625587281, "learning_rate": 2.986446456828151e-05, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11402945220470428, "step": 1440, "valid_targets_mean": 2989.2, "valid_targets_min": 797 }, { "epoch": 2.827788649706458, "grad_norm": 0.37883497798659016, "learning_rate": 2.977944903725451e-05, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.09855394065380096, "step": 1445, "valid_targets_mean": 2883.6, "valid_targets_min": 566 }, { "epoch": 2.837573385518591, "grad_norm": 0.36148811298502337, "learning_rate": 2.9694200637415967e-05, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.09221038967370987, "step": 1450, "valid_targets_mean": 2968.4, "valid_targets_min": 357 }, { "epoch": 2.847358121330724, "grad_norm": 0.3566538664567121, "learning_rate": 2.9608721398705768e-05, "loss": 0.1028, "loss_nan_ranks": 0, "loss_rank_avg": 0.08568309247493744, "step": 1455, "valid_targets_mean": 3442.5, "valid_targets_min": 920 }, { "epoch": 2.857142857142857, "grad_norm": 0.37633017266925395, "learning_rate": 2.952301335656053e-05, "loss": 0.1122, "loss_nan_ranks": 0, "loss_rank_avg": 0.09396082907915115, "step": 1460, "valid_targets_mean": 2965.3, "valid_targets_min": 536 }, { "epoch": 2.8669275929549904, "grad_norm": 0.35848214949952517, "learning_rate": 2.943707855186515e-05, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.08908859640359879, "step": 1465, "valid_targets_mean": 3153.4, "valid_targets_min": 540 }, { "epoch": 2.8767123287671232, "grad_norm": 0.3822152685430384, "learning_rate": 2.9350919030904227e-05, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.14029645919799805, "step": 1470, "valid_targets_mean": 3109.6, "valid_targets_min": 852 }, { "epoch": 2.8864970645792565, "grad_norm": 0.3413018378399703, "learning_rate": 2.926453684531329e-05, "loss": 0.0974, "loss_nan_ranks": 0, "loss_rank_avg": 0.08753784000873566, "step": 1475, "valid_targets_mean": 3042.3, "valid_targets_min": 820 }, { "epoch": 2.8962818003913893, "grad_norm": 0.4631072227207729, "learning_rate": 2.917793405203001e-05, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.12335332483053207, "step": 1480, "valid_targets_mean": 2351.6, "valid_targets_min": 700 }, { "epoch": 2.9060665362035225, "grad_norm": 0.41434492251896626, "learning_rate": 2.9091112713245136e-05, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.12784239649772644, "step": 1485, "valid_targets_mean": 2976.8, "valid_targets_min": 540 }, { "epoch": 2.9158512720156553, "grad_norm": 0.4359166147369341, "learning_rate": 2.9004074896353468e-05, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.15002021193504333, "step": 1490, "valid_targets_mean": 2503.5, "valid_targets_min": 840 }, { "epoch": 2.9256360078277885, "grad_norm": 0.3997076491880868, "learning_rate": 2.8916822673904584e-05, "loss": 0.1035, "loss_nan_ranks": 0, "loss_rank_avg": 0.11894476413726807, "step": 1495, "valid_targets_mean": 3113.6, "valid_targets_min": 654 }, { "epoch": 2.935420743639922, "grad_norm": 0.4175582010143018, "learning_rate": 2.882935812355349e-05, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.17195875942707062, "step": 1500, "valid_targets_mean": 2791.0, "valid_targets_min": 492 }, { "epoch": 2.9452054794520546, "grad_norm": 0.3307412019430931, "learning_rate": 2.8741683328011184e-05, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.09898516535758972, "step": 1505, "valid_targets_mean": 3485.9, "valid_targets_min": 1008 }, { "epoch": 2.954990215264188, "grad_norm": 0.3459910596152458, "learning_rate": 2.8653800374995008e-05, "loss": 0.0963, "loss_nan_ranks": 0, "loss_rank_avg": 0.09195069968700409, "step": 1510, "valid_targets_mean": 2914.2, "valid_targets_min": 817 }, { "epoch": 2.964774951076321, "grad_norm": 0.35273324567641856, "learning_rate": 2.8565711357178964e-05, "loss": 0.0977, "loss_nan_ranks": 0, "loss_rank_avg": 0.08810217678546906, "step": 1515, "valid_targets_mean": 3367.4, "valid_targets_min": 848 }, { "epoch": 2.974559686888454, "grad_norm": 0.36045123569179105, "learning_rate": 2.8477418372143897e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.10645238310098648, "step": 1520, "valid_targets_mean": 3010.5, "valid_targets_min": 834 }, { "epoch": 2.984344422700587, "grad_norm": 0.36580872832620526, "learning_rate": 2.838892352232752e-05, "loss": 0.1126, "loss_nan_ranks": 0, "loss_rank_avg": 0.09797756373882294, "step": 1525, "valid_targets_mean": 3353.2, "valid_targets_min": 799 }, { "epoch": 2.9941291585127203, "grad_norm": 0.3909700612235282, "learning_rate": 2.8300228914974365e-05, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.097335085272789, "step": 1530, "valid_targets_mean": 2301.2, "valid_targets_min": 387 }, { "epoch": 3.003913894324853, "grad_norm": 0.39960294073850516, "learning_rate": 2.82113366620856e-05, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.098995640873909, "step": 1535, "valid_targets_mean": 2721.5, "valid_targets_min": 751 }, { "epoch": 3.0136986301369864, "grad_norm": 0.4780867112307395, "learning_rate": 2.812224888036875e-05, "loss": 0.1031, "loss_nan_ranks": 0, "loss_rank_avg": 0.13829249143600464, "step": 1540, "valid_targets_mean": 2505.8, "valid_targets_min": 549 }, { "epoch": 3.0234833659491196, "grad_norm": 0.3986599206779102, "learning_rate": 2.8032967691187258e-05, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.10849355161190033, "step": 1545, "valid_targets_mean": 3316.6, "valid_targets_min": 1185 }, { "epoch": 3.0332681017612524, "grad_norm": 0.4161663796512601, "learning_rate": 2.794349522051003e-05, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.09069333970546722, "step": 1550, "valid_targets_mean": 2789.6, "valid_targets_min": 840 }, { "epoch": 3.0430528375733856, "grad_norm": 0.4410690914740329, "learning_rate": 2.785383359886075e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.09545639902353287, "step": 1555, "valid_targets_mean": 2650.6, "valid_targets_min": 574 }, { "epoch": 3.0528375733855184, "grad_norm": 0.5575943198695258, "learning_rate": 2.7763984961267202e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.09871990978717804, "step": 1560, "valid_targets_mean": 2915.4, "valid_targets_min": 468 }, { "epoch": 3.0626223091976517, "grad_norm": 0.3917830696660751, "learning_rate": 2.767395144721038e-05, "loss": 0.0952, "loss_nan_ranks": 0, "loss_rank_avg": 0.08617722988128662, "step": 1565, "valid_targets_mean": 2731.6, "valid_targets_min": 665 }, { "epoch": 3.072407045009785, "grad_norm": 0.5227822005219008, "learning_rate": 2.758373520057359e-05, "loss": 0.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.16681335866451263, "step": 1570, "valid_targets_mean": 2202.9, "valid_targets_min": 622 }, { "epoch": 3.0821917808219177, "grad_norm": 0.4481983579473897, "learning_rate": 2.7493338369591355e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.10602610558271408, "step": 1575, "valid_targets_mean": 2457.4, "valid_targets_min": 658 }, { "epoch": 3.091976516634051, "grad_norm": 0.41182336536618824, "learning_rate": 2.7402763106798295e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.09512235224246979, "step": 1580, "valid_targets_mean": 2693.2, "valid_targets_min": 323 }, { "epoch": 3.1017612524461837, "grad_norm": 0.4111689440731356, "learning_rate": 2.731201156897785e-05, "loss": 0.088, "loss_nan_ranks": 0, "loss_rank_avg": 0.08959066867828369, "step": 1585, "valid_targets_mean": 2895.9, "valid_targets_min": 614 }, { "epoch": 3.111545988258317, "grad_norm": 0.45106807085617473, "learning_rate": 2.722108591711095e-05, "loss": 0.1028, "loss_nan_ranks": 0, "loss_rank_avg": 0.10399621725082397, "step": 1590, "valid_targets_mean": 2582.5, "valid_targets_min": 526 }, { "epoch": 3.12133072407045, "grad_norm": 0.40429829012168483, "learning_rate": 2.7129988316324522e-05, "loss": 0.1017, "loss_nan_ranks": 0, "loss_rank_avg": 0.12241924554109573, "step": 1595, "valid_targets_mean": 2891.0, "valid_targets_min": 424 }, { "epoch": 3.131115459882583, "grad_norm": 0.41002787703696647, "learning_rate": 2.7038720935839955e-05, "loss": 0.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.10877316445112228, "step": 1600, "valid_targets_mean": 2865.1, "valid_targets_min": 324 }, { "epoch": 3.1409001956947162, "grad_norm": 0.46037341512154545, "learning_rate": 2.6947285948921447e-05, "loss": 0.1013, "loss_nan_ranks": 0, "loss_rank_avg": 0.10007884353399277, "step": 1605, "valid_targets_mean": 2481.1, "valid_targets_min": 688 }, { "epoch": 3.1506849315068495, "grad_norm": 5.110272464423244, "learning_rate": 2.6855685532824236e-05, "loss": 0.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.11062052845954895, "step": 1610, "valid_targets_mean": 2889.8, "valid_targets_min": 965 }, { "epoch": 3.1604696673189823, "grad_norm": 0.4114215687770999, "learning_rate": 2.676392186874279e-05, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.09809882938861847, "step": 1615, "valid_targets_mean": 2879.0, "valid_targets_min": 650 }, { "epoch": 3.1702544031311155, "grad_norm": 0.3996926275976193, "learning_rate": 2.6671997141758827e-05, "loss": 0.0927, "loss_nan_ranks": 0, "loss_rank_avg": 0.12717470526695251, "step": 1620, "valid_targets_mean": 2880.8, "valid_targets_min": 676 }, { "epoch": 3.1800391389432487, "grad_norm": 0.3639885387428381, "learning_rate": 2.6579913540789322e-05, "loss": 0.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.07497823983430862, "step": 1625, "valid_targets_mean": 2640.9, "valid_targets_min": 515 }, { "epoch": 3.1898238747553815, "grad_norm": 0.3703997916696169, "learning_rate": 2.6487673258534354e-05, "loss": 0.0885, "loss_nan_ranks": 0, "loss_rank_avg": 0.0767689049243927, "step": 1630, "valid_targets_mean": 3069.6, "valid_targets_min": 636 }, { "epoch": 3.1996086105675148, "grad_norm": 0.4413852282140088, "learning_rate": 2.639527849142491e-05, "loss": 0.1015, "loss_nan_ranks": 0, "loss_rank_avg": 0.10007453709840775, "step": 1635, "valid_targets_mean": 2802.6, "valid_targets_min": 924 }, { "epoch": 3.2093933463796476, "grad_norm": 0.44437000715097036, "learning_rate": 2.630273143957058e-05, "loss": 0.0977, "loss_nan_ranks": 0, "loss_rank_avg": 0.09787821769714355, "step": 1640, "valid_targets_mean": 2599.1, "valid_targets_min": 516 }, { "epoch": 3.219178082191781, "grad_norm": 0.4598260445599975, "learning_rate": 2.6210034306707165e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.09357476234436035, "step": 1645, "valid_targets_mean": 2352.2, "valid_targets_min": 659 }, { "epoch": 3.228962818003914, "grad_norm": 0.42650769322905097, "learning_rate": 2.6117189300144212e-05, "loss": 0.1012, "loss_nan_ranks": 0, "loss_rank_avg": 0.13607531785964966, "step": 1650, "valid_targets_mean": 2959.1, "valid_targets_min": 684 }, { "epoch": 3.238747553816047, "grad_norm": 0.3954567699571377, "learning_rate": 2.6024198630712444e-05, "loss": 0.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.08541727066040039, "step": 1655, "valid_targets_mean": 2900.4, "valid_targets_min": 538 }, { "epoch": 3.24853228962818, "grad_norm": 0.3799054478005135, "learning_rate": 2.5931064512711094e-05, "loss": 0.0974, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218566820025444, "step": 1660, "valid_targets_mean": 3502.8, "valid_targets_min": 774 }, { "epoch": 3.258317025440313, "grad_norm": 0.39283413314321314, "learning_rate": 2.583778916385522e-05, "loss": 0.0908, "loss_nan_ranks": 0, "loss_rank_avg": 0.08874887228012085, "step": 1665, "valid_targets_mean": 2809.4, "valid_targets_min": 663 }, { "epoch": 3.268101761252446, "grad_norm": 0.4381850178027912, "learning_rate": 2.5744374805222892e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.11543179303407669, "step": 1670, "valid_targets_mean": 3048.3, "valid_targets_min": 591 }, { "epoch": 3.2778864970645794, "grad_norm": 0.36917810068552503, "learning_rate": 2.565082366120226e-05, "loss": 0.0929, "loss_nan_ranks": 0, "loss_rank_avg": 0.08536778390407562, "step": 1675, "valid_targets_mean": 3376.4, "valid_targets_min": 1004 }, { "epoch": 3.287671232876712, "grad_norm": 0.4385678853719193, "learning_rate": 2.555713795943864e-05, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.11536893248558044, "step": 1680, "valid_targets_mean": 2739.6, "valid_targets_min": 824 }, { "epoch": 3.2974559686888454, "grad_norm": 0.393601306502803, "learning_rate": 2.5463319930781415e-05, "loss": 0.089, "loss_nan_ranks": 0, "loss_rank_avg": 0.09885405004024506, "step": 1685, "valid_targets_mean": 3358.1, "valid_targets_min": 699 }, { "epoch": 3.3072407045009786, "grad_norm": 0.36006488816751797, "learning_rate": 2.5369371809230977e-05, "loss": 0.0903, "loss_nan_ranks": 0, "loss_rank_avg": 0.08712077885866165, "step": 1690, "valid_targets_mean": 3766.2, "valid_targets_min": 720 }, { "epoch": 3.3170254403131114, "grad_norm": 0.37713092406723087, "learning_rate": 2.527529583188548e-05, "loss": 0.0961, "loss_nan_ranks": 0, "loss_rank_avg": 0.09263085573911667, "step": 1695, "valid_targets_mean": 2927.4, "valid_targets_min": 766 }, { "epoch": 3.3268101761252447, "grad_norm": 0.414881476450131, "learning_rate": 2.518109423888758e-05, "loss": 0.09, "loss_nan_ranks": 0, "loss_rank_avg": 0.09965046495199203, "step": 1700, "valid_targets_mean": 2728.1, "valid_targets_min": 805 }, { "epoch": 3.336594911937378, "grad_norm": 0.3276882930558519, "learning_rate": 2.5086769273371122e-05, "loss": 0.0902, "loss_nan_ranks": 0, "loss_rank_avg": 0.07712644338607788, "step": 1705, "valid_targets_mean": 3432.0, "valid_targets_min": 1229 }, { "epoch": 3.3463796477495107, "grad_norm": 0.41120960483108754, "learning_rate": 2.499232318140769e-05, "loss": 0.0963, "loss_nan_ranks": 0, "loss_rank_avg": 0.09201785922050476, "step": 1710, "valid_targets_mean": 2984.1, "valid_targets_min": 720 }, { "epoch": 3.356164383561644, "grad_norm": 0.4114515415368508, "learning_rate": 2.4897758211953135e-05, "loss": 0.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.09025739133358002, "step": 1715, "valid_targets_mean": 2741.2, "valid_targets_min": 707 }, { "epoch": 3.3659491193737767, "grad_norm": 0.3677616557466712, "learning_rate": 2.4803076616794038e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.08147165179252625, "step": 1720, "valid_targets_mean": 3088.6, "valid_targets_min": 350 }, { "epoch": 3.37573385518591, "grad_norm": 0.44042021167276707, "learning_rate": 2.4708280650494067e-05, "loss": 0.0895, "loss_nan_ranks": 0, "loss_rank_avg": 0.09253993630409241, "step": 1725, "valid_targets_mean": 2585.8, "valid_targets_min": 716 }, { "epoch": 3.385518590998043, "grad_norm": 0.4215992681842096, "learning_rate": 2.461337257034031e-05, "loss": 0.0982, "loss_nan_ranks": 0, "loss_rank_avg": 0.09265173971652985, "step": 1730, "valid_targets_mean": 2482.9, "valid_targets_min": 652 }, { "epoch": 3.395303326810176, "grad_norm": 0.4142825675183947, "learning_rate": 2.4518354636289523e-05, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.09479625523090363, "step": 1735, "valid_targets_mean": 2704.0, "valid_targets_min": 593 }, { "epoch": 3.4050880626223092, "grad_norm": 0.4359979529870605, "learning_rate": 2.442322911091428e-05, "loss": 0.0986, "loss_nan_ranks": 0, "loss_rank_avg": 0.0992426872253418, "step": 1740, "valid_targets_mean": 2675.4, "valid_targets_min": 794 }, { "epoch": 3.414872798434442, "grad_norm": 0.37594536492115166, "learning_rate": 2.4327998259349165e-05, "loss": 0.0952, "loss_nan_ranks": 0, "loss_rank_avg": 0.09966818988323212, "step": 1745, "valid_targets_mean": 3095.5, "valid_targets_min": 759 }, { "epoch": 3.4246575342465753, "grad_norm": 0.40001334846317066, "learning_rate": 2.4232664349236757e-05, "loss": 0.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.0902199074625969, "step": 1750, "valid_targets_mean": 2817.9, "valid_targets_min": 635 }, { "epoch": 3.4344422700587085, "grad_norm": 0.4006625889271972, "learning_rate": 2.413722965067371e-05, "loss": 0.0974, "loss_nan_ranks": 0, "loss_rank_avg": 0.09919355064630508, "step": 1755, "valid_targets_mean": 2923.6, "valid_targets_min": 636 }, { "epoch": 3.4442270058708413, "grad_norm": 0.3812585798186099, "learning_rate": 2.404169643615663e-05, "loss": 0.0899, "loss_nan_ranks": 0, "loss_rank_avg": 0.09447631239891052, "step": 1760, "valid_targets_mean": 3224.1, "valid_targets_min": 782 }, { "epoch": 3.4540117416829745, "grad_norm": 0.393226956942131, "learning_rate": 2.3946066980528e-05, "loss": 0.0977, "loss_nan_ranks": 0, "loss_rank_avg": 0.08800017833709717, "step": 1765, "valid_targets_mean": 2783.4, "valid_targets_min": 588 }, { "epoch": 3.4637964774951078, "grad_norm": 0.4130522975010669, "learning_rate": 2.3850343560922008e-05, "loss": 0.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.09055754542350769, "step": 1770, "valid_targets_mean": 2447.2, "valid_targets_min": 647 }, { "epoch": 3.4735812133072406, "grad_norm": 0.37842294460082415, "learning_rate": 2.37545284567103e-05, "loss": 0.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.0931730717420578, "step": 1775, "valid_targets_mean": 3382.8, "valid_targets_min": 697 }, { "epoch": 3.483365949119374, "grad_norm": 0.39858769418626966, "learning_rate": 2.3658623949447735e-05, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.09716151654720306, "step": 1780, "valid_targets_mean": 2783.8, "valid_targets_min": 699 }, { "epoch": 3.493150684931507, "grad_norm": 0.3587757194116961, "learning_rate": 2.3562632322818047e-05, "loss": 0.0864, "loss_nan_ranks": 0, "loss_rank_avg": 0.08153725415468216, "step": 1785, "valid_targets_mean": 3316.6, "valid_targets_min": 784 }, { "epoch": 3.50293542074364, "grad_norm": 0.5073856878677895, "learning_rate": 2.346655586257945e-05, "loss": 0.0975, "loss_nan_ranks": 0, "loss_rank_avg": 0.12582001090049744, "step": 1790, "valid_targets_mean": 2520.9, "valid_targets_min": 922 }, { "epoch": 3.512720156555773, "grad_norm": 0.3824304763924219, "learning_rate": 2.3370396856510228e-05, "loss": 0.0915, "loss_nan_ranks": 0, "loss_rank_avg": 0.09068600833415985, "step": 1795, "valid_targets_mean": 3130.3, "valid_targets_min": 1082 }, { "epoch": 3.5225048923679063, "grad_norm": 0.33517308415172126, "learning_rate": 2.3274157594354244e-05, "loss": 0.1002, "loss_nan_ranks": 0, "loss_rank_avg": 0.07240046560764313, "step": 1800, "valid_targets_mean": 3421.6, "valid_targets_min": 1003 }, { "epoch": 3.532289628180039, "grad_norm": 0.4151492239970627, "learning_rate": 2.317784036776643e-05, "loss": 0.095, "loss_nan_ranks": 0, "loss_rank_avg": 0.10990441590547562, "step": 1805, "valid_targets_mean": 2744.4, "valid_targets_min": 693 }, { "epoch": 3.5420743639921723, "grad_norm": 0.3897935534208523, "learning_rate": 2.308144747025822e-05, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.09307827055454254, "step": 1810, "valid_targets_mean": 3265.9, "valid_targets_min": 756 }, { "epoch": 3.551859099804305, "grad_norm": 0.43581519464806656, "learning_rate": 2.2984981197142903e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.1167551726102829, "step": 1815, "valid_targets_mean": 2591.2, "valid_targets_min": 836 }, { "epoch": 3.5616438356164384, "grad_norm": 0.386659833532582, "learning_rate": 2.2888443845481014e-05, "loss": 0.0933, "loss_nan_ranks": 0, "loss_rank_avg": 0.09008432179689407, "step": 1820, "valid_targets_mean": 3245.9, "valid_targets_min": 856 }, { "epoch": 3.571428571428571, "grad_norm": 0.3543818030871814, "learning_rate": 2.2791837714025605e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.09043369442224503, "step": 1825, "valid_targets_mean": 3304.0, "valid_targets_min": 800 }, { "epoch": 3.5812133072407044, "grad_norm": 0.438729662155011, "learning_rate": 2.269516510316753e-05, "loss": 0.1043, "loss_nan_ranks": 0, "loss_rank_avg": 0.09659003466367722, "step": 1830, "valid_targets_mean": 2356.2, "valid_targets_min": 665 }, { "epoch": 3.5909980430528377, "grad_norm": 0.4367444363023162, "learning_rate": 2.2598428314880626e-05, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1389397382736206, "step": 1835, "valid_targets_mean": 2930.7, "valid_targets_min": 729 }, { "epoch": 3.6007827788649704, "grad_norm": 0.3533335852440453, "learning_rate": 2.250162965266696e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.08077824115753174, "step": 1840, "valid_targets_mean": 3471.1, "valid_targets_min": 712 }, { "epoch": 3.6105675146771037, "grad_norm": 0.412577131838221, "learning_rate": 2.2404771421501924e-05, "loss": 0.1041, "loss_nan_ranks": 0, "loss_rank_avg": 0.12000207602977753, "step": 1845, "valid_targets_mean": 3292.5, "valid_targets_min": 774 }, { "epoch": 3.620352250489237, "grad_norm": 0.34314515066987156, "learning_rate": 2.230785592777938e-05, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.0764012485742569, "step": 1850, "valid_targets_mean": 3464.9, "valid_targets_min": 664 }, { "epoch": 3.6301369863013697, "grad_norm": 0.5021484175858066, "learning_rate": 2.2210885479256713e-05, "loss": 0.101, "loss_nan_ranks": 0, "loss_rank_avg": 0.0931086540222168, "step": 1855, "valid_targets_mean": 2372.5, "valid_targets_min": 767 }, { "epoch": 3.639921722113503, "grad_norm": 0.418925470817628, "learning_rate": 2.2113862384999908e-05, "loss": 0.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.09805671125650406, "step": 1860, "valid_targets_mean": 2864.6, "valid_targets_min": 575 }, { "epoch": 3.649706457925636, "grad_norm": 0.40788258413865075, "learning_rate": 2.2016788955328555e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.08214108645915985, "step": 1865, "valid_targets_mean": 3143.8, "valid_targets_min": 680 }, { "epoch": 3.659491193737769, "grad_norm": 0.39469198310409365, "learning_rate": 2.191966750176083e-05, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.09547490626573563, "step": 1870, "valid_targets_mean": 3034.0, "valid_targets_min": 333 }, { "epoch": 3.6692759295499022, "grad_norm": 0.45914037172512734, "learning_rate": 2.182250033695846e-05, "loss": 0.1033, "loss_nan_ranks": 0, "loss_rank_avg": 0.11296926438808441, "step": 1875, "valid_targets_mean": 2711.8, "valid_targets_min": 569 }, { "epoch": 3.6790606653620355, "grad_norm": 0.3475562297830893, "learning_rate": 2.1725289774671638e-05, "loss": 0.0995, "loss_nan_ranks": 0, "loss_rank_avg": 0.07544345408678055, "step": 1880, "valid_targets_mean": 3378.5, "valid_targets_min": 538 }, { "epoch": 3.6888454011741683, "grad_norm": 0.3326326001204827, "learning_rate": 2.1628038129683957e-05, "loss": 0.0934, "loss_nan_ranks": 0, "loss_rank_avg": 0.0732976496219635, "step": 1885, "valid_targets_mean": 3177.5, "valid_targets_min": 605 }, { "epoch": 3.6986301369863015, "grad_norm": 0.4293275842467327, "learning_rate": 2.1530747717757263e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.1031743511557579, "step": 1890, "valid_targets_mean": 3229.9, "valid_targets_min": 802 }, { "epoch": 3.7084148727984343, "grad_norm": 0.4391241516655618, "learning_rate": 2.1433420855576527e-05, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.11853335797786713, "step": 1895, "valid_targets_mean": 2822.1, "valid_targets_min": 502 }, { "epoch": 3.7181996086105675, "grad_norm": 0.33615772425302315, "learning_rate": 2.1336059860694672e-05, "loss": 0.0838, "loss_nan_ranks": 0, "loss_rank_avg": 0.07403817027807236, "step": 1900, "valid_targets_mean": 3502.2, "valid_targets_min": 715 }, { "epoch": 3.7279843444227003, "grad_norm": 0.4432964958725013, "learning_rate": 2.12386670514774e-05, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.12059329450130463, "step": 1905, "valid_targets_mean": 2732.8, "valid_targets_min": 1022 }, { "epoch": 3.7377690802348336, "grad_norm": 0.4070557595034096, "learning_rate": 2.1141244747047966e-05, "loss": 0.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.1020825058221817, "step": 1910, "valid_targets_mean": 2716.7, "valid_targets_min": 727 }, { "epoch": 3.747553816046967, "grad_norm": 0.457268061002794, "learning_rate": 2.1043795267231966e-05, "loss": 0.0961, "loss_nan_ranks": 0, "loss_rank_avg": 0.11039022356271744, "step": 1915, "valid_targets_mean": 2666.3, "valid_targets_min": 503 }, { "epoch": 3.7573385518590996, "grad_norm": 0.4136493991453706, "learning_rate": 2.094632093250212e-05, "loss": 0.091, "loss_nan_ranks": 0, "loss_rank_avg": 0.08572959899902344, "step": 1920, "valid_targets_mean": 3254.5, "valid_targets_min": 583 }, { "epoch": 3.767123287671233, "grad_norm": 0.32806235850432924, "learning_rate": 2.084882406392297e-05, "loss": 0.0888, "loss_nan_ranks": 0, "loss_rank_avg": 0.07594846934080124, "step": 1925, "valid_targets_mean": 3780.8, "valid_targets_min": 702 }, { "epoch": 3.776908023483366, "grad_norm": 0.45759987074773256, "learning_rate": 2.0751306983095643e-05, "loss": 0.0906, "loss_nan_ranks": 0, "loss_rank_avg": 0.12067622691392899, "step": 1930, "valid_targets_mean": 2477.0, "valid_targets_min": 665 }, { "epoch": 3.786692759295499, "grad_norm": 0.3576601656361029, "learning_rate": 2.065377201210256e-05, "loss": 0.0958, "loss_nan_ranks": 0, "loss_rank_avg": 0.08292445540428162, "step": 1935, "valid_targets_mean": 3148.9, "valid_targets_min": 776 }, { "epoch": 3.796477495107632, "grad_norm": 0.3888288020581319, "learning_rate": 2.0556221473452148e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.0956001952290535, "step": 1940, "valid_targets_mean": 3289.1, "valid_targets_min": 791 }, { "epoch": 3.8062622309197653, "grad_norm": 0.3536271628449205, "learning_rate": 2.0458657690023525e-05, "loss": 0.1016, "loss_nan_ranks": 0, "loss_rank_avg": 0.08662386238574982, "step": 1945, "valid_targets_mean": 3108.9, "valid_targets_min": 696 }, { "epoch": 3.816046966731898, "grad_norm": 0.4445545144675986, "learning_rate": 2.036108298501121e-05, "loss": 0.0974, "loss_nan_ranks": 0, "loss_rank_avg": 0.10066284239292145, "step": 1950, "valid_targets_mean": 2228.6, "valid_targets_min": 525 }, { "epoch": 3.8258317025440314, "grad_norm": 0.3486495806571903, "learning_rate": 2.026349968186977e-05, "loss": 0.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.08311164379119873, "step": 1955, "valid_targets_mean": 2806.6, "valid_targets_min": 652 }, { "epoch": 3.8356164383561646, "grad_norm": 0.41762766327312373, "learning_rate": 2.0165910104258518e-05, "loss": 0.0952, "loss_nan_ranks": 0, "loss_rank_avg": 0.09838832169771194, "step": 1960, "valid_targets_mean": 2575.5, "valid_targets_min": 652 }, { "epoch": 3.8454011741682974, "grad_norm": 0.4116450919445935, "learning_rate": 2.0068316575986185e-05, "loss": 0.0977, "loss_nan_ranks": 0, "loss_rank_avg": 0.09968436509370804, "step": 1965, "valid_targets_mean": 2753.2, "valid_targets_min": 520 }, { "epoch": 3.8551859099804306, "grad_norm": 0.44362431242875416, "learning_rate": 1.997072142095554e-05, "loss": 0.0975, "loss_nan_ranks": 0, "loss_rank_avg": 0.10917310416698456, "step": 1970, "valid_targets_mean": 2599.4, "valid_targets_min": 567 }, { "epoch": 3.8649706457925634, "grad_norm": 0.36533007507160525, "learning_rate": 1.9873126963108136e-05, "loss": 0.0909, "loss_nan_ranks": 0, "loss_rank_avg": 0.08436676114797592, "step": 1975, "valid_targets_mean": 2983.3, "valid_targets_min": 697 }, { "epoch": 3.8747553816046967, "grad_norm": 0.3873930571500393, "learning_rate": 1.9775535526368896e-05, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.12226013839244843, "step": 1980, "valid_targets_mean": 3220.3, "valid_targets_min": 757 }, { "epoch": 3.8845401174168295, "grad_norm": 0.3982111947251814, "learning_rate": 1.9677949434590807e-05, "loss": 0.0888, "loss_nan_ranks": 0, "loss_rank_avg": 0.09624812752008438, "step": 1985, "valid_targets_mean": 3241.6, "valid_targets_min": 759 }, { "epoch": 3.8943248532289627, "grad_norm": 0.4262008952175965, "learning_rate": 1.9580371011499587e-05, "loss": 0.099, "loss_nan_ranks": 0, "loss_rank_avg": 0.0822620540857315, "step": 1990, "valid_targets_mean": 2368.4, "valid_targets_min": 718 }, { "epoch": 3.904109589041096, "grad_norm": 0.4735174382000528, "learning_rate": 1.9482802580638346e-05, "loss": 0.0986, "loss_nan_ranks": 0, "loss_rank_avg": 0.11047929525375366, "step": 1995, "valid_targets_mean": 2749.8, "valid_targets_min": 745 }, { "epoch": 3.9138943248532287, "grad_norm": 0.44187199238337815, "learning_rate": 1.9385246465312252e-05, "loss": 0.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.10588258504867554, "step": 2000, "valid_targets_mean": 2721.5, "valid_targets_min": 711 }, { "epoch": 3.923679060665362, "grad_norm": 0.44168863210644604, "learning_rate": 1.928770498853323e-05, "loss": 0.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.09524992108345032, "step": 2005, "valid_targets_mean": 3425.9, "valid_targets_min": 939 }, { "epoch": 3.9334637964774952, "grad_norm": 0.37881242527643244, "learning_rate": 1.9190180472964614e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.09194761514663696, "step": 2010, "valid_targets_mean": 2941.8, "valid_targets_min": 585 }, { "epoch": 3.943248532289628, "grad_norm": 0.443444952622372, "learning_rate": 1.9092675240865863e-05, "loss": 0.0992, "loss_nan_ranks": 0, "loss_rank_avg": 0.1167190670967102, "step": 2015, "valid_targets_mean": 2865.1, "valid_targets_min": 763 }, { "epoch": 3.9530332681017613, "grad_norm": 0.40398307970988073, "learning_rate": 1.899519161403726e-05, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.11057884991168976, "step": 2020, "valid_targets_mean": 2692.5, "valid_targets_min": 540 }, { "epoch": 3.9628180039138945, "grad_norm": 0.35462175087471715, "learning_rate": 1.8897731913764624e-05, "loss": 0.0921, "loss_nan_ranks": 0, "loss_rank_avg": 0.08501636981964111, "step": 2025, "valid_targets_mean": 3447.5, "valid_targets_min": 623 }, { "epoch": 3.9726027397260273, "grad_norm": 0.40113304138042305, "learning_rate": 1.880029846076402e-05, "loss": 0.0969, "loss_nan_ranks": 0, "loss_rank_avg": 0.0958636999130249, "step": 2030, "valid_targets_mean": 2927.4, "valid_targets_min": 682 }, { "epoch": 3.9823874755381605, "grad_norm": 0.3499095157228217, "learning_rate": 1.8702893575126522e-05, "loss": 0.0903, "loss_nan_ranks": 0, "loss_rank_avg": 0.08162295818328857, "step": 2035, "valid_targets_mean": 3658.2, "valid_targets_min": 579 }, { "epoch": 3.9921722113502938, "grad_norm": 0.389382700380517, "learning_rate": 1.8605519576262957e-05, "loss": 0.0915, "loss_nan_ranks": 0, "loss_rank_avg": 0.09373045712709427, "step": 2040, "valid_targets_mean": 3264.7, "valid_targets_min": 771 }, { "epoch": 4.001956947162427, "grad_norm": 0.33347090417729486, "learning_rate": 1.850817878284867e-05, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.07215394079685211, "step": 2045, "valid_targets_mean": 3224.1, "valid_targets_min": 739 }, { "epoch": 4.011741682974559, "grad_norm": 0.4279822957204113, "learning_rate": 1.8410873512768318e-05, "loss": 0.0842, "loss_nan_ranks": 0, "loss_rank_avg": 0.10365812480449677, "step": 2050, "valid_targets_mean": 2869.9, "valid_targets_min": 486 }, { "epoch": 4.021526418786693, "grad_norm": 0.5174724407207372, "learning_rate": 1.831360608306068e-05, "loss": 0.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.09613613039255142, "step": 2055, "valid_targets_mean": 2579.1, "valid_targets_min": 530 }, { "epoch": 4.031311154598826, "grad_norm": 0.4758726038547127, "learning_rate": 1.8216378809863465e-05, "loss": 0.0751, "loss_nan_ranks": 0, "loss_rank_avg": 0.08645018935203552, "step": 2060, "valid_targets_mean": 2447.8, "valid_targets_min": 644 }, { "epoch": 4.041095890410959, "grad_norm": 0.4569397341530332, "learning_rate": 1.8119194008358187e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1112334281206131, "step": 2065, "valid_targets_mean": 3251.8, "valid_targets_min": 876 }, { "epoch": 4.050880626223092, "grad_norm": 0.40211824561355514, "learning_rate": 1.8022053992715007e-05, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.08205370604991913, "step": 2070, "valid_targets_mean": 3019.1, "valid_targets_min": 588 }, { "epoch": 4.060665362035225, "grad_norm": 0.43322593298423395, "learning_rate": 1.7924961076037655e-05, "loss": 0.0825, "loss_nan_ranks": 0, "loss_rank_avg": 0.07359033077955246, "step": 2075, "valid_targets_mean": 2844.8, "valid_targets_min": 546 }, { "epoch": 4.070450097847358, "grad_norm": 0.4406952972720065, "learning_rate": 1.782791757030833e-05, "loss": 0.0892, "loss_nan_ranks": 0, "loss_rank_avg": 0.08964337408542633, "step": 2080, "valid_targets_mean": 2993.1, "valid_targets_min": 704 }, { "epoch": 4.080234833659492, "grad_norm": 0.41185891067535985, "learning_rate": 1.773092578633265e-05, "loss": 0.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.10361534357070923, "step": 2085, "valid_targets_mean": 3335.3, "valid_targets_min": 804 }, { "epoch": 4.090019569471624, "grad_norm": 0.45078174424393247, "learning_rate": 1.763398803368466e-05, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.10514619201421738, "step": 2090, "valid_targets_mean": 2871.2, "valid_targets_min": 720 }, { "epoch": 4.099804305283757, "grad_norm": 0.6106485028695341, "learning_rate": 1.7537106620651766e-05, "loss": 0.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.10618409514427185, "step": 2095, "valid_targets_mean": 1862.8, "valid_targets_min": 714 }, { "epoch": 4.109589041095891, "grad_norm": 0.33022730463004335, "learning_rate": 1.7440283854179842e-05, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.06401461362838745, "step": 2100, "valid_targets_mean": 3686.1, "valid_targets_min": 920 }, { "epoch": 4.119373776908024, "grad_norm": 0.4126400761141411, "learning_rate": 1.7343522039818258e-05, "loss": 0.0827, "loss_nan_ranks": 0, "loss_rank_avg": 0.07285851240158081, "step": 2105, "valid_targets_mean": 2948.2, "valid_targets_min": 549 }, { "epoch": 4.129158512720156, "grad_norm": 0.4086389799740897, "learning_rate": 1.724682348166498e-05, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.07260704785585403, "step": 2110, "valid_targets_mean": 2825.8, "valid_targets_min": 721 }, { "epoch": 4.138943248532289, "grad_norm": 0.46286261572756504, "learning_rate": 1.7150190482311727e-05, "loss": 0.0788, "loss_nan_ranks": 0, "loss_rank_avg": 0.07903758436441422, "step": 2115, "valid_targets_mean": 2571.9, "valid_targets_min": 628 }, { "epoch": 4.148727984344423, "grad_norm": 0.4020407338776383, "learning_rate": 1.705362534278912e-05, "loss": 0.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.08354012668132782, "step": 2120, "valid_targets_mean": 3056.5, "valid_targets_min": 540 }, { "epoch": 4.158512720156556, "grad_norm": 0.39781399587220173, "learning_rate": 1.6957130362511907e-05, "loss": 0.0833, "loss_nan_ranks": 0, "loss_rank_avg": 0.07108549028635025, "step": 2125, "valid_targets_mean": 2955.3, "valid_targets_min": 696 }, { "epoch": 4.1682974559686885, "grad_norm": 0.41645999440413334, "learning_rate": 1.6860707839224183e-05, "loss": 0.0888, "loss_nan_ranks": 0, "loss_rank_avg": 0.08625232428312302, "step": 2130, "valid_targets_mean": 2813.1, "valid_targets_min": 697 }, { "epoch": 4.178082191780822, "grad_norm": 0.4644596872947445, "learning_rate": 1.6764360068944706e-05, "loss": 0.0758, "loss_nan_ranks": 0, "loss_rank_avg": 0.09085105359554291, "step": 2135, "valid_targets_mean": 2999.6, "valid_targets_min": 669 }, { "epoch": 4.187866927592955, "grad_norm": 0.3706643100998044, "learning_rate": 1.6668089345912217e-05, "loss": 0.0955, "loss_nan_ranks": 0, "loss_rank_avg": 0.07670444250106812, "step": 2140, "valid_targets_mean": 2918.2, "valid_targets_min": 724 }, { "epoch": 4.197651663405088, "grad_norm": 0.47220192026093816, "learning_rate": 1.6571897962530784e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.08821834623813629, "step": 2145, "valid_targets_mean": 2610.6, "valid_targets_min": 647 }, { "epoch": 4.2074363992172215, "grad_norm": 0.405018454979078, "learning_rate": 1.6475788209315248e-05, "loss": 0.0825, "loss_nan_ranks": 0, "loss_rank_avg": 0.09472696483135223, "step": 2150, "valid_targets_mean": 3579.1, "valid_targets_min": 912 }, { "epoch": 4.217221135029354, "grad_norm": 0.44603853536731675, "learning_rate": 1.6379762374836665e-05, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.08254195749759674, "step": 2155, "valid_targets_mean": 3158.2, "valid_targets_min": 246 }, { "epoch": 4.227005870841487, "grad_norm": 0.470220253122075, "learning_rate": 1.6283822745667818e-05, "loss": 0.0921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383131593465805, "step": 2160, "valid_targets_mean": 2484.4, "valid_targets_min": 889 }, { "epoch": 4.236790606653621, "grad_norm": 0.41664049920215673, "learning_rate": 1.6187971606328744e-05, "loss": 0.0843, "loss_nan_ranks": 0, "loss_rank_avg": 0.08246999979019165, "step": 2165, "valid_targets_mean": 3189.9, "valid_targets_min": 509 }, { "epoch": 4.2465753424657535, "grad_norm": 0.4177172165571193, "learning_rate": 1.609221123923239e-05, "loss": 0.0805, "loss_nan_ranks": 0, "loss_rank_avg": 0.07430468499660492, "step": 2170, "valid_targets_mean": 2448.2, "valid_targets_min": 796 }, { "epoch": 4.256360078277886, "grad_norm": 0.3659569689790677, "learning_rate": 1.5996543924630197e-05, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.06855691969394684, "step": 2175, "valid_targets_mean": 3914.1, "valid_targets_min": 800 }, { "epoch": 4.266144814090019, "grad_norm": 0.3928665815103277, "learning_rate": 1.590097194055786e-05, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.07608282566070557, "step": 2180, "valid_targets_mean": 3281.5, "valid_targets_min": 818 }, { "epoch": 4.275929549902153, "grad_norm": 0.38118551530157957, "learning_rate": 1.5805497562781018e-05, "loss": 0.0835, "loss_nan_ranks": 0, "loss_rank_avg": 0.08345082402229309, "step": 2185, "valid_targets_mean": 3308.7, "valid_targets_min": 680 }, { "epoch": 4.285714285714286, "grad_norm": 0.3140135252262881, "learning_rate": 1.571012306474115e-05, "loss": 0.0825, "loss_nan_ranks": 0, "loss_rank_avg": 0.0600694976747036, "step": 2190, "valid_targets_mean": 4122.0, "valid_targets_min": 1031 }, { "epoch": 4.295499021526418, "grad_norm": 0.36985203539245803, "learning_rate": 1.5614850717501374e-05, "loss": 0.0762, "loss_nan_ranks": 0, "loss_rank_avg": 0.06799148768186569, "step": 2195, "valid_targets_mean": 3213.6, "valid_targets_min": 447 }, { "epoch": 4.305283757338552, "grad_norm": 0.49624335733136077, "learning_rate": 1.5519682789692375e-05, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.0989300012588501, "step": 2200, "valid_targets_mean": 2505.1, "valid_targets_min": 776 }, { "epoch": 4.315068493150685, "grad_norm": 0.5817276658624355, "learning_rate": 1.5424621547458416e-05, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.08102203160524368, "step": 2205, "valid_targets_mean": 2599.9, "valid_targets_min": 716 }, { "epoch": 4.324853228962818, "grad_norm": 0.40804741152655644, "learning_rate": 1.5329669254403342e-05, "loss": 0.0822, "loss_nan_ranks": 0, "loss_rank_avg": 0.09205059707164764, "step": 2210, "valid_targets_mean": 3102.4, "valid_targets_min": 712 }, { "epoch": 4.334637964774951, "grad_norm": 0.3994952601025495, "learning_rate": 1.5234828171536705e-05, "loss": 0.079, "loss_nan_ranks": 0, "loss_rank_avg": 0.06924515962600708, "step": 2215, "valid_targets_mean": 2688.7, "valid_targets_min": 730 }, { "epoch": 4.344422700587084, "grad_norm": 0.43795940048070464, "learning_rate": 1.5140100557219902e-05, "loss": 0.0885, "loss_nan_ranks": 0, "loss_rank_avg": 0.08188264071941376, "step": 2220, "valid_targets_mean": 3017.8, "valid_targets_min": 542 }, { "epoch": 4.354207436399217, "grad_norm": 0.39285934151052326, "learning_rate": 1.5045488667112421e-05, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.08715667575597763, "step": 2225, "valid_targets_mean": 3435.9, "valid_targets_min": 810 }, { "epoch": 4.363992172211351, "grad_norm": 0.3927584507586724, "learning_rate": 1.4950994754118115e-05, "loss": 0.0818, "loss_nan_ranks": 0, "loss_rank_avg": 0.07635986059904099, "step": 2230, "valid_targets_mean": 3151.9, "valid_targets_min": 904 }, { "epoch": 4.373776908023483, "grad_norm": 0.40139400189745017, "learning_rate": 1.4856621068331557e-05, "loss": 0.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.07851336896419525, "step": 2235, "valid_targets_mean": 3499.4, "valid_targets_min": 703 }, { "epoch": 4.383561643835616, "grad_norm": 0.5472252641844141, "learning_rate": 1.4762369856984466e-05, "loss": 0.0893, "loss_nan_ranks": 0, "loss_rank_avg": 0.11168396472930908, "step": 2240, "valid_targets_mean": 2343.6, "valid_targets_min": 541 }, { "epoch": 4.39334637964775, "grad_norm": 0.44988499850357433, "learning_rate": 1.4668243364392187e-05, "loss": 0.0853, "loss_nan_ranks": 0, "loss_rank_avg": 0.08482237160205841, "step": 2245, "valid_targets_mean": 2604.9, "valid_targets_min": 541 }, { "epoch": 4.403131115459883, "grad_norm": 0.40278145909096286, "learning_rate": 1.4574243831900252e-05, "loss": 0.0832, "loss_nan_ranks": 0, "loss_rank_avg": 0.08804011344909668, "step": 2250, "valid_targets_mean": 2919.4, "valid_targets_min": 623 }, { "epoch": 4.4129158512720155, "grad_norm": 0.4283698076896282, "learning_rate": 1.4480373497831034e-05, "loss": 0.0846, "loss_nan_ranks": 0, "loss_rank_avg": 0.08546335250139236, "step": 2255, "valid_targets_mean": 3130.6, "valid_targets_min": 598 }, { "epoch": 4.422700587084149, "grad_norm": 0.42452807333687326, "learning_rate": 1.4386634597430402e-05, "loss": 0.0862, "loss_nan_ranks": 0, "loss_rank_avg": 0.0829804390668869, "step": 2260, "valid_targets_mean": 3186.8, "valid_targets_min": 758 }, { "epoch": 4.432485322896282, "grad_norm": 0.5080896782394324, "learning_rate": 1.4293029362814521e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.08919325470924377, "step": 2265, "valid_targets_mean": 3136.6, "valid_targets_min": 608 }, { "epoch": 4.442270058708415, "grad_norm": 0.3654051449018453, "learning_rate": 1.4199560022916701e-05, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.061577536165714264, "step": 2270, "valid_targets_mean": 3570.6, "valid_targets_min": 1093 }, { "epoch": 4.4520547945205475, "grad_norm": 0.4071984690405413, "learning_rate": 1.4106228803434329e-05, "loss": 0.0911, "loss_nan_ranks": 0, "loss_rank_avg": 0.08632341772317886, "step": 2275, "valid_targets_mean": 3279.2, "valid_targets_min": 784 }, { "epoch": 4.461839530332681, "grad_norm": 0.5465175072506565, "learning_rate": 1.4013037926775857e-05, "loss": 0.0942, "loss_nan_ranks": 0, "loss_rank_avg": 0.11121866852045059, "step": 2280, "valid_targets_mean": 2290.5, "valid_targets_min": 759 }, { "epoch": 4.471624266144814, "grad_norm": 0.4545421717381925, "learning_rate": 1.3919989612007873e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.09390892088413239, "step": 2285, "valid_targets_mean": 2565.9, "valid_targets_min": 357 }, { "epoch": 4.481409001956947, "grad_norm": 0.4744600265214128, "learning_rate": 1.3827086074802288e-05, "loss": 0.0904, "loss_nan_ranks": 0, "loss_rank_avg": 0.09152168780565262, "step": 2290, "valid_targets_mean": 3018.2, "valid_targets_min": 840 }, { "epoch": 4.4911937377690805, "grad_norm": 0.37848480874679646, "learning_rate": 1.373432952738355e-05, "loss": 0.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.07510063052177429, "step": 2295, "valid_targets_mean": 3468.9, "valid_targets_min": 947 }, { "epoch": 4.500978473581213, "grad_norm": 0.41100746477510236, "learning_rate": 1.3641722178475982e-05, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.07598906755447388, "step": 2300, "valid_targets_mean": 3540.9, "valid_targets_min": 743 }, { "epoch": 4.510763209393346, "grad_norm": 0.4031977134950344, "learning_rate": 1.354926623325119e-05, "loss": 0.0816, "loss_nan_ranks": 0, "loss_rank_avg": 0.08031619340181351, "step": 2305, "valid_targets_mean": 3444.3, "valid_targets_min": 763 }, { "epoch": 4.52054794520548, "grad_norm": 0.3907727106261878, "learning_rate": 1.3456963893275541e-05, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.0799025148153305, "step": 2310, "valid_targets_mean": 3235.8, "valid_targets_min": 785 }, { "epoch": 4.5303326810176126, "grad_norm": 0.41542931620683693, "learning_rate": 1.3364817356457739e-05, "loss": 0.0838, "loss_nan_ranks": 0, "loss_rank_avg": 0.0947611927986145, "step": 2315, "valid_targets_mean": 3364.6, "valid_targets_min": 929 }, { "epoch": 4.540117416829745, "grad_norm": 0.47481824122948996, "learning_rate": 1.3272828816996498e-05, "loss": 0.0908, "loss_nan_ranks": 0, "loss_rank_avg": 0.11458331346511841, "step": 2320, "valid_targets_mean": 2688.8, "valid_targets_min": 730 }, { "epoch": 4.549902152641879, "grad_norm": 0.4169815831506829, "learning_rate": 1.3181000465328298e-05, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.07972556352615356, "step": 2325, "valid_targets_mean": 2968.4, "valid_targets_min": 549 }, { "epoch": 4.559686888454012, "grad_norm": 0.42758434189152333, "learning_rate": 1.3089334488075207e-05, "loss": 0.1022, "loss_nan_ranks": 0, "loss_rank_avg": 0.09930993616580963, "step": 2330, "valid_targets_mean": 2937.4, "valid_targets_min": 515 }, { "epoch": 4.569471624266145, "grad_norm": 0.4036679246953518, "learning_rate": 1.2997833067992827e-05, "loss": 0.0821, "loss_nan_ranks": 0, "loss_rank_avg": 0.08978946506977081, "step": 2335, "valid_targets_mean": 3032.6, "valid_targets_min": 612 }, { "epoch": 4.579256360078277, "grad_norm": 0.42899233045163393, "learning_rate": 1.2906498383918327e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.09562341123819351, "step": 2340, "valid_targets_mean": 2699.2, "valid_targets_min": 509 }, { "epoch": 4.589041095890411, "grad_norm": 0.527541585974065, "learning_rate": 1.2815332610718522e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.12526696920394897, "step": 2345, "valid_targets_mean": 2469.9, "valid_targets_min": 726 }, { "epoch": 4.598825831702544, "grad_norm": 0.46389236440630605, "learning_rate": 1.2724337919238133e-05, "loss": 0.0892, "loss_nan_ranks": 0, "loss_rank_avg": 0.09370893239974976, "step": 2350, "valid_targets_mean": 2425.7, "valid_targets_min": 538 }, { "epoch": 4.608610567514678, "grad_norm": 0.4627174077448799, "learning_rate": 1.2633516476248067e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.08172088861465454, "step": 2355, "valid_targets_mean": 2239.6, "valid_targets_min": 534 }, { "epoch": 4.61839530332681, "grad_norm": 0.4273871422554128, "learning_rate": 1.2542870444393831e-05, "loss": 0.0879, "loss_nan_ranks": 0, "loss_rank_avg": 0.07641121745109558, "step": 2360, "valid_targets_mean": 2943.8, "valid_targets_min": 705 }, { "epoch": 4.628180039138943, "grad_norm": 0.45482968385454625, "learning_rate": 1.2452401982144027e-05, "loss": 0.0848, "loss_nan_ranks": 0, "loss_rank_avg": 0.07942764461040497, "step": 2365, "valid_targets_mean": 2497.5, "valid_targets_min": 591 }, { "epoch": 4.637964774951076, "grad_norm": 0.3831987122114139, "learning_rate": 1.2362113243738957e-05, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.06884678453207016, "step": 2370, "valid_targets_mean": 3136.9, "valid_targets_min": 652 }, { "epoch": 4.64774951076321, "grad_norm": 0.3426993876504314, "learning_rate": 1.227200637913934e-05, "loss": 0.0775, "loss_nan_ranks": 0, "loss_rank_avg": 0.06089651957154274, "step": 2375, "valid_targets_mean": 3657.6, "valid_targets_min": 1169 }, { "epoch": 4.657534246575342, "grad_norm": 0.36555463416806805, "learning_rate": 1.2182083533975093e-05, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.07065147161483765, "step": 2380, "valid_targets_mean": 3312.8, "valid_targets_min": 939 }, { "epoch": 4.667318982387475, "grad_norm": 0.49916195706518923, "learning_rate": 1.2092346849494249e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.1260618418455124, "step": 2385, "valid_targets_mean": 2458.0, "valid_targets_min": 819 }, { "epoch": 4.677103718199609, "grad_norm": 0.4401026984347728, "learning_rate": 1.2002798462511991e-05, "loss": 0.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.08726265281438828, "step": 2390, "valid_targets_mean": 2878.9, "valid_targets_min": 699 }, { "epoch": 4.686888454011742, "grad_norm": 0.41329131996894747, "learning_rate": 1.1913440505359737e-05, "loss": 0.0888, "loss_nan_ranks": 0, "loss_rank_avg": 0.09846547991037369, "step": 2395, "valid_targets_mean": 2795.2, "valid_targets_min": 580 }, { "epoch": 4.6966731898238745, "grad_norm": 0.40015455540562234, "learning_rate": 1.1824275105834376e-05, "loss": 0.0955, "loss_nan_ranks": 0, "loss_rank_avg": 0.09469325095415115, "step": 2400, "valid_targets_mean": 2817.9, "valid_targets_min": 760 }, { "epoch": 4.706457925636008, "grad_norm": 0.3638478848724825, "learning_rate": 1.173530438714761e-05, "loss": 0.0854, "loss_nan_ranks": 0, "loss_rank_avg": 0.0795590728521347, "step": 2405, "valid_targets_mean": 3600.8, "valid_targets_min": 792 }, { "epoch": 4.716242661448141, "grad_norm": 0.3610144363902236, "learning_rate": 1.1646530467875384e-05, "loss": 0.0795, "loss_nan_ranks": 0, "loss_rank_avg": 0.06894271075725555, "step": 2410, "valid_targets_mean": 2944.6, "valid_targets_min": 708 }, { "epoch": 4.726027397260274, "grad_norm": 0.4720220662855206, "learning_rate": 1.1557955461907468e-05, "loss": 0.0813, "loss_nan_ranks": 0, "loss_rank_avg": 0.09234504401683807, "step": 2415, "valid_targets_mean": 2605.2, "valid_targets_min": 839 }, { "epoch": 4.7358121330724074, "grad_norm": 0.4231419000389196, "learning_rate": 1.1469581478397044e-05, "loss": 0.0793, "loss_nan_ranks": 0, "loss_rank_avg": 0.07564327120780945, "step": 2420, "valid_targets_mean": 3238.0, "valid_targets_min": 531 }, { "epoch": 4.74559686888454, "grad_norm": 0.5160752220286023, "learning_rate": 1.1381410621710582e-05, "loss": 0.0891, "loss_nan_ranks": 0, "loss_rank_avg": 0.10082191228866577, "step": 2425, "valid_targets_mean": 2365.6, "valid_targets_min": 507 }, { "epoch": 4.755381604696673, "grad_norm": 0.41958078295292695, "learning_rate": 1.1293444991377683e-05, "loss": 0.0874, "loss_nan_ranks": 0, "loss_rank_avg": 0.07534124702215195, "step": 2430, "valid_targets_mean": 2718.6, "valid_targets_min": 676 }, { "epoch": 4.765166340508806, "grad_norm": 0.3993376985467739, "learning_rate": 1.120568668204105e-05, "loss": 0.0833, "loss_nan_ranks": 0, "loss_rank_avg": 0.07338666170835495, "step": 2435, "valid_targets_mean": 3466.2, "valid_targets_min": 995 }, { "epoch": 4.7749510763209395, "grad_norm": 0.40708648042993384, "learning_rate": 1.1118137783406691e-05, "loss": 0.0801, "loss_nan_ranks": 0, "loss_rank_avg": 0.07422689348459244, "step": 2440, "valid_targets_mean": 2852.9, "valid_targets_min": 613 }, { "epoch": 4.784735812133072, "grad_norm": 0.32933199228045734, "learning_rate": 1.1030800380194075e-05, "loss": 0.0824, "loss_nan_ranks": 0, "loss_rank_avg": 0.05903619900345802, "step": 2445, "valid_targets_mean": 3809.5, "valid_targets_min": 981 }, { "epoch": 4.794520547945205, "grad_norm": 0.45145938340577096, "learning_rate": 1.0943676552086555e-05, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.09547198563814163, "step": 2450, "valid_targets_mean": 3029.9, "valid_targets_min": 493 }, { "epoch": 4.804305283757339, "grad_norm": 0.39536994402553677, "learning_rate": 1.0856768373681824e-05, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.06591817736625671, "step": 2455, "valid_targets_mean": 3374.6, "valid_targets_min": 523 }, { "epoch": 4.814090019569472, "grad_norm": 0.43737528144487636, "learning_rate": 1.0770077914442481e-05, "loss": 0.0972, "loss_nan_ranks": 0, "loss_rank_avg": 0.08177588880062103, "step": 2460, "valid_targets_mean": 2486.7, "valid_targets_min": 721 }, { "epoch": 4.823874755381604, "grad_norm": 0.4029529691750347, "learning_rate": 1.0683607238646823e-05, "loss": 0.0861, "loss_nan_ranks": 0, "loss_rank_avg": 0.07464135438203812, "step": 2465, "valid_targets_mean": 2826.1, "valid_targets_min": 540 }, { "epoch": 4.833659491193738, "grad_norm": 0.40915386401021575, "learning_rate": 1.0597358405339612e-05, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.083827443420887, "step": 2470, "valid_targets_mean": 3118.3, "valid_targets_min": 672 }, { "epoch": 4.843444227005871, "grad_norm": 0.4673013862594274, "learning_rate": 1.0511333468283123e-05, "loss": 0.0876, "loss_nan_ranks": 0, "loss_rank_avg": 0.09946395456790924, "step": 2475, "valid_targets_mean": 2776.6, "valid_targets_min": 802 }, { "epoch": 4.853228962818004, "grad_norm": 0.4147413930838571, "learning_rate": 1.0425534475908162e-05, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.07261813431978226, "step": 2480, "valid_targets_mean": 3035.1, "valid_targets_min": 530 }, { "epoch": 4.863013698630137, "grad_norm": 0.39749212592351296, "learning_rate": 1.0339963471265354e-05, "loss": 0.0886, "loss_nan_ranks": 0, "loss_rank_avg": 0.06496164202690125, "step": 2485, "valid_targets_mean": 3029.6, "valid_targets_min": 459 }, { "epoch": 4.87279843444227, "grad_norm": 0.44617161341849004, "learning_rate": 1.0254622491976467e-05, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.08341960608959198, "step": 2490, "valid_targets_mean": 2654.7, "valid_targets_min": 753 }, { "epoch": 4.882583170254403, "grad_norm": 0.44433835158297286, "learning_rate": 1.0169513570185873e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.09123141318559647, "step": 2495, "valid_targets_mean": 2940.3, "valid_targets_min": 786 }, { "epoch": 4.892367906066536, "grad_norm": 0.43946592148289093, "learning_rate": 1.0084638732512193e-05, "loss": 0.0885, "loss_nan_ranks": 0, "loss_rank_avg": 0.09572343528270721, "step": 2500, "valid_targets_mean": 2890.5, "valid_targets_min": 667 }, { "epoch": 4.902152641878669, "grad_norm": 0.37271846213586, "learning_rate": 1.0000000000000006e-05, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.07236606627702713, "step": 2505, "valid_targets_mean": 3438.8, "valid_targets_min": 871 }, { "epoch": 4.911937377690802, "grad_norm": 0.4134697517013373, "learning_rate": 9.91559938807176e-06, "loss": 0.0888, "loss_nan_ranks": 0, "loss_rank_avg": 0.0818052664399147, "step": 2510, "valid_targets_mean": 3295.9, "valid_targets_min": 847 }, { "epoch": 4.921722113502936, "grad_norm": 0.5292638132574928, "learning_rate": 9.831438906479764e-06, "loss": 0.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.09691952913999557, "step": 2515, "valid_targets_mean": 2324.8, "valid_targets_min": 538 }, { "epoch": 4.931506849315069, "grad_norm": 0.4261666106299731, "learning_rate": 9.747520559258304e-06, "loss": 0.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.07897660881280899, "step": 2520, "valid_targets_mean": 2536.9, "valid_targets_min": 702 }, { "epoch": 4.9412915851272015, "grad_norm": 0.36788850762651626, "learning_rate": 9.663846344675982e-06, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.08979177474975586, "step": 2525, "valid_targets_mean": 3350.4, "valid_targets_min": 622 }, { "epoch": 4.951076320939334, "grad_norm": 0.5905666803453788, "learning_rate": 9.580418255188064e-06, "loss": 0.0864, "loss_nan_ranks": 0, "loss_rank_avg": 0.08794091641902924, "step": 2530, "valid_targets_mean": 2570.4, "valid_targets_min": 716 }, { "epoch": 4.960861056751468, "grad_norm": 0.455660084440653, "learning_rate": 9.497238277389096e-06, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.09039708971977234, "step": 2535, "valid_targets_mean": 2890.1, "valid_targets_min": 890 }, { "epoch": 4.970645792563601, "grad_norm": 0.43123529859668797, "learning_rate": 9.414308391965576e-06, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.08583714812994003, "step": 2540, "valid_targets_mean": 3090.9, "valid_targets_min": 804 }, { "epoch": 4.9804305283757335, "grad_norm": 0.38267209615286657, "learning_rate": 9.331630573648762e-06, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.0717456191778183, "step": 2545, "valid_targets_mean": 3247.4, "valid_targets_min": 700 }, { "epoch": 4.990215264187867, "grad_norm": 0.4869270630648989, "learning_rate": 9.249206791167708e-06, "loss": 0.0925, "loss_nan_ranks": 0, "loss_rank_avg": 0.1435987800359726, "step": 2550, "valid_targets_mean": 2629.9, "valid_targets_min": 623 }, { "epoch": 5.0, "grad_norm": 0.37216419041648807, "learning_rate": 9.167039007202318e-06, "loss": 0.0869, "loss_nan_ranks": 0, "loss_rank_avg": 0.0866527259349823, "step": 2555, "valid_targets_mean": 3667.2, "valid_targets_min": 673 }, { "epoch": 5.009784735812133, "grad_norm": 0.3846448015454443, "learning_rate": 9.08512917833668e-06, "loss": 0.08, "loss_nan_ranks": 0, "loss_rank_avg": 0.07525740563869476, "step": 2560, "valid_targets_mean": 3151.8, "valid_targets_min": 446 }, { "epoch": 5.0195694716242665, "grad_norm": 0.4566927718008459, "learning_rate": 9.003479255012407e-06, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278042286634445, "step": 2565, "valid_targets_mean": 2763.4, "valid_targets_min": 645 }, { "epoch": 5.029354207436399, "grad_norm": 0.44155540925429854, "learning_rate": 8.922091181482244e-06, "loss": 0.0723, "loss_nan_ranks": 0, "loss_rank_avg": 0.07004959881305695, "step": 2570, "valid_targets_mean": 3266.8, "valid_targets_min": 605 }, { "epoch": 5.039138943248532, "grad_norm": 0.41575306410926377, "learning_rate": 8.84096689576377e-06, "loss": 0.0775, "loss_nan_ranks": 0, "loss_rank_avg": 0.07973407208919525, "step": 2575, "valid_targets_mean": 3170.4, "valid_targets_min": 739 }, { "epoch": 5.048923679060666, "grad_norm": 0.40927473295170586, "learning_rate": 8.760108329593182e-06, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.06959472596645355, "step": 2580, "valid_targets_mean": 3163.4, "valid_targets_min": 622 }, { "epoch": 5.0587084148727985, "grad_norm": 0.4647202504030572, "learning_rate": 8.679517408379397e-06, "loss": 0.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.06403348594903946, "step": 2585, "valid_targets_mean": 3153.7, "valid_targets_min": 644 }, { "epoch": 5.068493150684931, "grad_norm": 0.4472345809309543, "learning_rate": 8.599196051158138e-06, "loss": 0.0801, "loss_nan_ranks": 0, "loss_rank_avg": 0.07315093278884888, "step": 2590, "valid_targets_mean": 3103.4, "valid_targets_min": 623 }, { "epoch": 5.078277886497064, "grad_norm": 0.4327382824717028, "learning_rate": 8.519146170546244e-06, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.06694217026233673, "step": 2595, "valid_targets_mean": 3028.6, "valid_targets_min": 621 }, { "epoch": 5.088062622309198, "grad_norm": 0.48093617379902154, "learning_rate": 8.439369672696163e-06, "loss": 0.0814, "loss_nan_ranks": 0, "loss_rank_avg": 0.11695721000432968, "step": 2600, "valid_targets_mean": 2941.0, "valid_targets_min": 593 }, { "epoch": 5.097847358121331, "grad_norm": 0.4947290913856816, "learning_rate": 8.3598684572505e-06, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.06659847497940063, "step": 2605, "valid_targets_mean": 3053.4, "valid_targets_min": 645 }, { "epoch": 5.107632093933463, "grad_norm": 0.425722662758008, "learning_rate": 8.280644417296857e-06, "loss": 0.0746, "loss_nan_ranks": 0, "loss_rank_avg": 0.05943864956498146, "step": 2610, "valid_targets_mean": 3356.5, "valid_targets_min": 841 }, { "epoch": 5.117416829745597, "grad_norm": 0.7010546552125257, "learning_rate": 8.201699439322683e-06, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.08390269428491592, "step": 2615, "valid_targets_mean": 2372.9, "valid_targets_min": 654 }, { "epoch": 5.12720156555773, "grad_norm": 0.4707701192161638, "learning_rate": 8.123035403170416e-06, "loss": 0.0782, "loss_nan_ranks": 0, "loss_rank_avg": 0.09458690881729126, "step": 2620, "valid_targets_mean": 3179.9, "valid_targets_min": 740 }, { "epoch": 5.136986301369863, "grad_norm": 0.3733882899924583, "learning_rate": 8.044654181992681e-06, "loss": 0.0829, "loss_nan_ranks": 0, "loss_rank_avg": 0.06267109513282776, "step": 2625, "valid_targets_mean": 3535.1, "valid_targets_min": 736 }, { "epoch": 5.146771037181996, "grad_norm": 0.5670266134338218, "learning_rate": 7.96655764220768e-06, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.10448236763477325, "step": 2630, "valid_targets_mean": 2141.2, "valid_targets_min": 534 }, { "epoch": 5.156555772994129, "grad_norm": 0.4579181411339998, "learning_rate": 7.888747643454795e-06, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.07108033448457718, "step": 2635, "valid_targets_mean": 3233.6, "valid_targets_min": 898 }, { "epoch": 5.166340508806262, "grad_norm": 0.4796639740717722, "learning_rate": 7.811226038550243e-06, "loss": 0.0833, "loss_nan_ranks": 0, "loss_rank_avg": 0.08697977662086487, "step": 2640, "valid_targets_mean": 2687.1, "valid_targets_min": 579 }, { "epoch": 5.176125244618396, "grad_norm": 0.4281783389607264, "learning_rate": 7.733994673443022e-06, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.0809246152639389, "step": 2645, "valid_targets_mean": 3109.3, "valid_targets_min": 826 }, { "epoch": 5.185909980430528, "grad_norm": 0.4700576121724099, "learning_rate": 7.657055387170902e-06, "loss": 0.0695, "loss_nan_ranks": 0, "loss_rank_avg": 0.075184665620327, "step": 2650, "valid_targets_mean": 2657.9, "valid_targets_min": 575 }, { "epoch": 5.195694716242661, "grad_norm": 0.46934057298939746, "learning_rate": 7.580410011816653e-06, "loss": 0.0701, "loss_nan_ranks": 0, "loss_rank_avg": 0.074135422706604, "step": 2655, "valid_targets_mean": 2797.4, "valid_targets_min": 779 }, { "epoch": 5.205479452054795, "grad_norm": 0.4586698081794364, "learning_rate": 7.504060372464441e-06, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.0656193196773529, "step": 2660, "valid_targets_mean": 2879.9, "valid_targets_min": 591 }, { "epoch": 5.215264187866928, "grad_norm": 0.42532010620654703, "learning_rate": 7.428008287156323e-06, "loss": 0.0675, "loss_nan_ranks": 0, "loss_rank_avg": 0.06322677433490753, "step": 2665, "valid_targets_mean": 3072.4, "valid_targets_min": 664 }, { "epoch": 5.2250489236790605, "grad_norm": 0.4546147009432678, "learning_rate": 7.352255566849005e-06, "loss": 0.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.07324878871440887, "step": 2670, "valid_targets_mean": 3465.8, "valid_targets_min": 919 }, { "epoch": 5.234833659491194, "grad_norm": 0.4004826507870159, "learning_rate": 7.276804015370691e-06, "loss": 0.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.06853301078081131, "step": 2675, "valid_targets_mean": 3300.2, "valid_targets_min": 761 }, { "epoch": 5.244618395303327, "grad_norm": 0.522264738532023, "learning_rate": 7.201655429378118e-06, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.11054161190986633, "step": 2680, "valid_targets_mean": 2592.6, "valid_targets_min": 647 }, { "epoch": 5.25440313111546, "grad_norm": 0.5331610897574944, "learning_rate": 7.1268115983138164e-06, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.1116286963224411, "step": 2685, "valid_targets_mean": 2340.2, "valid_targets_min": 819 }, { "epoch": 5.2641878669275926, "grad_norm": 0.49689270254400725, "learning_rate": 7.052274304363449e-06, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.083046555519104, "step": 2690, "valid_targets_mean": 2871.1, "valid_targets_min": 572 }, { "epoch": 5.273972602739726, "grad_norm": 0.4064264879916974, "learning_rate": 6.978045322413425e-06, "loss": 0.0867, "loss_nan_ranks": 0, "loss_rank_avg": 0.07062041759490967, "step": 2695, "valid_targets_mean": 3404.1, "valid_targets_min": 582 }, { "epoch": 5.283757338551859, "grad_norm": 0.43874521235403546, "learning_rate": 6.904126420008583e-06, "loss": 0.0786, "loss_nan_ranks": 0, "loss_rank_avg": 0.07893872261047363, "step": 2700, "valid_targets_mean": 3099.3, "valid_targets_min": 743 }, { "epoch": 5.293542074363992, "grad_norm": 0.42947030250371915, "learning_rate": 6.830519357310153e-06, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.07591693103313446, "step": 2705, "valid_targets_mean": 3025.2, "valid_targets_min": 700 }, { "epoch": 5.3033268101761255, "grad_norm": 0.41983088407002433, "learning_rate": 6.757225887053815e-06, "loss": 0.0765, "loss_nan_ranks": 0, "loss_rank_avg": 0.06995223462581635, "step": 2710, "valid_targets_mean": 3067.0, "valid_targets_min": 844 }, { "epoch": 5.313111545988258, "grad_norm": 0.5065180079964318, "learning_rate": 6.684247754507951e-06, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.08915503323078156, "step": 2715, "valid_targets_mean": 2829.2, "valid_targets_min": 663 }, { "epoch": 5.322896281800391, "grad_norm": 0.3514651583143728, "learning_rate": 6.611586697432124e-06, "loss": 0.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.056846678256988525, "step": 2720, "valid_targets_mean": 3205.9, "valid_targets_min": 726 }, { "epoch": 5.332681017612525, "grad_norm": 0.46576323988464474, "learning_rate": 6.539244446035657e-06, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.0915067046880722, "step": 2725, "valid_targets_mean": 3027.2, "valid_targets_min": 885 }, { "epoch": 5.342465753424658, "grad_norm": 0.38295613031553155, "learning_rate": 6.467222722936481e-06, "loss": 0.0765, "loss_nan_ranks": 0, "loss_rank_avg": 0.08527641743421555, "step": 2730, "valid_targets_mean": 3871.1, "valid_targets_min": 1785 }, { "epoch": 5.35225048923679, "grad_norm": 0.48047512841445, "learning_rate": 6.395523243120061e-06, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.07413574308156967, "step": 2735, "valid_targets_mean": 2652.9, "valid_targets_min": 559 }, { "epoch": 5.362035225048924, "grad_norm": 0.40613604935428527, "learning_rate": 6.324147713898592e-06, "loss": 0.067, "loss_nan_ranks": 0, "loss_rank_avg": 0.06498594582080841, "step": 2740, "valid_targets_mean": 3446.8, "valid_targets_min": 816 }, { "epoch": 5.371819960861057, "grad_norm": 0.4421159325694742, "learning_rate": 6.253097834870358e-06, "loss": 0.0732, "loss_nan_ranks": 0, "loss_rank_avg": 0.06856618821620941, "step": 2745, "valid_targets_mean": 2949.9, "valid_targets_min": 681 }, { "epoch": 5.38160469667319, "grad_norm": 0.5016463840499853, "learning_rate": 6.1823752978792125e-06, "loss": 0.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.08905217051506042, "step": 2750, "valid_targets_mean": 2479.9, "valid_targets_min": 342 }, { "epoch": 5.391389432485322, "grad_norm": 0.4924121530285662, "learning_rate": 6.111981786974346e-06, "loss": 0.0808, "loss_nan_ranks": 0, "loss_rank_avg": 0.09011845290660858, "step": 2755, "valid_targets_mean": 2914.0, "valid_targets_min": 744 }, { "epoch": 5.401174168297456, "grad_norm": 0.5061843867577648, "learning_rate": 6.0419189783701514e-06, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.08524833619594574, "step": 2760, "valid_targets_mean": 2597.8, "valid_targets_min": 782 }, { "epoch": 5.410958904109589, "grad_norm": 0.48279546078078917, "learning_rate": 5.972188540406312e-06, "loss": 0.0893, "loss_nan_ranks": 0, "loss_rank_avg": 0.09057684987783432, "step": 2765, "valid_targets_mean": 2810.7, "valid_targets_min": 337 }, { "epoch": 5.420743639921722, "grad_norm": 0.4277493595292542, "learning_rate": 5.902792133508095e-06, "loss": 0.0788, "loss_nan_ranks": 0, "loss_rank_avg": 0.06424663215875626, "step": 2770, "valid_targets_mean": 3190.0, "valid_targets_min": 676 }, { "epoch": 5.430528375733855, "grad_norm": 0.5086478426477666, "learning_rate": 5.833731410146786e-06, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.07968039065599442, "step": 2775, "valid_targets_mean": 2663.5, "valid_targets_min": 652 }, { "epoch": 5.440313111545988, "grad_norm": 0.5557090459869544, "learning_rate": 5.765008014800375e-06, "loss": 0.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.08440135419368744, "step": 2780, "valid_targets_mean": 2660.8, "valid_targets_min": 324 }, { "epoch": 5.450097847358121, "grad_norm": 0.3792929646660218, "learning_rate": 5.6966235839143495e-06, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.08909265697002411, "step": 2785, "valid_targets_mean": 3611.2, "valid_targets_min": 1122 }, { "epoch": 5.459882583170255, "grad_norm": 0.45468140912134825, "learning_rate": 5.628579745862777e-06, "loss": 0.0758, "loss_nan_ranks": 0, "loss_rank_avg": 0.07230260968208313, "step": 2790, "valid_targets_mean": 2914.3, "valid_targets_min": 323 }, { "epoch": 5.4696673189823874, "grad_norm": 0.4473717214046915, "learning_rate": 5.560878120909512e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.0659240335226059, "step": 2795, "valid_targets_mean": 3016.2, "valid_targets_min": 716 }, { "epoch": 5.47945205479452, "grad_norm": 0.3767059140003713, "learning_rate": 5.493520321169587e-06, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.06713557243347168, "step": 2800, "valid_targets_mean": 3682.9, "valid_targets_min": 1875 }, { "epoch": 5.489236790606654, "grad_norm": 0.4532874827402321, "learning_rate": 5.426507950570874e-06, "loss": 0.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.08205291628837585, "step": 2805, "valid_targets_mean": 3044.5, "valid_targets_min": 714 }, { "epoch": 5.499021526418787, "grad_norm": 0.5602610792291699, "learning_rate": 5.359842604815853e-06, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.0752958208322525, "step": 2810, "valid_targets_mean": 2457.2, "valid_targets_min": 801 }, { "epoch": 5.5088062622309195, "grad_norm": 0.40646962416999005, "learning_rate": 5.293525871343619e-06, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.06652592867612839, "step": 2815, "valid_targets_mean": 3495.7, "valid_targets_min": 761 }, { "epoch": 5.518590998043053, "grad_norm": 0.45587818448470707, "learning_rate": 5.227559329292115e-06, "loss": 0.0886, "loss_nan_ranks": 0, "loss_rank_avg": 0.07505495846271515, "step": 2820, "valid_targets_mean": 2507.4, "valid_targets_min": 665 }, { "epoch": 5.528375733855186, "grad_norm": 0.5332414159903734, "learning_rate": 5.161944549460483e-06, "loss": 0.0791, "loss_nan_ranks": 0, "loss_rank_avg": 0.08048176765441895, "step": 2825, "valid_targets_mean": 2633.4, "valid_targets_min": 622 }, { "epoch": 5.538160469667319, "grad_norm": 0.5913396187384118, "learning_rate": 5.096683094271702e-06, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.09726202487945557, "step": 2830, "valid_targets_mean": 2740.9, "valid_targets_min": 531 }, { "epoch": 5.5479452054794525, "grad_norm": 0.39863791888320843, "learning_rate": 5.031776517735341e-06, "loss": 0.0654, "loss_nan_ranks": 0, "loss_rank_avg": 0.05999351665377617, "step": 2835, "valid_targets_mean": 3267.8, "valid_targets_min": 732 }, { "epoch": 5.557729941291585, "grad_norm": 0.4516136822713863, "learning_rate": 4.967226365410598e-06, "loss": 0.0805, "loss_nan_ranks": 0, "loss_rank_avg": 0.07914609462022781, "step": 2840, "valid_targets_mean": 2839.3, "valid_targets_min": 945 }, { "epoch": 5.567514677103718, "grad_norm": 0.42885281973077843, "learning_rate": 4.903034174369477e-06, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.08505196124315262, "step": 2845, "valid_targets_mean": 3390.4, "valid_targets_min": 807 }, { "epoch": 5.577299412915851, "grad_norm": 0.40360506605925617, "learning_rate": 4.839201473160162e-06, "loss": 0.0652, "loss_nan_ranks": 0, "loss_rank_avg": 0.05721169710159302, "step": 2850, "valid_targets_mean": 2749.6, "valid_targets_min": 583 }, { "epoch": 5.5870841487279845, "grad_norm": 0.4655567417756694, "learning_rate": 4.775729781770682e-06, "loss": 0.0837, "loss_nan_ranks": 0, "loss_rank_avg": 0.0737919956445694, "step": 2855, "valid_targets_mean": 3181.2, "valid_targets_min": 831 }, { "epoch": 5.596868884540117, "grad_norm": 0.45830977254087935, "learning_rate": 4.7126206115926375e-06, "loss": 0.0648, "loss_nan_ranks": 0, "loss_rank_avg": 0.06951932609081268, "step": 2860, "valid_targets_mean": 2819.4, "valid_targets_min": 474 }, { "epoch": 5.60665362035225, "grad_norm": 0.4894743876633723, "learning_rate": 4.649875465385294e-06, "loss": 0.0834, "loss_nan_ranks": 0, "loss_rank_avg": 0.08948928862810135, "step": 2865, "valid_targets_mean": 2493.1, "valid_targets_min": 693 }, { "epoch": 5.616438356164384, "grad_norm": 0.4244925832158591, "learning_rate": 4.587495837239722e-06, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.06952004879713058, "step": 2870, "valid_targets_mean": 3181.3, "valid_targets_min": 719 }, { "epoch": 5.626223091976517, "grad_norm": 0.40823168515859165, "learning_rate": 4.525483212543273e-06, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.06525617837905884, "step": 2875, "valid_targets_mean": 3030.6, "valid_targets_min": 908 }, { "epoch": 5.636007827788649, "grad_norm": 0.4223584270445933, "learning_rate": 4.463839067944196e-06, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.07718521356582642, "step": 2880, "valid_targets_mean": 3210.1, "valid_targets_min": 516 }, { "epoch": 5.645792563600783, "grad_norm": 0.4102616492959249, "learning_rate": 4.402564871316455e-06, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.05997679382562637, "step": 2885, "valid_targets_mean": 3926.1, "valid_targets_min": 329 }, { "epoch": 5.655577299412916, "grad_norm": 0.4603342285016962, "learning_rate": 4.341662081724794e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.07202913612127304, "step": 2890, "valid_targets_mean": 2729.5, "valid_targets_min": 536 }, { "epoch": 5.665362035225049, "grad_norm": 0.6329113399161261, "learning_rate": 4.281132149390004e-06, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.08393596112728119, "step": 2895, "valid_targets_mean": 2008.6, "valid_targets_min": 567 }, { "epoch": 5.675146771037182, "grad_norm": 0.4694934388592357, "learning_rate": 4.220976515654358e-06, "loss": 0.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.08040758222341537, "step": 2900, "valid_targets_mean": 2670.1, "valid_targets_min": 613 }, { "epoch": 5.684931506849315, "grad_norm": 0.3448575873042548, "learning_rate": 4.1611966129473336e-06, "loss": 0.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.051838748157024384, "step": 2905, "valid_targets_mean": 3567.4, "valid_targets_min": 1293 }, { "epoch": 5.694716242661448, "grad_norm": 0.45465205799302394, "learning_rate": 4.101793864751449e-06, "loss": 0.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.09528183937072754, "step": 2910, "valid_targets_mean": 2994.5, "valid_targets_min": 848 }, { "epoch": 5.704500978473581, "grad_norm": 0.4707601342793054, "learning_rate": 4.0427696855684266e-06, "loss": 0.0745, "loss_nan_ranks": 0, "loss_rank_avg": 0.07119297236204147, "step": 2915, "valid_targets_mean": 2591.8, "valid_targets_min": 393 }, { "epoch": 5.714285714285714, "grad_norm": 0.4030225676073155, "learning_rate": 3.984125480885455e-06, "loss": 0.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.06661651283502579, "step": 2920, "valid_targets_mean": 3427.6, "valid_targets_min": 1524 }, { "epoch": 5.724070450097847, "grad_norm": 0.5059078539553407, "learning_rate": 3.925862647141769e-06, "loss": 0.0779, "loss_nan_ranks": 0, "loss_rank_avg": 0.07960377633571625, "step": 2925, "valid_targets_mean": 2849.5, "valid_targets_min": 784 }, { "epoch": 5.733855185909981, "grad_norm": 0.44174550198775075, "learning_rate": 3.867982571695372e-06, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.0717354342341423, "step": 2930, "valid_targets_mean": 3005.4, "valid_targets_min": 799 }, { "epoch": 5.743639921722114, "grad_norm": 0.4890108032015441, "learning_rate": 3.810486632789987e-06, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.09158261865377426, "step": 2935, "valid_targets_mean": 3100.3, "valid_targets_min": 790 }, { "epoch": 5.7534246575342465, "grad_norm": 0.4451920276397767, "learning_rate": 3.753376199522285e-06, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.06903664767742157, "step": 2940, "valid_targets_mean": 2797.9, "valid_targets_min": 599 }, { "epoch": 5.763209393346379, "grad_norm": 0.5124581684682721, "learning_rate": 3.696652631809221e-06, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.07900827378034592, "step": 2945, "valid_targets_mean": 2342.2, "valid_targets_min": 619 }, { "epoch": 5.772994129158513, "grad_norm": 0.4517907195455391, "learning_rate": 3.640317280355712e-06, "loss": 0.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.06947002559900284, "step": 2950, "valid_targets_mean": 2831.8, "valid_targets_min": 961 }, { "epoch": 5.782778864970646, "grad_norm": 0.40988865690038767, "learning_rate": 3.5843714866224376e-06, "loss": 0.0801, "loss_nan_ranks": 0, "loss_rank_avg": 0.07078046351671219, "step": 2955, "valid_targets_mean": 3242.0, "valid_targets_min": 1131 }, { "epoch": 5.7925636007827785, "grad_norm": 0.3907386140442345, "learning_rate": 3.528816582793899e-06, "loss": 0.067, "loss_nan_ranks": 0, "loss_rank_avg": 0.060267020016908646, "step": 2960, "valid_targets_mean": 3141.2, "valid_targets_min": 702 }, { "epoch": 5.802348336594912, "grad_norm": 0.4028211436491414, "learning_rate": 3.4736538917467222e-06, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.07580472528934479, "step": 2965, "valid_targets_mean": 3886.1, "valid_targets_min": 990 }, { "epoch": 5.812133072407045, "grad_norm": 0.41123716912616415, "learning_rate": 3.418884727018108e-06, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.06308360397815704, "step": 2970, "valid_targets_mean": 2827.6, "valid_targets_min": 719 }, { "epoch": 5.821917808219178, "grad_norm": 0.4472389010099648, "learning_rate": 3.364510392774616e-06, "loss": 0.0832, "loss_nan_ranks": 0, "loss_rank_avg": 0.07658056914806366, "step": 2975, "valid_targets_mean": 2843.1, "valid_targets_min": 604 }, { "epoch": 5.8317025440313115, "grad_norm": 0.4451983511580819, "learning_rate": 3.3105321837810722e-06, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.07372932881116867, "step": 2980, "valid_targets_mean": 3195.2, "valid_targets_min": 759 }, { "epoch": 5.841487279843444, "grad_norm": 0.46011692123417103, "learning_rate": 3.2569513853697333e-06, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.07479192316532135, "step": 2985, "valid_targets_mean": 3105.9, "valid_targets_min": 736 }, { "epoch": 5.851272015655577, "grad_norm": 0.6002060396100081, "learning_rate": 3.203769273409707e-06, "loss": 0.0788, "loss_nan_ranks": 0, "loss_rank_avg": 0.11194086074829102, "step": 2990, "valid_targets_mean": 2463.3, "valid_targets_min": 614 }, { "epoch": 5.861056751467711, "grad_norm": 0.4753432159430569, "learning_rate": 3.1509871142765423e-06, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.09354139864444733, "step": 2995, "valid_targets_mean": 2870.1, "valid_targets_min": 472 }, { "epoch": 5.870841487279844, "grad_norm": 0.48413719078598255, "learning_rate": 3.0986061648221e-06, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.08323981612920761, "step": 3000, "valid_targets_mean": 2966.8, "valid_targets_min": 953 }, { "epoch": 5.880626223091976, "grad_norm": 0.4569897092743185, "learning_rate": 3.046627672344602e-06, "loss": 0.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.07903550565242767, "step": 3005, "valid_targets_mean": 2830.2, "valid_targets_min": 747 }, { "epoch": 5.890410958904109, "grad_norm": 0.462909444059214, "learning_rate": 2.99505287455895e-06, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.06472785770893097, "step": 3010, "valid_targets_mean": 2494.8, "valid_targets_min": 715 }, { "epoch": 5.900195694716243, "grad_norm": 0.4807548754280305, "learning_rate": 2.9438829995672446e-06, "loss": 0.0846, "loss_nan_ranks": 0, "loss_rank_avg": 0.09636728465557098, "step": 3015, "valid_targets_mean": 3200.9, "valid_targets_min": 823 }, { "epoch": 5.909980430528376, "grad_norm": 0.4374839076350857, "learning_rate": 2.893119265829527e-06, "loss": 0.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.07287952303886414, "step": 3020, "valid_targets_mean": 2857.5, "valid_targets_min": 697 }, { "epoch": 5.919765166340508, "grad_norm": 0.5220099840364439, "learning_rate": 2.8427628821347997e-06, "loss": 0.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.09079423546791077, "step": 3025, "valid_targets_mean": 2285.8, "valid_targets_min": 518 }, { "epoch": 5.929549902152642, "grad_norm": 0.5213731033603919, "learning_rate": 2.7928150475722015e-06, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.07722978293895721, "step": 3030, "valid_targets_mean": 2516.9, "valid_targets_min": 525 }, { "epoch": 5.939334637964775, "grad_norm": 0.5552580974539469, "learning_rate": 2.7432769515024917e-06, "loss": 0.0745, "loss_nan_ranks": 0, "loss_rank_avg": 0.0762719139456749, "step": 3035, "valid_targets_mean": 2393.5, "valid_targets_min": 559 }, { "epoch": 5.949119373776908, "grad_norm": 0.5116590588913543, "learning_rate": 2.694149773529715e-06, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.06904571503400803, "step": 3040, "valid_targets_mean": 3790.9, "valid_targets_min": 1400 }, { "epoch": 5.958904109589041, "grad_norm": 0.4453120019573562, "learning_rate": 2.6454346834730826e-06, "loss": 0.0916, "loss_nan_ranks": 0, "loss_rank_avg": 0.07235158234834671, "step": 3045, "valid_targets_mean": 2963.2, "valid_targets_min": 756 }, { "epoch": 5.968688845401174, "grad_norm": 0.5147122188137311, "learning_rate": 2.5971328413391805e-06, "loss": 0.0825, "loss_nan_ranks": 0, "loss_rank_avg": 0.07566611468791962, "step": 3050, "valid_targets_mean": 2326.0, "valid_targets_min": 569 }, { "epoch": 5.978473581213307, "grad_norm": 0.40827862937111237, "learning_rate": 2.549245397294282e-06, "loss": 0.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.06662864983081818, "step": 3055, "valid_targets_mean": 3237.1, "valid_targets_min": 471 }, { "epoch": 5.988258317025441, "grad_norm": 0.5107580927974414, "learning_rate": 2.5017734916370073e-06, "loss": 0.0724, "loss_nan_ranks": 0, "loss_rank_avg": 0.0984416976571083, "step": 3060, "valid_targets_mean": 3002.3, "valid_targets_min": 701 }, { "epoch": 5.998043052837573, "grad_norm": 0.501114134610983, "learning_rate": 2.454718254771149e-06, "loss": 0.084, "loss_nan_ranks": 0, "loss_rank_avg": 0.08588661998510361, "step": 3065, "valid_targets_mean": 2286.1, "valid_targets_min": 526 }, { "epoch": 6.007827788649706, "grad_norm": 0.44192958420733774, "learning_rate": 2.4080808071787475e-06, "loss": 0.0665, "loss_nan_ranks": 0, "loss_rank_avg": 0.07303124666213989, "step": 3070, "valid_targets_mean": 2771.9, "valid_targets_min": 482 }, { "epoch": 6.01761252446184, "grad_norm": 0.43635614879975476, "learning_rate": 2.361862259393437e-06, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.0739935114979744, "step": 3075, "valid_targets_mean": 3080.9, "valid_targets_min": 687 }, { "epoch": 6.027397260273973, "grad_norm": 0.43422797068567826, "learning_rate": 2.316063711973966e-06, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.0661170482635498, "step": 3080, "valid_targets_mean": 3041.1, "valid_targets_min": 599 }, { "epoch": 6.0371819960861055, "grad_norm": 0.4754450126513109, "learning_rate": 2.270686255478025e-06, "loss": 0.0637, "loss_nan_ranks": 0, "loss_rank_avg": 0.07159139215946198, "step": 3085, "valid_targets_mean": 2441.1, "valid_targets_min": 592 }, { "epoch": 6.046966731898239, "grad_norm": 0.4981193042856778, "learning_rate": 2.225730970436264e-06, "loss": 0.062, "loss_nan_ranks": 0, "loss_rank_avg": 0.07770034670829773, "step": 3090, "valid_targets_mean": 2525.2, "valid_targets_min": 689 }, { "epoch": 6.056751467710372, "grad_norm": 0.49360571619910937, "learning_rate": 2.1811989273265464e-06, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.07154182344675064, "step": 3095, "valid_targets_mean": 2613.0, "valid_targets_min": 752 }, { "epoch": 6.066536203522505, "grad_norm": 0.4828277732842118, "learning_rate": 2.13709118654849e-06, "loss": 0.0838, "loss_nan_ranks": 0, "loss_rank_avg": 0.07128246128559113, "step": 3100, "valid_targets_mean": 2490.1, "valid_targets_min": 621 }, { "epoch": 6.076320939334638, "grad_norm": 0.41670521030012386, "learning_rate": 2.0934087983981865e-06, "loss": 0.0698, "loss_nan_ranks": 0, "loss_rank_avg": 0.060906365513801575, "step": 3105, "valid_targets_mean": 2875.4, "valid_targets_min": 583 }, { "epoch": 6.086105675146771, "grad_norm": 0.6321266492958042, "learning_rate": 2.0501528030432193e-06, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.0788595974445343, "step": 3110, "valid_targets_mean": 2716.3, "valid_targets_min": 683 }, { "epoch": 6.095890410958904, "grad_norm": 0.42036326945027286, "learning_rate": 2.0073242304978714e-06, "loss": 0.0695, "loss_nan_ranks": 0, "loss_rank_avg": 0.058495331555604935, "step": 3115, "valid_targets_mean": 3160.2, "valid_targets_min": 915 }, { "epoch": 6.105675146771037, "grad_norm": 0.4576932419686335, "learning_rate": 1.9649241005986196e-06, "loss": 0.0683, "loss_nan_ranks": 0, "loss_rank_avg": 0.07226675748825073, "step": 3120, "valid_targets_mean": 2632.1, "valid_targets_min": 717 }, { "epoch": 6.1154598825831705, "grad_norm": 0.4238466831137611, "learning_rate": 1.92295342297983e-06, "loss": 0.0609, "loss_nan_ranks": 0, "loss_rank_avg": 0.05905325710773468, "step": 3125, "valid_targets_mean": 3000.3, "valid_targets_min": 523 }, { "epoch": 6.125244618395303, "grad_norm": 0.45936995523354823, "learning_rate": 1.881413197049722e-06, "loss": 0.09, "loss_nan_ranks": 0, "loss_rank_avg": 0.08321767300367355, "step": 3130, "valid_targets_mean": 3155.2, "valid_targets_min": 764 }, { "epoch": 6.135029354207436, "grad_norm": 0.40115814381067516, "learning_rate": 1.840304411966587e-06, "loss": 0.0684, "loss_nan_ranks": 0, "loss_rank_avg": 0.058111824095249176, "step": 3135, "valid_targets_mean": 3388.8, "valid_targets_min": 542 }, { "epoch": 6.14481409001957, "grad_norm": 0.40435655215447924, "learning_rate": 1.7996280466152206e-06, "loss": 0.0642, "loss_nan_ranks": 0, "loss_rank_avg": 0.06856388598680496, "step": 3140, "valid_targets_mean": 3130.8, "valid_targets_min": 474 }, { "epoch": 6.154598825831703, "grad_norm": 0.4650210024055785, "learning_rate": 1.7593850695836012e-06, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.08073366433382034, "step": 3145, "valid_targets_mean": 2809.2, "valid_targets_min": 518 }, { "epoch": 6.164383561643835, "grad_norm": 0.47086624358290463, "learning_rate": 1.719576439139854e-06, "loss": 0.0638, "loss_nan_ranks": 0, "loss_rank_avg": 0.06494764238595963, "step": 3150, "valid_targets_mean": 2855.2, "valid_targets_min": 529 }, { "epoch": 6.174168297455969, "grad_norm": 0.44044476778002606, "learning_rate": 1.6802031032094079e-06, "loss": 0.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.062370240688323975, "step": 3155, "valid_targets_mean": 2845.0, "valid_targets_min": 526 }, { "epoch": 6.183953033268102, "grad_norm": 0.5499889346906841, "learning_rate": 1.6412659993524416e-06, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.10551338642835617, "step": 3160, "valid_targets_mean": 2796.4, "valid_targets_min": 647 }, { "epoch": 6.193737769080235, "grad_norm": 0.3840436421973751, "learning_rate": 1.602766054741538e-06, "loss": 0.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.06305300444364548, "step": 3165, "valid_targets_mean": 3447.1, "valid_targets_min": 985 }, { "epoch": 6.2035225048923675, "grad_norm": 0.46815680240348373, "learning_rate": 1.564704186139634e-06, "loss": 0.0692, "loss_nan_ranks": 0, "loss_rank_avg": 0.07610894739627838, "step": 3170, "valid_targets_mean": 3054.6, "valid_targets_min": 766 }, { "epoch": 6.213307240704501, "grad_norm": 0.47070496004221424, "learning_rate": 1.5270812998781658e-06, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.07871316373348236, "step": 3175, "valid_targets_mean": 3014.9, "valid_targets_min": 753 }, { "epoch": 6.223091976516634, "grad_norm": 0.40290413823371585, "learning_rate": 1.4898982918354942e-06, "loss": 0.0662, "loss_nan_ranks": 0, "loss_rank_avg": 0.05782357230782509, "step": 3180, "valid_targets_mean": 3368.4, "valid_targets_min": 457 }, { "epoch": 6.232876712328767, "grad_norm": 0.41283880434326553, "learning_rate": 1.4531560474155849e-06, "loss": 0.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.061546504497528076, "step": 3185, "valid_targets_mean": 3097.3, "valid_targets_min": 669 }, { "epoch": 6.2426614481409, "grad_norm": 0.4529313049393873, "learning_rate": 1.4168554415268987e-06, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.10040386766195297, "step": 3190, "valid_targets_mean": 3039.8, "valid_targets_min": 337 }, { "epoch": 6.252446183953033, "grad_norm": 0.5206840406534334, "learning_rate": 1.3809973385615916e-06, "loss": 0.0696, "loss_nan_ranks": 0, "loss_rank_avg": 0.07968272268772125, "step": 3195, "valid_targets_mean": 2537.8, "valid_targets_min": 647 }, { "epoch": 6.262230919765166, "grad_norm": 0.4212637058908629, "learning_rate": 1.345582592374901e-06, "loss": 0.0622, "loss_nan_ranks": 0, "loss_rank_avg": 0.056147150695323944, "step": 3200, "valid_targets_mean": 2918.4, "valid_targets_min": 745 }, { "epoch": 6.2720156555773, "grad_norm": 0.42506169113076164, "learning_rate": 1.3106120462648275e-06, "loss": 0.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.06854747235774994, "step": 3205, "valid_targets_mean": 3473.9, "valid_targets_min": 767 }, { "epoch": 6.2818003913894325, "grad_norm": 0.4367962042686225, "learning_rate": 1.2760865329520655e-06, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.06835062801837921, "step": 3210, "valid_targets_mean": 3223.1, "valid_targets_min": 847 }, { "epoch": 6.291585127201565, "grad_norm": 0.5787526761733716, "learning_rate": 1.2420068745601466e-06, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.08949454128742218, "step": 3215, "valid_targets_mean": 2135.1, "valid_targets_min": 614 }, { "epoch": 6.301369863013699, "grad_norm": 0.4526991495398931, "learning_rate": 1.208373882595888e-06, "loss": 0.0816, "loss_nan_ranks": 0, "loss_rank_avg": 0.06896747648715973, "step": 3220, "valid_targets_mean": 3314.7, "valid_targets_min": 533 }, { "epoch": 6.311154598825832, "grad_norm": 0.45990264333851216, "learning_rate": 1.1751883579300638e-06, "loss": 0.0665, "loss_nan_ranks": 0, "loss_rank_avg": 0.06581242382526398, "step": 3225, "valid_targets_mean": 2982.8, "valid_targets_min": 580 }, { "epoch": 6.3209393346379645, "grad_norm": 0.4957572419180614, "learning_rate": 1.142451090778316e-06, "loss": 0.0694, "loss_nan_ranks": 0, "loss_rank_avg": 0.0708361566066742, "step": 3230, "valid_targets_mean": 2542.9, "valid_targets_min": 458 }, { "epoch": 6.330724070450098, "grad_norm": 0.4311209078972947, "learning_rate": 1.1101628606823712e-06, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.07917267084121704, "step": 3235, "valid_targets_mean": 3413.6, "valid_targets_min": 1167 }, { "epoch": 6.340508806262231, "grad_norm": 0.5037246170434637, "learning_rate": 1.0783244364914424e-06, "loss": 0.0698, "loss_nan_ranks": 0, "loss_rank_avg": 0.07734787464141846, "step": 3240, "valid_targets_mean": 2585.9, "valid_targets_min": 544 }, { "epoch": 6.350293542074364, "grad_norm": 0.4115960837292546, "learning_rate": 1.0469365763439532e-06, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.05661565810441971, "step": 3245, "valid_targets_mean": 2866.4, "valid_targets_min": 609 }, { "epoch": 6.3600782778864975, "grad_norm": 0.453432086965716, "learning_rate": 1.016000027649453e-06, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.06349624693393707, "step": 3250, "valid_targets_mean": 2563.8, "valid_targets_min": 818 }, { "epoch": 6.36986301369863, "grad_norm": 0.4503359296980998, "learning_rate": 9.855155270708505e-07, "loss": 0.0635, "loss_nan_ranks": 0, "loss_rank_avg": 0.06908641755580902, "step": 3255, "valid_targets_mean": 3333.1, "valid_targets_min": 884 }, { "epoch": 6.379647749510763, "grad_norm": 0.4427969727086593, "learning_rate": 9.554838005068578e-07, "loss": 0.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.06669929623603821, "step": 3260, "valid_targets_mean": 2871.0, "valid_targets_min": 754 }, { "epoch": 6.389432485322896, "grad_norm": 0.382983514257635, "learning_rate": 9.259055630746939e-07, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.061314281076192856, "step": 3265, "valid_targets_mean": 3473.1, "valid_targets_min": 798 }, { "epoch": 6.3992172211350296, "grad_norm": 0.4697420687550243, "learning_rate": 8.96781519093084e-07, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.06169832870364189, "step": 3270, "valid_targets_mean": 2443.7, "valid_targets_min": 582 }, { "epoch": 6.409001956947162, "grad_norm": 0.4143290111512886, "learning_rate": 8.681123620654563e-07, "loss": 0.0825, "loss_nan_ranks": 0, "loss_rank_avg": 0.06625143438577652, "step": 3275, "valid_targets_mean": 3436.2, "valid_targets_min": 970 }, { "epoch": 6.418786692759295, "grad_norm": 0.484009641221671, "learning_rate": 8.398987746634546e-07, "loss": 0.0782, "loss_nan_ranks": 0, "loss_rank_avg": 0.06878200173377991, "step": 3280, "valid_targets_mean": 3051.4, "valid_targets_min": 497 }, { "epoch": 6.428571428571429, "grad_norm": 0.4403520522409024, "learning_rate": 8.121414287106711e-07, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.06902438402175903, "step": 3285, "valid_targets_mean": 3071.1, "valid_targets_min": 526 }, { "epoch": 6.438356164383562, "grad_norm": 0.4799058710132896, "learning_rate": 7.848409851666461e-07, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.0697348341345787, "step": 3290, "valid_targets_mean": 3066.8, "valid_targets_min": 1083 }, { "epoch": 6.448140900195694, "grad_norm": 0.5018899520017504, "learning_rate": 7.579980941111387e-07, "loss": 0.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.08869493752717972, "step": 3295, "valid_targets_mean": 2888.8, "valid_targets_min": 716 }, { "epoch": 6.457925636007828, "grad_norm": 0.5397448470834869, "learning_rate": 7.316133947286342e-07, "loss": 0.0706, "loss_nan_ranks": 0, "loss_rank_avg": 0.09075383841991425, "step": 3300, "valid_targets_mean": 2435.1, "valid_targets_min": 459 }, { "epoch": 6.467710371819961, "grad_norm": 0.4343565829140892, "learning_rate": 7.056875152931386e-07, "loss": 0.0701, "loss_nan_ranks": 0, "loss_rank_avg": 0.06514838337898254, "step": 3305, "valid_targets_mean": 3577.0, "valid_targets_min": 884 }, { "epoch": 6.477495107632094, "grad_norm": 0.437505635101395, "learning_rate": 6.802210731532066e-07, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.0722024068236351, "step": 3310, "valid_targets_mean": 3294.1, "valid_targets_min": 540 }, { "epoch": 6.487279843444227, "grad_norm": 0.43250932688840876, "learning_rate": 6.552146747172416e-07, "loss": 0.0669, "loss_nan_ranks": 0, "loss_rank_avg": 0.06441313028335571, "step": 3315, "valid_targets_mean": 3179.9, "valid_targets_min": 665 }, { "epoch": 6.49706457925636, "grad_norm": 0.5306303137510542, "learning_rate": 6.3066891543907e-07, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.08177472651004791, "step": 3320, "valid_targets_mean": 2607.1, "valid_targets_min": 376 }, { "epoch": 6.506849315068493, "grad_norm": 0.4645763344346858, "learning_rate": 6.065843798037362e-07, "loss": 0.0766, "loss_nan_ranks": 0, "loss_rank_avg": 0.07787041366100311, "step": 3325, "valid_targets_mean": 3014.7, "valid_targets_min": 507 }, { "epoch": 6.516634050880626, "grad_norm": 0.46590886033192663, "learning_rate": 5.829616413136196e-07, "loss": 0.0686, "loss_nan_ranks": 0, "loss_rank_avg": 0.0689203292131424, "step": 3330, "valid_targets_mean": 2799.1, "valid_targets_min": 516 }, { "epoch": 6.526418786692759, "grad_norm": 0.5280078983823107, "learning_rate": 5.598012624747396e-07, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.08582378178834915, "step": 3335, "valid_targets_mean": 2405.5, "valid_targets_min": 580 }, { "epoch": 6.536203522504892, "grad_norm": 0.4094668239027261, "learning_rate": 5.371037947833935e-07, "loss": 0.0608, "loss_nan_ranks": 0, "loss_rank_avg": 0.05724884569644928, "step": 3340, "valid_targets_mean": 3165.3, "valid_targets_min": 673 }, { "epoch": 6.545988258317026, "grad_norm": 0.3927725451944761, "learning_rate": 5.148697787130097e-07, "loss": 0.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.06178641691803932, "step": 3345, "valid_targets_mean": 3628.3, "valid_targets_min": 641 }, { "epoch": 6.555772994129159, "grad_norm": 0.4402791629455773, "learning_rate": 4.930997437012708e-07, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.0625002384185791, "step": 3350, "valid_targets_mean": 2967.3, "valid_targets_min": 623 }, { "epoch": 6.5655577299412915, "grad_norm": 0.44037028426323266, "learning_rate": 4.7179420813752817e-07, "loss": 0.0787, "loss_nan_ranks": 0, "loss_rank_avg": 0.08126027137041092, "step": 3355, "valid_targets_mean": 3116.8, "valid_targets_min": 756 }, { "epoch": 6.575342465753424, "grad_norm": 0.43892558836696705, "learning_rate": 4.5095367935043654e-07, "loss": 0.0671, "loss_nan_ranks": 0, "loss_rank_avg": 0.07232559472322464, "step": 3360, "valid_targets_mean": 3449.4, "valid_targets_min": 856 }, { "epoch": 6.585127201565558, "grad_norm": 0.4451158102887051, "learning_rate": 4.3057865359588336e-07, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.06538708508014679, "step": 3365, "valid_targets_mean": 2891.5, "valid_targets_min": 593 }, { "epoch": 6.594911937377691, "grad_norm": 0.5049095904166596, "learning_rate": 4.1066961604517173e-07, "loss": 0.0727, "loss_nan_ranks": 0, "loss_rank_avg": 0.07348017394542694, "step": 3370, "valid_targets_mean": 2615.9, "valid_targets_min": 424 }, { "epoch": 6.604696673189824, "grad_norm": 0.4665931012172164, "learning_rate": 3.912270407734653e-07, "loss": 0.0709, "loss_nan_ranks": 0, "loss_rank_avg": 0.07094801217317581, "step": 3375, "valid_targets_mean": 2681.4, "valid_targets_min": 714 }, { "epoch": 6.614481409001957, "grad_norm": 0.43757819898632666, "learning_rate": 3.722513907485059e-07, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.05991899222135544, "step": 3380, "valid_targets_mean": 3376.2, "valid_targets_min": 663 }, { "epoch": 6.62426614481409, "grad_norm": 0.4827208072192271, "learning_rate": 3.53743117819576e-07, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.07711789011955261, "step": 3385, "valid_targets_mean": 2911.2, "valid_targets_min": 900 }, { "epoch": 6.634050880626223, "grad_norm": 0.4603145031106069, "learning_rate": 3.357026627067517e-07, "loss": 0.0693, "loss_nan_ranks": 0, "loss_rank_avg": 0.0726405456662178, "step": 3390, "valid_targets_mean": 3347.3, "valid_targets_min": 718 }, { "epoch": 6.6438356164383565, "grad_norm": 0.4512525039794043, "learning_rate": 3.1813045499040853e-07, "loss": 0.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.06396128982305527, "step": 3395, "valid_targets_mean": 2948.3, "valid_targets_min": 488 }, { "epoch": 6.653620352250489, "grad_norm": 0.5590748700269601, "learning_rate": 3.0102691310097465e-07, "loss": 0.0664, "loss_nan_ranks": 0, "loss_rank_avg": 0.09083080291748047, "step": 3400, "valid_targets_mean": 2479.1, "valid_targets_min": 502 }, { "epoch": 6.663405088062622, "grad_norm": 0.4601230840272086, "learning_rate": 2.843924443089963e-07, "loss": 0.0698, "loss_nan_ranks": 0, "loss_rank_avg": 0.08319628238677979, "step": 3405, "valid_targets_mean": 3018.4, "valid_targets_min": 855 }, { "epoch": 6.673189823874756, "grad_norm": 0.45005808469478187, "learning_rate": 2.6822744471540986e-07, "loss": 0.0701, "loss_nan_ranks": 0, "loss_rank_avg": 0.08596012741327286, "step": 3410, "valid_targets_mean": 2817.6, "valid_targets_min": 720 }, { "epoch": 6.682974559686889, "grad_norm": 0.3919190742162424, "learning_rate": 2.5253229924213197e-07, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.05439390987157822, "step": 3415, "valid_targets_mean": 3104.9, "valid_targets_min": 861 }, { "epoch": 6.692759295499021, "grad_norm": 0.42935587377345263, "learning_rate": 2.3730738162288214e-07, "loss": 0.079, "loss_nan_ranks": 0, "loss_rank_avg": 0.06405270844697952, "step": 3420, "valid_targets_mean": 3171.0, "valid_targets_min": 797 }, { "epoch": 6.702544031311154, "grad_norm": 0.4050572131233319, "learning_rate": 2.2255305439428775e-07, "loss": 0.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.0682176873087883, "step": 3425, "valid_targets_mean": 3082.6, "valid_targets_min": 844 }, { "epoch": 6.712328767123288, "grad_norm": 0.5112504640863977, "learning_rate": 2.082696688872554e-07, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.07272009551525116, "step": 3430, "valid_targets_mean": 2604.7, "valid_targets_min": 585 }, { "epoch": 6.722113502935421, "grad_norm": 0.4520469516904392, "learning_rate": 1.944575652185865e-07, "loss": 0.0632, "loss_nan_ranks": 0, "loss_rank_avg": 0.0747576355934143, "step": 3435, "valid_targets_mean": 3447.1, "valid_targets_min": 778 }, { "epoch": 6.731898238747553, "grad_norm": 0.4959728539370891, "learning_rate": 1.8111707228290587e-07, "loss": 0.0803, "loss_nan_ranks": 0, "loss_rank_avg": 0.10230695456266403, "step": 3440, "valid_targets_mean": 2490.7, "valid_targets_min": 680 }, { "epoch": 6.741682974559687, "grad_norm": 0.564687612939018, "learning_rate": 1.6824850774480817e-07, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.10522986948490143, "step": 3445, "valid_targets_mean": 2524.9, "valid_targets_min": 831 }, { "epoch": 6.75146771037182, "grad_norm": 0.4564262808981618, "learning_rate": 1.5585217803130382e-07, "loss": 0.0693, "loss_nan_ranks": 0, "loss_rank_avg": 0.06908312439918518, "step": 3450, "valid_targets_mean": 3246.7, "valid_targets_min": 816 }, { "epoch": 6.761252446183953, "grad_norm": 0.3685097171137825, "learning_rate": 1.4392837832452044e-07, "loss": 0.0624, "loss_nan_ranks": 0, "loss_rank_avg": 0.04976704716682434, "step": 3455, "valid_targets_mean": 3558.4, "valid_targets_min": 524 }, { "epoch": 6.771037181996086, "grad_norm": 0.44998166826049446, "learning_rate": 1.3247739255467073e-07, "loss": 0.0683, "loss_nan_ranks": 0, "loss_rank_avg": 0.06746148318052292, "step": 3460, "valid_targets_mean": 3382.1, "valid_targets_min": 800 }, { "epoch": 6.780821917808219, "grad_norm": 0.412114167098292, "learning_rate": 1.2149949339330224e-07, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.06159614771604538, "step": 3465, "valid_targets_mean": 3328.3, "valid_targets_min": 924 }, { "epoch": 6.790606653620352, "grad_norm": 0.5001898542531955, "learning_rate": 1.1099494224678265e-07, "loss": 0.0756, "loss_nan_ranks": 0, "loss_rank_avg": 0.07178150862455368, "step": 3470, "valid_targets_mean": 2874.9, "valid_targets_min": 717 }, { "epoch": 6.800391389432486, "grad_norm": 0.45394214339484407, "learning_rate": 1.0096398925010464e-07, "loss": 0.0782, "loss_nan_ranks": 0, "loss_rank_avg": 0.06360410153865814, "step": 3475, "valid_targets_mean": 3023.1, "valid_targets_min": 758 }, { "epoch": 6.8101761252446185, "grad_norm": 0.4031908330874765, "learning_rate": 9.140687326090192e-08, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.06069003790616989, "step": 3480, "valid_targets_mean": 3315.9, "valid_targets_min": 799 }, { "epoch": 6.819960861056751, "grad_norm": 0.5352073918425082, "learning_rate": 8.232382185378252e-08, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.09013031423091888, "step": 3485, "valid_targets_mean": 2478.2, "valid_targets_min": 591 }, { "epoch": 6.829745596868884, "grad_norm": 0.4742305907566785, "learning_rate": 7.37150513148932e-08, "loss": 0.0762, "loss_nan_ranks": 0, "loss_rank_avg": 0.06776893138885498, "step": 3490, "valid_targets_mean": 2488.6, "valid_targets_min": 542 }, { "epoch": 6.839530332681018, "grad_norm": 0.5029427253629741, "learning_rate": 6.558076663678137e-08, "loss": 0.0731, "loss_nan_ranks": 0, "loss_rank_avg": 0.07862377166748047, "step": 3495, "valid_targets_mean": 2839.6, "valid_targets_min": 656 }, { "epoch": 6.8493150684931505, "grad_norm": 0.42216015174860255, "learning_rate": 5.7921161513512237e-08, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.05871112644672394, "step": 3500, "valid_targets_mean": 2906.5, "valid_targets_min": 629 }, { "epoch": 6.859099804305284, "grad_norm": 0.4509016571919049, "learning_rate": 5.0736418336043705e-08, "loss": 0.0674, "loss_nan_ranks": 0, "loss_rank_avg": 0.060274116694927216, "step": 3505, "valid_targets_mean": 2768.0, "valid_targets_min": 549 }, { "epoch": 6.868884540117417, "grad_norm": 0.4267381143120202, "learning_rate": 4.402670818790755e-08, "loss": 0.0665, "loss_nan_ranks": 0, "loss_rank_avg": 0.05474133789539337, "step": 3510, "valid_targets_mean": 3061.9, "valid_targets_min": 471 }, { "epoch": 6.87866927592955, "grad_norm": 0.4342700484129526, "learning_rate": 3.77921908411083e-08, "loss": 0.0732, "loss_nan_ranks": 0, "loss_rank_avg": 0.06307805329561234, "step": 3515, "valid_targets_mean": 3074.4, "valid_targets_min": 933 }, { "epoch": 6.888454011741683, "grad_norm": 0.5326321563392985, "learning_rate": 3.203301475233955e-08, "loss": 0.0806, "loss_nan_ranks": 0, "loss_rank_avg": 0.09981432557106018, "step": 3520, "valid_targets_mean": 2756.1, "valid_targets_min": 801 }, { "epoch": 6.898238747553816, "grad_norm": 0.45488358604153306, "learning_rate": 2.674931705943573e-08, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.06855349242687225, "step": 3525, "valid_targets_mean": 3244.5, "valid_targets_min": 827 }, { "epoch": 6.908023483365949, "grad_norm": 0.4535624735503632, "learning_rate": 2.194122357811912e-08, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.08300478011369705, "step": 3530, "valid_targets_mean": 2724.9, "valid_targets_min": 634 }, { "epoch": 6.917808219178082, "grad_norm": 0.5408105625931828, "learning_rate": 1.760884879898894e-08, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.07406459748744965, "step": 3535, "valid_targets_mean": 2703.8, "valid_targets_min": 519 }, { "epoch": 6.9275929549902155, "grad_norm": 0.4034744719739111, "learning_rate": 1.3752295884807976e-08, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.06537080556154251, "step": 3540, "valid_targets_mean": 3100.1, "valid_targets_min": 1032 }, { "epoch": 6.937377690802348, "grad_norm": 0.4841177004223412, "learning_rate": 1.0371656668037855e-08, "loss": 0.0814, "loss_nan_ranks": 0, "loss_rank_avg": 0.10481493175029755, "step": 3545, "valid_targets_mean": 3090.2, "valid_targets_min": 722 }, { "epoch": 6.947162426614481, "grad_norm": 0.4857124568122188, "learning_rate": 7.467011648660816e-09, "loss": 0.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.09597225487232208, "step": 3550, "valid_targets_mean": 3196.7, "valid_targets_min": 811 }, { "epoch": 6.956947162426615, "grad_norm": 0.4388488828589182, "learning_rate": 5.0384299922501266e-09, "loss": 0.0663, "loss_nan_ranks": 0, "loss_rank_avg": 0.07025769352912903, "step": 3555, "valid_targets_mean": 3822.1, "valid_targets_min": 954 }, { "epoch": 6.966731898238748, "grad_norm": 0.4993622905131659, "learning_rate": 3.085969528333621e-09, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.0812491849064827, "step": 3560, "valid_targets_mean": 2753.4, "valid_targets_min": 595 }, { "epoch": 6.97651663405088, "grad_norm": 0.4550823355534768, "learning_rate": 1.6096767490170195e-09, "loss": 0.0686, "loss_nan_ranks": 0, "loss_rank_avg": 0.06270751357078552, "step": 3565, "valid_targets_mean": 3089.9, "valid_targets_min": 864 }, { "epoch": 6.986301369863014, "grad_norm": 0.5623088551886786, "learning_rate": 6.095868078670464e-10, "loss": 0.0687, "loss_nan_ranks": 0, "loss_rank_avg": 0.08164788782596588, "step": 3570, "valid_targets_mean": 2565.1, "valid_targets_min": 536 }, { "epoch": 6.996086105675147, "grad_norm": 0.4922155503670224, "learning_rate": 8.572351908542331e-11, "loss": 0.082, "loss_nan_ranks": 0, "loss_rank_avg": 0.08383533358573914, "step": 3575, "valid_targets_mean": 2658.2, "valid_targets_min": 559 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.06287752836942673, "step": 3577, "total_flos": 1086238443962368.0, "train_loss": 0.10740660232207214, "train_runtime": 20738.2442, "train_samples_per_second": 2.758, "train_steps_per_second": 0.172, "valid_targets_mean": 3093.3, "valid_targets_min": 804 } ], "logging_steps": 5, "max_steps": 3577, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1086238443962368.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }