{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 3913, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008952551477170993, "grad_norm": 16.49591257441783, "learning_rate": 4.0816326530612243e-07, "loss": 0.8686, "loss_nan_ranks": 0, "loss_rank_avg": 0.4666103720664978, "step": 5, "valid_targets_mean": 4519.9, "valid_targets_min": 1559 }, { "epoch": 0.017905102954341987, "grad_norm": 17.298933206431972, "learning_rate": 9.183673469387756e-07, "loss": 0.8909, "loss_nan_ranks": 0, "loss_rank_avg": 0.43466073274612427, "step": 10, "valid_targets_mean": 2747.4, "valid_targets_min": 1250 }, { "epoch": 0.02685765443151298, "grad_norm": 16.827321924247315, "learning_rate": 1.4285714285714286e-06, "loss": 0.8744, "loss_nan_ranks": 0, "loss_rank_avg": 0.3920298218727112, "step": 15, "valid_targets_mean": 3581.1, "valid_targets_min": 1067 }, { "epoch": 0.03581020590868397, "grad_norm": 12.478016288643031, "learning_rate": 1.938775510204082e-06, "loss": 0.8919, "loss_nan_ranks": 0, "loss_rank_avg": 0.46270671486854553, "step": 20, "valid_targets_mean": 2438.8, "valid_targets_min": 1372 }, { "epoch": 0.044762757385854966, "grad_norm": 7.6946355193316345, "learning_rate": 2.4489795918367347e-06, "loss": 0.8118, "loss_nan_ranks": 0, "loss_rank_avg": 0.36239463090896606, "step": 25, "valid_targets_mean": 2902.6, "valid_targets_min": 1355 }, { "epoch": 0.05371530886302596, "grad_norm": 4.232599090692266, "learning_rate": 2.959183673469388e-06, "loss": 0.7486, "loss_nan_ranks": 0, "loss_rank_avg": 0.33849599957466125, "step": 30, "valid_targets_mean": 3254.2, "valid_targets_min": 1473 }, { "epoch": 0.06266786034019696, "grad_norm": 2.8884711311766234, "learning_rate": 3.469387755102041e-06, "loss": 0.7087, "loss_nan_ranks": 0, "loss_rank_avg": 0.35638314485549927, "step": 35, "valid_targets_mean": 2818.5, "valid_targets_min": 607 }, { "epoch": 0.07162041181736795, "grad_norm": 1.8606253940579665, "learning_rate": 3.979591836734694e-06, "loss": 0.6355, "loss_nan_ranks": 0, "loss_rank_avg": 0.2763682007789612, "step": 40, "valid_targets_mean": 2783.8, "valid_targets_min": 1126 }, { "epoch": 0.08057296329453895, "grad_norm": 1.5458228348682868, "learning_rate": 4.489795918367348e-06, "loss": 0.648, "loss_nan_ranks": 0, "loss_rank_avg": 0.3491474986076355, "step": 45, "valid_targets_mean": 3077.9, "valid_targets_min": 1310 }, { "epoch": 0.08952551477170993, "grad_norm": 1.2608980315826672, "learning_rate": 5e-06, "loss": 0.6069, "loss_nan_ranks": 0, "loss_rank_avg": 0.3331415057182312, "step": 50, "valid_targets_mean": 3091.8, "valid_targets_min": 1474 }, { "epoch": 0.09847806624888093, "grad_norm": 0.942020827015156, "learning_rate": 5.510204081632653e-06, "loss": 0.6139, "loss_nan_ranks": 0, "loss_rank_avg": 0.3337685167789459, "step": 55, "valid_targets_mean": 3797.2, "valid_targets_min": 2898 }, { "epoch": 0.10743061772605192, "grad_norm": 0.949804363038843, "learning_rate": 6.020408163265307e-06, "loss": 0.5488, "loss_nan_ranks": 0, "loss_rank_avg": 0.3087773025035858, "step": 60, "valid_targets_mean": 4610.4, "valid_targets_min": 1564 }, { "epoch": 0.11638316920322292, "grad_norm": 0.7193398126181899, "learning_rate": 6.530612244897959e-06, "loss": 0.6095, "loss_nan_ranks": 0, "loss_rank_avg": 0.22723770141601562, "step": 65, "valid_targets_mean": 3857.2, "valid_targets_min": 968 }, { "epoch": 0.12533572068039392, "grad_norm": 0.7588167962315939, "learning_rate": 7.0408163265306125e-06, "loss": 0.5624, "loss_nan_ranks": 0, "loss_rank_avg": 0.29583364725112915, "step": 70, "valid_targets_mean": 3903.6, "valid_targets_min": 1367 }, { "epoch": 0.13428827215756492, "grad_norm": 0.7317870592280868, "learning_rate": 7.551020408163265e-06, "loss": 0.5739, "loss_nan_ranks": 0, "loss_rank_avg": 0.213375985622406, "step": 75, "valid_targets_mean": 3182.4, "valid_targets_min": 1621 }, { "epoch": 0.1432408236347359, "grad_norm": 0.758736502420054, "learning_rate": 8.06122448979592e-06, "loss": 0.5921, "loss_nan_ranks": 0, "loss_rank_avg": 0.251443475484848, "step": 80, "valid_targets_mean": 3973.0, "valid_targets_min": 1283 }, { "epoch": 0.1521933751119069, "grad_norm": 0.8048639714424809, "learning_rate": 8.571428571428571e-06, "loss": 0.5738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2732312083244324, "step": 85, "valid_targets_mean": 2992.2, "valid_targets_min": 1093 }, { "epoch": 0.1611459265890779, "grad_norm": 0.7340125250194033, "learning_rate": 9.081632653061225e-06, "loss": 0.5579, "loss_nan_ranks": 0, "loss_rank_avg": 0.25547561049461365, "step": 90, "valid_targets_mean": 2874.4, "valid_targets_min": 1616 }, { "epoch": 0.1700984780662489, "grad_norm": 0.6621673773996177, "learning_rate": 9.591836734693878e-06, "loss": 0.5464, "loss_nan_ranks": 0, "loss_rank_avg": 0.2635806202888489, "step": 95, "valid_targets_mean": 4164.6, "valid_targets_min": 1091 }, { "epoch": 0.17905102954341987, "grad_norm": 0.5908341411665475, "learning_rate": 1.0102040816326531e-05, "loss": 0.5235, "loss_nan_ranks": 0, "loss_rank_avg": 0.3442309498786926, "step": 100, "valid_targets_mean": 6593.6, "valid_targets_min": 2032 }, { "epoch": 0.18800358102059087, "grad_norm": 0.6686214031508748, "learning_rate": 1.0612244897959186e-05, "loss": 0.5113, "loss_nan_ranks": 0, "loss_rank_avg": 0.31256240606307983, "step": 105, "valid_targets_mean": 5066.4, "valid_targets_min": 1405 }, { "epoch": 0.19695613249776187, "grad_norm": 0.6681187078608829, "learning_rate": 1.1122448979591838e-05, "loss": 0.5178, "loss_nan_ranks": 0, "loss_rank_avg": 0.2890857458114624, "step": 110, "valid_targets_mean": 4381.5, "valid_targets_min": 1342 }, { "epoch": 0.20590868397493287, "grad_norm": 0.7026152513616436, "learning_rate": 1.1632653061224491e-05, "loss": 0.5156, "loss_nan_ranks": 0, "loss_rank_avg": 0.23764872550964355, "step": 115, "valid_targets_mean": 3407.8, "valid_targets_min": 976 }, { "epoch": 0.21486123545210384, "grad_norm": 0.705302694688467, "learning_rate": 1.2142857142857142e-05, "loss": 0.5083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2273426502943039, "step": 120, "valid_targets_mean": 3928.0, "valid_targets_min": 1690 }, { "epoch": 0.22381378692927484, "grad_norm": 0.7484839660312749, "learning_rate": 1.2653061224489798e-05, "loss": 0.5391, "loss_nan_ranks": 0, "loss_rank_avg": 0.18557226657867432, "step": 125, "valid_targets_mean": 2330.8, "valid_targets_min": 1250 }, { "epoch": 0.23276633840644584, "grad_norm": 0.7160792181517066, "learning_rate": 1.316326530612245e-05, "loss": 0.5299, "loss_nan_ranks": 0, "loss_rank_avg": 0.3373291790485382, "step": 130, "valid_targets_mean": 3965.8, "valid_targets_min": 1350 }, { "epoch": 0.24171888988361684, "grad_norm": 0.6476324474732508, "learning_rate": 1.3673469387755102e-05, "loss": 0.5149, "loss_nan_ranks": 0, "loss_rank_avg": 0.2963748574256897, "step": 135, "valid_targets_mean": 5056.6, "valid_targets_min": 1288 }, { "epoch": 0.25067144136078784, "grad_norm": 0.5706629071327133, "learning_rate": 1.4183673469387755e-05, "loss": 0.5034, "loss_nan_ranks": 0, "loss_rank_avg": 0.23031815886497498, "step": 140, "valid_targets_mean": 5887.0, "valid_targets_min": 1510 }, { "epoch": 0.25962399283795884, "grad_norm": 0.6087657636188725, "learning_rate": 1.469387755102041e-05, "loss": 0.4746, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000361919403076, "step": 145, "valid_targets_mean": 5092.6, "valid_targets_min": 1163 }, { "epoch": 0.26857654431512984, "grad_norm": 0.7437663805138169, "learning_rate": 1.5204081632653063e-05, "loss": 0.4949, "loss_nan_ranks": 0, "loss_rank_avg": 0.2728891968727112, "step": 150, "valid_targets_mean": 3300.6, "valid_targets_min": 738 }, { "epoch": 0.2775290957923008, "grad_norm": 0.7018877269558821, "learning_rate": 1.5714285714285715e-05, "loss": 0.5209, "loss_nan_ranks": 0, "loss_rank_avg": 0.2847294509410858, "step": 155, "valid_targets_mean": 3328.4, "valid_targets_min": 1380 }, { "epoch": 0.2864816472694718, "grad_norm": 0.674193694437514, "learning_rate": 1.6224489795918368e-05, "loss": 0.5125, "loss_nan_ranks": 0, "loss_rank_avg": 0.37893906235694885, "step": 160, "valid_targets_mean": 5591.1, "valid_targets_min": 2806 }, { "epoch": 0.2954341987466428, "grad_norm": 0.6383105740666587, "learning_rate": 1.673469387755102e-05, "loss": 0.5008, "loss_nan_ranks": 0, "loss_rank_avg": 0.30907806754112244, "step": 165, "valid_targets_mean": 5553.2, "valid_targets_min": 1773 }, { "epoch": 0.3043867502238138, "grad_norm": 0.635478910064303, "learning_rate": 1.7244897959183674e-05, "loss": 0.4626, "loss_nan_ranks": 0, "loss_rank_avg": 0.16394081711769104, "step": 170, "valid_targets_mean": 2659.8, "valid_targets_min": 1578 }, { "epoch": 0.3133393017009848, "grad_norm": 0.6408016364792337, "learning_rate": 1.7755102040816327e-05, "loss": 0.501, "loss_nan_ranks": 0, "loss_rank_avg": 0.26969802379608154, "step": 175, "valid_targets_mean": 4537.2, "valid_targets_min": 1860 }, { "epoch": 0.3222918531781558, "grad_norm": 0.7532590420669183, "learning_rate": 1.826530612244898e-05, "loss": 0.4535, "loss_nan_ranks": 0, "loss_rank_avg": 0.22142918407917023, "step": 180, "valid_targets_mean": 3185.2, "valid_targets_min": 810 }, { "epoch": 0.3312444046553268, "grad_norm": 0.682281377108529, "learning_rate": 1.8775510204081636e-05, "loss": 0.474, "loss_nan_ranks": 0, "loss_rank_avg": 0.26704490184783936, "step": 185, "valid_targets_mean": 5240.8, "valid_targets_min": 1677 }, { "epoch": 0.3401969561324978, "grad_norm": 0.7548919483126133, "learning_rate": 1.928571428571429e-05, "loss": 0.5005, "loss_nan_ranks": 0, "loss_rank_avg": 0.2760850787162781, "step": 190, "valid_targets_mean": 2447.2, "valid_targets_min": 648 }, { "epoch": 0.34914950760966873, "grad_norm": 0.5571129919492352, "learning_rate": 1.979591836734694e-05, "loss": 0.4893, "loss_nan_ranks": 0, "loss_rank_avg": 0.20134209096431732, "step": 195, "valid_targets_mean": 4296.0, "valid_targets_min": 1469 }, { "epoch": 0.35810205908683973, "grad_norm": 0.7295265109368269, "learning_rate": 2.0306122448979594e-05, "loss": 0.4687, "loss_nan_ranks": 0, "loss_rank_avg": 0.209572434425354, "step": 200, "valid_targets_mean": 3726.4, "valid_targets_min": 1347 }, { "epoch": 0.36705461056401073, "grad_norm": 0.6965350987539844, "learning_rate": 2.0816326530612247e-05, "loss": 0.4337, "loss_nan_ranks": 0, "loss_rank_avg": 0.25286203622817993, "step": 205, "valid_targets_mean": 4697.0, "valid_targets_min": 1313 }, { "epoch": 0.37600716204118173, "grad_norm": 0.6480471167428298, "learning_rate": 2.13265306122449e-05, "loss": 0.4741, "loss_nan_ranks": 0, "loss_rank_avg": 0.2200263887643814, "step": 210, "valid_targets_mean": 3665.0, "valid_targets_min": 1142 }, { "epoch": 0.38495971351835273, "grad_norm": 0.8564301909823199, "learning_rate": 2.1836734693877552e-05, "loss": 0.4655, "loss_nan_ranks": 0, "loss_rank_avg": 0.18472859263420105, "step": 215, "valid_targets_mean": 2090.5, "valid_targets_min": 438 }, { "epoch": 0.39391226499552373, "grad_norm": 0.6354279960876454, "learning_rate": 2.2346938775510205e-05, "loss": 0.4649, "loss_nan_ranks": 0, "loss_rank_avg": 0.23229990899562836, "step": 220, "valid_targets_mean": 4387.4, "valid_targets_min": 1532 }, { "epoch": 0.40286481647269473, "grad_norm": 0.6789177721083521, "learning_rate": 2.2857142857142858e-05, "loss": 0.4429, "loss_nan_ranks": 0, "loss_rank_avg": 0.22782085835933685, "step": 225, "valid_targets_mean": 3793.0, "valid_targets_min": 2323 }, { "epoch": 0.41181736794986573, "grad_norm": 0.6516095638644306, "learning_rate": 2.336734693877551e-05, "loss": 0.4971, "loss_nan_ranks": 0, "loss_rank_avg": 0.30450618267059326, "step": 230, "valid_targets_mean": 4820.1, "valid_targets_min": 1458 }, { "epoch": 0.42076991942703673, "grad_norm": 0.693576705410677, "learning_rate": 2.3877551020408167e-05, "loss": 0.4478, "loss_nan_ranks": 0, "loss_rank_avg": 0.25775548815727234, "step": 235, "valid_targets_mean": 4522.9, "valid_targets_min": 1256 }, { "epoch": 0.4297224709042077, "grad_norm": 0.5947860501405103, "learning_rate": 2.438775510204082e-05, "loss": 0.4666, "loss_nan_ranks": 0, "loss_rank_avg": 0.2969934642314911, "step": 240, "valid_targets_mean": 6070.8, "valid_targets_min": 2159 }, { "epoch": 0.4386750223813787, "grad_norm": 0.7892029600583624, "learning_rate": 2.4897959183673473e-05, "loss": 0.4616, "loss_nan_ranks": 0, "loss_rank_avg": 0.2159813940525055, "step": 245, "valid_targets_mean": 3087.0, "valid_targets_min": 1141 }, { "epoch": 0.4476275738585497, "grad_norm": 0.6788801249806748, "learning_rate": 2.5408163265306125e-05, "loss": 0.4693, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609705924987793, "step": 250, "valid_targets_mean": 4786.5, "valid_targets_min": 1562 }, { "epoch": 0.4565801253357207, "grad_norm": 0.7361627557491236, "learning_rate": 2.5918367346938778e-05, "loss": 0.4342, "loss_nan_ranks": 0, "loss_rank_avg": 0.2108224332332611, "step": 255, "valid_targets_mean": 3732.5, "valid_targets_min": 1577 }, { "epoch": 0.4655326768128917, "grad_norm": 0.7565470090146987, "learning_rate": 2.642857142857143e-05, "loss": 0.4244, "loss_nan_ranks": 0, "loss_rank_avg": 0.2238048017024994, "step": 260, "valid_targets_mean": 3423.0, "valid_targets_min": 1153 }, { "epoch": 0.4744852282900627, "grad_norm": 0.6303638496536128, "learning_rate": 2.6938775510204084e-05, "loss": 0.4441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890367716550827, "step": 265, "valid_targets_mean": 4411.1, "valid_targets_min": 1263 }, { "epoch": 0.4834377797672337, "grad_norm": 0.7302565591847386, "learning_rate": 2.7448979591836737e-05, "loss": 0.4208, "loss_nan_ranks": 0, "loss_rank_avg": 0.19841700792312622, "step": 270, "valid_targets_mean": 2944.1, "valid_targets_min": 1350 }, { "epoch": 0.4923903312444047, "grad_norm": 0.5863910054331536, "learning_rate": 2.7959183673469393e-05, "loss": 0.4246, "loss_nan_ranks": 0, "loss_rank_avg": 0.18440236151218414, "step": 275, "valid_targets_mean": 4238.5, "valid_targets_min": 1273 }, { "epoch": 0.5013428827215757, "grad_norm": 0.6774434443668762, "learning_rate": 2.8469387755102046e-05, "loss": 0.4048, "loss_nan_ranks": 0, "loss_rank_avg": 0.1615563929080963, "step": 280, "valid_targets_mean": 2832.2, "valid_targets_min": 1141 }, { "epoch": 0.5102954341987467, "grad_norm": 0.6644483687290574, "learning_rate": 2.89795918367347e-05, "loss": 0.4356, "loss_nan_ranks": 0, "loss_rank_avg": 0.12459085136651993, "step": 285, "valid_targets_mean": 2369.5, "valid_targets_min": 896 }, { "epoch": 0.5192479856759177, "grad_norm": 0.7685920251159404, "learning_rate": 2.948979591836735e-05, "loss": 0.4356, "loss_nan_ranks": 0, "loss_rank_avg": 0.18276526033878326, "step": 290, "valid_targets_mean": 2990.8, "valid_targets_min": 1289 }, { "epoch": 0.5282005371530887, "grad_norm": 0.6355310059485909, "learning_rate": 3.0000000000000004e-05, "loss": 0.4321, "loss_nan_ranks": 0, "loss_rank_avg": 0.1871587336063385, "step": 295, "valid_targets_mean": 5225.5, "valid_targets_min": 1319 }, { "epoch": 0.5371530886302597, "grad_norm": 1.018574390466646, "learning_rate": 3.0510204081632654e-05, "loss": 0.4465, "loss_nan_ranks": 0, "loss_rank_avg": 0.2808264195919037, "step": 300, "valid_targets_mean": 4023.5, "valid_targets_min": 1624 }, { "epoch": 0.5461056401074306, "grad_norm": 0.6281786892326823, "learning_rate": 3.102040816326531e-05, "loss": 0.4131, "loss_nan_ranks": 0, "loss_rank_avg": 0.20266380906105042, "step": 305, "valid_targets_mean": 4063.4, "valid_targets_min": 1769 }, { "epoch": 0.5550581915846016, "grad_norm": 0.7808363483204404, "learning_rate": 3.153061224489796e-05, "loss": 0.4336, "loss_nan_ranks": 0, "loss_rank_avg": 0.23263785243034363, "step": 310, "valid_targets_mean": 6843.8, "valid_targets_min": 1471 }, { "epoch": 0.5640107430617726, "grad_norm": 0.831519619870683, "learning_rate": 3.2040816326530615e-05, "loss": 0.4348, "loss_nan_ranks": 0, "loss_rank_avg": 0.19032128155231476, "step": 315, "valid_targets_mean": 3595.5, "valid_targets_min": 1225 }, { "epoch": 0.5729632945389436, "grad_norm": 1.073552738434753, "learning_rate": 3.255102040816327e-05, "loss": 0.4172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1755063533782959, "step": 320, "valid_targets_mean": 3981.4, "valid_targets_min": 1390 }, { "epoch": 0.5819158460161146, "grad_norm": 0.69129535171428, "learning_rate": 3.306122448979592e-05, "loss": 0.4478, "loss_nan_ranks": 0, "loss_rank_avg": 0.20842593908309937, "step": 325, "valid_targets_mean": 3756.1, "valid_targets_min": 867 }, { "epoch": 0.5908683974932856, "grad_norm": 0.6287282438450149, "learning_rate": 3.357142857142858e-05, "loss": 0.4415, "loss_nan_ranks": 0, "loss_rank_avg": 0.12963131070137024, "step": 330, "valid_targets_mean": 2827.4, "valid_targets_min": 829 }, { "epoch": 0.5998209489704566, "grad_norm": 0.5643853229439663, "learning_rate": 3.408163265306123e-05, "loss": 0.4135, "loss_nan_ranks": 0, "loss_rank_avg": 0.18341860175132751, "step": 335, "valid_targets_mean": 4425.6, "valid_targets_min": 1437 }, { "epoch": 0.6087735004476276, "grad_norm": 0.7125901635629522, "learning_rate": 3.459183673469388e-05, "loss": 0.4423, "loss_nan_ranks": 0, "loss_rank_avg": 0.3656802773475647, "step": 340, "valid_targets_mean": 5335.0, "valid_targets_min": 1545 }, { "epoch": 0.6177260519247986, "grad_norm": 0.620910199580982, "learning_rate": 3.510204081632653e-05, "loss": 0.428, "loss_nan_ranks": 0, "loss_rank_avg": 0.22268570959568024, "step": 345, "valid_targets_mean": 5409.2, "valid_targets_min": 1050 }, { "epoch": 0.6266786034019696, "grad_norm": 0.7650139202001973, "learning_rate": 3.561224489795918e-05, "loss": 0.4633, "loss_nan_ranks": 0, "loss_rank_avg": 0.23281125724315643, "step": 350, "valid_targets_mean": 4042.8, "valid_targets_min": 1140 }, { "epoch": 0.6356311548791406, "grad_norm": 0.9201532516782224, "learning_rate": 3.612244897959184e-05, "loss": 0.4281, "loss_nan_ranks": 0, "loss_rank_avg": 0.25236573815345764, "step": 355, "valid_targets_mean": 3224.9, "valid_targets_min": 1933 }, { "epoch": 0.6445837063563116, "grad_norm": 0.7183411085392811, "learning_rate": 3.6632653061224494e-05, "loss": 0.4701, "loss_nan_ranks": 0, "loss_rank_avg": 0.17252346873283386, "step": 360, "valid_targets_mean": 2688.4, "valid_targets_min": 1418 }, { "epoch": 0.6535362578334826, "grad_norm": 0.582680287280911, "learning_rate": 3.714285714285715e-05, "loss": 0.4149, "loss_nan_ranks": 0, "loss_rank_avg": 0.19246900081634521, "step": 365, "valid_targets_mean": 5347.9, "valid_targets_min": 1211 }, { "epoch": 0.6624888093106536, "grad_norm": 0.9129377165838232, "learning_rate": 3.76530612244898e-05, "loss": 0.4551, "loss_nan_ranks": 0, "loss_rank_avg": 0.27284592390060425, "step": 370, "valid_targets_mean": 4036.4, "valid_targets_min": 1053 }, { "epoch": 0.6714413607878246, "grad_norm": 0.6678131909597557, "learning_rate": 3.816326530612245e-05, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.20466414093971252, "step": 375, "valid_targets_mean": 3872.2, "valid_targets_min": 1191 }, { "epoch": 0.6803939122649956, "grad_norm": 0.8045668374112488, "learning_rate": 3.8673469387755105e-05, "loss": 0.4116, "loss_nan_ranks": 0, "loss_rank_avg": 0.22858558595180511, "step": 380, "valid_targets_mean": 3204.1, "valid_targets_min": 1715 }, { "epoch": 0.6893464637421666, "grad_norm": 0.666520730258989, "learning_rate": 3.9183673469387755e-05, "loss": 0.4161, "loss_nan_ranks": 0, "loss_rank_avg": 0.17605772614479065, "step": 385, "valid_targets_mean": 4473.6, "valid_targets_min": 1557 }, { "epoch": 0.6982990152193375, "grad_norm": 0.6247290424770604, "learning_rate": 3.969387755102041e-05, "loss": 0.4045, "loss_nan_ranks": 0, "loss_rank_avg": 0.25795891880989075, "step": 390, "valid_targets_mean": 4912.9, "valid_targets_min": 1158 }, { "epoch": 0.7072515666965085, "grad_norm": 0.779100748971421, "learning_rate": 3.9999968156003224e-05, "loss": 0.4716, "loss_nan_ranks": 0, "loss_rank_avg": 0.44641977548599243, "step": 395, "valid_targets_mean": 5953.0, "valid_targets_min": 599 }, { "epoch": 0.7162041181736795, "grad_norm": 0.6495151157923535, "learning_rate": 3.999960991220401e-05, "loss": 0.3952, "loss_nan_ranks": 0, "loss_rank_avg": 0.20517157018184662, "step": 400, "valid_targets_mean": 3357.4, "valid_targets_min": 1749 }, { "epoch": 0.7251566696508505, "grad_norm": 0.7150419841254799, "learning_rate": 3.9998853626763316e-05, "loss": 0.4102, "loss_nan_ranks": 0, "loss_rank_avg": 0.18629693984985352, "step": 405, "valid_targets_mean": 3205.6, "valid_targets_min": 1522 }, { "epoch": 0.7341092211280215, "grad_norm": 0.7390419158141074, "learning_rate": 3.999769931473309e-05, "loss": 0.4018, "loss_nan_ranks": 0, "loss_rank_avg": 0.14274990558624268, "step": 410, "valid_targets_mean": 2136.0, "valid_targets_min": 994 }, { "epoch": 0.7430617726051925, "grad_norm": 1.259396937429778, "learning_rate": 3.999614699908698e-05, "loss": 0.438, "loss_nan_ranks": 0, "loss_rank_avg": 0.26997411251068115, "step": 415, "valid_targets_mean": 4593.8, "valid_targets_min": 1766 }, { "epoch": 0.7520143240823635, "grad_norm": 0.6154121664436549, "learning_rate": 3.999419671071993e-05, "loss": 0.4231, "loss_nan_ranks": 0, "loss_rank_avg": 0.20233558118343353, "step": 420, "valid_targets_mean": 4364.0, "valid_targets_min": 1588 }, { "epoch": 0.7609668755595345, "grad_norm": 0.6423223707679937, "learning_rate": 3.999184848844746e-05, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704905480146408, "step": 425, "valid_targets_mean": 3104.9, "valid_targets_min": 1439 }, { "epoch": 0.7699194270367055, "grad_norm": 0.729810705804325, "learning_rate": 3.9989102379005026e-05, "loss": 0.4225, "loss_nan_ranks": 0, "loss_rank_avg": 0.1957702934741974, "step": 430, "valid_targets_mean": 3646.9, "valid_targets_min": 1005 }, { "epoch": 0.7788719785138765, "grad_norm": 0.7345669763856479, "learning_rate": 3.9985958437046976e-05, "loss": 0.453, "loss_nan_ranks": 0, "loss_rank_avg": 0.23787890374660492, "step": 435, "valid_targets_mean": 3216.0, "valid_targets_min": 568 }, { "epoch": 0.7878245299910475, "grad_norm": 0.781247168859166, "learning_rate": 3.998241672514551e-05, "loss": 0.4173, "loss_nan_ranks": 0, "loss_rank_avg": 0.17754238843917847, "step": 440, "valid_targets_mean": 2567.8, "valid_targets_min": 1113 }, { "epoch": 0.7967770814682185, "grad_norm": 0.5671255551819204, "learning_rate": 3.997847731378946e-05, "loss": 0.4087, "loss_nan_ranks": 0, "loss_rank_avg": 0.26526498794555664, "step": 445, "valid_targets_mean": 6251.0, "valid_targets_min": 1697 }, { "epoch": 0.8057296329453895, "grad_norm": 0.6272203363976995, "learning_rate": 3.9974140281382844e-05, "loss": 0.4155, "loss_nan_ranks": 0, "loss_rank_avg": 0.22401854395866394, "step": 450, "valid_targets_mean": 4900.2, "valid_targets_min": 1566 }, { "epoch": 0.8146821844225605, "grad_norm": 0.6084346283327203, "learning_rate": 3.996940571424331e-05, "loss": 0.3975, "loss_nan_ranks": 0, "loss_rank_avg": 0.2205761969089508, "step": 455, "valid_targets_mean": 5000.9, "valid_targets_min": 1425 }, { "epoch": 0.8236347358997315, "grad_norm": 0.6541164392281177, "learning_rate": 3.996427370660045e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.18832074105739594, "step": 460, "valid_targets_mean": 4095.9, "valid_targets_min": 821 }, { "epoch": 0.8325872873769025, "grad_norm": 0.6460255342842145, "learning_rate": 3.995874436059389e-05, "loss": 0.4071, "loss_nan_ranks": 0, "loss_rank_avg": 0.18600459396839142, "step": 465, "valid_targets_mean": 3793.5, "valid_targets_min": 2096 }, { "epoch": 0.8415398388540735, "grad_norm": 0.6200976937245356, "learning_rate": 3.9952817786271264e-05, "loss": 0.416, "loss_nan_ranks": 0, "loss_rank_avg": 0.13933804631233215, "step": 470, "valid_targets_mean": 3723.6, "valid_targets_min": 1207 }, { "epoch": 0.8504923903312444, "grad_norm": 0.6168712556601921, "learning_rate": 3.994649410158605e-05, "loss": 0.4072, "loss_nan_ranks": 0, "loss_rank_avg": 0.22264635562896729, "step": 475, "valid_targets_mean": 4751.8, "valid_targets_min": 2191 }, { "epoch": 0.8594449418084154, "grad_norm": 0.6514273070342461, "learning_rate": 3.99397734323952e-05, "loss": 0.4224, "loss_nan_ranks": 0, "loss_rank_avg": 0.20883207023143768, "step": 480, "valid_targets_mean": 4464.0, "valid_targets_min": 1847 }, { "epoch": 0.8683974932855864, "grad_norm": 0.800906223272931, "learning_rate": 3.993265591245662e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.1863759309053421, "step": 485, "valid_targets_mean": 2938.4, "valid_targets_min": 871 }, { "epoch": 0.8773500447627574, "grad_norm": 0.83277145829148, "learning_rate": 3.992514168342655e-05, "loss": 0.4067, "loss_nan_ranks": 0, "loss_rank_avg": 0.17269662022590637, "step": 490, "valid_targets_mean": 2428.8, "valid_targets_min": 1668 }, { "epoch": 0.8863025962399284, "grad_norm": 0.7304828801141144, "learning_rate": 3.9917230894856705e-05, "loss": 0.4063, "loss_nan_ranks": 0, "loss_rank_avg": 0.2120320200920105, "step": 495, "valid_targets_mean": 3160.0, "valid_targets_min": 1270 }, { "epoch": 0.8952551477170994, "grad_norm": 0.7572826126724849, "learning_rate": 3.990892370419132e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.20016592741012573, "step": 500, "valid_targets_mean": 3175.8, "valid_targets_min": 799 }, { "epoch": 0.9042076991942704, "grad_norm": 0.5919370272102532, "learning_rate": 3.9900220276764013e-05, "loss": 0.4074, "loss_nan_ranks": 0, "loss_rank_avg": 0.16611447930335999, "step": 505, "valid_targets_mean": 3963.9, "valid_targets_min": 743 }, { "epoch": 0.9131602506714414, "grad_norm": 0.6819403148937269, "learning_rate": 3.989112078579449e-05, "loss": 0.418, "loss_nan_ranks": 0, "loss_rank_avg": 0.2877485752105713, "step": 510, "valid_targets_mean": 5093.2, "valid_targets_min": 1691 }, { "epoch": 0.9221128021486124, "grad_norm": 0.6769829439772228, "learning_rate": 3.988162541238509e-05, "loss": 0.4057, "loss_nan_ranks": 0, "loss_rank_avg": 0.3087572157382965, "step": 515, "valid_targets_mean": 4994.5, "valid_targets_min": 1352 }, { "epoch": 0.9310653536257834, "grad_norm": 0.7318964239583158, "learning_rate": 3.98717343455172e-05, "loss": 0.3829, "loss_nan_ranks": 0, "loss_rank_avg": 0.178988978266716, "step": 520, "valid_targets_mean": 3043.4, "valid_targets_min": 1840 }, { "epoch": 0.9400179051029544, "grad_norm": 0.736170364782059, "learning_rate": 3.9861447782047495e-05, "loss": 0.426, "loss_nan_ranks": 0, "loss_rank_avg": 0.2085171490907669, "step": 525, "valid_targets_mean": 3353.6, "valid_targets_min": 1939 }, { "epoch": 0.9489704565801254, "grad_norm": 0.6775094297571437, "learning_rate": 3.9850765926704e-05, "loss": 0.4128, "loss_nan_ranks": 0, "loss_rank_avg": 0.21749690175056458, "step": 530, "valid_targets_mean": 4364.0, "valid_targets_min": 1464 }, { "epoch": 0.9579230080572964, "grad_norm": 0.7321608884861143, "learning_rate": 3.9839688992082004e-05, "loss": 0.3747, "loss_nan_ranks": 0, "loss_rank_avg": 0.20859259366989136, "step": 535, "valid_targets_mean": 3524.5, "valid_targets_min": 1556 }, { "epoch": 0.9668755595344674, "grad_norm": 0.6153393187558923, "learning_rate": 3.9828217198639884e-05, "loss": 0.4165, "loss_nan_ranks": 0, "loss_rank_avg": 0.21272610127925873, "step": 540, "valid_targets_mean": 4658.5, "valid_targets_min": 1706 }, { "epoch": 0.9758281110116384, "grad_norm": 0.798525150352497, "learning_rate": 3.981635077469468e-05, "loss": 0.4188, "loss_nan_ranks": 0, "loss_rank_avg": 0.15253381431102753, "step": 545, "valid_targets_mean": 1837.2, "valid_targets_min": 883 }, { "epoch": 0.9847806624888094, "grad_norm": 0.7395653489663312, "learning_rate": 3.980408995641751e-05, "loss": 0.4116, "loss_nan_ranks": 0, "loss_rank_avg": 0.2817031741142273, "step": 550, "valid_targets_mean": 3830.6, "valid_targets_min": 1066 }, { "epoch": 0.9937332139659804, "grad_norm": 0.7202520372221168, "learning_rate": 3.979143498782898e-05, "loss": 0.4252, "loss_nan_ranks": 0, "loss_rank_avg": 0.20223543047904968, "step": 555, "valid_targets_mean": 3306.4, "valid_targets_min": 1423 }, { "epoch": 1.001790510295434, "grad_norm": 0.579798364095407, "learning_rate": 3.977838612079419e-05, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.14297722280025482, "step": 560, "valid_targets_mean": 3010.2, "valid_targets_min": 1194 }, { "epoch": 1.0107430617726052, "grad_norm": 0.7410636986612479, "learning_rate": 3.976494361501786e-05, "loss": 0.4051, "loss_nan_ranks": 0, "loss_rank_avg": 0.15187795460224152, "step": 565, "valid_targets_mean": 2236.6, "valid_targets_min": 1057 }, { "epoch": 1.019695613249776, "grad_norm": 0.692386761584416, "learning_rate": 3.975110773803904e-05, "loss": 0.373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2205927073955536, "step": 570, "valid_targets_mean": 4001.6, "valid_targets_min": 1337 }, { "epoch": 1.0286481647269472, "grad_norm": 0.760062922065256, "learning_rate": 3.973687876522587e-05, "loss": 0.4077, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433718055486679, "step": 575, "valid_targets_mean": 2319.2, "valid_targets_min": 1285 }, { "epoch": 1.037600716204118, "grad_norm": 0.6231058381003745, "learning_rate": 3.9722256979770054e-05, "loss": 0.377, "loss_nan_ranks": 0, "loss_rank_avg": 0.25835368037223816, "step": 580, "valid_targets_mean": 5127.9, "valid_targets_min": 1433 }, { "epoch": 1.0465532676812892, "grad_norm": 0.7798383704851466, "learning_rate": 3.970724267268125e-05, "loss": 0.4182, "loss_nan_ranks": 0, "loss_rank_avg": 0.18632589280605316, "step": 585, "valid_targets_mean": 2504.1, "valid_targets_min": 1374 }, { "epoch": 1.05550581915846, "grad_norm": 0.6724122975388895, "learning_rate": 3.969183614278125e-05, "loss": 0.3795, "loss_nan_ranks": 0, "loss_rank_avg": 0.16075168550014496, "step": 590, "valid_targets_mean": 2468.0, "valid_targets_min": 1272 }, { "epoch": 1.0644583706356312, "grad_norm": 0.6216207940286806, "learning_rate": 3.9676037696698056e-05, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.1869785636663437, "step": 595, "valid_targets_mean": 3637.8, "valid_targets_min": 1239 }, { "epoch": 1.073410922112802, "grad_norm": 0.6038132355180709, "learning_rate": 3.9659847648859775e-05, "loss": 0.3771, "loss_nan_ranks": 0, "loss_rank_avg": 0.19958503544330597, "step": 600, "valid_targets_mean": 5002.8, "valid_targets_min": 2207 }, { "epoch": 1.0823634735899732, "grad_norm": 0.6547559144298567, "learning_rate": 3.9643266321488354e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.1961314082145691, "step": 605, "valid_targets_mean": 3541.4, "valid_targets_min": 1259 }, { "epoch": 1.091316025067144, "grad_norm": 0.6283731669036798, "learning_rate": 3.962629404459317e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.20619988441467285, "step": 610, "valid_targets_mean": 4151.5, "valid_targets_min": 1027 }, { "epoch": 1.1002685765443152, "grad_norm": 0.733013694119783, "learning_rate": 3.960893115596445e-05, "loss": 0.3824, "loss_nan_ranks": 0, "loss_rank_avg": 0.19611495733261108, "step": 615, "valid_targets_mean": 3181.6, "valid_targets_min": 1191 }, { "epoch": 1.109221128021486, "grad_norm": 0.7451977959813969, "learning_rate": 3.959117800116658e-05, "loss": 0.3859, "loss_nan_ranks": 0, "loss_rank_avg": 0.2177126407623291, "step": 620, "valid_targets_mean": 3460.2, "valid_targets_min": 1551 }, { "epoch": 1.1181736794986572, "grad_norm": 0.6425600662981381, "learning_rate": 3.9573034933531195e-05, "loss": 0.3747, "loss_nan_ranks": 0, "loss_rank_avg": 0.1971556693315506, "step": 625, "valid_targets_mean": 5205.9, "valid_targets_min": 1687 }, { "epoch": 1.127126230975828, "grad_norm": 0.7396238738527312, "learning_rate": 3.955450231415014e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.18451285362243652, "step": 630, "valid_targets_mean": 3393.9, "valid_targets_min": 1696 }, { "epoch": 1.1360787824529992, "grad_norm": 0.6577118059689598, "learning_rate": 3.953558051186834e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.15830595791339874, "step": 635, "valid_targets_mean": 2799.0, "valid_targets_min": 1209 }, { "epoch": 1.14503133393017, "grad_norm": 0.5395992030023509, "learning_rate": 3.95162699032764e-05, "loss": 0.3835, "loss_nan_ranks": 0, "loss_rank_avg": 0.20836785435676575, "step": 640, "valid_targets_mean": 5411.8, "valid_targets_min": 1545 }, { "epoch": 1.153983885407341, "grad_norm": 0.7044513534849349, "learning_rate": 3.949657087270313e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.1730477213859558, "step": 645, "valid_targets_mean": 2762.4, "valid_targets_min": 1430 }, { "epoch": 1.162936436884512, "grad_norm": 0.7783993520311729, "learning_rate": 3.947648381220789e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.1869765818119049, "step": 650, "valid_targets_mean": 2660.5, "valid_targets_min": 1459 }, { "epoch": 1.1718889883616832, "grad_norm": 0.7192368699302448, "learning_rate": 3.9456009121572824e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.1545119732618332, "step": 655, "valid_targets_mean": 2477.6, "valid_targets_min": 1394 }, { "epoch": 1.180841539838854, "grad_norm": 0.592724596003384, "learning_rate": 3.943514720829485e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.15250423550605774, "step": 660, "valid_targets_mean": 3685.5, "valid_targets_min": 1099 }, { "epoch": 1.189794091316025, "grad_norm": 0.8159242881243397, "learning_rate": 3.941389848757756e-05, "loss": 0.3938, "loss_nan_ranks": 0, "loss_rank_avg": 0.18470154702663422, "step": 665, "valid_targets_mean": 2337.1, "valid_targets_min": 1237 }, { "epoch": 1.198746642793196, "grad_norm": 0.7782799836744587, "learning_rate": 3.9392263382323e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.20358330011367798, "step": 670, "valid_targets_mean": 5639.0, "valid_targets_min": 2708 }, { "epoch": 1.207699194270367, "grad_norm": 0.8082493752911124, "learning_rate": 3.93702423231232e-05, "loss": 0.4009, "loss_nan_ranks": 0, "loss_rank_avg": 0.17506203055381775, "step": 675, "valid_targets_mean": 2361.5, "valid_targets_min": 1256 }, { "epoch": 1.216651745747538, "grad_norm": 0.5418104763492934, "learning_rate": 3.9347835748251645e-05, "loss": 0.3607, "loss_nan_ranks": 0, "loss_rank_avg": 0.18025299906730652, "step": 680, "valid_targets_mean": 5253.0, "valid_targets_min": 1219 }, { "epoch": 1.225604297224709, "grad_norm": 0.6442211318310618, "learning_rate": 3.9325044103654526e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.20891106128692627, "step": 685, "valid_targets_mean": 4414.8, "valid_targets_min": 1615 }, { "epoch": 1.23455684870188, "grad_norm": 0.6451467432686171, "learning_rate": 3.9301867842941867e-05, "loss": 0.3718, "loss_nan_ranks": 0, "loss_rank_avg": 0.19293522834777832, "step": 690, "valid_targets_mean": 3735.8, "valid_targets_min": 1013 }, { "epoch": 1.243509400179051, "grad_norm": 0.5339050160402266, "learning_rate": 3.9278307427378495e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.18412509560585022, "step": 695, "valid_targets_mean": 6164.5, "valid_targets_min": 1894 }, { "epoch": 1.252461951656222, "grad_norm": 0.62297846690471, "learning_rate": 3.92543633258749e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.13548460602760315, "step": 700, "valid_targets_mean": 2993.4, "valid_targets_min": 1667 }, { "epoch": 1.261414503133393, "grad_norm": 0.6745712113247786, "learning_rate": 3.923003601497785e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.21251079440116882, "step": 705, "valid_targets_mean": 3604.5, "valid_targets_min": 1443 }, { "epoch": 1.2703670546105639, "grad_norm": 0.6186655781741142, "learning_rate": 3.920532597886091e-05, "loss": 0.3796, "loss_nan_ranks": 0, "loss_rank_avg": 0.1852312535047531, "step": 710, "valid_targets_mean": 5199.1, "valid_targets_min": 1838 }, { "epoch": 1.279319606087735, "grad_norm": 0.6476873687407971, "learning_rate": 3.918023370931485e-05, "loss": 0.3554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16326086223125458, "step": 715, "valid_targets_mean": 3766.6, "valid_targets_min": 1334 }, { "epoch": 1.288272157564906, "grad_norm": 0.7346554234208614, "learning_rate": 3.915475970573782e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.16769498586654663, "step": 720, "valid_targets_mean": 2661.0, "valid_targets_min": 1397 }, { "epoch": 1.297224709042077, "grad_norm": 0.5311121017298314, "learning_rate": 3.9128904475125414e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.2087760865688324, "step": 725, "valid_targets_mean": 5643.4, "valid_targets_min": 1375 }, { "epoch": 1.3061772605192479, "grad_norm": 0.7108382046067068, "learning_rate": 3.910266853206058e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.326129674911499, "step": 730, "valid_targets_mean": 3954.4, "valid_targets_min": 883 }, { "epoch": 1.315129811996419, "grad_norm": 0.739273369261475, "learning_rate": 3.907605239870342e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.20131108164787292, "step": 735, "valid_targets_mean": 2797.8, "valid_targets_min": 1263 }, { "epoch": 1.32408236347359, "grad_norm": 0.6341507161751151, "learning_rate": 3.904905660478072e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.19136598706245422, "step": 740, "valid_targets_mean": 3837.9, "valid_targets_min": 1419 }, { "epoch": 1.333034914950761, "grad_norm": 0.5325044817359841, "learning_rate": 3.9021681687575465e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.09225505590438843, "step": 745, "valid_targets_mean": 2742.8, "valid_targets_min": 1209 }, { "epoch": 1.3419874664279319, "grad_norm": 0.6544505821705787, "learning_rate": 3.8993928191916134e-05, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.2583926320075989, "step": 750, "valid_targets_mean": 4458.0, "valid_targets_min": 1105 }, { "epoch": 1.350940017905103, "grad_norm": 0.7669301555471535, "learning_rate": 3.8965796670165856e-05, "loss": 0.3814, "loss_nan_ranks": 0, "loss_rank_avg": 0.12664443254470825, "step": 755, "valid_targets_mean": 2020.8, "valid_targets_min": 1072 }, { "epoch": 1.3598925693822739, "grad_norm": 0.7129506043666346, "learning_rate": 3.893728768221139e-05, "loss": 0.3773, "loss_nan_ranks": 0, "loss_rank_avg": 0.25370943546295166, "step": 760, "valid_targets_mean": 3605.6, "valid_targets_min": 1012 }, { "epoch": 1.368845120859445, "grad_norm": 0.6334981286822261, "learning_rate": 3.8908401795452033e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.24940751492977142, "step": 765, "valid_targets_mean": 4710.8, "valid_targets_min": 1575 }, { "epoch": 1.3777976723366159, "grad_norm": 0.6085268704857869, "learning_rate": 3.8879139584788286e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.16782809793949127, "step": 770, "valid_targets_mean": 3777.8, "valid_targets_min": 1416 }, { "epoch": 1.386750223813787, "grad_norm": 0.7858602694978715, "learning_rate": 3.884950163261042e-05, "loss": 0.373, "loss_nan_ranks": 0, "loss_rank_avg": 0.13924919068813324, "step": 775, "valid_targets_mean": 2685.4, "valid_targets_min": 1551 }, { "epoch": 1.3957027752909579, "grad_norm": 0.6289344762472306, "learning_rate": 3.8819488528786904e-05, "loss": 0.3881, "loss_nan_ranks": 0, "loss_rank_avg": 0.18281199038028717, "step": 780, "valid_targets_mean": 4110.0, "valid_targets_min": 1287 }, { "epoch": 1.404655326768129, "grad_norm": 0.6406051764111861, "learning_rate": 3.878910087065264e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.16362640261650085, "step": 785, "valid_targets_mean": 2657.2, "valid_targets_min": 1445 }, { "epoch": 1.4136078782452999, "grad_norm": 0.6648737360349115, "learning_rate": 3.8758339262997094e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.13713306188583374, "step": 790, "valid_targets_mean": 2693.4, "valid_targets_min": 959 }, { "epoch": 1.422560429722471, "grad_norm": 0.4917049041944973, "learning_rate": 3.872720431805224e-05, "loss": 0.3745, "loss_nan_ranks": 0, "loss_rank_avg": 0.11397358775138855, "step": 795, "valid_targets_mean": 3676.1, "valid_targets_min": 1163 }, { "epoch": 1.4315129811996419, "grad_norm": 0.646876600165104, "learning_rate": 3.86956966554804e-05, "loss": 0.371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11982043087482452, "step": 800, "valid_targets_mean": 2264.4, "valid_targets_min": 1625 }, { "epoch": 1.440465532676813, "grad_norm": 0.5032837505063902, "learning_rate": 3.8663816902361896e-05, "loss": 0.374, "loss_nan_ranks": 0, "loss_rank_avg": 0.17598767578601837, "step": 805, "valid_targets_mean": 5998.6, "valid_targets_min": 926 }, { "epoch": 1.4494180841539839, "grad_norm": 0.7075325188332748, "learning_rate": 3.863156569318256e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22245752811431885, "step": 810, "valid_targets_mean": 4238.8, "valid_targets_min": 1245 }, { "epoch": 1.4583706356311548, "grad_norm": 0.7140064280888134, "learning_rate": 3.8598943669821124e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.21389253437519073, "step": 815, "valid_targets_mean": 2880.5, "valid_targets_min": 1271 }, { "epoch": 1.4673231871083259, "grad_norm": 0.644094370810947, "learning_rate": 3.856595148153643e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.11374405771493912, "step": 820, "valid_targets_mean": 2398.5, "valid_targets_min": 380 }, { "epoch": 1.476275738585497, "grad_norm": 0.6911180314953034, "learning_rate": 3.853258978495454e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.20857420563697815, "step": 825, "valid_targets_mean": 3739.2, "valid_targets_min": 1153 }, { "epoch": 1.4852282900626679, "grad_norm": 0.6730820644303149, "learning_rate": 3.8498859244055616e-05, "loss": 0.3506, "loss_nan_ranks": 0, "loss_rank_avg": 0.16855305433273315, "step": 830, "valid_targets_mean": 2936.1, "valid_targets_min": 1202 }, { "epoch": 1.4941808415398388, "grad_norm": 0.6485920300501455, "learning_rate": 3.8464760530160756e-05, "loss": 0.3849, "loss_nan_ranks": 0, "loss_rank_avg": 0.21470798552036285, "step": 835, "valid_targets_mean": 3659.1, "valid_targets_min": 1797 }, { "epoch": 1.5031333930170099, "grad_norm": 0.6962762200783088, "learning_rate": 3.843029432191858e-05, "loss": 0.364, "loss_nan_ranks": 0, "loss_rank_avg": 0.18541723489761353, "step": 840, "valid_targets_mean": 3259.0, "valid_targets_min": 1029 }, { "epoch": 1.512085944494181, "grad_norm": 0.6094253072530402, "learning_rate": 3.839546130529179e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.13300365209579468, "step": 845, "valid_targets_mean": 3356.0, "valid_targets_min": 1277 }, { "epoch": 1.5210384959713519, "grad_norm": 0.541921565334437, "learning_rate": 3.8360262173543467e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.11396744847297668, "step": 850, "valid_targets_mean": 3406.4, "valid_targets_min": 1086 }, { "epoch": 1.5299910474485228, "grad_norm": 0.7195629206207933, "learning_rate": 3.8324697627223263e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.14234784245491028, "step": 855, "valid_targets_mean": 3167.8, "valid_targets_min": 1432 }, { "epoch": 1.5389435989256937, "grad_norm": 1.1044858797443737, "learning_rate": 3.828876837415352e-05, "loss": 0.3762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2260916531085968, "step": 860, "valid_targets_mean": 3686.5, "valid_targets_min": 1234 }, { "epoch": 1.5478961504028648, "grad_norm": 0.6173627572346159, "learning_rate": 3.8252475129415127e-05, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.11603335291147232, "step": 865, "valid_targets_mean": 2601.2, "valid_targets_min": 1231 }, { "epoch": 1.5568487018800359, "grad_norm": 0.612868623270254, "learning_rate": 3.82158186153333e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899331510066986, "step": 870, "valid_targets_mean": 3989.4, "valid_targets_min": 668 }, { "epoch": 1.5658012533572068, "grad_norm": 0.8308887319226448, "learning_rate": 3.817879956146323e-05, "loss": 0.3751, "loss_nan_ranks": 0, "loss_rank_avg": 0.23491792380809784, "step": 875, "valid_targets_mean": 2837.4, "valid_targets_min": 1314 }, { "epoch": 1.5747538048343777, "grad_norm": 0.5706204421068442, "learning_rate": 3.814141870457553e-05, "loss": 0.3548, "loss_nan_ranks": 0, "loss_rank_avg": 0.21271702647209167, "step": 880, "valid_targets_mean": 3921.5, "valid_targets_min": 1627 }, { "epoch": 1.5837063563115488, "grad_norm": 0.5905492028618122, "learning_rate": 3.810367678864159e-05, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.1883733570575714, "step": 885, "valid_targets_mean": 4394.5, "valid_targets_min": 1679 }, { "epoch": 1.5926589077887199, "grad_norm": 0.7269147011558954, "learning_rate": 3.806557456481878e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.1721513271331787, "step": 890, "valid_targets_mean": 2881.2, "valid_targets_min": 319 }, { "epoch": 1.6016114592658908, "grad_norm": 0.6068211615448192, "learning_rate": 3.8027112791435466e-05, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.1983214020729065, "step": 895, "valid_targets_mean": 5167.1, "valid_targets_min": 1281 }, { "epoch": 1.6105640107430617, "grad_norm": 0.6812461385143791, "learning_rate": 3.7988292233975947e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13996651768684387, "step": 900, "valid_targets_mean": 2514.6, "valid_targets_min": 1322 }, { "epoch": 1.6195165622202328, "grad_norm": 0.5697069170093747, "learning_rate": 3.7949113665065226e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.11300276964902878, "step": 905, "valid_targets_mean": 2734.5, "valid_targets_min": 954 }, { "epoch": 1.6284691136974039, "grad_norm": 0.7967680943849905, "learning_rate": 3.7909577864453593e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.19516390562057495, "step": 910, "valid_targets_mean": 2512.0, "valid_targets_min": 1348 }, { "epoch": 1.6374216651745748, "grad_norm": 0.6714153332367297, "learning_rate": 3.786968561900116e-05, "loss": 0.3911, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842774748802185, "step": 915, "valid_targets_mean": 3405.9, "valid_targets_min": 1271 }, { "epoch": 1.6463742166517457, "grad_norm": 0.6561038510002812, "learning_rate": 3.782943772266213e-05, "loss": 0.3851, "loss_nan_ranks": 0, "loss_rank_avg": 0.23451654613018036, "step": 920, "valid_targets_mean": 4284.4, "valid_targets_min": 530 }, { "epoch": 1.6553267681289168, "grad_norm": 0.6142681543103801, "learning_rate": 3.7788834976469095e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.20726540684700012, "step": 925, "valid_targets_mean": 4569.1, "valid_targets_min": 2473 }, { "epoch": 1.6642793196060879, "grad_norm": 0.6213721879990686, "learning_rate": 3.7747878188516965e-05, "loss": 0.3717, "loss_nan_ranks": 0, "loss_rank_avg": 0.21202799677848816, "step": 930, "valid_targets_mean": 4032.8, "valid_targets_min": 2941 }, { "epoch": 1.6732318710832588, "grad_norm": 0.5774124752627617, "learning_rate": 3.770656817394703e-05, "loss": 0.3759, "loss_nan_ranks": 0, "loss_rank_avg": 0.09195344150066376, "step": 935, "valid_targets_mean": 2147.5, "valid_targets_min": 1288 }, { "epoch": 1.6821844225604297, "grad_norm": 0.5792812289191612, "learning_rate": 3.7664905754930616e-05, "loss": 0.3811, "loss_nan_ranks": 0, "loss_rank_avg": 0.2350800782442093, "step": 940, "valid_targets_mean": 5344.9, "valid_targets_min": 2115 }, { "epoch": 1.6911369740376008, "grad_norm": 0.5250025119182727, "learning_rate": 3.762289176065276e-05, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.19462850689888, "step": 945, "valid_targets_mean": 6841.0, "valid_targets_min": 2135 }, { "epoch": 1.7000895255147717, "grad_norm": 0.649613775475992, "learning_rate": 3.758052702729576e-05, "loss": 0.3504, "loss_nan_ranks": 0, "loss_rank_avg": 0.17525091767311096, "step": 950, "valid_targets_mean": 3303.4, "valid_targets_min": 1450 }, { "epoch": 1.7090420769919428, "grad_norm": 0.6480009935206632, "learning_rate": 3.753781239802245e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.17123568058013916, "step": 955, "valid_targets_mean": 3213.5, "valid_targets_min": 1432 }, { "epoch": 1.7179946284691137, "grad_norm": 0.5665419742760008, "learning_rate": 3.749474872295946e-05, "loss": 0.3598, "loss_nan_ranks": 0, "loss_rank_avg": 0.17659839987754822, "step": 960, "valid_targets_mean": 4176.4, "valid_targets_min": 1155 }, { "epoch": 1.7269471799462845, "grad_norm": 0.4711008135049166, "learning_rate": 3.745133685918032e-05, "loss": 0.358, "loss_nan_ranks": 0, "loss_rank_avg": 0.13374367356300354, "step": 965, "valid_targets_mean": 4934.9, "valid_targets_min": 1677 }, { "epoch": 1.7358997314234557, "grad_norm": 0.5941103023388754, "learning_rate": 3.740757767068834e-05, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.18420416116714478, "step": 970, "valid_targets_mean": 4014.4, "valid_targets_min": 1444 }, { "epoch": 1.7448522829006268, "grad_norm": 0.6018670288242158, "learning_rate": 3.7363472028399476e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.20882412791252136, "step": 975, "valid_targets_mean": 4805.8, "valid_targets_min": 1521 }, { "epoch": 1.7538048343777977, "grad_norm": 0.5684940241609523, "learning_rate": 3.7319020810124965e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.13425326347351074, "step": 980, "valid_targets_mean": 2943.4, "valid_targets_min": 1368 }, { "epoch": 1.7627573858549686, "grad_norm": 0.578302453704476, "learning_rate": 3.727422490055386e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.16196070611476898, "step": 985, "valid_targets_mean": 4246.9, "valid_targets_min": 1018 }, { "epoch": 1.7717099373321397, "grad_norm": 0.5126381116701886, "learning_rate": 3.72290851912354e-05, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1364893913269043, "step": 990, "valid_targets_mean": 4596.4, "valid_targets_min": 1367 }, { "epoch": 1.7806624888093108, "grad_norm": 0.6689103493428239, "learning_rate": 3.718360258056133e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.17874747514724731, "step": 995, "valid_targets_mean": 3822.0, "valid_targets_min": 1367 }, { "epoch": 1.7896150402864817, "grad_norm": 0.5733552205006976, "learning_rate": 3.713777797374794e-05, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.1342494636774063, "step": 1000, "valid_targets_mean": 3976.6, "valid_targets_min": 1779 }, { "epoch": 1.7985675917636526, "grad_norm": 0.615956841130552, "learning_rate": 3.709161228281811e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488458812236786, "step": 1005, "valid_targets_mean": 3553.6, "valid_targets_min": 1921 }, { "epoch": 1.8075201432408237, "grad_norm": 0.6675507908636208, "learning_rate": 3.704510642658314e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.10533076524734497, "step": 1010, "valid_targets_mean": 2549.6, "valid_targets_min": 1152 }, { "epoch": 1.8164726947179948, "grad_norm": 0.5622567774770557, "learning_rate": 3.699826133062443e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.16377931833267212, "step": 1015, "valid_targets_mean": 4790.0, "valid_targets_min": 1564 }, { "epoch": 1.8254252461951657, "grad_norm": 0.7045205939224921, "learning_rate": 3.6951077927275126e-05, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.17814645171165466, "step": 1020, "valid_targets_mean": 3490.4, "valid_targets_min": 1701 }, { "epoch": 1.8343777976723366, "grad_norm": 0.5623018666792298, "learning_rate": 3.6903557155601503e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.15948252379894257, "step": 1025, "valid_targets_mean": 4541.9, "valid_targets_min": 1733 }, { "epoch": 1.8433303491495077, "grad_norm": 0.6793583770529867, "learning_rate": 3.685569996138431e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.18709158897399902, "step": 1030, "valid_targets_mean": 3235.8, "valid_targets_min": 1280 }, { "epoch": 1.8522829006266786, "grad_norm": 0.6230901893070521, "learning_rate": 3.680750729709993e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.20924879610538483, "step": 1035, "valid_targets_mean": 3889.1, "valid_targets_min": 1246 }, { "epoch": 1.8612354521038497, "grad_norm": 0.6213562591140741, "learning_rate": 3.675898012190143e-05, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.17583440244197845, "step": 1040, "valid_targets_mean": 3936.8, "valid_targets_min": 1664 }, { "epoch": 1.8701880035810206, "grad_norm": 0.6347145618018462, "learning_rate": 3.6710119401599474e-05, "loss": 0.3631, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309717744588852, "step": 1045, "valid_targets_mean": 2106.9, "valid_targets_min": 857 }, { "epoch": 1.8791405550581914, "grad_norm": 0.58973298577871, "learning_rate": 3.6660926108643086e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.19553452730178833, "step": 1050, "valid_targets_mean": 3828.2, "valid_targets_min": 1020 }, { "epoch": 1.8880931065353626, "grad_norm": 0.6896943990427881, "learning_rate": 3.661140122210032e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.12913288176059723, "step": 1055, "valid_targets_mean": 2498.1, "valid_targets_min": 1305 }, { "epoch": 1.8970456580125337, "grad_norm": 0.623411962311995, "learning_rate": 3.656154572763877e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.14518050849437714, "step": 1060, "valid_targets_mean": 4387.0, "valid_targets_min": 1385 }, { "epoch": 1.9059982094897046, "grad_norm": 0.6976422673738203, "learning_rate": 3.651136061750592e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1363721787929535, "step": 1065, "valid_targets_mean": 2462.8, "valid_targets_min": 1088 }, { "epoch": 1.9149507609668754, "grad_norm": 0.5544024419127411, "learning_rate": 3.646084689050942e-05, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.23097077012062073, "step": 1070, "valid_targets_mean": 5681.8, "valid_targets_min": 777 }, { "epoch": 1.9239033124440466, "grad_norm": 0.5989450206693978, "learning_rate": 3.641000555199725e-05, "loss": 0.3672, "loss_nan_ranks": 0, "loss_rank_avg": 0.3325088322162628, "step": 1075, "valid_targets_mean": 6761.1, "valid_targets_min": 1202 }, { "epoch": 1.9328558639212177, "grad_norm": 0.5099408282063519, "learning_rate": 3.6358837613837604e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1250154674053192, "step": 1080, "valid_targets_mean": 3475.6, "valid_targets_min": 1433 }, { "epoch": 1.9418084153983886, "grad_norm": 0.6114130466606059, "learning_rate": 3.630734409439887e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.18339493870735168, "step": 1085, "valid_targets_mean": 4119.0, "valid_targets_min": 1102 }, { "epoch": 1.9507609668755594, "grad_norm": 0.7222349042904347, "learning_rate": 3.625552601852928e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.1875397115945816, "step": 1090, "valid_targets_mean": 2863.2, "valid_targets_min": 940 }, { "epoch": 1.9597135183527306, "grad_norm": 0.6804750208910717, "learning_rate": 3.6203384417536566e-05, "loss": 0.3557, "loss_nan_ranks": 0, "loss_rank_avg": 0.18265077471733093, "step": 1095, "valid_targets_mean": 3868.4, "valid_targets_min": 1400 }, { "epoch": 1.9686660698299017, "grad_norm": 0.6657262397912295, "learning_rate": 3.615092032916736e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.16759824752807617, "step": 1100, "valid_targets_mean": 3627.8, "valid_targets_min": 810 }, { "epoch": 1.9776186213070726, "grad_norm": 0.6073636882366005, "learning_rate": 3.6098134797586646e-05, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.12195791304111481, "step": 1105, "valid_targets_mean": 2877.5, "valid_targets_min": 1204 }, { "epoch": 1.9865711727842434, "grad_norm": 0.8596770463224701, "learning_rate": 3.604502887335688e-05, "loss": 0.3513, "loss_nan_ranks": 0, "loss_rank_avg": 0.19915196299552917, "step": 1110, "valid_targets_mean": 5150.5, "valid_targets_min": 2758 }, { "epoch": 1.9955237242614146, "grad_norm": 0.5642215443988173, "learning_rate": 3.599160361341715e-05, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.16652005910873413, "step": 1115, "valid_targets_mean": 4599.1, "valid_targets_min": 742 }, { "epoch": 2.003581020590868, "grad_norm": 0.6052219331868266, "learning_rate": 3.59378600810621e-05, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.20534177124500275, "step": 1120, "valid_targets_mean": 5202.9, "valid_targets_min": 2496 }, { "epoch": 2.0125335720680395, "grad_norm": 0.6372134090351926, "learning_rate": 3.588379934592078e-05, "loss": 0.322, "loss_nan_ranks": 0, "loss_rank_avg": 0.12786754965782166, "step": 1125, "valid_targets_mean": 2973.5, "valid_targets_min": 1293 }, { "epoch": 2.0214861235452104, "grad_norm": 0.6723864873622751, "learning_rate": 3.5829422483935374e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.15999622642993927, "step": 1130, "valid_targets_mean": 3738.4, "valid_targets_min": 1399 }, { "epoch": 2.0304386750223813, "grad_norm": 0.6401323119556832, "learning_rate": 3.577473057733975e-05, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.12839260697364807, "step": 1135, "valid_targets_mean": 3227.8, "valid_targets_min": 684 }, { "epoch": 2.039391226499552, "grad_norm": 0.5527559741075448, "learning_rate": 3.571972471463795e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.17527739703655243, "step": 1140, "valid_targets_mean": 5061.2, "valid_targets_min": 1219 }, { "epoch": 2.0483437779767235, "grad_norm": 0.453223635680156, "learning_rate": 3.566440599058253e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.0904235690832138, "step": 1145, "valid_targets_mean": 3904.6, "valid_targets_min": 1378 }, { "epoch": 2.0572963294538944, "grad_norm": 0.7061541670317182, "learning_rate": 3.560877550615275e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.17458279430866241, "step": 1150, "valid_targets_mean": 3816.8, "valid_targets_min": 1423 }, { "epoch": 2.0662488809310653, "grad_norm": 0.5763514441348033, "learning_rate": 3.555283436853267e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.10202936828136444, "step": 1155, "valid_targets_mean": 2085.8, "valid_targets_min": 348 }, { "epoch": 2.075201432408236, "grad_norm": 0.6128115206461063, "learning_rate": 3.549658369108911e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.07467757165431976, "step": 1160, "valid_targets_mean": 1714.5, "valid_targets_min": 854 }, { "epoch": 2.0841539838854075, "grad_norm": 0.6446047657894652, "learning_rate": 3.544002459334952e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.20798584818840027, "step": 1165, "valid_targets_mean": 5297.9, "valid_targets_min": 2317 }, { "epoch": 2.0931065353625784, "grad_norm": 0.7059351630467845, "learning_rate": 3.5383158200979636e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.17275607585906982, "step": 1170, "valid_targets_mean": 2938.5, "valid_targets_min": 1575 }, { "epoch": 2.1020590868397493, "grad_norm": 0.5826650464806887, "learning_rate": 3.532598564576117e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.14418719708919525, "step": 1175, "valid_targets_mean": 4263.2, "valid_targets_min": 1440 }, { "epoch": 2.11101163831692, "grad_norm": 0.6875978539339866, "learning_rate": 3.526850806556919e-05, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.17782482504844666, "step": 1180, "valid_targets_mean": 3434.2, "valid_targets_min": 2377 }, { "epoch": 2.1199641897940915, "grad_norm": 0.5535655704379627, "learning_rate": 3.521072660434952e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.19075921177864075, "step": 1185, "valid_targets_mean": 4385.1, "valid_targets_min": 1440 }, { "epoch": 2.1289167412712624, "grad_norm": 0.5373177167125995, "learning_rate": 3.5152642412095984e-05, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952834129333496, "step": 1190, "valid_targets_mean": 4648.5, "valid_targets_min": 1982 }, { "epoch": 2.1378692927484333, "grad_norm": 0.6179979971643651, "learning_rate": 3.5094256644827474e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.12283094227313995, "step": 1195, "valid_targets_mean": 3926.1, "valid_targets_min": 1374 }, { "epoch": 2.146821844225604, "grad_norm": 0.6783117172187012, "learning_rate": 3.503557046456501e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.17674294114112854, "step": 1200, "valid_targets_mean": 3098.4, "valid_targets_min": 1504 }, { "epoch": 2.1557743957027755, "grad_norm": 0.5363304730541903, "learning_rate": 3.4976585039308535e-05, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.18800324201583862, "step": 1205, "valid_targets_mean": 5661.8, "valid_targets_min": 592 }, { "epoch": 2.1647269471799464, "grad_norm": 0.6647851175758868, "learning_rate": 3.491730154301372e-05, "loss": 0.3397, "loss_nan_ranks": 0, "loss_rank_avg": 0.14593389630317688, "step": 1210, "valid_targets_mean": 3087.5, "valid_targets_min": 1108 }, { "epoch": 2.1736794986571173, "grad_norm": 0.6195332060911277, "learning_rate": 3.485772115556859e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.20628832280635834, "step": 1215, "valid_targets_mean": 5044.6, "valid_targets_min": 1387 }, { "epoch": 2.182632050134288, "grad_norm": 0.6787497059916711, "learning_rate": 3.4797845062770045e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11903105676174164, "step": 1220, "valid_targets_mean": 2183.8, "valid_targets_min": 1277 }, { "epoch": 2.191584601611459, "grad_norm": 0.6282562749240457, "learning_rate": 3.473767445630022e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.142918199300766, "step": 1225, "valid_targets_mean": 3534.5, "valid_targets_min": 1357 }, { "epoch": 2.2005371530886304, "grad_norm": 0.7211672197526297, "learning_rate": 3.467721053370284e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.16219381988048553, "step": 1230, "valid_targets_mean": 2918.1, "valid_targets_min": 1453 }, { "epoch": 2.2094897045658013, "grad_norm": 0.5816702367464138, "learning_rate": 3.4616454498359306e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13409647345542908, "step": 1235, "valid_targets_mean": 3830.8, "valid_targets_min": 1249 }, { "epoch": 2.218442256042972, "grad_norm": 0.5734139252571135, "learning_rate": 3.4555407559464825e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.18026067316532135, "step": 1240, "valid_targets_mean": 5342.8, "valid_targets_min": 1652 }, { "epoch": 2.227394807520143, "grad_norm": 0.771243368082431, "learning_rate": 3.4494070932004274e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591377556324005, "step": 1245, "valid_targets_mean": 2311.4, "valid_targets_min": 1421 }, { "epoch": 2.2363473589973144, "grad_norm": 0.5336435857271173, "learning_rate": 3.4432445836728055e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.08339603245258331, "step": 1250, "valid_targets_mean": 2657.4, "valid_targets_min": 1575 }, { "epoch": 2.2452999104744853, "grad_norm": 0.6603765461133814, "learning_rate": 3.4370533500127794e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445946991443634, "step": 1255, "valid_targets_mean": 2847.9, "valid_targets_min": 1215 }, { "epoch": 2.254252461951656, "grad_norm": 0.562964584770617, "learning_rate": 3.430833515441193e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.1468866467475891, "step": 1260, "valid_targets_mean": 4139.5, "valid_targets_min": 1707 }, { "epoch": 2.263205013428827, "grad_norm": 0.5539438164656543, "learning_rate": 3.424585203748119e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521764039993286, "step": 1265, "valid_targets_mean": 6956.5, "valid_targets_min": 1362 }, { "epoch": 2.2721575649059984, "grad_norm": 0.525859014560588, "learning_rate": 3.4183085392903965e-05, "loss": 0.3346, "loss_nan_ranks": 0, "loss_rank_avg": 0.13610875606536865, "step": 1270, "valid_targets_mean": 4491.5, "valid_targets_min": 1387 }, { "epoch": 2.2811101163831693, "grad_norm": 0.5713317851483184, "learning_rate": 3.41200364698915e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.16015830636024475, "step": 1275, "valid_targets_mean": 4629.2, "valid_targets_min": 1121 }, { "epoch": 2.29006266786034, "grad_norm": 0.6197825601277361, "learning_rate": 3.405670652327313e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.12453843653202057, "step": 1280, "valid_targets_mean": 2702.1, "valid_targets_min": 1198 }, { "epoch": 2.299015219337511, "grad_norm": 0.6081138136553563, "learning_rate": 3.399309681347123e-05, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.24878063797950745, "step": 1285, "valid_targets_mean": 5480.4, "valid_targets_min": 1878 }, { "epoch": 2.307967770814682, "grad_norm": 0.5662395930780025, "learning_rate": 3.392920860647617e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.20692947506904602, "step": 1290, "valid_targets_mean": 5727.5, "valid_targets_min": 1652 }, { "epoch": 2.3169203222918533, "grad_norm": 0.6357833331434369, "learning_rate": 3.3865043173821074e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.16444212198257446, "step": 1295, "valid_targets_mean": 3905.9, "valid_targets_min": 1131 }, { "epoch": 2.325872873769024, "grad_norm": 0.6131522307396422, "learning_rate": 3.380060179255656e-05, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1174757182598114, "step": 1300, "valid_targets_mean": 3201.8, "valid_targets_min": 1403 }, { "epoch": 2.334825425246195, "grad_norm": 0.6863608314070286, "learning_rate": 3.37358857452253e-05, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.14921192824840546, "step": 1305, "valid_targets_mean": 3493.2, "valid_targets_min": 1655 }, { "epoch": 2.3437779767233664, "grad_norm": 0.5237704728272313, "learning_rate": 3.367089631983651e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.16521351039409637, "step": 1310, "valid_targets_mean": 5021.4, "valid_targets_min": 2158 }, { "epoch": 2.3527305282005373, "grad_norm": 0.6996060481011926, "learning_rate": 3.360563480984029e-05, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.1772424280643463, "step": 1315, "valid_targets_mean": 3603.8, "valid_targets_min": 568 }, { "epoch": 2.361683079677708, "grad_norm": 0.7294480018686996, "learning_rate": 3.3540102514101904e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.20145997405052185, "step": 1320, "valid_targets_mean": 2952.6, "valid_targets_min": 957 }, { "epoch": 2.370635631154879, "grad_norm": 0.6581096747139857, "learning_rate": 3.347430073687592e-05, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.19283172488212585, "step": 1325, "valid_targets_mean": 4159.8, "valid_targets_min": 1204 }, { "epoch": 2.37958818263205, "grad_norm": 0.7560342075752016, "learning_rate": 3.340823078778024e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.13571259379386902, "step": 1330, "valid_targets_mean": 3687.5, "valid_targets_min": 1318 }, { "epoch": 2.3885407341092213, "grad_norm": 0.6492264139164943, "learning_rate": 3.3341893981770086e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.17319390177726746, "step": 1335, "valid_targets_mean": 4212.1, "valid_targets_min": 1287 }, { "epoch": 2.397493285586392, "grad_norm": 0.7608633793249342, "learning_rate": 3.327529163911174e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.180658221244812, "step": 1340, "valid_targets_mean": 3035.4, "valid_targets_min": 1567 }, { "epoch": 2.406445837063563, "grad_norm": 0.6040569218759534, "learning_rate": 3.320842508535636e-05, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.09077704697847366, "step": 1345, "valid_targets_mean": 2779.8, "valid_targets_min": 1270 }, { "epoch": 2.415398388540734, "grad_norm": 0.5775762445982943, "learning_rate": 3.314129565131355e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17546844482421875, "step": 1350, "valid_targets_mean": 4502.0, "valid_targets_min": 1548 }, { "epoch": 2.424350940017905, "grad_norm": 0.6769552471767344, "learning_rate": 3.3073904673024854e-05, "loss": 0.3349, "loss_nan_ranks": 0, "loss_rank_avg": 0.15670402348041534, "step": 1355, "valid_targets_mean": 3034.5, "valid_targets_min": 999 }, { "epoch": 2.433303491495076, "grad_norm": 0.6316224464390162, "learning_rate": 3.300625349173723e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.16486474871635437, "step": 1360, "valid_targets_mean": 3398.2, "valid_targets_min": 1208 }, { "epoch": 2.442256042972247, "grad_norm": 0.5840973689561537, "learning_rate": 3.29383434538763e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.24210324883460999, "step": 1365, "valid_targets_mean": 4687.2, "valid_targets_min": 1368 }, { "epoch": 2.451208594449418, "grad_norm": 0.7500647888106254, "learning_rate": 3.287017591101957e-05, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.13718849420547485, "step": 1370, "valid_targets_mean": 1851.1, "valid_targets_min": 742 }, { "epoch": 2.4601611459265893, "grad_norm": 0.5428272494700659, "learning_rate": 3.2801752219869536e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.12291097640991211, "step": 1375, "valid_targets_mean": 3957.2, "valid_targets_min": 1438 }, { "epoch": 2.46911369740376, "grad_norm": 0.7959123302263251, "learning_rate": 3.273307374222667e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.13849949836730957, "step": 1380, "valid_targets_mean": 2558.8, "valid_targets_min": 972 }, { "epoch": 2.478066248880931, "grad_norm": 0.7062680019503911, "learning_rate": 3.266414184496233e-05, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.1923518180847168, "step": 1385, "valid_targets_mean": 4609.4, "valid_targets_min": 1581 }, { "epoch": 2.487018800358102, "grad_norm": 0.6406251692788578, "learning_rate": 3.2594957899991566e-05, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.11892961710691452, "step": 1390, "valid_targets_mean": 2757.5, "valid_targets_min": 980 }, { "epoch": 2.495971351835273, "grad_norm": 1.2275726101592588, "learning_rate": 3.2525523284245766e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.11468460410833359, "step": 1395, "valid_targets_mean": 3384.9, "valid_targets_min": 1793 }, { "epoch": 2.504923903312444, "grad_norm": 0.6884681320356183, "learning_rate": 3.245583937964532e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.134379580616951, "step": 1400, "valid_targets_mean": 2567.1, "valid_targets_min": 1334 }, { "epoch": 2.513876454789615, "grad_norm": 0.7779458297473585, "learning_rate": 3.238590757307206e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.15265807509422302, "step": 1405, "valid_targets_mean": 2609.0, "valid_targets_min": 756 }, { "epoch": 2.522829006266786, "grad_norm": 0.6640063486633304, "learning_rate": 3.2315729256341686e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987053006887436, "step": 1410, "valid_targets_mean": 3837.5, "valid_targets_min": 1001 }, { "epoch": 2.5317815577439573, "grad_norm": 0.5553044657523085, "learning_rate": 3.2245305826176063e-05, "loss": 0.3326, "loss_nan_ranks": 0, "loss_rank_avg": 0.19759173691272736, "step": 1415, "valid_targets_mean": 6199.4, "valid_targets_min": 2226 }, { "epoch": 2.5407341092211277, "grad_norm": 0.709939055780021, "learning_rate": 3.217463868417541e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.1832863688468933, "step": 1420, "valid_targets_mean": 5806.5, "valid_targets_min": 1427 }, { "epoch": 2.549686660698299, "grad_norm": 0.6357425947737642, "learning_rate": 3.2103729236790434e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.195903941988945, "step": 1425, "valid_targets_mean": 3483.8, "valid_targets_min": 810 }, { "epoch": 2.55863921217547, "grad_norm": 0.636197345665908, "learning_rate": 3.203257889529428e-05, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.11567019671201706, "step": 1430, "valid_targets_mean": 2667.1, "valid_targets_min": 1435 }, { "epoch": 2.567591763652641, "grad_norm": 0.7235618047532826, "learning_rate": 3.196118907575452e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823103278875351, "step": 1435, "valid_targets_mean": 3246.8, "valid_targets_min": 1396 }, { "epoch": 2.576544315129812, "grad_norm": 0.7047547532105115, "learning_rate": 3.188956119900491e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.16611355543136597, "step": 1440, "valid_targets_mean": 3224.5, "valid_targets_min": 1763 }, { "epoch": 2.585496866606983, "grad_norm": 0.6653266014374837, "learning_rate": 3.181769669061713e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501968652009964, "step": 1445, "valid_targets_mean": 3479.5, "valid_targets_min": 1221 }, { "epoch": 2.594449418084154, "grad_norm": 0.6844620037691017, "learning_rate": 3.174559698087244e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1589304506778717, "step": 1450, "valid_targets_mean": 2945.6, "valid_targets_min": 297 }, { "epoch": 2.603401969561325, "grad_norm": 0.7613153397840512, "learning_rate": 3.1673263504733136e-05, "loss": 0.3334, "loss_nan_ranks": 0, "loss_rank_avg": 0.18859216570854187, "step": 1455, "valid_targets_mean": 2624.0, "valid_targets_min": 639 }, { "epoch": 2.6123545210384957, "grad_norm": 0.5871776640120691, "learning_rate": 3.160069770181411e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.11848124116659164, "step": 1460, "valid_targets_mean": 3289.4, "valid_targets_min": 943 }, { "epoch": 2.621307072515667, "grad_norm": 0.605999766136029, "learning_rate": 3.152790101635408e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.13618788123130798, "step": 1465, "valid_targets_mean": 2836.8, "valid_targets_min": 770 }, { "epoch": 2.630259623992838, "grad_norm": 0.5726662176186619, "learning_rate": 3.145487489718692e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.15494957566261292, "step": 1470, "valid_targets_mean": 3869.1, "valid_targets_min": 1322 }, { "epoch": 2.639212175470009, "grad_norm": 0.5365989748453186, "learning_rate": 3.138162079771278e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.15874773263931274, "step": 1475, "valid_targets_mean": 4577.9, "valid_targets_min": 1279 }, { "epoch": 2.64816472694718, "grad_norm": 0.5551684662320231, "learning_rate": 3.1308140175869216e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.14446908235549927, "step": 1480, "valid_targets_mean": 4658.5, "valid_targets_min": 1400 }, { "epoch": 2.657117278424351, "grad_norm": 0.6388833788450519, "learning_rate": 3.123443449410211e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1660110056400299, "step": 1485, "valid_targets_mean": 3828.0, "valid_targets_min": 1524 }, { "epoch": 2.666069829901522, "grad_norm": 0.7296008634040168, "learning_rate": 3.1160505219336594e-05, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.19480803608894348, "step": 1490, "valid_targets_mean": 3797.8, "valid_targets_min": 1757 }, { "epoch": 2.675022381378693, "grad_norm": 0.5872767622862354, "learning_rate": 3.108635382294787e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.18170863389968872, "step": 1495, "valid_targets_mean": 4497.4, "valid_targets_min": 1429 }, { "epoch": 2.6839749328558637, "grad_norm": 0.6001385480022825, "learning_rate": 3.101198178073189e-05, "loss": 0.3295, "loss_nan_ranks": 0, "loss_rank_avg": 0.15100830793380737, "step": 1500, "valid_targets_mean": 3492.2, "valid_targets_min": 1173 }, { "epoch": 2.692927484333035, "grad_norm": 0.5942570457251561, "learning_rate": 3.093739057287603e-05, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2285933643579483, "step": 1505, "valid_targets_mean": 5245.6, "valid_targets_min": 1920 }, { "epoch": 2.701880035810206, "grad_norm": 0.5518275448844328, "learning_rate": 3.086258168392957e-05, "loss": 0.3334, "loss_nan_ranks": 0, "loss_rank_avg": 0.13938848674297333, "step": 1510, "valid_targets_mean": 3998.1, "valid_targets_min": 2193 }, { "epoch": 2.710832587287377, "grad_norm": 0.5695709347856279, "learning_rate": 3.0787556602774195e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.11261847615242004, "step": 1515, "valid_targets_mean": 3775.1, "valid_targets_min": 1405 }, { "epoch": 2.7197851387645477, "grad_norm": 0.6491649502754991, "learning_rate": 3.071231682259437e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.0938911885023117, "step": 1520, "valid_targets_mean": 2205.0, "valid_targets_min": 1617 }, { "epoch": 2.7287376902417186, "grad_norm": 0.7019210724410154, "learning_rate": 3.063686384084756e-05, "loss": 0.3346, "loss_nan_ranks": 0, "loss_rank_avg": 0.19694435596466064, "step": 1525, "valid_targets_mean": 3414.0, "valid_targets_min": 1186 }, { "epoch": 2.73769024171889, "grad_norm": 0.6690446047856118, "learning_rate": 3.05611991592345e-05, "loss": 0.3368, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392868608236313, "step": 1530, "valid_targets_mean": 2480.8, "valid_targets_min": 323 }, { "epoch": 2.746642793196061, "grad_norm": 0.522232064697356, "learning_rate": 3.0485324283669288e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.13069400191307068, "step": 1535, "valid_targets_mean": 4926.6, "valid_targets_min": 762 }, { "epoch": 2.7555953446732318, "grad_norm": 0.6183033586621423, "learning_rate": 3.0409240724249334e-05, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.1853337287902832, "step": 1540, "valid_targets_mean": 4915.0, "valid_targets_min": 1817 }, { "epoch": 2.764547896150403, "grad_norm": 0.4868431778426567, "learning_rate": 3.033294999522545e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.15458467602729797, "step": 1545, "valid_targets_mean": 4923.0, "valid_targets_min": 1974 }, { "epoch": 2.773500447627574, "grad_norm": 0.7871239617122384, "learning_rate": 3.0256453614971594e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.17956718802452087, "step": 1550, "valid_targets_mean": 2356.8, "valid_targets_min": 1062 }, { "epoch": 2.782452999104745, "grad_norm": 0.6070057091754848, "learning_rate": 3.017975310595469e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.1523509919643402, "step": 1555, "valid_targets_mean": 3920.9, "valid_targets_min": 1789 }, { "epoch": 2.7914055505819158, "grad_norm": 0.5835084934822887, "learning_rate": 3.0102849994704343e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.24419042468070984, "step": 1560, "valid_targets_mean": 6938.5, "valid_targets_min": 1161 }, { "epoch": 2.8003581020590866, "grad_norm": 0.5723181812585326, "learning_rate": 3.0025745811782444e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.16458186507225037, "step": 1565, "valid_targets_mean": 6416.8, "valid_targets_min": 954 }, { "epoch": 2.809310653536258, "grad_norm": 0.8168745210965721, "learning_rate": 2.994844209175269e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2504898011684418, "step": 1570, "valid_targets_mean": 6881.8, "valid_targets_min": 2422 }, { "epoch": 2.818263205013429, "grad_norm": 0.6134084352950554, "learning_rate": 2.987094037315008e-05, "loss": 0.3277, "loss_nan_ranks": 0, "loss_rank_avg": 0.10477450489997864, "step": 1575, "valid_targets_mean": 2753.1, "valid_targets_min": 1248 }, { "epoch": 2.8272157564905998, "grad_norm": 0.6017942096883853, "learning_rate": 2.9793242198450258e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.22128619253635406, "step": 1580, "valid_targets_mean": 4756.5, "valid_targets_min": 1344 }, { "epoch": 2.836168307967771, "grad_norm": 0.6881016094467826, "learning_rate": 2.9715349114038825e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594001293182373, "step": 1585, "valid_targets_mean": 4732.9, "valid_targets_min": 1482 }, { "epoch": 2.845120859444942, "grad_norm": 0.6892520214493385, "learning_rate": 2.9637262670180597e-05, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.15683342516422272, "step": 1590, "valid_targets_mean": 4689.9, "valid_targets_min": 1435 }, { "epoch": 2.854073410922113, "grad_norm": 0.5987162236177794, "learning_rate": 2.955898442098869e-05, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.131935715675354, "step": 1595, "valid_targets_mean": 3541.9, "valid_targets_min": 2303 }, { "epoch": 2.8630259623992838, "grad_norm": 0.6058561074570699, "learning_rate": 2.948051592439363e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.15223629772663116, "step": 1600, "valid_targets_mean": 4136.6, "valid_targets_min": 923 }, { "epoch": 2.8719785138764546, "grad_norm": 0.643496513498291, "learning_rate": 2.9401858742112334e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.1517014503479004, "step": 1605, "valid_targets_mean": 3460.1, "valid_targets_min": 752 }, { "epoch": 2.880931065353626, "grad_norm": 0.6081337292995073, "learning_rate": 2.9323014439617044e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.1477939486503601, "step": 1610, "valid_targets_mean": 3606.8, "valid_targets_min": 1532 }, { "epoch": 2.889883616830797, "grad_norm": 0.7519232605972647, "learning_rate": 2.924398458610414e-05, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.16121116280555725, "step": 1615, "valid_targets_mean": 2771.6, "valid_targets_min": 1246 }, { "epoch": 2.8988361683079678, "grad_norm": 0.7600425688063651, "learning_rate": 2.9164770754462926e-05, "loss": 0.33, "loss_nan_ranks": 0, "loss_rank_avg": 0.11213885247707367, "step": 1620, "valid_targets_mean": 1783.6, "valid_targets_min": 1319 }, { "epoch": 2.9077887197851386, "grad_norm": 0.7521189124061843, "learning_rate": 2.9085374521244333e-05, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.12697280943393707, "step": 1625, "valid_targets_mean": 2481.1, "valid_targets_min": 1211 }, { "epoch": 2.9167412712623095, "grad_norm": 0.6453096854133333, "learning_rate": 2.900579746662954e-05, "loss": 0.3219, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347714602947235, "step": 1630, "valid_targets_mean": 4646.9, "valid_targets_min": 1423 }, { "epoch": 2.925693822739481, "grad_norm": 0.6077027161283227, "learning_rate": 2.8926041174398496e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.14254099130630493, "step": 1635, "valid_targets_mean": 2738.0, "valid_targets_min": 1211 }, { "epoch": 2.9346463742166518, "grad_norm": 0.6255429232553751, "learning_rate": 2.8846107231898445e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.11949039995670319, "step": 1640, "valid_targets_mean": 2887.8, "valid_targets_min": 1159 }, { "epoch": 2.9435989256938226, "grad_norm": 0.5375741825450264, "learning_rate": 2.8765997230012295e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.16180676221847534, "step": 1645, "valid_targets_mean": 4740.6, "valid_targets_min": 1853 }, { "epoch": 2.952551477170994, "grad_norm": 0.5606317759146799, "learning_rate": 2.868571276312698e-05, "loss": 0.3313, "loss_nan_ranks": 0, "loss_rank_avg": 0.09235462546348572, "step": 1650, "valid_targets_mean": 2538.4, "valid_targets_min": 940 }, { "epoch": 2.961504028648165, "grad_norm": 0.495487570027274, "learning_rate": 2.860525542910171e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.15310625731945038, "step": 1655, "valid_targets_mean": 6490.4, "valid_targets_min": 1336 }, { "epoch": 2.9704565801253358, "grad_norm": 0.6035435039933449, "learning_rate": 2.852462682923619e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.11764907091856003, "step": 1660, "valid_targets_mean": 3602.6, "valid_targets_min": 1870 }, { "epoch": 2.9794091316025066, "grad_norm": 0.5800177987722784, "learning_rate": 2.844382856823872e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.17618133127689362, "step": 1665, "valid_targets_mean": 4074.4, "valid_targets_min": 1877 }, { "epoch": 2.9883616830796775, "grad_norm": 0.5646098547959599, "learning_rate": 2.8362862254194298e-05, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1157437115907669, "step": 1670, "valid_targets_mean": 4417.1, "valid_targets_min": 1411 }, { "epoch": 2.997314234556849, "grad_norm": 0.5842366355959351, "learning_rate": 2.8281729498532574e-05, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.11269823461771011, "step": 1675, "valid_targets_mean": 2794.1, "valid_targets_min": 1527 }, { "epoch": 3.0053715308863027, "grad_norm": 0.7896580577617582, "learning_rate": 2.8200431915995805e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.18021970987319946, "step": 1680, "valid_targets_mean": 2496.4, "valid_targets_min": 1147 }, { "epoch": 3.0143240823634736, "grad_norm": 0.6135743160512117, "learning_rate": 2.8118971124606712e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.11502575874328613, "step": 1685, "valid_targets_mean": 3006.2, "valid_targets_min": 546 }, { "epoch": 3.0232766338406445, "grad_norm": 0.778235505268862, "learning_rate": 2.8037348745636274e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.16493195295333862, "step": 1690, "valid_targets_mean": 3107.1, "valid_targets_min": 1264 }, { "epoch": 3.0322291853178154, "grad_norm": 0.6754797455330058, "learning_rate": 2.7955566403571464e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.10485086590051651, "step": 1695, "valid_targets_mean": 2169.6, "valid_targets_min": 997 }, { "epoch": 3.0411817367949867, "grad_norm": 0.6283660091763017, "learning_rate": 2.78736257260829e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.18023446202278137, "step": 1700, "valid_targets_mean": 4900.4, "valid_targets_min": 1553 }, { "epoch": 3.0501342882721576, "grad_norm": 0.613476158397626, "learning_rate": 2.7791528343992494e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.14587222039699554, "step": 1705, "valid_targets_mean": 4158.8, "valid_targets_min": 2135 }, { "epoch": 3.0590868397493285, "grad_norm": 0.7294903187312021, "learning_rate": 2.7709275891240936e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.1322895586490631, "step": 1710, "valid_targets_mean": 2585.0, "valid_targets_min": 1878 }, { "epoch": 3.0680393912264994, "grad_norm": 0.6572500474612717, "learning_rate": 2.7626870004855236e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.15101733803749084, "step": 1715, "valid_targets_mean": 4297.8, "valid_targets_min": 1439 }, { "epoch": 3.0769919427036707, "grad_norm": 0.6803417140783832, "learning_rate": 2.7544312324916088e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.14546285569667816, "step": 1720, "valid_targets_mean": 3869.4, "valid_targets_min": 1324 }, { "epoch": 3.0859444941808416, "grad_norm": 0.6317442286776777, "learning_rate": 2.7461604494525257e-05, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.1800333857536316, "step": 1725, "valid_targets_mean": 4861.0, "valid_targets_min": 1163 }, { "epoch": 3.0948970456580125, "grad_norm": 0.7419679306586767, "learning_rate": 2.7378748159772888e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.15141788125038147, "step": 1730, "valid_targets_mean": 2425.8, "valid_targets_min": 1532 }, { "epoch": 3.1038495971351834, "grad_norm": 0.7184181395352648, "learning_rate": 2.7295744969704725e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.19635578989982605, "step": 1735, "valid_targets_mean": 3549.2, "valid_targets_min": 1355 }, { "epoch": 3.1128021486123547, "grad_norm": 0.5637059424050045, "learning_rate": 2.7212596576289264e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.0870228111743927, "step": 1740, "valid_targets_mean": 2423.9, "valid_targets_min": 872 }, { "epoch": 3.1217547000895256, "grad_norm": 0.6187756682224378, "learning_rate": 2.712930463438496e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.1919945776462555, "step": 1745, "valid_targets_mean": 4811.8, "valid_targets_min": 955 }, { "epoch": 3.1307072515666965, "grad_norm": 0.59176036605801, "learning_rate": 2.7045870801707194e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.11655890196561813, "step": 1750, "valid_targets_mean": 2882.5, "valid_targets_min": 1410 }, { "epoch": 3.1396598030438674, "grad_norm": 0.6273416731577955, "learning_rate": 2.6962296738795344e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.1495613157749176, "step": 1755, "valid_targets_mean": 5002.0, "valid_targets_min": 1440 }, { "epoch": 3.1486123545210383, "grad_norm": 0.645728944689026, "learning_rate": 2.687858410897971e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856779158115387, "step": 1760, "valid_targets_mean": 3773.8, "valid_targets_min": 1118 }, { "epoch": 3.1575649059982096, "grad_norm": 0.7516562586294452, "learning_rate": 2.679473457834842e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.14939184486865997, "step": 1765, "valid_targets_mean": 2931.6, "valid_targets_min": 1250 }, { "epoch": 3.1665174574753805, "grad_norm": 0.6046394108437115, "learning_rate": 2.6710749815714262e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.13386991620063782, "step": 1770, "valid_targets_mean": 3748.0, "valid_targets_min": 1578 }, { "epoch": 3.1754700089525514, "grad_norm": 0.7118151612384511, "learning_rate": 2.6626631492581475e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.16341659426689148, "step": 1775, "valid_targets_mean": 2723.5, "valid_targets_min": 601 }, { "epoch": 3.1844225604297223, "grad_norm": 0.6155300408382743, "learning_rate": 2.654238128311249e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.15156874060630798, "step": 1780, "valid_targets_mean": 3313.4, "valid_targets_min": 1402 }, { "epoch": 3.1933751119068936, "grad_norm": 0.8067424596360118, "learning_rate": 2.645800086409458e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.20328623056411743, "step": 1785, "valid_targets_mean": 3177.9, "valid_targets_min": 1310 }, { "epoch": 3.2023276633840645, "grad_norm": 0.641857203118475, "learning_rate": 2.637349191490654e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.2052251100540161, "step": 1790, "valid_targets_mean": 4034.6, "valid_targets_min": 668 }, { "epoch": 3.2112802148612354, "grad_norm": 0.6368261308999402, "learning_rate": 2.6288856117485216e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.17902475595474243, "step": 1795, "valid_targets_mean": 4138.2, "valid_targets_min": 1206 }, { "epoch": 3.2202327663384063, "grad_norm": 0.5548069381687681, "learning_rate": 2.6204095156292048e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.14810031652450562, "step": 1800, "valid_targets_mean": 5104.6, "valid_targets_min": 1210 }, { "epoch": 3.2291853178155776, "grad_norm": 0.753660257908115, "learning_rate": 2.6119210718279538e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.11428888142108917, "step": 1805, "valid_targets_mean": 2015.9, "valid_targets_min": 1291 }, { "epoch": 3.2381378692927485, "grad_norm": 0.5660494935503344, "learning_rate": 2.60342044928577e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.13116174936294556, "step": 1810, "valid_targets_mean": 4031.4, "valid_targets_min": 1595 }, { "epoch": 3.2470904207699194, "grad_norm": 0.533929651082135, "learning_rate": 2.5949078171860395e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.12700650095939636, "step": 1815, "valid_targets_mean": 5214.2, "valid_targets_min": 1254 }, { "epoch": 3.2560429722470903, "grad_norm": 0.5416322919386064, "learning_rate": 2.5863833449511706e-05, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.17714446783065796, "step": 1820, "valid_targets_mean": 6259.0, "valid_targets_min": 1927 }, { "epoch": 3.2649955237242616, "grad_norm": 0.43344116835180807, "learning_rate": 2.5778472022392184e-05, "loss": 0.2884, "loss_nan_ranks": 0, "loss_rank_avg": 0.21672791242599487, "step": 1825, "valid_targets_mean": 10914.1, "valid_targets_min": 1495 }, { "epoch": 3.2739480752014325, "grad_norm": 0.5802891194562758, "learning_rate": 2.5692995589405087e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.127014622092247, "step": 1830, "valid_targets_mean": 3817.8, "valid_targets_min": 1465 }, { "epoch": 3.2829006266786034, "grad_norm": 0.64587786194205, "learning_rate": 2.5607405851742578e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.1963973343372345, "step": 1835, "valid_targets_mean": 4352.9, "valid_targets_min": 1256 }, { "epoch": 3.2918531781557743, "grad_norm": 0.5684432148710743, "learning_rate": 2.5521704512851884e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.15847089886665344, "step": 1840, "valid_targets_mean": 4296.1, "valid_targets_min": 979 }, { "epoch": 3.3008057296329456, "grad_norm": 0.6666687517731704, "learning_rate": 2.5435893278401328e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.1337079405784607, "step": 1845, "valid_targets_mean": 3256.2, "valid_targets_min": 1158 }, { "epoch": 3.3097582811101165, "grad_norm": 0.7717906084958367, "learning_rate": 2.534997385624647e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.12368161976337433, "step": 1850, "valid_targets_mean": 2424.4, "valid_targets_min": 890 }, { "epoch": 3.3187108325872874, "grad_norm": 0.735202247533644, "learning_rate": 2.5263947956396043e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.112772636115551, "step": 1855, "valid_targets_mean": 2231.6, "valid_targets_min": 1053 }, { "epoch": 3.3276633840644583, "grad_norm": 0.7702737075049189, "learning_rate": 2.5177817290977967e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.14182201027870178, "step": 1860, "valid_targets_mean": 2349.6, "valid_targets_min": 1470 }, { "epoch": 3.336615935541629, "grad_norm": 0.6119811350195906, "learning_rate": 2.5091583574205247e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.14366689324378967, "step": 1865, "valid_targets_mean": 4402.0, "valid_targets_min": 1261 }, { "epoch": 3.3455684870188005, "grad_norm": 0.6505709086023806, "learning_rate": 2.5005248522341868e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.13018080592155457, "step": 1870, "valid_targets_mean": 2860.2, "valid_targets_min": 1648 }, { "epoch": 3.3545210384959714, "grad_norm": 0.7074105189549208, "learning_rate": 2.4918813853668632e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.19293466210365295, "step": 1875, "valid_targets_mean": 4045.8, "valid_targets_min": 1493 }, { "epoch": 3.3634735899731423, "grad_norm": 0.5807379486607306, "learning_rate": 2.483228128844896e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.1795765608549118, "step": 1880, "valid_targets_mean": 5007.6, "valid_targets_min": 693 }, { "epoch": 3.372426141450313, "grad_norm": 0.6968229011978457, "learning_rate": 2.4745652548894654e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.14516671001911163, "step": 1885, "valid_targets_mean": 2635.5, "valid_targets_min": 627 }, { "epoch": 3.3813786929274845, "grad_norm": 0.5800079788765263, "learning_rate": 2.4658929359131634e-05, "loss": 0.2961, "loss_nan_ranks": 0, "loss_rank_avg": 0.09096183627843857, "step": 1890, "valid_targets_mean": 2528.5, "valid_targets_min": 1193 }, { "epoch": 3.3903312444046554, "grad_norm": 0.6408890861943591, "learning_rate": 2.4572113445165603e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.13080674409866333, "step": 1895, "valid_targets_mean": 3830.5, "valid_targets_min": 1113 }, { "epoch": 3.3992837958818263, "grad_norm": 0.5575769883321318, "learning_rate": 2.4485206534847706e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.18095198273658752, "step": 1900, "valid_targets_mean": 5400.2, "valid_targets_min": 1789 }, { "epoch": 3.408236347358997, "grad_norm": 0.6243600107033797, "learning_rate": 2.439821035784014e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.12245135009288788, "step": 1905, "valid_targets_mean": 3295.4, "valid_targets_min": 1052 }, { "epoch": 3.4171888988361685, "grad_norm": 0.7984110210507213, "learning_rate": 2.431112664558173e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.12867091596126556, "step": 1910, "valid_targets_mean": 2177.6, "valid_targets_min": 1007 }, { "epoch": 3.4261414503133394, "grad_norm": 0.7626136272645896, "learning_rate": 2.4223957131253467e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.16945910453796387, "step": 1915, "valid_targets_mean": 4280.2, "valid_targets_min": 954 }, { "epoch": 3.4350940017905103, "grad_norm": 0.879960636032773, "learning_rate": 2.4136703549744028e-05, "loss": 0.3266, "loss_nan_ranks": 0, "loss_rank_avg": 0.17531342804431915, "step": 1920, "valid_targets_mean": 2265.9, "valid_targets_min": 1111 }, { "epoch": 3.444046553267681, "grad_norm": 0.6069014751890103, "learning_rate": 2.4049367637615215e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.15128836035728455, "step": 1925, "valid_targets_mean": 3898.9, "valid_targets_min": 1362 }, { "epoch": 3.452999104744852, "grad_norm": 0.6683394762004051, "learning_rate": 2.396195113306742e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.11693670600652695, "step": 1930, "valid_targets_mean": 2843.2, "valid_targets_min": 1079 }, { "epoch": 3.4619516562220234, "grad_norm": 0.5527522960821272, "learning_rate": 2.3874455775905036e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.10419487953186035, "step": 1935, "valid_targets_mean": 2983.6, "valid_targets_min": 854 }, { "epoch": 3.4709042076991943, "grad_norm": 0.5252735073672182, "learning_rate": 2.3786883307501794e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.10443928092718124, "step": 1940, "valid_targets_mean": 3916.2, "valid_targets_min": 1351 }, { "epoch": 3.479856759176365, "grad_norm": 0.635207514509153, "learning_rate": 2.3699235470766147e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575881689786911, "step": 1945, "valid_targets_mean": 4008.0, "valid_targets_min": 1165 }, { "epoch": 3.4888093106535365, "grad_norm": 0.6106698152368751, "learning_rate": 2.3611514010106564e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.09959106892347336, "step": 1950, "valid_targets_mean": 2759.2, "valid_targets_min": 1435 }, { "epoch": 3.4977618621307074, "grad_norm": 0.673225130627237, "learning_rate": 2.35237206713968e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.14371871948242188, "step": 1955, "valid_targets_mean": 3085.5, "valid_targets_min": 1152 }, { "epoch": 3.5067144136078783, "grad_norm": 0.6968504081569306, "learning_rate": 2.3435857201941172e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.17559152841567993, "step": 1960, "valid_targets_mean": 3212.4, "valid_targets_min": 1197 }, { "epoch": 3.515666965085049, "grad_norm": 0.819564689611184, "learning_rate": 2.3347925350439765e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.08735944330692291, "step": 1965, "valid_targets_mean": 2583.0, "valid_targets_min": 1021 }, { "epoch": 3.52461951656222, "grad_norm": 0.6468820188123998, "learning_rate": 2.3259926866953636e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.1301145851612091, "step": 1970, "valid_targets_mean": 2990.2, "valid_targets_min": 1568 }, { "epoch": 3.5335720680393914, "grad_norm": 0.6244370600947371, "learning_rate": 2.3171863502869993e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1787623018026352, "step": 1975, "valid_targets_mean": 4180.9, "valid_targets_min": 1222 }, { "epoch": 3.5425246195165623, "grad_norm": 0.5967752262455601, "learning_rate": 2.3083737010867316e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309892237186432, "step": 1980, "valid_targets_mean": 4325.4, "valid_targets_min": 2600 }, { "epoch": 3.551477170993733, "grad_norm": 0.6563237980167774, "learning_rate": 2.2995549144880487e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.21774521470069885, "step": 1985, "valid_targets_mean": 5259.1, "valid_targets_min": 500 }, { "epoch": 3.560429722470904, "grad_norm": 0.7265770510021908, "learning_rate": 2.290730166006589e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371801793575287, "step": 1990, "valid_targets_mean": 2824.9, "valid_targets_min": 1326 }, { "epoch": 3.569382273948075, "grad_norm": 0.5905568901366419, "learning_rate": 2.2818996312766474e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.12975779175758362, "step": 1995, "valid_targets_mean": 3795.4, "valid_targets_min": 1783 }, { "epoch": 3.5783348254252463, "grad_norm": 0.9382745533338204, "learning_rate": 2.2730634860476778e-05, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.15109074115753174, "step": 2000, "valid_targets_mean": 2627.1, "valid_targets_min": 1023 }, { "epoch": 3.587287376902417, "grad_norm": 0.6451958349593174, "learning_rate": 2.264221906180798e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.13331124186515808, "step": 2005, "valid_targets_mean": 4238.4, "valid_targets_min": 648 }, { "epoch": 3.596239928379588, "grad_norm": 0.5218084865899012, "learning_rate": 2.255375067645289e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.12357210367918015, "step": 2010, "valid_targets_mean": 4533.5, "valid_targets_min": 1235 }, { "epoch": 3.6051924798567594, "grad_norm": 0.6280492068387579, "learning_rate": 2.2465231465150902e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.15180960297584534, "step": 2015, "valid_targets_mean": 4229.2, "valid_targets_min": 1155 }, { "epoch": 3.6141450313339303, "grad_norm": 0.5459403625133381, "learning_rate": 2.2376663189653002e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.14584055542945862, "step": 2020, "valid_targets_mean": 4946.4, "valid_targets_min": 939 }, { "epoch": 3.623097582811101, "grad_norm": 0.9835261973194854, "learning_rate": 2.2288047612686655e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.17734041810035706, "step": 2025, "valid_targets_mean": 2308.6, "valid_targets_min": 762 }, { "epoch": 3.632050134288272, "grad_norm": 0.6974222571881543, "learning_rate": 2.219938649792074e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.1139960065484047, "step": 2030, "valid_targets_mean": 2714.5, "valid_targets_min": 1142 }, { "epoch": 3.641002685765443, "grad_norm": 0.7573070540679137, "learning_rate": 2.2110681609930458e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.10645341873168945, "step": 2035, "valid_targets_mean": 2737.5, "valid_targets_min": 1408 }, { "epoch": 3.6499552372426143, "grad_norm": 0.5556169607261522, "learning_rate": 2.2021934714162212e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.12965692579746246, "step": 2040, "valid_targets_mean": 5005.0, "valid_targets_min": 1399 }, { "epoch": 3.658907788719785, "grad_norm": 0.5206042195827867, "learning_rate": 2.1933147576898447e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.11286148428916931, "step": 2045, "valid_targets_mean": 3836.8, "valid_targets_min": 1443 }, { "epoch": 3.667860340196956, "grad_norm": 0.7793043605399187, "learning_rate": 2.1844321965222525e-05, "loss": 0.3053, "loss_nan_ranks": 0, "loss_rank_avg": 0.22073161602020264, "step": 2050, "valid_targets_mean": 3054.5, "valid_targets_min": 994 }, { "epoch": 3.6768128916741274, "grad_norm": 0.5769817589721981, "learning_rate": 2.1755459646983545e-05, "loss": 0.2876, "loss_nan_ranks": 0, "loss_rank_avg": 0.10495971888303757, "step": 2055, "valid_targets_mean": 3625.0, "valid_targets_min": 1958 }, { "epoch": 3.6857654431512983, "grad_norm": 0.6481517125690924, "learning_rate": 2.1666562390761147e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.18431368470191956, "step": 2060, "valid_targets_mean": 5741.5, "valid_targets_min": 1239 }, { "epoch": 3.694717994628469, "grad_norm": 0.7275087755723013, "learning_rate": 2.1577631965830324e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.12168044596910477, "step": 2065, "valid_targets_mean": 2084.9, "valid_targets_min": 1283 }, { "epoch": 3.70367054610564, "grad_norm": 0.6423090431771338, "learning_rate": 2.1488670142126234e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.1942213922739029, "step": 2070, "valid_targets_mean": 4032.9, "valid_targets_min": 1211 }, { "epoch": 3.712623097582811, "grad_norm": 0.5518641128616621, "learning_rate": 2.13996786902089e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.1275741159915924, "step": 2075, "valid_targets_mean": 3884.5, "valid_targets_min": 1262 }, { "epoch": 3.7215756490599823, "grad_norm": 0.8036840000440701, "learning_rate": 2.1310659381228066e-05, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.11641264706850052, "step": 2080, "valid_targets_mean": 1787.6, "valid_targets_min": 482 }, { "epoch": 3.730528200537153, "grad_norm": 0.6250950737248954, "learning_rate": 2.122161398688788e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.16850410401821136, "step": 2085, "valid_targets_mean": 5024.2, "valid_targets_min": 1243 }, { "epoch": 3.739480752014324, "grad_norm": 0.7620593924231298, "learning_rate": 2.1132544279411655e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.15078432857990265, "step": 2090, "valid_targets_mean": 2521.5, "valid_targets_min": 1417 }, { "epoch": 3.748433303491495, "grad_norm": 0.6376558624151332, "learning_rate": 2.1043452031506578e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.18131475150585175, "step": 2095, "valid_targets_mean": 4089.2, "valid_targets_min": 1127 }, { "epoch": 3.757385854968666, "grad_norm": 0.6510696932710319, "learning_rate": 2.0954339016328485e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.15922397375106812, "step": 2100, "valid_targets_mean": 4445.5, "valid_targets_min": 2170 }, { "epoch": 3.766338406445837, "grad_norm": 0.577097450206775, "learning_rate": 2.08652070074465e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.09382876753807068, "step": 2105, "valid_targets_mean": 3492.4, "valid_targets_min": 1608 }, { "epoch": 3.775290957923008, "grad_norm": 0.5921188375445776, "learning_rate": 2.077605777880778e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.10202471911907196, "step": 2110, "valid_targets_mean": 2826.9, "valid_targets_min": 1268 }, { "epoch": 3.784243509400179, "grad_norm": 0.5115559628016806, "learning_rate": 2.0686893104702198e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.10683996230363846, "step": 2115, "valid_targets_mean": 5196.5, "valid_targets_min": 1911 }, { "epoch": 3.7931960608773503, "grad_norm": 0.7148038157802632, "learning_rate": 2.0597714759727028e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.17320764064788818, "step": 2120, "valid_targets_mean": 3600.4, "valid_targets_min": 1208 }, { "epoch": 3.802148612354521, "grad_norm": 0.568336718540444, "learning_rate": 2.050852451875163e-05, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.10769255459308624, "step": 2125, "valid_targets_mean": 3134.1, "valid_targets_min": 724 }, { "epoch": 3.811101163831692, "grad_norm": 2.2889402597376063, "learning_rate": 2.041932415688212e-05, "loss": 0.3295, "loss_nan_ranks": 0, "loss_rank_avg": 0.24901776015758514, "step": 2130, "valid_targets_mean": 5238.8, "valid_targets_min": 1279 }, { "epoch": 3.820053715308863, "grad_norm": 0.7498566172955531, "learning_rate": 2.0330115449426054e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.17251518368721008, "step": 2135, "valid_targets_mean": 3523.2, "valid_targets_min": 1317 }, { "epoch": 3.829006266786034, "grad_norm": 0.6454834290568767, "learning_rate": 2.0240900171857064e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.13242211937904358, "step": 2140, "valid_targets_mean": 2924.2, "valid_targets_min": 1211 }, { "epoch": 3.837958818263205, "grad_norm": 0.7545116802419165, "learning_rate": 2.0151680099779574e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.14533577859401703, "step": 2145, "valid_targets_mean": 2128.8, "valid_targets_min": 923 }, { "epoch": 3.846911369740376, "grad_norm": 0.5716602619910933, "learning_rate": 2.0062457008893408e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.13911041617393494, "step": 2150, "valid_targets_mean": 5648.6, "valid_targets_min": 686 }, { "epoch": 3.855863921217547, "grad_norm": 0.719492062343642, "learning_rate": 1.9973232674958487e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.18894167244434357, "step": 2155, "valid_targets_mean": 2912.6, "valid_targets_min": 1167 }, { "epoch": 3.864816472694718, "grad_norm": 0.6512482583559067, "learning_rate": 1.9884008873759446e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.13799162209033966, "step": 2160, "valid_targets_mean": 3115.5, "valid_targets_min": 1117 }, { "epoch": 3.8737690241718887, "grad_norm": 0.5445724516346668, "learning_rate": 1.979478738107035e-05, "loss": 0.33, "loss_nan_ranks": 0, "loss_rank_avg": 0.20787352323532104, "step": 2165, "valid_targets_mean": 6374.6, "valid_targets_min": 1262 }, { "epoch": 3.88272157564906, "grad_norm": 0.5513455230236962, "learning_rate": 1.9705569972619295e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.14444196224212646, "step": 2170, "valid_targets_mean": 5843.2, "valid_targets_min": 1690 }, { "epoch": 3.891674127126231, "grad_norm": 1.1283522903092538, "learning_rate": 1.961635842405311e-05, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.14688581228256226, "step": 2175, "valid_targets_mean": 4568.0, "valid_targets_min": 1533 }, { "epoch": 3.900626678603402, "grad_norm": 0.46615888239311576, "learning_rate": 1.9527154510901972e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.12086974084377289, "step": 2180, "valid_targets_mean": 5431.4, "valid_targets_min": 852 }, { "epoch": 3.909579230080573, "grad_norm": 0.6815721768826772, "learning_rate": 1.9437960008544126e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.11174547672271729, "step": 2185, "valid_targets_mean": 2458.1, "valid_targets_min": 857 }, { "epoch": 3.918531781557744, "grad_norm": 0.6300320312371228, "learning_rate": 1.9348776692170494e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.1311410665512085, "step": 2190, "valid_targets_mean": 3613.5, "valid_targets_min": 1647 }, { "epoch": 3.927484333034915, "grad_norm": 0.6036465789016668, "learning_rate": 1.9259606336749374e-05, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.13302668929100037, "step": 2195, "valid_targets_mean": 3842.6, "valid_targets_min": 1443 }, { "epoch": 3.936436884512086, "grad_norm": 0.5896110554577646, "learning_rate": 1.9170450716991122e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.12744395434856415, "step": 2200, "valid_targets_mean": 2985.9, "valid_targets_min": 1156 }, { "epoch": 3.9453894359892567, "grad_norm": 0.6582203423205444, "learning_rate": 1.90813116073128e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.17242342233657837, "step": 2205, "valid_targets_mean": 4057.6, "valid_targets_min": 1444 }, { "epoch": 3.954341987466428, "grad_norm": 0.6421456714075086, "learning_rate": 1.899219078180289e-05, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.14306621253490448, "step": 2210, "valid_targets_mean": 3036.6, "valid_targets_min": 1355 }, { "epoch": 3.963294538943599, "grad_norm": 0.6036407507169996, "learning_rate": 1.8903090014185984e-05, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.13021019101142883, "step": 2215, "valid_targets_mean": 3490.6, "valid_targets_min": 1559 }, { "epoch": 3.97224709042077, "grad_norm": 0.6312426539317694, "learning_rate": 1.881401107778744e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.14264509081840515, "step": 2220, "valid_targets_mean": 3784.1, "valid_targets_min": 1696 }, { "epoch": 3.981199641897941, "grad_norm": 0.7232138636484131, "learning_rate": 1.8724955745498147e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.1296793520450592, "step": 2225, "valid_targets_mean": 2648.1, "valid_targets_min": 1959 }, { "epoch": 3.990152193375112, "grad_norm": 0.7135232139570937, "learning_rate": 1.863592578973921e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.1762787401676178, "step": 2230, "valid_targets_mean": 2832.0, "valid_targets_min": 1144 }, { "epoch": 3.999104744852283, "grad_norm": 0.6524854149615098, "learning_rate": 1.854692298242667e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.08761607855558395, "step": 2235, "valid_targets_mean": 2061.9, "valid_targets_min": 1150 }, { "epoch": 4.007162041181736, "grad_norm": 0.652689916111008, "learning_rate": 1.8457949094936265e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.1780852973461151, "step": 2240, "valid_targets_mean": 3954.2, "valid_targets_min": 1405 }, { "epoch": 4.016114592658908, "grad_norm": 0.6939405565326737, "learning_rate": 1.8369005898068136e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.13696125149726868, "step": 2245, "valid_targets_mean": 3110.2, "valid_targets_min": 1338 }, { "epoch": 4.025067144136079, "grad_norm": 0.6378249349993657, "learning_rate": 1.8280095162011617e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.13300368189811707, "step": 2250, "valid_targets_mean": 4896.8, "valid_targets_min": 592 }, { "epoch": 4.0340196956132495, "grad_norm": 0.7368942381013488, "learning_rate": 1.819121865630998e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.15255354344844818, "step": 2255, "valid_targets_mean": 3039.0, "valid_targets_min": 1374 }, { "epoch": 4.042972247090421, "grad_norm": 0.7766928914583657, "learning_rate": 1.8102378149825242e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.13009774684906006, "step": 2260, "valid_targets_mean": 2237.8, "valid_targets_min": 1130 }, { "epoch": 4.051924798567592, "grad_norm": 0.7000134703860864, "learning_rate": 1.801357541070294e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.1389508992433548, "step": 2265, "valid_targets_mean": 3212.9, "valid_targets_min": 1664 }, { "epoch": 4.060877350044763, "grad_norm": 0.63986533138509, "learning_rate": 1.7924812206336956e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371454894542694, "step": 2270, "valid_targets_mean": 3442.1, "valid_targets_min": 1547 }, { "epoch": 4.069829901521934, "grad_norm": 0.7149119111892002, "learning_rate": 1.7836090303334312e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.14737096428871155, "step": 2275, "valid_targets_mean": 3364.8, "valid_targets_min": 1102 }, { "epoch": 4.078782452999104, "grad_norm": 0.7621996479130542, "learning_rate": 1.7747411467480058e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.07246645539999008, "step": 2280, "valid_targets_mean": 2137.5, "valid_targets_min": 297 }, { "epoch": 4.087735004476276, "grad_norm": 0.6927270599507354, "learning_rate": 1.7658777463702076e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.13911257684230804, "step": 2285, "valid_targets_mean": 3724.5, "valid_targets_min": 1392 }, { "epoch": 4.096687555953447, "grad_norm": 0.6592900626100703, "learning_rate": 1.7570190056035996e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12096744775772095, "step": 2290, "valid_targets_mean": 3600.1, "valid_targets_min": 629 }, { "epoch": 4.1056401074306175, "grad_norm": 0.5529767948719162, "learning_rate": 1.7481651007590054e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.08802123367786407, "step": 2295, "valid_targets_mean": 3757.2, "valid_targets_min": 943 }, { "epoch": 4.114592658907789, "grad_norm": 0.7168183953666155, "learning_rate": 1.7393162080510045e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.11998733878135681, "step": 2300, "valid_targets_mean": 3039.2, "valid_targets_min": 1347 }, { "epoch": 4.12354521038496, "grad_norm": 0.6658442031434119, "learning_rate": 1.7304725035944194e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.18848788738250732, "step": 2305, "valid_targets_mean": 4259.6, "valid_targets_min": 1697 }, { "epoch": 4.132497761862131, "grad_norm": 0.6199747775481698, "learning_rate": 1.7216341634008168e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.13999530673027039, "step": 2310, "valid_targets_mean": 4771.9, "valid_targets_min": 1507 }, { "epoch": 4.141450313339302, "grad_norm": 0.6147583167095588, "learning_rate": 1.7128013633749978e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.09678598493337631, "step": 2315, "valid_targets_mean": 3455.9, "valid_targets_min": 1205 }, { "epoch": 4.150402864816472, "grad_norm": 0.6828990726624986, "learning_rate": 1.7039742793115025e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.21309149265289307, "step": 2320, "valid_targets_mean": 4329.9, "valid_targets_min": 1531 }, { "epoch": 4.159355416293644, "grad_norm": 0.6398092008512408, "learning_rate": 1.6951530868911097e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.13850344717502594, "step": 2325, "valid_targets_mean": 4057.2, "valid_targets_min": 1079 }, { "epoch": 4.168307967770815, "grad_norm": 0.5902243331399586, "learning_rate": 1.6863379616773388e-05, "loss": 0.2889, "loss_nan_ranks": 0, "loss_rank_avg": 0.13679037988185883, "step": 2330, "valid_targets_mean": 5202.8, "valid_targets_min": 1586 }, { "epoch": 4.1772605192479855, "grad_norm": 0.7060895769409575, "learning_rate": 1.6775290791129567e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.1696832776069641, "step": 2335, "valid_targets_mean": 3682.5, "valid_targets_min": 686 }, { "epoch": 4.186213070725157, "grad_norm": 0.7160039942556854, "learning_rate": 1.668726614516488e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.14439858496189117, "step": 2340, "valid_targets_mean": 3356.0, "valid_targets_min": 1383 }, { "epoch": 4.195165622202327, "grad_norm": 0.5775126603858747, "learning_rate": 1.6599307430787216e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.15367811918258667, "step": 2345, "valid_targets_mean": 4872.6, "valid_targets_min": 1973 }, { "epoch": 4.204118173679499, "grad_norm": 0.5871347654839713, "learning_rate": 1.6511416398592264e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1796134114265442, "step": 2350, "valid_targets_mean": 4855.1, "valid_targets_min": 1235 }, { "epoch": 4.21307072515667, "grad_norm": 0.6986302940453207, "learning_rate": 1.64235947978287e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.14644259214401245, "step": 2355, "valid_targets_mean": 3897.0, "valid_targets_min": 1721 }, { "epoch": 4.22202327663384, "grad_norm": 0.6254039148831865, "learning_rate": 1.6335844376363295e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.13061976432800293, "step": 2360, "valid_targets_mean": 4755.5, "valid_targets_min": 1734 }, { "epoch": 4.230975828111012, "grad_norm": 0.7819861990910386, "learning_rate": 1.6248166880646225e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.1424158662557602, "step": 2365, "valid_targets_mean": 2361.4, "valid_targets_min": 1039 }, { "epoch": 4.239928379588183, "grad_norm": 0.6227715778784336, "learning_rate": 1.6160564055676235e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.14585551619529724, "step": 2370, "valid_targets_mean": 3901.1, "valid_targets_min": 1765 }, { "epoch": 4.2488809310653535, "grad_norm": 0.6909008649845587, "learning_rate": 1.6073037644965938e-05, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.14594003558158875, "step": 2375, "valid_targets_mean": 4022.0, "valid_targets_min": 1773 }, { "epoch": 4.257833482542525, "grad_norm": 0.46912244899919914, "learning_rate": 1.5985589390507117e-05, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.06319141387939453, "step": 2380, "valid_targets_mean": 2577.6, "valid_targets_min": 1459 }, { "epoch": 4.266786034019695, "grad_norm": 0.7369101921583909, "learning_rate": 1.589822103273607e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.14047077298164368, "step": 2385, "valid_targets_mean": 2833.1, "valid_targets_min": 1702 }, { "epoch": 4.275738585496867, "grad_norm": 0.7399346097155552, "learning_rate": 1.5810934310498922e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.1556873321533203, "step": 2390, "valid_targets_mean": 3457.5, "valid_targets_min": 1405 }, { "epoch": 4.284691136974038, "grad_norm": 0.5486188212174534, "learning_rate": 1.5723730961017082e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.14268964529037476, "step": 2395, "valid_targets_mean": 5756.1, "valid_targets_min": 1075 }, { "epoch": 4.293643688451208, "grad_norm": 0.5690671174903594, "learning_rate": 1.5636612719852615e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.12536361813545227, "step": 2400, "valid_targets_mean": 3819.0, "valid_targets_min": 762 }, { "epoch": 4.30259623992838, "grad_norm": 0.8433999368027125, "learning_rate": 1.5549581320873715e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2086883932352066, "step": 2405, "valid_targets_mean": 4699.0, "valid_targets_min": 1064 }, { "epoch": 4.311548791405551, "grad_norm": 0.5776608739956453, "learning_rate": 1.5462638496220223e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1258239895105362, "step": 2410, "valid_targets_mean": 5195.8, "valid_targets_min": 1653 }, { "epoch": 4.3205013428827215, "grad_norm": 0.6302947068102072, "learning_rate": 1.537578597626912e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.172328382730484, "step": 2415, "valid_targets_mean": 4611.9, "valid_targets_min": 1465 }, { "epoch": 4.329453894359893, "grad_norm": 0.5973858707112296, "learning_rate": 1.528902548960009e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.11022946983575821, "step": 2420, "valid_targets_mean": 2726.6, "valid_targets_min": 767 }, { "epoch": 4.338406445837063, "grad_norm": 0.7250095814311094, "learning_rate": 1.5202358762961155e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334499567747116, "step": 2425, "valid_targets_mean": 2546.6, "valid_targets_min": 607 }, { "epoch": 4.347358997314235, "grad_norm": 0.5687437987785104, "learning_rate": 1.511578752123426e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.1087578758597374, "step": 2430, "valid_targets_mean": 3391.1, "valid_targets_min": 1508 }, { "epoch": 4.356311548791406, "grad_norm": 0.6236160085767933, "learning_rate": 1.5029313487400958e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.15010881423950195, "step": 2435, "valid_targets_mean": 4927.9, "valid_targets_min": 974 }, { "epoch": 4.365264100268576, "grad_norm": 0.6108000626099473, "learning_rate": 1.4942938382508147e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.14772196114063263, "step": 2440, "valid_targets_mean": 4286.6, "valid_targets_min": 2408 }, { "epoch": 4.374216651745748, "grad_norm": 0.5794759583267514, "learning_rate": 1.4856663925633776e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.18810175359249115, "step": 2445, "valid_targets_mean": 6704.9, "valid_targets_min": 1239 }, { "epoch": 4.383169203222918, "grad_norm": 0.5144877574661774, "learning_rate": 1.4770491833852663e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.10823938250541687, "step": 2450, "valid_targets_mean": 4218.6, "valid_targets_min": 1567 }, { "epoch": 4.3921217547000895, "grad_norm": 0.6115457695521388, "learning_rate": 1.4684423822202297e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.1742391586303711, "step": 2455, "valid_targets_mean": 4900.4, "valid_targets_min": 1170 }, { "epoch": 4.401074306177261, "grad_norm": 0.6603355387772237, "learning_rate": 1.4598461603648736e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.1439456045627594, "step": 2460, "valid_targets_mean": 4160.2, "valid_targets_min": 1588 }, { "epoch": 4.410026857654431, "grad_norm": 0.5592975604579535, "learning_rate": 1.451260688905245e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.12507349252700806, "step": 2465, "valid_targets_mean": 4971.6, "valid_targets_min": 1627 }, { "epoch": 4.418979409131603, "grad_norm": 0.5425052312698014, "learning_rate": 1.4426861387134361e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.11168238520622253, "step": 2470, "valid_targets_mean": 4877.9, "valid_targets_min": 1707 }, { "epoch": 4.427931960608774, "grad_norm": 0.5221747063544983, "learning_rate": 1.4341226804441766e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.12132534384727478, "step": 2475, "valid_targets_mean": 5736.0, "valid_targets_min": 1785 }, { "epoch": 4.436884512085944, "grad_norm": 0.6687015942354837, "learning_rate": 1.4255704845314406e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.08877840638160706, "step": 2480, "valid_targets_mean": 3548.1, "valid_targets_min": 1012 }, { "epoch": 4.445837063563116, "grad_norm": 0.6764095401280212, "learning_rate": 1.4170297211850522e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.1928788721561432, "step": 2485, "valid_targets_mean": 4394.4, "valid_targets_min": 2121 }, { "epoch": 4.454789615040286, "grad_norm": 0.6534942221563793, "learning_rate": 1.4085005603873004e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1439860314130783, "step": 2490, "valid_targets_mean": 4347.1, "valid_targets_min": 1227 }, { "epoch": 4.4637421665174575, "grad_norm": 0.6576143650799924, "learning_rate": 1.3999831718895545e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.14860865473747253, "step": 2495, "valid_targets_mean": 4357.6, "valid_targets_min": 1706 }, { "epoch": 4.472694717994629, "grad_norm": 0.6216399384728338, "learning_rate": 1.3914777252088851e-05, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.0829973816871643, "step": 2500, "valid_targets_mean": 2239.1, "valid_targets_min": 1102 }, { "epoch": 4.481647269471799, "grad_norm": 0.677746287070446, "learning_rate": 1.3829843896246917e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.10659922659397125, "step": 2505, "valid_targets_mean": 3080.5, "valid_targets_min": 1430 }, { "epoch": 4.490599820948971, "grad_norm": 0.6894645564542359, "learning_rate": 1.3745033341753337e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.14530538022518158, "step": 2510, "valid_targets_mean": 3823.0, "valid_targets_min": 713 }, { "epoch": 4.499552372426141, "grad_norm": 0.6848821237514404, "learning_rate": 1.3660347276547645e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529255509376526, "step": 2515, "valid_targets_mean": 3820.8, "valid_targets_min": 1396 }, { "epoch": 4.508504923903312, "grad_norm": 0.6641129507383274, "learning_rate": 1.3575787386091745e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.14307177066802979, "step": 2520, "valid_targets_mean": 3578.8, "valid_targets_min": 1528 }, { "epoch": 4.517457475380484, "grad_norm": 0.536151610151765, "learning_rate": 1.3491355353336338e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.12758341431617737, "step": 2525, "valid_targets_mean": 4726.1, "valid_targets_min": 1227 }, { "epoch": 4.526410026857654, "grad_norm": 0.7168460298420432, "learning_rate": 1.3407052858687432e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.16223827004432678, "step": 2530, "valid_targets_mean": 4002.4, "valid_targets_min": 799 }, { "epoch": 4.5353625783348255, "grad_norm": 0.5770371894689392, "learning_rate": 1.3322881579972934e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.19758792221546173, "step": 2535, "valid_targets_mean": 6236.2, "valid_targets_min": 1662 }, { "epoch": 4.544315129811997, "grad_norm": 0.635407424302777, "learning_rate": 1.323884319240921e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.14273598790168762, "step": 2540, "valid_targets_mean": 3251.4, "valid_targets_min": 566 }, { "epoch": 4.553267681289167, "grad_norm": 0.6247115660878144, "learning_rate": 1.3154939368567771e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.11011286079883575, "step": 2545, "valid_targets_mean": 3317.2, "valid_targets_min": 1259 }, { "epoch": 4.562220232766339, "grad_norm": 0.7097429777926196, "learning_rate": 1.3071171778341975e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.11763446033000946, "step": 2550, "valid_targets_mean": 2547.4, "valid_targets_min": 1533 }, { "epoch": 4.571172784243509, "grad_norm": 0.7507832272507481, "learning_rate": 1.2987542088913801e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.15912875533103943, "step": 2555, "valid_targets_mean": 3061.6, "valid_targets_min": 1198 }, { "epoch": 4.58012533572068, "grad_norm": 0.688816376455702, "learning_rate": 1.290405196472064e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.14911401271820068, "step": 2560, "valid_targets_mean": 3128.0, "valid_targets_min": 795 }, { "epoch": 4.589077887197852, "grad_norm": 0.661762219202973, "learning_rate": 1.282070306742222e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.12021621316671371, "step": 2565, "valid_targets_mean": 2507.5, "valid_targets_min": 1491 }, { "epoch": 4.598030438675022, "grad_norm": 0.9591904980428351, "learning_rate": 1.2737497055867482e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.11839226633310318, "step": 2570, "valid_targets_mean": 1713.8, "valid_targets_min": 1207 }, { "epoch": 4.6069829901521935, "grad_norm": 0.6924345045587993, "learning_rate": 1.2654435586061604e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.16126775741577148, "step": 2575, "valid_targets_mean": 3368.1, "valid_targets_min": 1571 }, { "epoch": 4.615935541629364, "grad_norm": 0.6083972711681029, "learning_rate": 1.2571520311133012e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.23135092854499817, "step": 2580, "valid_targets_mean": 5297.0, "valid_targets_min": 940 }, { "epoch": 4.624888093106535, "grad_norm": 0.6780051708511852, "learning_rate": 1.2488752881300514e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.10475669801235199, "step": 2585, "valid_targets_mean": 2886.1, "valid_targets_min": 1939 }, { "epoch": 4.633840644583707, "grad_norm": 0.5687322217353462, "learning_rate": 1.2406134943840398e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.14360423386096954, "step": 2590, "valid_targets_mean": 4537.2, "valid_targets_min": 1153 }, { "epoch": 4.642793196060877, "grad_norm": 0.6473869261700407, "learning_rate": 1.232366814305372e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.11344386637210846, "step": 2595, "valid_targets_mean": 3455.0, "valid_targets_min": 935 }, { "epoch": 4.651745747538048, "grad_norm": 0.6749099477987037, "learning_rate": 1.2241354120233527e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.15856057405471802, "step": 2600, "valid_targets_mean": 4211.4, "valid_targets_min": 913 }, { "epoch": 4.66069829901522, "grad_norm": 0.7881154419641004, "learning_rate": 1.2159194513632213e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.1507546603679657, "step": 2605, "valid_targets_mean": 2755.9, "valid_targets_min": 1225 }, { "epoch": 4.66965085049239, "grad_norm": 0.7379646376101288, "learning_rate": 1.20771909584289e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.09531432390213013, "step": 2610, "valid_targets_mean": 2293.4, "valid_targets_min": 863 }, { "epoch": 4.6786034019695615, "grad_norm": 0.6830443105031209, "learning_rate": 1.1995345086696919e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.1766771525144577, "step": 2615, "valid_targets_mean": 3217.0, "valid_targets_min": 1326 }, { "epoch": 4.687555953446733, "grad_norm": 0.5962665890821673, "learning_rate": 1.1913658527371284e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.14932385087013245, "step": 2620, "valid_targets_mean": 5058.2, "valid_targets_min": 1528 }, { "epoch": 4.696508504923903, "grad_norm": 0.47356874610934896, "learning_rate": 1.1832132906216314e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.18485575914382935, "step": 2625, "valid_targets_mean": 8106.5, "valid_targets_min": 1666 }, { "epoch": 4.705461056401075, "grad_norm": 0.56409332554102, "learning_rate": 1.1750769845793268e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.16708049178123474, "step": 2630, "valid_targets_mean": 5391.1, "valid_targets_min": 1698 }, { "epoch": 4.714413607878245, "grad_norm": 0.601411143213395, "learning_rate": 1.1669570965428028e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.1906755566596985, "step": 2635, "valid_targets_mean": 5690.4, "valid_targets_min": 1583 }, { "epoch": 4.723366159355416, "grad_norm": 0.6789549439651793, "learning_rate": 1.1588537881178902e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.11652162671089172, "step": 2640, "valid_targets_mean": 2992.8, "valid_targets_min": 1505 }, { "epoch": 4.732318710832587, "grad_norm": 0.6723833109915706, "learning_rate": 1.150767220580444e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.11995535343885422, "step": 2645, "valid_targets_mean": 3536.5, "valid_targets_min": 1642 }, { "epoch": 4.741271262309758, "grad_norm": 0.6575823926090214, "learning_rate": 1.1426975548731329e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.10528416931629181, "step": 2650, "valid_targets_mean": 3233.6, "valid_targets_min": 1417 }, { "epoch": 4.7502238137869295, "grad_norm": 0.8973962588630344, "learning_rate": 1.1346449516022395e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.13312417268753052, "step": 2655, "valid_targets_mean": 2539.0, "valid_targets_min": 1387 }, { "epoch": 4.7591763652641, "grad_norm": 0.7406132454253875, "learning_rate": 1.1266095710344611e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.11993972957134247, "step": 2660, "valid_targets_mean": 2144.9, "valid_targets_min": 1320 }, { "epoch": 4.768128916741271, "grad_norm": 0.6553369560744424, "learning_rate": 1.1185915730937209e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.2034987509250641, "step": 2665, "valid_targets_mean": 4664.8, "valid_targets_min": 2213 }, { "epoch": 4.777081468218443, "grad_norm": 0.6504080770189988, "learning_rate": 1.1105911173579831e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.13247156143188477, "step": 2670, "valid_targets_mean": 3853.6, "valid_targets_min": 1582 }, { "epoch": 4.786034019695613, "grad_norm": 0.5396966396231404, "learning_rate": 1.1026083630560814e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.13336597383022308, "step": 2675, "valid_targets_mean": 4759.8, "valid_targets_min": 1589 }, { "epoch": 4.794986571172784, "grad_norm": 0.7028031847571087, "learning_rate": 1.0946434690645446e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.11444665491580963, "step": 2680, "valid_targets_mean": 2722.8, "valid_targets_min": 957 }, { "epoch": 4.803939122649956, "grad_norm": 0.7611209196171498, "learning_rate": 1.08669659390444e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.15461182594299316, "step": 2685, "valid_targets_mean": 2940.1, "valid_targets_min": 1102 }, { "epoch": 4.812891674127126, "grad_norm": 0.4826017225952945, "learning_rate": 1.0787678957382124e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.14187920093536377, "step": 2690, "valid_targets_mean": 7101.1, "valid_targets_min": 2404 }, { "epoch": 4.8218442256042975, "grad_norm": 0.6866006226835454, "learning_rate": 1.0708575323665422e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.22017309069633484, "step": 2695, "valid_targets_mean": 4468.1, "valid_targets_min": 945 }, { "epoch": 4.830796777081468, "grad_norm": 0.5309211399639769, "learning_rate": 1.062965661225201e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.2241315245628357, "step": 2700, "valid_targets_mean": 7465.5, "valid_targets_min": 2375 }, { "epoch": 4.839749328558639, "grad_norm": 0.4591025984323562, "learning_rate": 1.0550924393819204e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.11950083076953888, "step": 2705, "valid_targets_mean": 7293.9, "valid_targets_min": 1849 }, { "epoch": 4.84870188003581, "grad_norm": 0.6619076366623318, "learning_rate": 1.0472380235332631e-05, "loss": 0.286, "loss_nan_ranks": 0, "loss_rank_avg": 0.22019797563552856, "step": 2710, "valid_targets_mean": 4832.2, "valid_targets_min": 1383 }, { "epoch": 4.857654431512981, "grad_norm": 0.5843763984853266, "learning_rate": 1.0394025700015064e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.13572683930397034, "step": 2715, "valid_targets_mean": 5376.1, "valid_targets_min": 603 }, { "epoch": 4.866606982990152, "grad_norm": 0.7344743693867272, "learning_rate": 1.0315862347315314e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.16285094618797302, "step": 2720, "valid_targets_mean": 2709.2, "valid_targets_min": 715 }, { "epoch": 4.875559534467323, "grad_norm": 0.6503799281847995, "learning_rate": 1.0237891732877202e-05, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.07052436470985413, "step": 2725, "valid_targets_mean": 2046.9, "valid_targets_min": 984 }, { "epoch": 4.884512085944494, "grad_norm": 0.617330707981824, "learning_rate": 1.0160115408508533e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.12248671799898148, "step": 2730, "valid_targets_mean": 4232.9, "valid_targets_min": 1337 }, { "epoch": 4.8934646374216655, "grad_norm": 0.7526164512433189, "learning_rate": 1.008253492215031e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.12305112183094025, "step": 2735, "valid_targets_mean": 2726.4, "valid_targets_min": 1245 }, { "epoch": 4.902417188898836, "grad_norm": 0.7644756910958415, "learning_rate": 1.0005151817845853e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.1255050152540207, "step": 2740, "valid_targets_mean": 3517.9, "valid_targets_min": 1480 }, { "epoch": 4.911369740376007, "grad_norm": 0.697384124011533, "learning_rate": 9.927967635710087e-06, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.198576420545578, "step": 2745, "valid_targets_mean": 3570.9, "valid_targets_min": 1700 }, { "epoch": 4.920322291853179, "grad_norm": 0.6518775685954262, "learning_rate": 9.850983911898913e-06, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.13477128744125366, "step": 2750, "valid_targets_mean": 3412.9, "valid_targets_min": 1245 }, { "epoch": 4.929274843330349, "grad_norm": 0.5702427451034175, "learning_rate": 9.774202178578592e-06, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.13000229001045227, "step": 2755, "valid_targets_mean": 5218.1, "valid_targets_min": 867 }, { "epoch": 4.93822739480752, "grad_norm": 0.5856656942790103, "learning_rate": 9.69762396389529e-06, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.17482590675354004, "step": 2760, "valid_targets_mean": 6087.2, "valid_targets_min": 309 }, { "epoch": 4.947179946284691, "grad_norm": 0.5588495480516651, "learning_rate": 9.621250791944659e-06, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.14949437975883484, "step": 2765, "valid_targets_mean": 6034.0, "valid_targets_min": 2237 }, { "epoch": 4.956132497761862, "grad_norm": 0.6552422528340169, "learning_rate": 9.545084182741476e-06, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.13703200221061707, "step": 2770, "valid_targets_mean": 4118.9, "valid_targets_min": 1240 }, { "epoch": 4.9650850492390335, "grad_norm": 0.6357647022187265, "learning_rate": 9.469125652189403e-06, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.16705867648124695, "step": 2775, "valid_targets_mean": 4768.6, "valid_targets_min": 1812 }, { "epoch": 4.974037600716204, "grad_norm": 0.6226941191762654, "learning_rate": 9.393376712050847e-06, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.10897770524024963, "step": 2780, "valid_targets_mean": 3234.6, "valid_targets_min": 1360 }, { "epoch": 4.982990152193375, "grad_norm": 0.6967866479605265, "learning_rate": 9.317838869916835e-06, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.13590985536575317, "step": 2785, "valid_targets_mean": 3151.5, "valid_targets_min": 1099 }, { "epoch": 4.991942703670546, "grad_norm": 0.7032441654198661, "learning_rate": 9.242513629177033e-06, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.09712253510951996, "step": 2790, "valid_targets_mean": 2091.2, "valid_targets_min": 1157 }, { "epoch": 5.0, "grad_norm": 0.8998685532132251, "learning_rate": 9.167402488989784e-06, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.21871262788772583, "step": 2795, "valid_targets_mean": 3141.6, "valid_targets_min": 1243 }, { "epoch": 5.008952551477171, "grad_norm": 0.5672203119629013, "learning_rate": 9.092506944252344e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.09469739347696304, "step": 2800, "valid_targets_mean": 3623.1, "valid_targets_min": 1407 }, { "epoch": 5.017905102954342, "grad_norm": 0.655519497598404, "learning_rate": 9.017828485571044e-06, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.17740251123905182, "step": 2805, "valid_targets_mean": 4623.1, "valid_targets_min": 2129 }, { "epoch": 5.026857654431513, "grad_norm": 0.7020677912715662, "learning_rate": 8.943368599231706e-06, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.13922971487045288, "step": 2810, "valid_targets_mean": 3362.6, "valid_targets_min": 479 }, { "epoch": 5.035810205908684, "grad_norm": 0.825644641170174, "learning_rate": 8.869128767169986e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.1696254163980484, "step": 2815, "valid_targets_mean": 3811.8, "valid_targets_min": 1768 }, { "epoch": 5.044762757385855, "grad_norm": 0.8818205726342686, "learning_rate": 8.79511046694194e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.13734868168830872, "step": 2820, "valid_targets_mean": 2140.6, "valid_targets_min": 1360 }, { "epoch": 5.053715308863026, "grad_norm": 0.702209345246406, "learning_rate": 8.721315171694591e-06, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.18483301997184753, "step": 2825, "valid_targets_mean": 6754.9, "valid_targets_min": 1059 }, { "epoch": 5.062667860340197, "grad_norm": 0.6393303273760027, "learning_rate": 8.647744350136612e-06, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.11104267835617065, "step": 2830, "valid_targets_mean": 3685.9, "valid_targets_min": 1589 }, { "epoch": 5.071620411817368, "grad_norm": 0.5255206558374389, "learning_rate": 8.574399466509085e-06, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.10467648506164551, "step": 2835, "valid_targets_mean": 5690.4, "valid_targets_min": 2675 }, { "epoch": 5.080572963294539, "grad_norm": 0.7143778521850589, "learning_rate": 8.501281980556369e-06, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.10567007958889008, "step": 2840, "valid_targets_mean": 2356.2, "valid_targets_min": 650 }, { "epoch": 5.08952551477171, "grad_norm": 0.716682380290392, "learning_rate": 8.428393347497057e-06, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.16459281742572784, "step": 2845, "valid_targets_mean": 3752.9, "valid_targets_min": 943 }, { "epoch": 5.098478066248881, "grad_norm": 0.5273948530519541, "learning_rate": 8.355735017995011e-06, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.13910041749477386, "step": 2850, "valid_targets_mean": 6443.0, "valid_targets_min": 1560 }, { "epoch": 5.107430617726052, "grad_norm": 0.6510951941881681, "learning_rate": 8.283308438130458e-06, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.1511838138103485, "step": 2855, "valid_targets_mean": 4896.4, "valid_targets_min": 1342 }, { "epoch": 5.116383169203223, "grad_norm": 0.6858690794166993, "learning_rate": 8.211115049371266e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.12362384796142578, "step": 2860, "valid_targets_mean": 2373.6, "valid_targets_min": 957 }, { "epoch": 5.125335720680394, "grad_norm": 0.5535898753458209, "learning_rate": 8.13915628854419e-06, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.07326360791921616, "step": 2865, "valid_targets_mean": 3076.2, "valid_targets_min": 634 }, { "epoch": 5.134288272157565, "grad_norm": 0.7396227483650418, "learning_rate": 8.067433587806336e-06, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.11240927875041962, "step": 2870, "valid_targets_mean": 2971.2, "valid_targets_min": 1502 }, { "epoch": 5.143240823634736, "grad_norm": 0.7846909642291244, "learning_rate": 7.995948374616628e-06, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.20373129844665527, "step": 2875, "valid_targets_mean": 3556.4, "valid_targets_min": 1123 }, { "epoch": 5.1521933751119064, "grad_norm": 0.6285062997656536, "learning_rate": 7.924702071707386e-06, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.14518675208091736, "step": 2880, "valid_targets_mean": 4632.1, "valid_targets_min": 1531 }, { "epoch": 5.161145926589078, "grad_norm": 0.6039304591242447, "learning_rate": 7.853696097056037e-06, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.11315350234508514, "step": 2885, "valid_targets_mean": 4218.2, "valid_targets_min": 2653 }, { "epoch": 5.170098478066249, "grad_norm": 0.8183337860784501, "learning_rate": 7.782931863856888e-06, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.12211750447750092, "step": 2890, "valid_targets_mean": 2672.9, "valid_targets_min": 1298 }, { "epoch": 5.17905102954342, "grad_norm": 0.7130275214913603, "learning_rate": 7.71241078049298e-06, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.09092959016561508, "step": 2895, "valid_targets_mean": 2564.5, "valid_targets_min": 1837 }, { "epoch": 5.188003581020591, "grad_norm": 0.5935134877912135, "learning_rate": 7.642134250508069e-06, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.15817828476428986, "step": 2900, "valid_targets_mean": 5829.6, "valid_targets_min": 1443 }, { "epoch": 5.196956132497762, "grad_norm": 0.8005018784062845, "learning_rate": 7.57210367257871e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.10520976781845093, "step": 2905, "valid_targets_mean": 1867.4, "valid_targets_min": 1007 }, { "epoch": 5.205908683974933, "grad_norm": 0.798936430838001, "learning_rate": 7.502320440486399e-06, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396452784538269, "step": 2910, "valid_targets_mean": 3387.9, "valid_targets_min": 1281 }, { "epoch": 5.214861235452104, "grad_norm": 0.6016086885660464, "learning_rate": 7.4327859430898445e-06, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.11716702580451965, "step": 2915, "valid_targets_mean": 4086.6, "valid_targets_min": 2135 }, { "epoch": 5.2238137869292744, "grad_norm": 0.6393638894017067, "learning_rate": 7.363501564297302e-06, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.13421833515167236, "step": 2920, "valid_targets_mean": 3354.6, "valid_targets_min": 1245 }, { "epoch": 5.232766338406446, "grad_norm": 0.8074938423836445, "learning_rate": 7.294468683039058e-06, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262279748916626, "step": 2925, "valid_targets_mean": 2581.8, "valid_targets_min": 1215 }, { "epoch": 5.241718889883617, "grad_norm": 0.8329732110149718, "learning_rate": 7.225688673239981e-06, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.16714711487293243, "step": 2930, "valid_targets_mean": 2932.5, "valid_targets_min": 1553 }, { "epoch": 5.250671441360788, "grad_norm": 0.7395911133371526, "learning_rate": 7.1571629037921804e-06, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.13582395017147064, "step": 2935, "valid_targets_mean": 3136.4, "valid_targets_min": 1113 }, { "epoch": 5.259623992837959, "grad_norm": 0.614797462595206, "learning_rate": 7.088892738527731e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.16834554076194763, "step": 2940, "valid_targets_mean": 4725.5, "valid_targets_min": 1186 }, { "epoch": 5.26857654431513, "grad_norm": 0.7133096956091478, "learning_rate": 7.020879536191571e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.159225195646286, "step": 2945, "valid_targets_mean": 4072.2, "valid_targets_min": 1758 }, { "epoch": 5.277529095792301, "grad_norm": 0.7046101552726547, "learning_rate": 6.953124650414447e-06, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.22066622972488403, "step": 2950, "valid_targets_mean": 4210.6, "valid_targets_min": 1025 }, { "epoch": 5.286481647269472, "grad_norm": 0.669736961464681, "learning_rate": 6.885629429685943e-06, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.1097680926322937, "step": 2955, "valid_targets_mean": 3142.9, "valid_targets_min": 1246 }, { "epoch": 5.2954341987466425, "grad_norm": 0.8029811043618871, "learning_rate": 6.818395217327696e-06, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.14252065122127533, "step": 2960, "valid_targets_mean": 2978.2, "valid_targets_min": 1504 }, { "epoch": 5.304386750223814, "grad_norm": 0.7781260969246138, "learning_rate": 6.751423351466604e-06, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.10851228982210159, "step": 2965, "valid_targets_mean": 2605.2, "valid_targets_min": 1713 }, { "epoch": 5.313339301700985, "grad_norm": 0.6460543913806297, "learning_rate": 6.684715165008242e-06, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.17115241289138794, "step": 2970, "valid_targets_mean": 4524.1, "valid_targets_min": 1583 }, { "epoch": 5.322291853178156, "grad_norm": 0.7163531771180065, "learning_rate": 6.618271985610316e-06, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.08804437518119812, "step": 2975, "valid_targets_mean": 2492.9, "valid_targets_min": 1156 }, { "epoch": 5.331244404655327, "grad_norm": 0.6507792520937868, "learning_rate": 6.552095135656211e-06, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.17436163127422333, "step": 2980, "valid_targets_mean": 4282.0, "valid_targets_min": 1098 }, { "epoch": 5.340196956132498, "grad_norm": 0.6625767763231452, "learning_rate": 6.486185932228732e-06, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317645013332367, "step": 2985, "valid_targets_mean": 3719.6, "valid_targets_min": 1221 }, { "epoch": 5.349149507609669, "grad_norm": 0.8136256888520679, "learning_rate": 6.420545687083823e-06, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.14313414692878723, "step": 2990, "valid_targets_mean": 2730.9, "valid_targets_min": 1379 }, { "epoch": 5.35810205908684, "grad_norm": 0.704770853254314, "learning_rate": 6.355175706624521e-06, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.12149710953235626, "step": 2995, "valid_targets_mean": 3353.9, "valid_targets_min": 1524 }, { "epoch": 5.3670546105640105, "grad_norm": 0.7794678826905497, "learning_rate": 6.290077291874923e-06, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.20259982347488403, "step": 3000, "valid_targets_mean": 3896.9, "valid_targets_min": 380 }, { "epoch": 5.376007162041182, "grad_norm": 0.5949025014278967, "learning_rate": 6.225251738454281e-06, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.09551064670085907, "step": 3005, "valid_targets_mean": 2741.0, "valid_targets_min": 1655 }, { "epoch": 5.384959713518353, "grad_norm": 0.6274746645978216, "learning_rate": 6.160700336551246e-06, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.12926769256591797, "step": 3010, "valid_targets_mean": 3956.5, "valid_targets_min": 1077 }, { "epoch": 5.393912264995524, "grad_norm": 0.5995098175946255, "learning_rate": 6.096424370898186e-06, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.13776710629463196, "step": 3015, "valid_targets_mean": 5238.2, "valid_targets_min": 1205 }, { "epoch": 5.402864816472695, "grad_norm": 0.8693786800154273, "learning_rate": 6.032425120745586e-06, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.11495324224233627, "step": 3020, "valid_targets_mean": 2983.0, "valid_targets_min": 1227 }, { "epoch": 5.411817367949865, "grad_norm": 0.4417681435455645, "learning_rate": 5.968703859836615e-06, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.08964274823665619, "step": 3025, "valid_targets_mean": 6241.9, "valid_targets_min": 1478 }, { "epoch": 5.420769919427037, "grad_norm": 0.6451109995686765, "learning_rate": 5.905261856381779e-06, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320190727710724, "step": 3030, "valid_targets_mean": 3444.6, "valid_targets_min": 1422 }, { "epoch": 5.429722470904208, "grad_norm": 0.5982446796929841, "learning_rate": 5.8421003730336635e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.19169670343399048, "step": 3035, "valid_targets_mean": 4772.6, "valid_targets_min": 1219 }, { "epoch": 5.4386750223813785, "grad_norm": 1.0526800510164407, "learning_rate": 5.77922066686182e-06, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.129215806722641, "step": 3040, "valid_targets_mean": 3020.8, "valid_targets_min": 1197 }, { "epoch": 5.44762757385855, "grad_norm": 0.710300937036674, "learning_rate": 5.716623989327723e-06, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.1642998456954956, "step": 3045, "valid_targets_mean": 4067.4, "valid_targets_min": 854 }, { "epoch": 5.456580125335721, "grad_norm": 0.6236049531620286, "learning_rate": 5.654311586259882e-06, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.14742004871368408, "step": 3050, "valid_targets_mean": 4697.9, "valid_targets_min": 1989 }, { "epoch": 5.465532676812892, "grad_norm": 0.9100445506977155, "learning_rate": 5.592284697829049e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.12023288756608963, "step": 3055, "valid_targets_mean": 2732.1, "valid_targets_min": 629 }, { "epoch": 5.474485228290063, "grad_norm": 0.7130523821840068, "learning_rate": 5.5305445585235315e-06, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.11885958164930344, "step": 3060, "valid_targets_mean": 2787.4, "valid_targets_min": 1352 }, { "epoch": 5.483437779767233, "grad_norm": 0.6155452380583275, "learning_rate": 5.469092397124609e-06, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.14290834963321686, "step": 3065, "valid_targets_mean": 5837.5, "valid_targets_min": 1530 }, { "epoch": 5.492390331244405, "grad_norm": 0.6357781709172484, "learning_rate": 5.407929436682098e-06, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.10490871220827103, "step": 3070, "valid_targets_mean": 3321.1, "valid_targets_min": 1508 }, { "epoch": 5.501342882721576, "grad_norm": 0.8268851686010698, "learning_rate": 5.347056894490006e-06, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.14326724410057068, "step": 3075, "valid_targets_mean": 3260.1, "valid_targets_min": 1403 }, { "epoch": 5.5102954341987465, "grad_norm": 0.5411962844748759, "learning_rate": 5.286475982062283e-06, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.12881606817245483, "step": 3080, "valid_targets_mean": 6029.1, "valid_targets_min": 1722 }, { "epoch": 5.519247985675918, "grad_norm": 0.6334671165729598, "learning_rate": 5.226187905108746e-06, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.12549631297588348, "step": 3085, "valid_targets_mean": 4009.8, "valid_targets_min": 2518 }, { "epoch": 5.528200537153088, "grad_norm": 0.6692364678732721, "learning_rate": 5.166193863511046e-06, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15974244475364685, "step": 3090, "valid_targets_mean": 4663.0, "valid_targets_min": 1498 }, { "epoch": 5.53715308863026, "grad_norm": 0.6288056109133601, "learning_rate": 5.106495051298815e-06, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.16460061073303223, "step": 3095, "valid_targets_mean": 5248.2, "valid_targets_min": 1210 }, { "epoch": 5.546105640107431, "grad_norm": 0.6708522131884734, "learning_rate": 5.047092656625887e-06, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.1474558711051941, "step": 3100, "valid_targets_mean": 3772.6, "valid_targets_min": 1412 }, { "epoch": 5.555058191584601, "grad_norm": 0.6267068759154054, "learning_rate": 4.98798786174667e-06, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.10332757234573364, "step": 3105, "valid_targets_mean": 3453.0, "valid_targets_min": 1433 }, { "epoch": 5.564010743061773, "grad_norm": 0.6319201392464182, "learning_rate": 4.9291818429925585e-06, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.10445370525121689, "step": 3110, "valid_targets_mean": 3067.1, "valid_targets_min": 1353 }, { "epoch": 5.572963294538944, "grad_norm": 0.5676958670427478, "learning_rate": 4.8706757707486075e-06, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.09762459993362427, "step": 3115, "valid_targets_mean": 4044.8, "valid_targets_min": 1640 }, { "epoch": 5.5819158460161145, "grad_norm": 0.6600426946715785, "learning_rate": 4.812470809430179e-06, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.17617090046405792, "step": 3120, "valid_targets_mean": 5532.6, "valid_targets_min": 1143 }, { "epoch": 5.590868397493286, "grad_norm": 0.72512681265544, "learning_rate": 4.754568117459788e-06, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.13752184808254242, "step": 3125, "valid_targets_mean": 3298.5, "valid_targets_min": 1072 }, { "epoch": 5.599820948970456, "grad_norm": 0.7546139947956615, "learning_rate": 4.69696884724403e-06, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.13179543614387512, "step": 3130, "valid_targets_mean": 2606.4, "valid_targets_min": 954 }, { "epoch": 5.608773500447628, "grad_norm": 0.6414231679701241, "learning_rate": 4.639674145150679e-06, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.13612650334835052, "step": 3135, "valid_targets_mean": 4690.4, "valid_targets_min": 1975 }, { "epoch": 5.617726051924799, "grad_norm": 0.7849198197821255, "learning_rate": 4.582685151485826e-06, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.12271968275308609, "step": 3140, "valid_targets_mean": 2440.4, "valid_targets_min": 1279 }, { "epoch": 5.626678603401969, "grad_norm": 0.7190190450522136, "learning_rate": 4.526003000471238e-06, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.10943076759576797, "step": 3145, "valid_targets_mean": 3442.4, "valid_targets_min": 1326 }, { "epoch": 5.635631154879141, "grad_norm": 0.6723105509161403, "learning_rate": 4.469628820221723e-06, "loss": 0.2407, "loss_nan_ranks": 0, "loss_rank_avg": 0.09454697370529175, "step": 3150, "valid_targets_mean": 2455.6, "valid_targets_min": 1625 }, { "epoch": 5.644583706356311, "grad_norm": 0.6951817724940638, "learning_rate": 4.4135637327227365e-06, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.13040387630462646, "step": 3155, "valid_targets_mean": 3532.4, "valid_targets_min": 1533 }, { "epoch": 5.6535362578334825, "grad_norm": 0.7380519857603212, "learning_rate": 4.357808853808014e-06, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2020113617181778, "step": 3160, "valid_targets_mean": 4735.9, "valid_targets_min": 2317 }, { "epoch": 5.662488809310654, "grad_norm": 0.6194983497856827, "learning_rate": 4.302365293137383e-06, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.09762684255838394, "step": 3165, "valid_targets_mean": 4547.6, "valid_targets_min": 592 }, { "epoch": 5.671441360787824, "grad_norm": 0.6052656519002572, "learning_rate": 4.247234154174649e-06, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.10471494495868683, "step": 3170, "valid_targets_mean": 4168.4, "valid_targets_min": 1212 }, { "epoch": 5.680393912264996, "grad_norm": 0.6514165243579992, "learning_rate": 4.192416534165666e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.12467285245656967, "step": 3175, "valid_targets_mean": 4404.5, "valid_targets_min": 2024 }, { "epoch": 5.689346463742167, "grad_norm": 0.5202351850880886, "learning_rate": 4.137913524116488e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.11434194445610046, "step": 3180, "valid_targets_mean": 4798.5, "valid_targets_min": 734 }, { "epoch": 5.698299015219337, "grad_norm": 0.5713811257106961, "learning_rate": 4.083726208771653e-06, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.13401255011558533, "step": 3185, "valid_targets_mean": 5045.8, "valid_targets_min": 2507 }, { "epoch": 5.707251566696509, "grad_norm": 0.6411090621867449, "learning_rate": 4.0298556665925996e-06, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.14346866309642792, "step": 3190, "valid_targets_mean": 3961.9, "valid_targets_min": 2058 }, { "epoch": 5.716204118173679, "grad_norm": 0.7831831361437512, "learning_rate": 3.976302969736183e-06, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.09419474005699158, "step": 3195, "valid_targets_mean": 2366.5, "valid_targets_min": 1530 }, { "epoch": 5.7251566696508505, "grad_norm": 0.5953201952601799, "learning_rate": 3.923069184033357e-06, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.14828859269618988, "step": 3200, "valid_targets_mean": 5864.6, "valid_targets_min": 1024 }, { "epoch": 5.734109221128022, "grad_norm": 0.6184407471177551, "learning_rate": 3.870155368967963e-06, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13603097200393677, "step": 3205, "valid_targets_mean": 4392.2, "valid_targets_min": 1660 }, { "epoch": 5.743061772605192, "grad_norm": 0.7344526439829354, "learning_rate": 3.8175625776556354e-06, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.14963099360466003, "step": 3210, "valid_targets_mean": 3856.8, "valid_targets_min": 1296 }, { "epoch": 5.752014324082364, "grad_norm": 0.6323484235013329, "learning_rate": 3.76529185682283e-06, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.13975292444229126, "step": 3215, "valid_targets_mean": 4587.0, "valid_targets_min": 2248 }, { "epoch": 5.760966875559534, "grad_norm": 0.7162533875016649, "learning_rate": 3.7133442467860215e-06, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.15536366403102875, "step": 3220, "valid_targets_mean": 4356.5, "valid_targets_min": 1482 }, { "epoch": 5.769919427036705, "grad_norm": 0.6697775409439238, "learning_rate": 3.6617207814309686e-06, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.09813784062862396, "step": 3225, "valid_targets_mean": 2768.2, "valid_targets_min": 1433 }, { "epoch": 5.778871978513877, "grad_norm": 0.724357058918503, "learning_rate": 3.610422488192169e-06, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.11302490532398224, "step": 3230, "valid_targets_mean": 3345.9, "valid_targets_min": 1072 }, { "epoch": 5.787824529991047, "grad_norm": 0.8637753559487381, "learning_rate": 3.559450388032355e-06, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.09676891565322876, "step": 3235, "valid_targets_mean": 2141.9, "valid_targets_min": 1626 }, { "epoch": 5.7967770814682185, "grad_norm": 0.5678361887713559, "learning_rate": 3.508805495422247e-06, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.14245836436748505, "step": 3240, "valid_targets_mean": 4776.8, "valid_targets_min": 1125 }, { "epoch": 5.80572963294539, "grad_norm": 0.8697062311998607, "learning_rate": 3.4584888183203134e-06, "loss": 0.2431, "loss_nan_ranks": 0, "loss_rank_avg": 0.11090271174907684, "step": 3245, "valid_targets_mean": 2297.5, "valid_targets_min": 1552 }, { "epoch": 5.81468218442256, "grad_norm": 0.7206579145760911, "learning_rate": 3.4085013581527295e-06, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.08114241808652878, "step": 3250, "valid_targets_mean": 2197.1, "valid_targets_min": 867 }, { "epoch": 5.823634735899732, "grad_norm": 0.962494971346814, "learning_rate": 3.3588441097934223e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.15923663973808289, "step": 3255, "valid_targets_mean": 2391.8, "valid_targets_min": 1293 }, { "epoch": 5.832587287376903, "grad_norm": 0.6003561256453428, "learning_rate": 3.30951806154431e-06, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.11105726659297943, "step": 3260, "valid_targets_mean": 4796.4, "valid_targets_min": 762 }, { "epoch": 5.841539838854073, "grad_norm": 0.6864067176009239, "learning_rate": 3.260524195115595e-06, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.10556810349225998, "step": 3265, "valid_targets_mean": 3109.9, "valid_targets_min": 1578 }, { "epoch": 5.850492390331245, "grad_norm": 0.7633968434678636, "learning_rate": 3.2118634856062546e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667451560497284, "step": 3270, "valid_targets_mean": 3742.0, "valid_targets_min": 2079 }, { "epoch": 5.859444941808415, "grad_norm": 0.901362913650791, "learning_rate": 3.163536901484601e-06, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.09401094168424606, "step": 3275, "valid_targets_mean": 2745.1, "valid_targets_min": 406 }, { "epoch": 5.8683974932855865, "grad_norm": 0.5798302684786609, "learning_rate": 3.115545404569045e-06, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.1682177037000656, "step": 3280, "valid_targets_mean": 5518.4, "valid_targets_min": 1412 }, { "epoch": 5.877350044762757, "grad_norm": 0.5757168480468727, "learning_rate": 3.0678899500089244e-06, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.1087426021695137, "step": 3285, "valid_targets_mean": 4423.0, "valid_targets_min": 2758 }, { "epoch": 5.886302596239928, "grad_norm": 0.6310116283037832, "learning_rate": 3.0205714862655135e-06, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.06991326808929443, "step": 3290, "valid_targets_mean": 2434.1, "valid_targets_min": 1352 }, { "epoch": 5.8952551477171, "grad_norm": 0.6840482387720046, "learning_rate": 2.973590955093124e-06, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.17993587255477905, "step": 3295, "valid_targets_mean": 4772.0, "valid_targets_min": 1583 }, { "epoch": 5.90420769919427, "grad_norm": 0.6503479570111461, "learning_rate": 2.9269492915203735e-06, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.20532022416591644, "step": 3300, "valid_targets_mean": 4907.6, "valid_targets_min": 759 }, { "epoch": 5.913160250671441, "grad_norm": 0.803170965499726, "learning_rate": 2.880647423831591e-06, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.09620766341686249, "step": 3305, "valid_targets_mean": 1729.2, "valid_targets_min": 309 }, { "epoch": 5.922112802148613, "grad_norm": 0.6442650027465544, "learning_rate": 2.8346862735483215e-06, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.16743940114974976, "step": 3310, "valid_targets_mean": 5283.6, "valid_targets_min": 1357 }, { "epoch": 5.931065353625783, "grad_norm": 0.6545274581161713, "learning_rate": 2.789066755410994e-06, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.13862073421478271, "step": 3315, "valid_targets_mean": 4231.5, "valid_targets_min": 1748 }, { "epoch": 5.9400179051029545, "grad_norm": 0.6389435663416849, "learning_rate": 2.7437897773607102e-06, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.09975261241197586, "step": 3320, "valid_targets_mean": 3778.2, "valid_targets_min": 1710 }, { "epoch": 5.948970456580126, "grad_norm": 0.5835511788435559, "learning_rate": 2.698856240521173e-06, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.14617975056171417, "step": 3325, "valid_targets_mean": 5683.6, "valid_targets_min": 1113 }, { "epoch": 5.957923008057296, "grad_norm": 0.5665404863664787, "learning_rate": 2.6542670391807667e-06, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269206702709198, "step": 3330, "valid_targets_mean": 5419.6, "valid_targets_min": 1200 }, { "epoch": 5.966875559534468, "grad_norm": 0.7472897852320771, "learning_rate": 2.610023060774749e-06, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.15214401483535767, "step": 3335, "valid_targets_mean": 3904.2, "valid_targets_min": 1457 }, { "epoch": 5.975828111011638, "grad_norm": 0.7742003305228212, "learning_rate": 2.566125185867576e-06, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.17470315098762512, "step": 3340, "valid_targets_mean": 3845.4, "valid_targets_min": 1932 }, { "epoch": 5.984780662488809, "grad_norm": 0.7491756904261838, "learning_rate": 2.5225742881354043e-06, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.12955431640148163, "step": 3345, "valid_targets_mean": 3063.2, "valid_targets_min": 1256 }, { "epoch": 5.993733213965981, "grad_norm": 0.6987549042529995, "learning_rate": 2.479371234348682e-06, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.10832779109477997, "step": 3350, "valid_targets_mean": 3335.0, "valid_targets_min": 1000 }, { "epoch": 6.001790510295434, "grad_norm": 0.7069990185531398, "learning_rate": 2.4365168843549e-06, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.08464382588863373, "step": 3355, "valid_targets_mean": 3527.0, "valid_targets_min": 1385 }, { "epoch": 6.010743061772605, "grad_norm": 0.6685974475107747, "learning_rate": 2.3940120910614774e-06, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.14645615220069885, "step": 3360, "valid_targets_mean": 4492.4, "valid_targets_min": 2039 }, { "epoch": 6.019695613249776, "grad_norm": 0.6914934325979221, "learning_rate": 2.351857700418807e-06, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.11661306023597717, "step": 3365, "valid_targets_mean": 3499.0, "valid_targets_min": 1563 }, { "epoch": 6.028648164726947, "grad_norm": 0.621813437866408, "learning_rate": 2.310054551403391e-06, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.08839264512062073, "step": 3370, "valid_targets_mean": 2995.2, "valid_targets_min": 747 }, { "epoch": 6.0376007162041185, "grad_norm": 0.7788394346376253, "learning_rate": 2.2686034760011656e-06, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.12395849823951721, "step": 3375, "valid_targets_mean": 2545.0, "valid_targets_min": 1173 }, { "epoch": 6.046553267681289, "grad_norm": 0.8526120857062531, "learning_rate": 2.2275052991909218e-06, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.13557417690753937, "step": 3380, "valid_targets_mean": 2442.6, "valid_targets_min": 1236 }, { "epoch": 6.05550581915846, "grad_norm": 0.6879366966499265, "learning_rate": 2.186760838927897e-06, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.12125202268362045, "step": 3385, "valid_targets_mean": 3931.8, "valid_targets_min": 1224 }, { "epoch": 6.064458370635631, "grad_norm": 0.5909197508211376, "learning_rate": 2.146370906127506e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.13690954446792603, "step": 3390, "valid_targets_mean": 3945.5, "valid_targets_min": 1216 }, { "epoch": 6.073410922112802, "grad_norm": 0.669659070570112, "learning_rate": 2.1063363046491813e-06, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.11727896332740784, "step": 3395, "valid_targets_mean": 3985.1, "valid_targets_min": 1442 }, { "epoch": 6.082363473589973, "grad_norm": 0.7079044777647083, "learning_rate": 2.0666578312803942e-06, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.11680565029382706, "step": 3400, "valid_targets_mean": 3181.2, "valid_targets_min": 1560 }, { "epoch": 6.091316025067144, "grad_norm": 0.7267778237592878, "learning_rate": 2.0273362757207726e-06, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440717875957489, "step": 3405, "valid_targets_mean": 3801.5, "valid_targets_min": 788 }, { "epoch": 6.100268576544315, "grad_norm": 0.6851230389909834, "learning_rate": 1.988372420566416e-06, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.10894258320331573, "step": 3410, "valid_targets_mean": 3692.6, "valid_targets_min": 2252 }, { "epoch": 6.1092211280214865, "grad_norm": 0.723418442049336, "learning_rate": 1.9497670412942835e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.12403066456317902, "step": 3415, "valid_targets_mean": 2928.9, "valid_targets_min": 1355 }, { "epoch": 6.118173679498657, "grad_norm": 0.7207144614470365, "learning_rate": 1.9115209062467954e-06, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.10563968867063522, "step": 3420, "valid_targets_mean": 3282.1, "valid_targets_min": 1383 }, { "epoch": 6.127126230975828, "grad_norm": 0.8346687848959415, "learning_rate": 1.8736347766165086e-06, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.11731438338756561, "step": 3425, "valid_targets_mean": 2362.8, "valid_targets_min": 1038 }, { "epoch": 6.136078782452999, "grad_norm": 0.636727979042535, "learning_rate": 1.8361094064309993e-06, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.14710702002048492, "step": 3430, "valid_targets_mean": 4899.9, "valid_targets_min": 2263 }, { "epoch": 6.14503133393017, "grad_norm": 0.7467477214038792, "learning_rate": 1.7989455425378266e-06, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.1593431681394577, "step": 3435, "valid_targets_mean": 4329.8, "valid_targets_min": 1444 }, { "epoch": 6.153983885407341, "grad_norm": 0.6264376858160309, "learning_rate": 1.7621439245896943e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.18382921814918518, "step": 3440, "valid_targets_mean": 7472.1, "valid_targets_min": 1363 }, { "epoch": 6.162936436884512, "grad_norm": 0.7282562384461457, "learning_rate": 1.7257052850296996e-06, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.14502188563346863, "step": 3445, "valid_targets_mean": 3724.5, "valid_targets_min": 1729 }, { "epoch": 6.171888988361683, "grad_norm": 0.7815809174043036, "learning_rate": 1.6896303490767829e-06, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.11601326614618301, "step": 3450, "valid_targets_mean": 2493.1, "valid_targets_min": 1297 }, { "epoch": 6.180841539838854, "grad_norm": 0.6086355952564768, "learning_rate": 1.6539198347112884e-06, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.11718467622995377, "step": 3455, "valid_targets_mean": 4018.1, "valid_targets_min": 1443 }, { "epoch": 6.189794091316025, "grad_norm": 0.9504972739313073, "learning_rate": 1.6185744526606706e-06, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09783005714416504, "step": 3460, "valid_targets_mean": 3889.9, "valid_targets_min": 1889 }, { "epoch": 6.198746642793196, "grad_norm": 0.724465952354465, "learning_rate": 1.583594906385335e-06, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1024479940533638, "step": 3465, "valid_targets_mean": 2325.9, "valid_targets_min": 1076 }, { "epoch": 6.207699194270367, "grad_norm": 0.6451374857999173, "learning_rate": 1.548981892064665e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.07624150067567825, "step": 3470, "valid_targets_mean": 2470.6, "valid_targets_min": 1121 }, { "epoch": 6.216651745747538, "grad_norm": 0.5455560588187984, "learning_rate": 1.5147360985831516e-06, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.09515611827373505, "step": 3475, "valid_targets_mean": 4178.1, "valid_targets_min": 1288 }, { "epoch": 6.225604297224709, "grad_norm": 0.816357841000134, "learning_rate": 1.4808582075166778e-06, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.09542781114578247, "step": 3480, "valid_targets_mean": 2079.2, "valid_targets_min": 1162 }, { "epoch": 6.23455684870188, "grad_norm": 0.81830346676513, "learning_rate": 1.447348893118965e-06, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.12241758406162262, "step": 3485, "valid_targets_mean": 2740.4, "valid_targets_min": 1158 }, { "epoch": 6.243509400179051, "grad_norm": 0.762453707084996, "learning_rate": 1.4142088223081408e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.10295930504798889, "step": 3490, "valid_targets_mean": 2399.1, "valid_targets_min": 1530 }, { "epoch": 6.252461951656222, "grad_norm": 0.7034908425844338, "learning_rate": 1.3814386546534864e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.15138891339302063, "step": 3495, "valid_targets_mean": 3894.6, "valid_targets_min": 876 }, { "epoch": 6.261414503133393, "grad_norm": 0.4626175053772806, "learning_rate": 1.3490390423622856e-06, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.0836140513420105, "step": 3500, "valid_targets_mean": 3548.6, "valid_targets_min": 1162 }, { "epoch": 6.270367054610564, "grad_norm": 0.7895264365296455, "learning_rate": 1.3170106302668616e-06, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.11527480185031891, "step": 3505, "valid_targets_mean": 3602.1, "valid_targets_min": 1366 }, { "epoch": 6.279319606087735, "grad_norm": 0.8147171086824726, "learning_rate": 1.2853540558117272e-06, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.15035514533519745, "step": 3510, "valid_targets_mean": 5440.1, "valid_targets_min": 1958 }, { "epoch": 6.288272157564906, "grad_norm": 0.7116251172852573, "learning_rate": 1.254069949040917e-06, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.11078624427318573, "step": 3515, "valid_targets_mean": 3214.0, "valid_targets_min": 854 }, { "epoch": 6.2972247090420765, "grad_norm": 0.7297254614713066, "learning_rate": 1.2231589325854354e-06, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.11363118886947632, "step": 3520, "valid_targets_mean": 2799.8, "valid_targets_min": 939 }, { "epoch": 6.306177260519248, "grad_norm": 0.6596134416441236, "learning_rate": 1.1926216216508735e-06, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.08517421782016754, "step": 3525, "valid_targets_mean": 2873.4, "valid_targets_min": 1744 }, { "epoch": 6.315129811996419, "grad_norm": 0.69883908604293, "learning_rate": 1.162458624005145e-06, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.12335070222616196, "step": 3530, "valid_targets_mean": 3635.4, "valid_targets_min": 1704 }, { "epoch": 6.32408236347359, "grad_norm": 0.6847726574413945, "learning_rate": 1.1326705399664207e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.09604361653327942, "step": 3535, "valid_targets_mean": 2974.9, "valid_targets_min": 1474 }, { "epoch": 6.333034914950761, "grad_norm": 0.6519594989356231, "learning_rate": 1.103257962391151e-06, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.12078134715557098, "step": 3540, "valid_targets_mean": 4011.9, "valid_targets_min": 1443 }, { "epoch": 6.341987466427932, "grad_norm": 0.5937147175773294, "learning_rate": 1.0742214766622938e-06, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.08249370008707047, "step": 3545, "valid_targets_mean": 3290.8, "valid_targets_min": 935 }, { "epoch": 6.350940017905103, "grad_norm": 0.7381445050429146, "learning_rate": 1.0455616606776363e-06, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.13618944585323334, "step": 3550, "valid_targets_mean": 3257.4, "valid_targets_min": 1219 }, { "epoch": 6.359892569382274, "grad_norm": 0.700522577996905, "learning_rate": 1.0172790848383141e-06, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.1201668530702591, "step": 3555, "valid_targets_mean": 4017.9, "valid_targets_min": 1709 }, { "epoch": 6.3688451208594445, "grad_norm": 0.8464430462952892, "learning_rate": 9.893743120374543e-07, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.13719336688518524, "step": 3560, "valid_targets_mean": 2657.0, "valid_targets_min": 1553 }, { "epoch": 6.377797672336616, "grad_norm": 0.6417224127363806, "learning_rate": 9.618478976489709e-07, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.10005088150501251, "step": 3565, "valid_targets_mean": 3522.0, "valid_targets_min": 1346 }, { "epoch": 6.386750223813787, "grad_norm": 0.8450055799005987, "learning_rate": 9.347003895165052e-07, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.12907400727272034, "step": 3570, "valid_targets_mean": 2274.2, "valid_targets_min": 871 }, { "epoch": 6.395702775290958, "grad_norm": 0.718865189721249, "learning_rate": 9.079323279425245e-07, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.15633174777030945, "step": 3575, "valid_targets_mean": 3628.4, "valid_targets_min": 1727 }, { "epoch": 6.404655326768129, "grad_norm": 0.6318602168953558, "learning_rate": 8.815442456775835e-07, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.0951131284236908, "step": 3580, "valid_targets_mean": 3976.5, "valid_targets_min": 1513 }, { "epoch": 6.4136078782453, "grad_norm": 0.6896320314558233, "learning_rate": 8.555366679097043e-07, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.10344749689102173, "step": 3585, "valid_targets_mean": 2882.4, "valid_targets_min": 1102 }, { "epoch": 6.422560429722471, "grad_norm": 0.5944068667542841, "learning_rate": 8.29910112253931e-07, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.12075631320476532, "step": 3590, "valid_targets_mean": 5318.9, "valid_targets_min": 1346 }, { "epoch": 6.431512981199642, "grad_norm": 0.7009103872992966, "learning_rate": 8.046650887420227e-07, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.16663353145122528, "step": 3595, "valid_targets_mean": 4816.9, "valid_targets_min": 1604 }, { "epoch": 6.4404655326768125, "grad_norm": 0.6102090137908595, "learning_rate": 7.798020998123101e-07, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.09184370934963226, "step": 3600, "valid_targets_mean": 3440.4, "valid_targets_min": 1266 }, { "epoch": 6.449418084153984, "grad_norm": 0.7312966151837536, "learning_rate": 7.55321640299691e-07, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317036747932434, "step": 3605, "valid_targets_mean": 3115.0, "valid_targets_min": 955 }, { "epoch": 6.458370635631155, "grad_norm": 0.6431639047809755, "learning_rate": 7.312241974257861e-07, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.11406281590461731, "step": 3610, "valid_targets_mean": 4320.2, "valid_targets_min": 1317 }, { "epoch": 6.467323187108326, "grad_norm": 0.7636759815012041, "learning_rate": 7.075102507892295e-07, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.10190820693969727, "step": 3615, "valid_targets_mean": 2279.1, "valid_targets_min": 1466 }, { "epoch": 6.476275738585497, "grad_norm": 0.8129538828808625, "learning_rate": 6.841802723561408e-07, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.11288426071405411, "step": 3620, "valid_targets_mean": 2167.2, "valid_targets_min": 1163 }, { "epoch": 6.485228290062668, "grad_norm": 0.5596904145823007, "learning_rate": 6.612347264507257e-07, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.10565987974405289, "step": 3625, "valid_targets_mean": 5062.5, "valid_targets_min": 1552 }, { "epoch": 6.494180841539839, "grad_norm": 0.5924035256383883, "learning_rate": 6.386740697460281e-07, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.1311139017343521, "step": 3630, "valid_targets_mean": 5557.9, "valid_targets_min": 295 }, { "epoch": 6.50313339301701, "grad_norm": 0.7289701592713733, "learning_rate": 6.164987512548415e-07, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.15614090859889984, "step": 3635, "valid_targets_mean": 3911.8, "valid_targets_min": 1792 }, { "epoch": 6.5120859444941805, "grad_norm": 0.5887989220028383, "learning_rate": 5.947092123207854e-07, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.12084167450666428, "step": 3640, "valid_targets_mean": 4592.4, "valid_targets_min": 2004 }, { "epoch": 6.521038495971352, "grad_norm": 0.866493744978262, "learning_rate": 5.733058866095143e-07, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.15592843294143677, "step": 3645, "valid_targets_mean": 2719.5, "valid_targets_min": 832 }, { "epoch": 6.529991047448523, "grad_norm": 0.6686036394371799, "learning_rate": 5.522892001000801e-07, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.1646374613046646, "step": 3650, "valid_targets_mean": 4997.0, "valid_targets_min": 1410 }, { "epoch": 6.538943598925694, "grad_norm": 0.5839134082394074, "learning_rate": 5.316595710764594e-07, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.193353071808815, "step": 3655, "valid_targets_mean": 6390.2, "valid_targets_min": 728 }, { "epoch": 6.547896150402865, "grad_norm": 0.5616135043250162, "learning_rate": 5.114174101192282e-07, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.14416781067848206, "step": 3660, "valid_targets_mean": 6041.5, "valid_targets_min": 1649 }, { "epoch": 6.556848701880035, "grad_norm": 0.7640989189195657, "learning_rate": 4.915631200973958e-07, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.13019560277462006, "step": 3665, "valid_targets_mean": 3621.5, "valid_targets_min": 1080 }, { "epoch": 6.565801253357207, "grad_norm": 0.6726753158457589, "learning_rate": 4.7209709616038214e-07, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.15556487441062927, "step": 3670, "valid_targets_mean": 4878.2, "valid_targets_min": 1111 }, { "epoch": 6.574753804834378, "grad_norm": 0.7209662902786135, "learning_rate": 4.5301972573014163e-07, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.11224491894245148, "step": 3675, "valid_targets_mean": 2792.8, "valid_targets_min": 1572 }, { "epoch": 6.5837063563115485, "grad_norm": 0.7821872619160591, "learning_rate": 4.3433138849347854e-07, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.091234490275383, "step": 3680, "valid_targets_mean": 1755.8, "valid_targets_min": 1107 }, { "epoch": 6.59265890778872, "grad_norm": 0.7028208056439585, "learning_rate": 4.1603245639446845e-07, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.13173747062683105, "step": 3685, "valid_targets_mean": 4195.1, "valid_targets_min": 1660 }, { "epoch": 6.601611459265891, "grad_norm": 0.6866687362574865, "learning_rate": 3.981232936270596e-07, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.14300760626792908, "step": 3690, "valid_targets_mean": 4124.4, "valid_targets_min": 1608 }, { "epoch": 6.610564010743062, "grad_norm": 0.7201161780473606, "learning_rate": 3.806042566278345e-07, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.09710663557052612, "step": 3695, "valid_targets_mean": 2816.4, "valid_targets_min": 1473 }, { "epoch": 6.619516562220233, "grad_norm": 0.7227544704360982, "learning_rate": 3.6347569406890213e-07, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.13512368500232697, "step": 3700, "valid_targets_mean": 3177.6, "valid_targets_min": 1742 }, { "epoch": 6.628469113697403, "grad_norm": 0.7298426483697191, "learning_rate": 3.467379468509746e-07, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.16440506279468536, "step": 3705, "valid_targets_mean": 3989.5, "valid_targets_min": 482 }, { "epoch": 6.637421665174575, "grad_norm": 0.6520707507301194, "learning_rate": 3.3039134809656594e-07, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.09945560991764069, "step": 3710, "valid_targets_mean": 3097.5, "valid_targets_min": 1278 }, { "epoch": 6.646374216651746, "grad_norm": 0.7574937610571322, "learning_rate": 3.144362231433706e-07, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.15985745191574097, "step": 3715, "valid_targets_mean": 4052.4, "valid_targets_min": 1452 }, { "epoch": 6.6553267681289165, "grad_norm": 0.6807781785735898, "learning_rate": 2.9887288953778903e-07, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.12004221230745316, "step": 3720, "valid_targets_mean": 3874.6, "valid_targets_min": 1429 }, { "epoch": 6.664279319606088, "grad_norm": 0.7422840275979297, "learning_rate": 2.8370165702860553e-07, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.16807028651237488, "step": 3725, "valid_targets_mean": 3694.1, "valid_targets_min": 1465 }, { "epoch": 6.673231871083258, "grad_norm": 0.7450098153423828, "learning_rate": 2.6892282756082246e-07, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.11174918711185455, "step": 3730, "valid_targets_mean": 3676.8, "valid_targets_min": 1557 }, { "epoch": 6.68218442256043, "grad_norm": 0.7111965111121455, "learning_rate": 2.545366952696582e-07, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.10589167475700378, "step": 3735, "valid_targets_mean": 3334.2, "valid_targets_min": 1023 }, { "epoch": 6.691136974037601, "grad_norm": 0.6293266970949545, "learning_rate": 2.405435464746786e-07, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.14255636930465698, "step": 3740, "valid_targets_mean": 4811.6, "valid_targets_min": 1805 }, { "epoch": 6.700089525514771, "grad_norm": 0.6652721706334741, "learning_rate": 2.2694365967411258e-07, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.14178217947483063, "step": 3745, "valid_targets_mean": 4991.2, "valid_targets_min": 1887 }, { "epoch": 6.709042076991943, "grad_norm": 0.7681480091833459, "learning_rate": 2.137373055393055e-07, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1362355649471283, "step": 3750, "valid_targets_mean": 3588.9, "valid_targets_min": 1403 }, { "epoch": 6.717994628469114, "grad_norm": 0.7191832014484213, "learning_rate": 2.009247469093234e-07, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.16261494159698486, "step": 3755, "valid_targets_mean": 4700.6, "valid_targets_min": 1921 }, { "epoch": 6.7269471799462845, "grad_norm": 0.6889617601852991, "learning_rate": 1.8850623878573505e-07, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.19672788679599762, "step": 3760, "valid_targets_mean": 4380.6, "valid_targets_min": 1376 }, { "epoch": 6.735899731423456, "grad_norm": 0.5481225860807925, "learning_rate": 1.7648202832752924e-07, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.30157795548439026, "step": 3765, "valid_targets_mean": 7732.9, "valid_targets_min": 1137 }, { "epoch": 6.744852282900626, "grad_norm": 0.710685504394315, "learning_rate": 1.6485235484619665e-07, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.12485798448324203, "step": 3770, "valid_targets_mean": 2765.8, "valid_targets_min": 1182 }, { "epoch": 6.753804834377798, "grad_norm": 0.689831853046377, "learning_rate": 1.5361744980096905e-07, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.10303008556365967, "step": 3775, "valid_targets_mean": 3598.8, "valid_targets_min": 1571 }, { "epoch": 6.762757385854969, "grad_norm": 0.7124881086751207, "learning_rate": 1.427775367942097e-07, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.1335175335407257, "step": 3780, "valid_targets_mean": 3160.1, "valid_targets_min": 1357 }, { "epoch": 6.771709937332139, "grad_norm": 0.6559820335978044, "learning_rate": 1.3233283156696142e-07, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501990109682083, "step": 3785, "valid_targets_mean": 4496.8, "valid_targets_min": 1821 }, { "epoch": 6.780662488809311, "grad_norm": 0.5956093434224163, "learning_rate": 1.222835419946633e-07, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.09017609059810638, "step": 3790, "valid_targets_mean": 3518.2, "valid_targets_min": 858 }, { "epoch": 6.789615040286481, "grad_norm": 0.5830036783313224, "learning_rate": 1.1262986808300291e-07, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.10115193575620651, "step": 3795, "valid_targets_mean": 5107.1, "valid_targets_min": 1177 }, { "epoch": 6.7985675917636526, "grad_norm": 0.7584116947768964, "learning_rate": 1.0337200196393505e-07, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397339403629303, "step": 3800, "valid_targets_mean": 3640.5, "valid_targets_min": 1659 }, { "epoch": 6.807520143240824, "grad_norm": 0.6528866226497931, "learning_rate": 9.451012789186476e-08, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.10747568309307098, "step": 3805, "valid_targets_mean": 3717.6, "valid_targets_min": 1563 }, { "epoch": 6.816472694717994, "grad_norm": 0.790754630686848, "learning_rate": 8.604442223998144e-08, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327494978904724, "step": 3810, "valid_targets_mean": 3487.0, "valid_targets_min": 1412 }, { "epoch": 6.825425246195166, "grad_norm": 0.6658217086863656, "learning_rate": 7.797505349673496e-08, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.11113050580024719, "step": 3815, "valid_targets_mean": 3609.1, "valid_targets_min": 1262 }, { "epoch": 6.834377797672337, "grad_norm": 0.7049353307220068, "learning_rate": 7.030218226250051e-08, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.10403628647327423, "step": 3820, "valid_targets_mean": 3243.0, "valid_targets_min": 1126 }, { "epoch": 6.843330349149507, "grad_norm": 0.5860588029996026, "learning_rate": 6.302596124636573e-08, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433483511209488, "step": 3825, "valid_targets_mean": 4925.4, "valid_targets_min": 2027 }, { "epoch": 6.852282900626679, "grad_norm": 0.7879325522414711, "learning_rate": 5.6146535263106314e-08, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332634687423706, "step": 3830, "valid_targets_mean": 2959.4, "valid_targets_min": 1468 }, { "epoch": 6.861235452103849, "grad_norm": 0.8092109840762858, "learning_rate": 4.966404123029289e-08, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.11193729937076569, "step": 3835, "valid_targets_mean": 2531.8, "valid_targets_min": 1080 }, { "epoch": 6.8701880035810206, "grad_norm": 0.5253238898739874, "learning_rate": 4.357860816557091e-08, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.09079030156135559, "step": 3840, "valid_targets_mean": 5008.1, "valid_targets_min": 1724 }, { "epoch": 6.879140555058192, "grad_norm": 0.6837265207779236, "learning_rate": 3.789035718408718e-08, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591939926147461, "step": 3845, "valid_targets_mean": 4355.1, "valid_targets_min": 1326 }, { "epoch": 6.888093106535362, "grad_norm": 0.6377651911445792, "learning_rate": 3.259940149609175e-08, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.1554187387228012, "step": 3850, "valid_targets_mean": 4470.0, "valid_targets_min": 1377 }, { "epoch": 6.897045658012534, "grad_norm": 0.6876946100735892, "learning_rate": 2.7705846404670888e-08, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.10332445800304413, "step": 3855, "valid_targets_mean": 2918.2, "valid_targets_min": 1389 }, { "epoch": 6.905998209489704, "grad_norm": 0.6433560412596225, "learning_rate": 2.3209789303657582e-08, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.1013648509979248, "step": 3860, "valid_targets_mean": 3309.1, "valid_targets_min": 1396 }, { "epoch": 6.914950760966875, "grad_norm": 0.6004214021548672, "learning_rate": 1.9111319675699792e-08, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.10128806531429291, "step": 3865, "valid_targets_mean": 3911.9, "valid_targets_min": 1753 }, { "epoch": 6.923903312444047, "grad_norm": 0.6818541228429529, "learning_rate": 1.5410519090461872e-08, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.10375615209341049, "step": 3870, "valid_targets_mean": 2862.6, "valid_targets_min": 1050 }, { "epoch": 6.932855863921217, "grad_norm": 0.9019330979790738, "learning_rate": 1.210746120302142e-08, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.14588722586631775, "step": 3875, "valid_targets_mean": 3001.8, "valid_targets_min": 710 }, { "epoch": 6.9418084153983886, "grad_norm": 0.6213345710457211, "learning_rate": 9.202211752386003e-09, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.10529154539108276, "step": 3880, "valid_targets_mean": 3572.5, "valid_targets_min": 1550 }, { "epoch": 6.95076096687556, "grad_norm": 0.8144722091986042, "learning_rate": 6.694828560200872e-09, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.12102942913770676, "step": 3885, "valid_targets_mean": 2542.0, "valid_targets_min": 977 }, { "epoch": 6.95971351835273, "grad_norm": 0.6060836910004495, "learning_rate": 4.585361529581001e-09, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.10048162937164307, "step": 3890, "valid_targets_mean": 3793.5, "valid_targets_min": 1837 }, { "epoch": 6.968666069829902, "grad_norm": 0.6612027073540584, "learning_rate": 2.87385264413631e-09, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.09530146420001984, "step": 3895, "valid_targets_mean": 3492.0, "valid_targets_min": 1252 }, { "epoch": 6.977618621307073, "grad_norm": 0.6346262077642075, "learning_rate": 1.560335967114579e-09, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.10467442870140076, "step": 3900, "valid_targets_mean": 3068.6, "valid_targets_min": 1651 }, { "epoch": 6.9865711727842434, "grad_norm": 0.7723757881455082, "learning_rate": 6.4483764074863e-10, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.08849972486495972, "step": 3905, "valid_targets_mean": 2084.8, "valid_targets_min": 829 }, { "epoch": 6.995523724261415, "grad_norm": 0.5277717756862081, "learning_rate": 1.273758857145424e-10, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.13350322842597961, "step": 3910, "valid_targets_mean": 4850.9, "valid_targets_min": 863 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.25713130831718445, "step": 3913, "total_flos": 1.082631006881579e+18, "train_loss": 0.32484868789553917, "train_runtime": 42725.2777, "train_samples_per_second": 1.463, "train_steps_per_second": 0.092, "valid_targets_mean": 3542.5, "valid_targets_min": 1547 } ], "logging_steps": 5, "max_steps": 3913, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.082631006881579e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }