{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4417, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.00792393026941363, "grad_norm": 18.30795544148065, "learning_rate": 3.619909502262444e-07, "loss": 0.9909, "loss_nan_ranks": 0, "loss_rank_avg": 1.0027930736541748, "step": 5, "valid_targets_mean": 3096.8, "valid_targets_min": 1275 }, { "epoch": 0.01584786053882726, "grad_norm": 17.799072817552403, "learning_rate": 8.144796380090498e-07, "loss": 0.9684, "loss_nan_ranks": 0, "loss_rank_avg": 1.0059874057769775, "step": 10, "valid_targets_mean": 2921.6, "valid_targets_min": 959 }, { "epoch": 0.02377179080824089, "grad_norm": 18.446857759452225, "learning_rate": 1.2669683257918552e-06, "loss": 0.928, "loss_nan_ranks": 0, "loss_rank_avg": 0.9721807241439819, "step": 15, "valid_targets_mean": 3334.1, "valid_targets_min": 1196 }, { "epoch": 0.03169572107765452, "grad_norm": 13.528514126701259, "learning_rate": 1.7194570135746609e-06, "loss": 0.9344, "loss_nan_ranks": 0, "loss_rank_avg": 0.8746083974838257, "step": 20, "valid_targets_mean": 3560.9, "valid_targets_min": 1101 }, { "epoch": 0.039619651347068144, "grad_norm": 9.31391677104, "learning_rate": 2.171945701357466e-06, "loss": 0.896, "loss_nan_ranks": 0, "loss_rank_avg": 0.8563970327377319, "step": 25, "valid_targets_mean": 3255.4, "valid_targets_min": 1420 }, { "epoch": 0.04754358161648178, "grad_norm": 5.740949384443614, "learning_rate": 2.624434389140272e-06, "loss": 0.8017, "loss_nan_ranks": 0, "loss_rank_avg": 0.7667723894119263, "step": 30, "valid_targets_mean": 3685.8, "valid_targets_min": 1106 }, { "epoch": 0.0554675118858954, "grad_norm": 2.8043645950548908, "learning_rate": 3.0769230769230774e-06, "loss": 0.7712, "loss_nan_ranks": 0, "loss_rank_avg": 0.6531684994697571, "step": 35, "valid_targets_mean": 4291.8, "valid_targets_min": 1303 }, { "epoch": 0.06339144215530904, "grad_norm": 2.1470577969090754, "learning_rate": 3.529411764705883e-06, "loss": 0.7427, "loss_nan_ranks": 0, "loss_rank_avg": 0.7266800403594971, "step": 40, "valid_targets_mean": 2956.1, "valid_targets_min": 999 }, { "epoch": 0.07131537242472266, "grad_norm": 1.8591952619735816, "learning_rate": 3.9819004524886875e-06, "loss": 0.7016, "loss_nan_ranks": 0, "loss_rank_avg": 0.7177771329879761, "step": 45, "valid_targets_mean": 2703.8, "valid_targets_min": 1178 }, { "epoch": 0.07923930269413629, "grad_norm": 1.5113516568275136, "learning_rate": 4.434389140271493e-06, "loss": 0.697, "loss_nan_ranks": 0, "loss_rank_avg": 0.7023115158081055, "step": 50, "valid_targets_mean": 2789.7, "valid_targets_min": 1292 }, { "epoch": 0.08716323296354993, "grad_norm": 1.0994842020421405, "learning_rate": 4.886877828054299e-06, "loss": 0.6765, "loss_nan_ranks": 0, "loss_rank_avg": 0.6585033535957336, "step": 55, "valid_targets_mean": 3465.1, "valid_targets_min": 1032 }, { "epoch": 0.09508716323296355, "grad_norm": 1.9537311330380602, "learning_rate": 5.339366515837105e-06, "loss": 0.6928, "loss_nan_ranks": 0, "loss_rank_avg": 0.7655017375946045, "step": 60, "valid_targets_mean": 2952.2, "valid_targets_min": 932 }, { "epoch": 0.10301109350237718, "grad_norm": 0.9347844302177003, "learning_rate": 5.79185520361991e-06, "loss": 0.6466, "loss_nan_ranks": 0, "loss_rank_avg": 0.6798193454742432, "step": 65, "valid_targets_mean": 3296.2, "valid_targets_min": 558 }, { "epoch": 0.1109350237717908, "grad_norm": 0.820064187537382, "learning_rate": 6.244343891402716e-06, "loss": 0.6493, "loss_nan_ranks": 0, "loss_rank_avg": 0.6339085102081299, "step": 70, "valid_targets_mean": 3473.1, "valid_targets_min": 974 }, { "epoch": 0.11885895404120443, "grad_norm": 0.84149786444046, "learning_rate": 6.69683257918552e-06, "loss": 0.6203, "loss_nan_ranks": 0, "loss_rank_avg": 0.5971336960792542, "step": 75, "valid_targets_mean": 3043.6, "valid_targets_min": 1040 }, { "epoch": 0.12678288431061807, "grad_norm": 0.819875440430727, "learning_rate": 7.1493212669683265e-06, "loss": 0.6207, "loss_nan_ranks": 0, "loss_rank_avg": 0.5473138093948364, "step": 80, "valid_targets_mean": 3087.9, "valid_targets_min": 1250 }, { "epoch": 0.1347068145800317, "grad_norm": 0.937345203637578, "learning_rate": 7.601809954751131e-06, "loss": 0.6579, "loss_nan_ranks": 0, "loss_rank_avg": 0.7002801895141602, "step": 85, "valid_targets_mean": 2635.6, "valid_targets_min": 574 }, { "epoch": 0.14263074484944532, "grad_norm": 0.9146174502773798, "learning_rate": 8.054298642533938e-06, "loss": 0.62, "loss_nan_ranks": 0, "loss_rank_avg": 0.6000384092330933, "step": 90, "valid_targets_mean": 2494.1, "valid_targets_min": 737 }, { "epoch": 0.15055467511885895, "grad_norm": 0.9169686189770018, "learning_rate": 8.506787330316743e-06, "loss": 0.6039, "loss_nan_ranks": 0, "loss_rank_avg": 0.6068024039268494, "step": 95, "valid_targets_mean": 2555.5, "valid_targets_min": 1085 }, { "epoch": 0.15847860538827258, "grad_norm": 0.9320852712314595, "learning_rate": 8.95927601809955e-06, "loss": 0.6062, "loss_nan_ranks": 0, "loss_rank_avg": 0.614492654800415, "step": 100, "valid_targets_mean": 2322.4, "valid_targets_min": 923 }, { "epoch": 0.1664025356576862, "grad_norm": 0.7979632405521523, "learning_rate": 9.411764705882354e-06, "loss": 0.5937, "loss_nan_ranks": 0, "loss_rank_avg": 0.562329888343811, "step": 105, "valid_targets_mean": 3538.2, "valid_targets_min": 511 }, { "epoch": 0.17432646592709986, "grad_norm": 0.7797014261938441, "learning_rate": 9.86425339366516e-06, "loss": 0.5676, "loss_nan_ranks": 0, "loss_rank_avg": 0.5618658065795898, "step": 110, "valid_targets_mean": 3149.2, "valid_targets_min": 813 }, { "epoch": 0.18225039619651348, "grad_norm": 0.7701673082038006, "learning_rate": 1.0316742081447966e-05, "loss": 0.5769, "loss_nan_ranks": 0, "loss_rank_avg": 0.561303436756134, "step": 115, "valid_targets_mean": 2988.9, "valid_targets_min": 1007 }, { "epoch": 0.1901743264659271, "grad_norm": 0.7301022610624124, "learning_rate": 1.076923076923077e-05, "loss": 0.585, "loss_nan_ranks": 0, "loss_rank_avg": 0.5721402764320374, "step": 120, "valid_targets_mean": 3576.1, "valid_targets_min": 1733 }, { "epoch": 0.19809825673534073, "grad_norm": 0.8464639593444047, "learning_rate": 1.1221719457013576e-05, "loss": 0.5752, "loss_nan_ranks": 0, "loss_rank_avg": 0.6512378454208374, "step": 125, "valid_targets_mean": 3244.2, "valid_targets_min": 1307 }, { "epoch": 0.20602218700475436, "grad_norm": 0.7861472935507103, "learning_rate": 1.1674208144796382e-05, "loss": 0.5427, "loss_nan_ranks": 0, "loss_rank_avg": 0.5997300148010254, "step": 130, "valid_targets_mean": 3249.4, "valid_targets_min": 1552 }, { "epoch": 0.21394611727416799, "grad_norm": 0.6975163539631399, "learning_rate": 1.2126696832579185e-05, "loss": 0.5473, "loss_nan_ranks": 0, "loss_rank_avg": 0.5397928953170776, "step": 135, "valid_targets_mean": 3848.9, "valid_targets_min": 613 }, { "epoch": 0.2218700475435816, "grad_norm": 0.8396368977750472, "learning_rate": 1.2579185520361991e-05, "loss": 0.5497, "loss_nan_ranks": 0, "loss_rank_avg": 0.5377547740936279, "step": 140, "valid_targets_mean": 2616.2, "valid_targets_min": 1135 }, { "epoch": 0.22979397781299524, "grad_norm": 0.734689091691239, "learning_rate": 1.3031674208144797e-05, "loss": 0.5247, "loss_nan_ranks": 0, "loss_rank_avg": 0.5179744958877563, "step": 145, "valid_targets_mean": 3031.5, "valid_targets_min": 806 }, { "epoch": 0.23771790808240886, "grad_norm": 0.810545526512668, "learning_rate": 1.3484162895927604e-05, "loss": 0.5628, "loss_nan_ranks": 0, "loss_rank_avg": 0.5749671459197998, "step": 150, "valid_targets_mean": 2848.2, "valid_targets_min": 1117 }, { "epoch": 0.24564183835182252, "grad_norm": 0.7252435536596383, "learning_rate": 1.3936651583710408e-05, "loss": 0.5325, "loss_nan_ranks": 0, "loss_rank_avg": 0.4927237033843994, "step": 155, "valid_targets_mean": 3464.4, "valid_targets_min": 804 }, { "epoch": 0.25356576862123614, "grad_norm": 0.7835612232571453, "learning_rate": 1.4389140271493213e-05, "loss": 0.5614, "loss_nan_ranks": 0, "loss_rank_avg": 0.5875840783119202, "step": 160, "valid_targets_mean": 3134.0, "valid_targets_min": 1040 }, { "epoch": 0.26148969889064977, "grad_norm": 0.8037709330769847, "learning_rate": 1.484162895927602e-05, "loss": 0.555, "loss_nan_ranks": 0, "loss_rank_avg": 0.5322756171226501, "step": 165, "valid_targets_mean": 2802.3, "valid_targets_min": 1217 }, { "epoch": 0.2694136291600634, "grad_norm": 0.8508977275858737, "learning_rate": 1.5294117647058822e-05, "loss": 0.55, "loss_nan_ranks": 0, "loss_rank_avg": 0.5077811479568481, "step": 170, "valid_targets_mean": 3118.4, "valid_targets_min": 643 }, { "epoch": 0.277337559429477, "grad_norm": 0.7172097062555428, "learning_rate": 1.574660633484163e-05, "loss": 0.5179, "loss_nan_ranks": 0, "loss_rank_avg": 0.48911088705062866, "step": 175, "valid_targets_mean": 3719.6, "valid_targets_min": 1500 }, { "epoch": 0.28526148969889065, "grad_norm": 0.753428022374828, "learning_rate": 1.6199095022624435e-05, "loss": 0.4977, "loss_nan_ranks": 0, "loss_rank_avg": 0.5100698471069336, "step": 180, "valid_targets_mean": 3200.1, "valid_targets_min": 795 }, { "epoch": 0.2931854199683043, "grad_norm": 0.7186918449674007, "learning_rate": 1.6651583710407243e-05, "loss": 0.5391, "loss_nan_ranks": 0, "loss_rank_avg": 0.5387634038925171, "step": 185, "valid_targets_mean": 3925.0, "valid_targets_min": 1582 }, { "epoch": 0.3011093502377179, "grad_norm": 0.8467273342860667, "learning_rate": 1.7104072398190047e-05, "loss": 0.5302, "loss_nan_ranks": 0, "loss_rank_avg": 0.5354914665222168, "step": 190, "valid_targets_mean": 2833.6, "valid_targets_min": 976 }, { "epoch": 0.3090332805071315, "grad_norm": 0.8821480809910013, "learning_rate": 1.7556561085972852e-05, "loss": 0.5174, "loss_nan_ranks": 0, "loss_rank_avg": 0.5056538581848145, "step": 195, "valid_targets_mean": 2422.6, "valid_targets_min": 1091 }, { "epoch": 0.31695721077654515, "grad_norm": 0.7440887923285217, "learning_rate": 1.8009049773755657e-05, "loss": 0.5504, "loss_nan_ranks": 0, "loss_rank_avg": 0.5461665391921997, "step": 200, "valid_targets_mean": 3475.5, "valid_targets_min": 953 }, { "epoch": 0.3248811410459588, "grad_norm": 0.8495808389526411, "learning_rate": 1.8461538461538465e-05, "loss": 0.5109, "loss_nan_ranks": 0, "loss_rank_avg": 0.4988098740577698, "step": 205, "valid_targets_mean": 2842.1, "valid_targets_min": 948 }, { "epoch": 0.3328050713153724, "grad_norm": 0.8073270397360635, "learning_rate": 1.891402714932127e-05, "loss": 0.5039, "loss_nan_ranks": 0, "loss_rank_avg": 0.5106959342956543, "step": 210, "valid_targets_mean": 3173.0, "valid_targets_min": 1091 }, { "epoch": 0.34072900158478603, "grad_norm": 0.8240792568108604, "learning_rate": 1.9366515837104074e-05, "loss": 0.504, "loss_nan_ranks": 0, "loss_rank_avg": 0.5431502461433411, "step": 215, "valid_targets_mean": 2898.2, "valid_targets_min": 605 }, { "epoch": 0.3486529318541997, "grad_norm": 0.8295014877374133, "learning_rate": 1.981900452488688e-05, "loss": 0.5304, "loss_nan_ranks": 0, "loss_rank_avg": 0.5582056045532227, "step": 220, "valid_targets_mean": 2875.2, "valid_targets_min": 1271 }, { "epoch": 0.35657686212361334, "grad_norm": 2.271995482651572, "learning_rate": 2.0271493212669683e-05, "loss": 0.5235, "loss_nan_ranks": 0, "loss_rank_avg": 0.538544774055481, "step": 225, "valid_targets_mean": 2641.7, "valid_targets_min": 959 }, { "epoch": 0.36450079239302696, "grad_norm": 0.8237389594967636, "learning_rate": 2.072398190045249e-05, "loss": 0.5407, "loss_nan_ranks": 0, "loss_rank_avg": 0.5350701808929443, "step": 230, "valid_targets_mean": 3219.0, "valid_targets_min": 1486 }, { "epoch": 0.3724247226624406, "grad_norm": 0.7959671331295798, "learning_rate": 2.1176470588235296e-05, "loss": 0.5032, "loss_nan_ranks": 0, "loss_rank_avg": 0.5149205923080444, "step": 235, "valid_targets_mean": 2917.6, "valid_targets_min": 1040 }, { "epoch": 0.3803486529318542, "grad_norm": 0.7671263696227919, "learning_rate": 2.16289592760181e-05, "loss": 0.5213, "loss_nan_ranks": 0, "loss_rank_avg": 0.541510283946991, "step": 240, "valid_targets_mean": 3337.9, "valid_targets_min": 1126 }, { "epoch": 0.38827258320126784, "grad_norm": 0.8241086669277788, "learning_rate": 2.2081447963800908e-05, "loss": 0.5073, "loss_nan_ranks": 0, "loss_rank_avg": 0.49820655584335327, "step": 245, "valid_targets_mean": 3259.1, "valid_targets_min": 1129 }, { "epoch": 0.39619651347068147, "grad_norm": 0.8184305981195854, "learning_rate": 2.2533936651583713e-05, "loss": 0.5124, "loss_nan_ranks": 0, "loss_rank_avg": 0.5349119901657104, "step": 250, "valid_targets_mean": 3188.1, "valid_targets_min": 1113 }, { "epoch": 0.4041204437400951, "grad_norm": 0.7932024628401, "learning_rate": 2.2986425339366517e-05, "loss": 0.4913, "loss_nan_ranks": 0, "loss_rank_avg": 0.5034860372543335, "step": 255, "valid_targets_mean": 2739.3, "valid_targets_min": 1349 }, { "epoch": 0.4120443740095087, "grad_norm": 0.7551847650496477, "learning_rate": 2.3438914027149325e-05, "loss": 0.5018, "loss_nan_ranks": 0, "loss_rank_avg": 0.4922025203704834, "step": 260, "valid_targets_mean": 3856.2, "valid_targets_min": 1112 }, { "epoch": 0.41996830427892234, "grad_norm": 0.8505689875054292, "learning_rate": 2.3891402714932127e-05, "loss": 0.4818, "loss_nan_ranks": 0, "loss_rank_avg": 0.48634108901023865, "step": 265, "valid_targets_mean": 3152.6, "valid_targets_min": 984 }, { "epoch": 0.42789223454833597, "grad_norm": 0.772976426564909, "learning_rate": 2.434389140271493e-05, "loss": 0.4938, "loss_nan_ranks": 0, "loss_rank_avg": 0.5387519001960754, "step": 270, "valid_targets_mean": 3622.1, "valid_targets_min": 987 }, { "epoch": 0.4358161648177496, "grad_norm": 0.728717890666478, "learning_rate": 2.479638009049774e-05, "loss": 0.4837, "loss_nan_ranks": 0, "loss_rank_avg": 0.4416227638721466, "step": 275, "valid_targets_mean": 3568.1, "valid_targets_min": 870 }, { "epoch": 0.4437400950871632, "grad_norm": 0.7440381524213614, "learning_rate": 2.5248868778280544e-05, "loss": 0.4725, "loss_nan_ranks": 0, "loss_rank_avg": 0.4643154740333557, "step": 280, "valid_targets_mean": 3414.1, "valid_targets_min": 1170 }, { "epoch": 0.45166402535657685, "grad_norm": 0.8310009993608024, "learning_rate": 2.5701357466063352e-05, "loss": 0.508, "loss_nan_ranks": 0, "loss_rank_avg": 0.5839574933052063, "step": 285, "valid_targets_mean": 3222.6, "valid_targets_min": 1309 }, { "epoch": 0.4595879556259905, "grad_norm": 1.0056080573653239, "learning_rate": 2.6153846153846157e-05, "loss": 0.503, "loss_nan_ranks": 0, "loss_rank_avg": 0.5559020042419434, "step": 290, "valid_targets_mean": 2088.1, "valid_targets_min": 904 }, { "epoch": 0.4675118858954041, "grad_norm": 0.7408460822295689, "learning_rate": 2.660633484162896e-05, "loss": 0.4563, "loss_nan_ranks": 0, "loss_rank_avg": 0.485029399394989, "step": 295, "valid_targets_mean": 3781.1, "valid_targets_min": 1262 }, { "epoch": 0.4754358161648177, "grad_norm": 0.8762884446062088, "learning_rate": 2.705882352941177e-05, "loss": 0.4595, "loss_nan_ranks": 0, "loss_rank_avg": 0.4712425470352173, "step": 300, "valid_targets_mean": 2533.3, "valid_targets_min": 1219 }, { "epoch": 0.48335974643423135, "grad_norm": 0.848146038346364, "learning_rate": 2.7511312217194574e-05, "loss": 0.4776, "loss_nan_ranks": 0, "loss_rank_avg": 0.40771573781967163, "step": 305, "valid_targets_mean": 3576.4, "valid_targets_min": 1520 }, { "epoch": 0.49128367670364503, "grad_norm": 0.9694638564949015, "learning_rate": 2.7963800904977375e-05, "loss": 0.4906, "loss_nan_ranks": 0, "loss_rank_avg": 0.4891023337841034, "step": 310, "valid_targets_mean": 2688.9, "valid_targets_min": 1303 }, { "epoch": 0.49920760697305866, "grad_norm": 1.0834078584446678, "learning_rate": 2.8416289592760183e-05, "loss": 0.4946, "loss_nan_ranks": 0, "loss_rank_avg": 0.4841890335083008, "step": 315, "valid_targets_mean": 3407.0, "valid_targets_min": 809 }, { "epoch": 0.5071315372424723, "grad_norm": 0.9122194804424244, "learning_rate": 2.8868778280542988e-05, "loss": 0.4741, "loss_nan_ranks": 0, "loss_rank_avg": 0.47857069969177246, "step": 320, "valid_targets_mean": 2495.8, "valid_targets_min": 1338 }, { "epoch": 0.5150554675118859, "grad_norm": 0.9343811207818954, "learning_rate": 2.9321266968325792e-05, "loss": 0.482, "loss_nan_ranks": 0, "loss_rank_avg": 0.4668818712234497, "step": 325, "valid_targets_mean": 2979.8, "valid_targets_min": 1365 }, { "epoch": 0.5229793977812995, "grad_norm": 0.9068833355782842, "learning_rate": 2.97737556561086e-05, "loss": 0.4667, "loss_nan_ranks": 0, "loss_rank_avg": 0.4718451499938965, "step": 330, "valid_targets_mean": 2903.4, "valid_targets_min": 1354 }, { "epoch": 0.5309033280507132, "grad_norm": 0.7990682092269628, "learning_rate": 3.0226244343891405e-05, "loss": 0.5061, "loss_nan_ranks": 0, "loss_rank_avg": 0.5103294849395752, "step": 335, "valid_targets_mean": 2843.9, "valid_targets_min": 323 }, { "epoch": 0.5388272583201268, "grad_norm": 0.8690173421542774, "learning_rate": 3.067873303167421e-05, "loss": 0.4835, "loss_nan_ranks": 0, "loss_rank_avg": 0.5316380262374878, "step": 340, "valid_targets_mean": 2980.1, "valid_targets_min": 926 }, { "epoch": 0.5467511885895404, "grad_norm": 0.9164824781790208, "learning_rate": 3.1131221719457014e-05, "loss": 0.5017, "loss_nan_ranks": 0, "loss_rank_avg": 0.4985496699810028, "step": 345, "valid_targets_mean": 2905.6, "valid_targets_min": 1131 }, { "epoch": 0.554675118858954, "grad_norm": 0.953530103945049, "learning_rate": 3.158371040723982e-05, "loss": 0.5038, "loss_nan_ranks": 0, "loss_rank_avg": 0.506258487701416, "step": 350, "valid_targets_mean": 2239.8, "valid_targets_min": 968 }, { "epoch": 0.5625990491283677, "grad_norm": 0.831534497185613, "learning_rate": 3.203619909502263e-05, "loss": 0.4813, "loss_nan_ranks": 0, "loss_rank_avg": 0.4679664373397827, "step": 355, "valid_targets_mean": 2892.7, "valid_targets_min": 742 }, { "epoch": 0.5705229793977813, "grad_norm": 0.9297214655733225, "learning_rate": 3.248868778280543e-05, "loss": 0.4977, "loss_nan_ranks": 0, "loss_rank_avg": 0.5199379920959473, "step": 360, "valid_targets_mean": 2508.0, "valid_targets_min": 944 }, { "epoch": 0.5784469096671949, "grad_norm": 0.7980105320092034, "learning_rate": 3.294117647058824e-05, "loss": 0.4842, "loss_nan_ranks": 0, "loss_rank_avg": 0.4856064021587372, "step": 365, "valid_targets_mean": 3416.5, "valid_targets_min": 1289 }, { "epoch": 0.5863708399366085, "grad_norm": 0.7614084262261346, "learning_rate": 3.339366515837105e-05, "loss": 0.4761, "loss_nan_ranks": 0, "loss_rank_avg": 0.4349548816680908, "step": 370, "valid_targets_mean": 3276.8, "valid_targets_min": 994 }, { "epoch": 0.5942947702060222, "grad_norm": 0.750217913881111, "learning_rate": 3.384615384615385e-05, "loss": 0.4981, "loss_nan_ranks": 0, "loss_rank_avg": 0.5112859606742859, "step": 375, "valid_targets_mean": 3364.1, "valid_targets_min": 949 }, { "epoch": 0.6022187004754358, "grad_norm": 0.9079283778370618, "learning_rate": 3.429864253393665e-05, "loss": 0.4827, "loss_nan_ranks": 0, "loss_rank_avg": 0.5121220946311951, "step": 380, "valid_targets_mean": 2648.1, "valid_targets_min": 1194 }, { "epoch": 0.6101426307448494, "grad_norm": 0.8438307201472272, "learning_rate": 3.475113122171946e-05, "loss": 0.474, "loss_nan_ranks": 0, "loss_rank_avg": 0.47371935844421387, "step": 385, "valid_targets_mean": 3062.8, "valid_targets_min": 1584 }, { "epoch": 0.618066561014263, "grad_norm": 0.7638788394514087, "learning_rate": 3.5203619909502266e-05, "loss": 0.4903, "loss_nan_ranks": 0, "loss_rank_avg": 0.46218085289001465, "step": 390, "valid_targets_mean": 3355.6, "valid_targets_min": 1171 }, { "epoch": 0.6259904912836767, "grad_norm": 0.8057208518874918, "learning_rate": 3.5656108597285074e-05, "loss": 0.4516, "loss_nan_ranks": 0, "loss_rank_avg": 0.4557874798774719, "step": 395, "valid_targets_mean": 2975.8, "valid_targets_min": 1180 }, { "epoch": 0.6339144215530903, "grad_norm": 0.8047504969731512, "learning_rate": 3.6108597285067875e-05, "loss": 0.506, "loss_nan_ranks": 0, "loss_rank_avg": 0.5088905096054077, "step": 400, "valid_targets_mean": 3338.4, "valid_targets_min": 1134 }, { "epoch": 0.6418383518225039, "grad_norm": 0.7333017715853949, "learning_rate": 3.656108597285068e-05, "loss": 0.438, "loss_nan_ranks": 0, "loss_rank_avg": 0.40402841567993164, "step": 405, "valid_targets_mean": 3842.2, "valid_targets_min": 1351 }, { "epoch": 0.6497622820919176, "grad_norm": 0.8399572940800708, "learning_rate": 3.701357466063349e-05, "loss": 0.5022, "loss_nan_ranks": 0, "loss_rank_avg": 0.48715096712112427, "step": 410, "valid_targets_mean": 3547.1, "valid_targets_min": 1158 }, { "epoch": 0.6576862123613312, "grad_norm": 0.6829367274200412, "learning_rate": 3.746606334841629e-05, "loss": 0.4701, "loss_nan_ranks": 0, "loss_rank_avg": 0.4927830994129181, "step": 415, "valid_targets_mean": 4532.0, "valid_targets_min": 1815 }, { "epoch": 0.6656101426307448, "grad_norm": 0.7331801766359471, "learning_rate": 3.791855203619909e-05, "loss": 0.4813, "loss_nan_ranks": 0, "loss_rank_avg": 0.4546471834182739, "step": 420, "valid_targets_mean": 3296.0, "valid_targets_min": 1238 }, { "epoch": 0.6735340729001584, "grad_norm": 0.6517565900289717, "learning_rate": 3.837104072398191e-05, "loss": 0.4519, "loss_nan_ranks": 0, "loss_rank_avg": 0.3863980174064636, "step": 425, "valid_targets_mean": 3856.7, "valid_targets_min": 1241 }, { "epoch": 0.6814580031695721, "grad_norm": 0.7230595741095671, "learning_rate": 3.882352941176471e-05, "loss": 0.4603, "loss_nan_ranks": 0, "loss_rank_avg": 0.4377797544002533, "step": 430, "valid_targets_mean": 3500.8, "valid_targets_min": 1413 }, { "epoch": 0.6893819334389857, "grad_norm": 0.8116424062683696, "learning_rate": 3.927601809954751e-05, "loss": 0.478, "loss_nan_ranks": 0, "loss_rank_avg": 0.48108479380607605, "step": 435, "valid_targets_mean": 2934.9, "valid_targets_min": 1263 }, { "epoch": 0.6973058637083994, "grad_norm": 0.7795795329155563, "learning_rate": 3.972850678733032e-05, "loss": 0.4656, "loss_nan_ranks": 0, "loss_rank_avg": 0.4403081238269806, "step": 440, "valid_targets_mean": 2962.6, "valid_targets_min": 973 }, { "epoch": 0.705229793977813, "grad_norm": 0.7200947601229617, "learning_rate": 3.99999750146533e-05, "loss": 0.4536, "loss_nan_ranks": 0, "loss_rank_avg": 0.4119512438774109, "step": 445, "valid_targets_mean": 3470.1, "valid_targets_min": 666 }, { "epoch": 0.7131537242472267, "grad_norm": 0.7628047573152018, "learning_rate": 3.999969393021975e-05, "loss": 0.4598, "loss_nan_ranks": 0, "loss_rank_avg": 0.4884294271469116, "step": 450, "valid_targets_mean": 3419.0, "valid_targets_min": 933 }, { "epoch": 0.7210776545166403, "grad_norm": 0.7380251751146455, "learning_rate": 3.999910053407327e-05, "loss": 0.4637, "loss_nan_ranks": 0, "loss_rank_avg": 0.48761463165283203, "step": 455, "valid_targets_mean": 4100.1, "valid_targets_min": 1287 }, { "epoch": 0.7290015847860539, "grad_norm": 0.9308179330317129, "learning_rate": 3.999819483548022e-05, "loss": 0.4695, "loss_nan_ranks": 0, "loss_rank_avg": 0.4577655792236328, "step": 460, "valid_targets_mean": 2391.7, "valid_targets_min": 1138 }, { "epoch": 0.7369255150554676, "grad_norm": 0.7825831726322529, "learning_rate": 3.999697684858384e-05, "loss": 0.4776, "loss_nan_ranks": 0, "loss_rank_avg": 0.48154550790786743, "step": 465, "valid_targets_mean": 3380.8, "valid_targets_min": 1034 }, { "epoch": 0.7448494453248812, "grad_norm": 0.6672464690362646, "learning_rate": 3.9995446592403994e-05, "loss": 0.462, "loss_nan_ranks": 0, "loss_rank_avg": 0.43639689683914185, "step": 470, "valid_targets_mean": 3831.9, "valid_targets_min": 995 }, { "epoch": 0.7527733755942948, "grad_norm": 0.8243105277532876, "learning_rate": 3.9993604090836905e-05, "loss": 0.4321, "loss_nan_ranks": 0, "loss_rank_avg": 0.47002795338630676, "step": 475, "valid_targets_mean": 3040.6, "valid_targets_min": 917 }, { "epoch": 0.7606973058637084, "grad_norm": 0.761930542283936, "learning_rate": 3.999144937265473e-05, "loss": 0.4752, "loss_nan_ranks": 0, "loss_rank_avg": 0.46109023690223694, "step": 480, "valid_targets_mean": 3145.6, "valid_targets_min": 1514 }, { "epoch": 0.768621236133122, "grad_norm": 0.8060589330068717, "learning_rate": 3.998898247150519e-05, "loss": 0.4463, "loss_nan_ranks": 0, "loss_rank_avg": 0.4293675720691681, "step": 485, "valid_targets_mean": 2624.5, "valid_targets_min": 875 }, { "epoch": 0.7765451664025357, "grad_norm": 0.7239375292351515, "learning_rate": 3.9986203425910976e-05, "loss": 0.4541, "loss_nan_ranks": 0, "loss_rank_avg": 0.49284249544143677, "step": 490, "valid_targets_mean": 3257.3, "valid_targets_min": 1477 }, { "epoch": 0.7844690966719493, "grad_norm": 0.661893236239374, "learning_rate": 3.998311227926918e-05, "loss": 0.4455, "loss_nan_ranks": 0, "loss_rank_avg": 0.4618075489997864, "step": 495, "valid_targets_mean": 3975.6, "valid_targets_min": 1167 }, { "epoch": 0.7923930269413629, "grad_norm": 0.7934924986420486, "learning_rate": 3.997970907985059e-05, "loss": 0.5113, "loss_nan_ranks": 0, "loss_rank_avg": 0.5001330375671387, "step": 500, "valid_targets_mean": 2784.4, "valid_targets_min": 1326 }, { "epoch": 0.8003169572107766, "grad_norm": 0.8975772569125601, "learning_rate": 3.9975993880799e-05, "loss": 0.4497, "loss_nan_ranks": 0, "loss_rank_avg": 0.42663824558258057, "step": 505, "valid_targets_mean": 2079.9, "valid_targets_min": 918 }, { "epoch": 0.8082408874801902, "grad_norm": 0.6568781194669023, "learning_rate": 3.9971966740130284e-05, "loss": 0.4495, "loss_nan_ranks": 0, "loss_rank_avg": 0.46053969860076904, "step": 510, "valid_targets_mean": 3603.1, "valid_targets_min": 1018 }, { "epoch": 0.8161648177496038, "grad_norm": 0.6658645533938224, "learning_rate": 3.996762772073156e-05, "loss": 0.4417, "loss_nan_ranks": 0, "loss_rank_avg": 0.4799339771270752, "step": 515, "valid_targets_mean": 4443.3, "valid_targets_min": 1201 }, { "epoch": 0.8240887480190174, "grad_norm": 0.8120691967226177, "learning_rate": 3.996297689036022e-05, "loss": 0.4691, "loss_nan_ranks": 0, "loss_rank_avg": 0.5048344731330872, "step": 520, "valid_targets_mean": 2798.8, "valid_targets_min": 982 }, { "epoch": 0.8320126782884311, "grad_norm": 0.7585539749107885, "learning_rate": 3.995801432164279e-05, "loss": 0.4741, "loss_nan_ranks": 0, "loss_rank_avg": 0.42256441712379456, "step": 525, "valid_targets_mean": 2953.5, "valid_targets_min": 1244 }, { "epoch": 0.8399366085578447, "grad_norm": 0.7627360477522009, "learning_rate": 3.9952740092073895e-05, "loss": 0.4474, "loss_nan_ranks": 0, "loss_rank_avg": 0.45900869369506836, "step": 530, "valid_targets_mean": 2668.1, "valid_targets_min": 1356 }, { "epoch": 0.8478605388272583, "grad_norm": 0.7233384200007872, "learning_rate": 3.9947154284014955e-05, "loss": 0.472, "loss_nan_ranks": 0, "loss_rank_avg": 0.46540921926498413, "step": 535, "valid_targets_mean": 3327.3, "valid_targets_min": 956 }, { "epoch": 0.8557844690966719, "grad_norm": 0.8462825976473535, "learning_rate": 3.994125698469298e-05, "loss": 0.4679, "loss_nan_ranks": 0, "loss_rank_avg": 0.44462665915489197, "step": 540, "valid_targets_mean": 2309.5, "valid_targets_min": 839 }, { "epoch": 0.8637083993660856, "grad_norm": 0.7523146524714103, "learning_rate": 3.9935048286199166e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.4704914391040802, "step": 545, "valid_targets_mean": 3301.1, "valid_targets_min": 896 }, { "epoch": 0.8716323296354992, "grad_norm": 0.7323342838512769, "learning_rate": 3.992852828548745e-05, "loss": 0.4391, "loss_nan_ranks": 0, "loss_rank_avg": 0.43246427178382874, "step": 550, "valid_targets_mean": 3083.8, "valid_targets_min": 592 }, { "epoch": 0.8795562599049128, "grad_norm": 0.7835802807257946, "learning_rate": 3.992169708437304e-05, "loss": 0.4496, "loss_nan_ranks": 0, "loss_rank_avg": 0.42524343729019165, "step": 555, "valid_targets_mean": 2537.8, "valid_targets_min": 805 }, { "epoch": 0.8874801901743264, "grad_norm": 0.8164094838303196, "learning_rate": 3.9914554789530753e-05, "loss": 0.4494, "loss_nan_ranks": 0, "loss_rank_avg": 0.4827771782875061, "step": 560, "valid_targets_mean": 3152.2, "valid_targets_min": 1026 }, { "epoch": 0.8954041204437401, "grad_norm": 0.6690559963612506, "learning_rate": 3.990710151249342e-05, "loss": 0.4493, "loss_nan_ranks": 0, "loss_rank_avg": 0.4192623496055603, "step": 565, "valid_targets_mean": 3655.5, "valid_targets_min": 1219 }, { "epoch": 0.9033280507131537, "grad_norm": 0.6580359416743707, "learning_rate": 3.989933736965011e-05, "loss": 0.4577, "loss_nan_ranks": 0, "loss_rank_avg": 0.4300585389137268, "step": 570, "valid_targets_mean": 4057.7, "valid_targets_min": 762 }, { "epoch": 0.9112519809825673, "grad_norm": 0.8064570151818262, "learning_rate": 3.9891262482244315e-05, "loss": 0.4571, "loss_nan_ranks": 0, "loss_rank_avg": 0.49867746233940125, "step": 575, "valid_targets_mean": 2577.3, "valid_targets_min": 917 }, { "epoch": 0.919175911251981, "grad_norm": 0.7851899897385263, "learning_rate": 3.988287697637206e-05, "loss": 0.4444, "loss_nan_ranks": 0, "loss_rank_avg": 0.5172279477119446, "step": 580, "valid_targets_mean": 3265.5, "valid_targets_min": 929 }, { "epoch": 0.9270998415213946, "grad_norm": 0.7641647370399206, "learning_rate": 3.987418098297993e-05, "loss": 0.423, "loss_nan_ranks": 0, "loss_rank_avg": 0.4322676360607147, "step": 585, "valid_targets_mean": 2695.2, "valid_targets_min": 1420 }, { "epoch": 0.9350237717908082, "grad_norm": 0.7323141223552216, "learning_rate": 3.986517463786304e-05, "loss": 0.4142, "loss_nan_ranks": 0, "loss_rank_avg": 0.4049820899963379, "step": 590, "valid_targets_mean": 2684.9, "valid_targets_min": 1028 }, { "epoch": 0.9429477020602218, "grad_norm": 0.7633256320545897, "learning_rate": 3.985585808166289e-05, "loss": 0.4453, "loss_nan_ranks": 0, "loss_rank_avg": 0.4967576563358307, "step": 595, "valid_targets_mean": 2754.4, "valid_targets_min": 1337 }, { "epoch": 0.9508716323296355, "grad_norm": 0.7629796008373017, "learning_rate": 3.9846231459865195e-05, "loss": 0.4256, "loss_nan_ranks": 0, "loss_rank_avg": 0.43822014331817627, "step": 600, "valid_targets_mean": 2671.6, "valid_targets_min": 1143 }, { "epoch": 0.9587955625990491, "grad_norm": 0.8958552133877844, "learning_rate": 3.983629492279759e-05, "loss": 0.4518, "loss_nan_ranks": 0, "loss_rank_avg": 0.48023688793182373, "step": 605, "valid_targets_mean": 2614.1, "valid_targets_min": 1174 }, { "epoch": 0.9667194928684627, "grad_norm": 0.6996692976043973, "learning_rate": 3.982604862562729e-05, "loss": 0.4385, "loss_nan_ranks": 0, "loss_rank_avg": 0.44010189175605774, "step": 610, "valid_targets_mean": 3366.1, "valid_targets_min": 1220 }, { "epoch": 0.9746434231378764, "grad_norm": 0.6660341248169072, "learning_rate": 3.9815492728358674e-05, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.4266677498817444, "step": 615, "valid_targets_mean": 3921.9, "valid_targets_min": 878 }, { "epoch": 0.9825673534072901, "grad_norm": 0.9292017152796667, "learning_rate": 3.980462739583079e-05, "loss": 0.4216, "loss_nan_ranks": 0, "loss_rank_avg": 0.40375131368637085, "step": 620, "valid_targets_mean": 2191.8, "valid_targets_min": 941 }, { "epoch": 0.9904912836767037, "grad_norm": 0.7664309991122322, "learning_rate": 3.9793452797714765e-05, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.4360402524471283, "step": 625, "valid_targets_mean": 3167.6, "valid_targets_min": 883 }, { "epoch": 0.9984152139461173, "grad_norm": 0.762176105418411, "learning_rate": 3.9781969108511156e-05, "loss": 0.4323, "loss_nan_ranks": 0, "loss_rank_avg": 0.4275134801864624, "step": 630, "valid_targets_mean": 2764.2, "valid_targets_min": 832 }, { "epoch": 1.006339144215531, "grad_norm": 0.704479878187583, "learning_rate": 3.9770176507547246e-05, "loss": 0.4287, "loss_nan_ranks": 0, "loss_rank_avg": 0.41019442677497864, "step": 635, "valid_targets_mean": 4324.3, "valid_targets_min": 1450 }, { "epoch": 1.0142630744849446, "grad_norm": 0.9019061125405019, "learning_rate": 3.975807517897422e-05, "loss": 0.4257, "loss_nan_ranks": 0, "loss_rank_avg": 0.3917194604873657, "step": 640, "valid_targets_mean": 2455.1, "valid_targets_min": 1134 }, { "epoch": 1.0221870047543582, "grad_norm": 0.8978043885613115, "learning_rate": 3.9745665311764305e-05, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.4289025664329529, "step": 645, "valid_targets_mean": 2416.1, "valid_targets_min": 891 }, { "epoch": 1.0301109350237718, "grad_norm": 0.7816645884156189, "learning_rate": 3.973294709970781e-05, "loss": 0.424, "loss_nan_ranks": 0, "loss_rank_avg": 0.4417671263217926, "step": 650, "valid_targets_mean": 2768.1, "valid_targets_min": 932 }, { "epoch": 1.0380348652931854, "grad_norm": 0.718601192352368, "learning_rate": 3.97199207414101e-05, "loss": 0.4231, "loss_nan_ranks": 0, "loss_rank_avg": 0.40946125984191895, "step": 655, "valid_targets_mean": 3722.6, "valid_targets_min": 926 }, { "epoch": 1.045958795562599, "grad_norm": 0.84427108743179, "learning_rate": 3.970658644028851e-05, "loss": 0.4549, "loss_nan_ranks": 0, "loss_rank_avg": 0.46118617057800293, "step": 660, "valid_targets_mean": 2638.7, "valid_targets_min": 832 }, { "epoch": 1.0538827258320127, "grad_norm": 0.860139409056787, "learning_rate": 3.969294440456915e-05, "loss": 0.4158, "loss_nan_ranks": 0, "loss_rank_avg": 0.43523386120796204, "step": 665, "valid_targets_mean": 2739.1, "valid_targets_min": 1231 }, { "epoch": 1.0618066561014263, "grad_norm": 0.7097427943901892, "learning_rate": 3.9678994847283636e-05, "loss": 0.4183, "loss_nan_ranks": 0, "loss_rank_avg": 0.3999113142490387, "step": 670, "valid_targets_mean": 3927.4, "valid_targets_min": 1556 }, { "epoch": 1.06973058637084, "grad_norm": 0.7042143614988474, "learning_rate": 3.9664737986265825e-05, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.3503003418445587, "step": 675, "valid_targets_mean": 3451.0, "valid_targets_min": 1132 }, { "epoch": 1.0776545166402536, "grad_norm": 0.797726052806819, "learning_rate": 3.9650174044148364e-05, "loss": 0.4136, "loss_nan_ranks": 0, "loss_rank_avg": 0.4306812882423401, "step": 680, "valid_targets_mean": 2851.7, "valid_targets_min": 972 }, { "epoch": 1.0855784469096672, "grad_norm": 0.7997403365127854, "learning_rate": 3.9635303248359206e-05, "loss": 0.4343, "loss_nan_ranks": 0, "loss_rank_avg": 0.4064903259277344, "step": 685, "valid_targets_mean": 3858.1, "valid_targets_min": 828 }, { "epoch": 1.0935023771790808, "grad_norm": 0.741920647282534, "learning_rate": 3.9620125831118105e-05, "loss": 0.4148, "loss_nan_ranks": 0, "loss_rank_avg": 0.42814987897872925, "step": 690, "valid_targets_mean": 3245.4, "valid_targets_min": 1067 }, { "epoch": 1.1014263074484945, "grad_norm": 0.8105775677772558, "learning_rate": 3.960464202943293e-05, "loss": 0.4221, "loss_nan_ranks": 0, "loss_rank_avg": 0.42513906955718994, "step": 695, "valid_targets_mean": 2785.9, "valid_targets_min": 1048 }, { "epoch": 1.109350237717908, "grad_norm": 0.7115809927579022, "learning_rate": 3.958885208509601e-05, "loss": 0.4217, "loss_nan_ranks": 0, "loss_rank_avg": 0.41410183906555176, "step": 700, "valid_targets_mean": 3303.6, "valid_targets_min": 1311 }, { "epoch": 1.1172741679873217, "grad_norm": 0.6566885854355542, "learning_rate": 3.957275624468037e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.3849619925022125, "step": 705, "valid_targets_mean": 3675.2, "valid_targets_min": 1298 }, { "epoch": 1.1251980982567353, "grad_norm": 0.7159393546972551, "learning_rate": 3.9556354759535806e-05, "loss": 0.3989, "loss_nan_ranks": 0, "loss_rank_avg": 0.3957841694355011, "step": 710, "valid_targets_mean": 3910.0, "valid_targets_min": 1085 }, { "epoch": 1.133122028526149, "grad_norm": 0.654787326318881, "learning_rate": 3.9539647885785056e-05, "loss": 0.4271, "loss_nan_ranks": 0, "loss_rank_avg": 0.42849165201187134, "step": 715, "valid_targets_mean": 4003.0, "valid_targets_min": 1117 }, { "epoch": 1.1410459587955626, "grad_norm": 0.692869210178711, "learning_rate": 3.952263588431971e-05, "loss": 0.4155, "loss_nan_ranks": 0, "loss_rank_avg": 0.3946205675601959, "step": 720, "valid_targets_mean": 3680.2, "valid_targets_min": 734 }, { "epoch": 1.1489698890649762, "grad_norm": 0.8061172018614384, "learning_rate": 3.950531902079622e-05, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.40015098452568054, "step": 725, "valid_targets_mean": 3444.4, "valid_targets_min": 1252 }, { "epoch": 1.1568938193343898, "grad_norm": 0.7318031830672799, "learning_rate": 3.948769756563167e-05, "loss": 0.4215, "loss_nan_ranks": 0, "loss_rank_avg": 0.3930429220199585, "step": 730, "valid_targets_mean": 3201.9, "valid_targets_min": 666 }, { "epoch": 1.1648177496038035, "grad_norm": 0.612779900383534, "learning_rate": 3.9469771793999625e-05, "loss": 0.4347, "loss_nan_ranks": 0, "loss_rank_avg": 0.4050843119621277, "step": 735, "valid_targets_mean": 4257.2, "valid_targets_min": 1484 }, { "epoch": 1.172741679873217, "grad_norm": 0.7408822062660686, "learning_rate": 3.9451541985825786e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3889385163784027, "step": 740, "valid_targets_mean": 3084.0, "valid_targets_min": 925 }, { "epoch": 1.1806656101426307, "grad_norm": 0.8417691654111226, "learning_rate": 3.9433008425783644e-05, "loss": 0.4036, "loss_nan_ranks": 0, "loss_rank_avg": 0.39221471548080444, "step": 745, "valid_targets_mean": 2542.4, "valid_targets_min": 824 }, { "epoch": 1.1885895404120443, "grad_norm": 0.8455649038780431, "learning_rate": 3.941417140329002e-05, "loss": 0.4236, "loss_nan_ranks": 0, "loss_rank_avg": 0.41412001848220825, "step": 750, "valid_targets_mean": 2310.1, "valid_targets_min": 692 }, { "epoch": 1.196513470681458, "grad_norm": 0.8023487927804567, "learning_rate": 3.939503121250055e-05, "loss": 0.4444, "loss_nan_ranks": 0, "loss_rank_avg": 0.4537830054759979, "step": 755, "valid_targets_mean": 2984.4, "valid_targets_min": 1263 }, { "epoch": 1.2044374009508716, "grad_norm": 0.836410102281734, "learning_rate": 3.937558815230511e-05, "loss": 0.4309, "loss_nan_ranks": 0, "loss_rank_avg": 0.41315758228302, "step": 760, "valid_targets_mean": 2404.2, "valid_targets_min": 1275 }, { "epoch": 1.2123613312202852, "grad_norm": 0.7687019899235902, "learning_rate": 3.935584252632311e-05, "loss": 0.3922, "loss_nan_ranks": 0, "loss_rank_avg": 0.4471081495285034, "step": 765, "valid_targets_mean": 3286.8, "valid_targets_min": 881 }, { "epoch": 1.2202852614896988, "grad_norm": 0.8076276401226896, "learning_rate": 3.933579464289877e-05, "loss": 0.4229, "loss_nan_ranks": 0, "loss_rank_avg": 0.44439810514450073, "step": 770, "valid_targets_mean": 2975.2, "valid_targets_min": 605 }, { "epoch": 1.2282091917591125, "grad_norm": 0.6761174721765739, "learning_rate": 3.931544481509634e-05, "loss": 0.4123, "loss_nan_ranks": 0, "loss_rank_avg": 0.3570912480354309, "step": 775, "valid_targets_mean": 3133.5, "valid_targets_min": 1202 }, { "epoch": 1.236133122028526, "grad_norm": 0.6540995614498064, "learning_rate": 3.929479336069515e-05, "loss": 0.4087, "loss_nan_ranks": 0, "loss_rank_avg": 0.4113902449607849, "step": 780, "valid_targets_mean": 3971.6, "valid_targets_min": 1882 }, { "epoch": 1.2440570522979397, "grad_norm": 0.7555222122842105, "learning_rate": 3.9273840602184704e-05, "loss": 0.4283, "loss_nan_ranks": 0, "loss_rank_avg": 0.415526807308197, "step": 785, "valid_targets_mean": 2650.9, "valid_targets_min": 1373 }, { "epoch": 1.2519809825673534, "grad_norm": 0.7338778533435747, "learning_rate": 3.925258686675959e-05, "loss": 0.4202, "loss_nan_ranks": 0, "loss_rank_avg": 0.4193318486213684, "step": 790, "valid_targets_mean": 3284.5, "valid_targets_min": 729 }, { "epoch": 1.259904912836767, "grad_norm": 0.6821772996833774, "learning_rate": 3.9231032486314424e-05, "loss": 0.424, "loss_nan_ranks": 0, "loss_rank_avg": 0.4240224063396454, "step": 795, "valid_targets_mean": 3689.0, "valid_targets_min": 767 }, { "epoch": 1.2678288431061806, "grad_norm": 0.6846368831579128, "learning_rate": 3.920917779743863e-05, "loss": 0.4251, "loss_nan_ranks": 0, "loss_rank_avg": 0.3829592764377594, "step": 800, "valid_targets_mean": 3325.4, "valid_targets_min": 1102 }, { "epoch": 1.2757527733755942, "grad_norm": 0.6659668031255094, "learning_rate": 3.9187023141411174e-05, "loss": 0.4236, "loss_nan_ranks": 0, "loss_rank_avg": 0.38867223262786865, "step": 805, "valid_targets_mean": 3416.3, "valid_targets_min": 1262 }, { "epoch": 1.2836767036450079, "grad_norm": 0.7285809624299453, "learning_rate": 3.916456886419531e-05, "loss": 0.4231, "loss_nan_ranks": 0, "loss_rank_avg": 0.3913799822330475, "step": 810, "valid_targets_mean": 3115.3, "valid_targets_min": 1613 }, { "epoch": 1.2916006339144215, "grad_norm": 0.6294190021912572, "learning_rate": 3.914181531643308e-05, "loss": 0.4208, "loss_nan_ranks": 0, "loss_rank_avg": 0.40710440278053284, "step": 815, "valid_targets_mean": 4045.3, "valid_targets_min": 1010 }, { "epoch": 1.299524564183835, "grad_norm": 0.6395002952830273, "learning_rate": 3.9118762853439896e-05, "loss": 0.4159, "loss_nan_ranks": 0, "loss_rank_avg": 0.38787251710891724, "step": 820, "valid_targets_mean": 3804.1, "valid_targets_min": 1352 }, { "epoch": 1.3074484944532487, "grad_norm": 0.8584841420313233, "learning_rate": 3.909541183519897e-05, "loss": 0.3973, "loss_nan_ranks": 0, "loss_rank_avg": 0.44322896003723145, "step": 825, "valid_targets_mean": 2552.2, "valid_targets_min": 1167 }, { "epoch": 1.3153724247226624, "grad_norm": 0.8556648774974849, "learning_rate": 3.907176262635573e-05, "loss": 0.4347, "loss_nan_ranks": 0, "loss_rank_avg": 0.4341663718223572, "step": 830, "valid_targets_mean": 2628.5, "valid_targets_min": 1103 }, { "epoch": 1.3232963549920762, "grad_norm": 0.7234909908437245, "learning_rate": 3.904781559621205e-05, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.39154618978500366, "step": 835, "valid_targets_mean": 3121.8, "valid_targets_min": 1013 }, { "epoch": 1.3312202852614896, "grad_norm": 0.8559159891089542, "learning_rate": 3.9023571118720556e-05, "loss": 0.4387, "loss_nan_ranks": 0, "loss_rank_avg": 0.451394259929657, "step": 840, "valid_targets_mean": 3243.3, "valid_targets_min": 1096 }, { "epoch": 1.3391442155309035, "grad_norm": 0.6960908027565411, "learning_rate": 3.899902957247876e-05, "loss": 0.4319, "loss_nan_ranks": 0, "loss_rank_avg": 0.4584362208843231, "step": 845, "valid_targets_mean": 3875.6, "valid_targets_min": 790 }, { "epoch": 1.3470681458003169, "grad_norm": 0.7088383534291515, "learning_rate": 3.8974191340723156e-05, "loss": 0.4269, "loss_nan_ranks": 0, "loss_rank_avg": 0.4132707118988037, "step": 850, "valid_targets_mean": 3384.2, "valid_targets_min": 820 }, { "epoch": 1.3549920760697307, "grad_norm": 0.9002448432474283, "learning_rate": 3.89490568113232e-05, "loss": 0.4319, "loss_nan_ranks": 0, "loss_rank_avg": 0.4581453502178192, "step": 855, "valid_targets_mean": 2567.9, "valid_targets_min": 907 }, { "epoch": 1.3629160063391441, "grad_norm": 0.8733397713665929, "learning_rate": 3.8923626376775304e-05, "loss": 0.4174, "loss_nan_ranks": 0, "loss_rank_avg": 0.38375404477119446, "step": 860, "valid_targets_mean": 2163.6, "valid_targets_min": 1028 }, { "epoch": 1.370839936608558, "grad_norm": 0.7437113903348465, "learning_rate": 3.889790043419667e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.39502203464508057, "step": 865, "valid_targets_mean": 2958.6, "valid_targets_min": 928 }, { "epoch": 1.3787638668779714, "grad_norm": 0.8343548930808327, "learning_rate": 3.88718793853191e-05, "loss": 0.3955, "loss_nan_ranks": 0, "loss_rank_avg": 0.3916308283805847, "step": 870, "valid_targets_mean": 2949.1, "valid_targets_min": 1143 }, { "epoch": 1.3866877971473852, "grad_norm": 0.7516211189853197, "learning_rate": 3.884556363648274e-05, "loss": 0.4079, "loss_nan_ranks": 0, "loss_rank_avg": 0.39778488874435425, "step": 875, "valid_targets_mean": 3050.1, "valid_targets_min": 1425 }, { "epoch": 1.3946117274167986, "grad_norm": 1.9122478361363395, "learning_rate": 3.881895359862971e-05, "loss": 0.3955, "loss_nan_ranks": 0, "loss_rank_avg": 0.3751554489135742, "step": 880, "valid_targets_mean": 3727.2, "valid_targets_min": 1411 }, { "epoch": 1.4025356576862125, "grad_norm": 0.8283328429349839, "learning_rate": 3.8792049687297676e-05, "loss": 0.429, "loss_nan_ranks": 0, "loss_rank_avg": 0.4410147964954376, "step": 885, "valid_targets_mean": 2555.6, "valid_targets_min": 1352 }, { "epoch": 1.4104595879556259, "grad_norm": 0.7964713017148128, "learning_rate": 3.8764852322613424e-05, "loss": 0.3962, "loss_nan_ranks": 0, "loss_rank_avg": 0.4192018508911133, "step": 890, "valid_targets_mean": 2898.3, "valid_targets_min": 1409 }, { "epoch": 1.4183835182250397, "grad_norm": 0.9240073279538392, "learning_rate": 3.873736192928621e-05, "loss": 0.4215, "loss_nan_ranks": 0, "loss_rank_avg": 0.4372017979621887, "step": 895, "valid_targets_mean": 2696.7, "valid_targets_min": 756 }, { "epoch": 1.4263074484944531, "grad_norm": 0.83039785426173, "learning_rate": 3.870957893660121e-05, "loss": 0.3843, "loss_nan_ranks": 0, "loss_rank_avg": 0.41866040229797363, "step": 900, "valid_targets_mean": 2210.3, "valid_targets_min": 805 }, { "epoch": 1.434231378763867, "grad_norm": 0.80445295919421, "learning_rate": 3.8681503778412755e-05, "loss": 0.3896, "loss_nan_ranks": 0, "loss_rank_avg": 0.4015462398529053, "step": 905, "valid_targets_mean": 2993.2, "valid_targets_min": 1028 }, { "epoch": 1.4421553090332804, "grad_norm": 0.7688696814096964, "learning_rate": 3.86531368931376e-05, "loss": 0.4115, "loss_nan_ranks": 0, "loss_rank_avg": 0.4431518018245697, "step": 910, "valid_targets_mean": 2941.3, "valid_targets_min": 1125 }, { "epoch": 1.4500792393026942, "grad_norm": 0.6998329358267783, "learning_rate": 3.862447872374804e-05, "loss": 0.4143, "loss_nan_ranks": 0, "loss_rank_avg": 0.3961395025253296, "step": 915, "valid_targets_mean": 3132.4, "valid_targets_min": 1155 }, { "epoch": 1.4580031695721076, "grad_norm": 0.7100699865804003, "learning_rate": 3.859552971776503e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.4128316044807434, "step": 920, "valid_targets_mean": 3220.7, "valid_targets_min": 1136 }, { "epoch": 1.4659270998415215, "grad_norm": 0.724096649438488, "learning_rate": 3.856629032725117e-05, "loss": 0.4019, "loss_nan_ranks": 0, "loss_rank_avg": 0.413987398147583, "step": 925, "valid_targets_mean": 3048.2, "valid_targets_min": 1512 }, { "epoch": 1.473851030110935, "grad_norm": 0.9087616628326457, "learning_rate": 3.853676100880366e-05, "loss": 0.4225, "loss_nan_ranks": 0, "loss_rank_avg": 0.4310683012008667, "step": 930, "valid_targets_mean": 2377.6, "valid_targets_min": 764 }, { "epoch": 1.4817749603803487, "grad_norm": 0.696626378789911, "learning_rate": 3.8506942223547144e-05, "loss": 0.4151, "loss_nan_ranks": 0, "loss_rank_avg": 0.41933345794677734, "step": 935, "valid_targets_mean": 3630.8, "valid_targets_min": 890 }, { "epoch": 1.4896988906497624, "grad_norm": 0.8254765290702623, "learning_rate": 3.847683443712655e-05, "loss": 0.4054, "loss_nan_ranks": 0, "loss_rank_avg": 0.4006253480911255, "step": 940, "valid_targets_mean": 2531.5, "valid_targets_min": 613 }, { "epoch": 1.497622820919176, "grad_norm": 0.6563699014476309, "learning_rate": 3.844643811969979e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.3917093873023987, "step": 945, "valid_targets_mean": 3745.3, "valid_targets_min": 1636 }, { "epoch": 1.5055467511885894, "grad_norm": 0.7034200261801405, "learning_rate": 3.8415753745930434e-05, "loss": 0.3836, "loss_nan_ranks": 0, "loss_rank_avg": 0.37366852164268494, "step": 950, "valid_targets_mean": 3708.8, "valid_targets_min": 1277 }, { "epoch": 1.5134706814580032, "grad_norm": 0.7068374328594914, "learning_rate": 3.8384781794980266e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.3869531750679016, "step": 955, "valid_targets_mean": 3328.4, "valid_targets_min": 1074 }, { "epoch": 1.5213946117274166, "grad_norm": 0.7395241815584156, "learning_rate": 3.835352275050186e-05, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.41180118918418884, "step": 960, "valid_targets_mean": 2738.5, "valid_targets_min": 1475 }, { "epoch": 1.5293185419968305, "grad_norm": 0.8711264116280388, "learning_rate": 3.832197710063095e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.45476359128952026, "step": 965, "valid_targets_mean": 2199.7, "valid_targets_min": 933 }, { "epoch": 1.537242472266244, "grad_norm": 0.6703294555536304, "learning_rate": 3.829014533797889e-05, "loss": 0.4049, "loss_nan_ranks": 0, "loss_rank_avg": 0.37091028690338135, "step": 970, "valid_targets_mean": 3504.9, "valid_targets_min": 1036 }, { "epoch": 1.5451664025356577, "grad_norm": 0.686830221903586, "learning_rate": 3.8258027959624896e-05, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.41083040833473206, "step": 975, "valid_targets_mean": 3011.7, "valid_targets_min": 1312 }, { "epoch": 1.5530903328050714, "grad_norm": 0.7408376847260882, "learning_rate": 3.822562546710831e-05, "loss": 0.4002, "loss_nan_ranks": 0, "loss_rank_avg": 0.4086455702781677, "step": 980, "valid_targets_mean": 2653.7, "valid_targets_min": 882 }, { "epoch": 1.561014263074485, "grad_norm": 0.636239559181727, "learning_rate": 3.8192938366420783e-05, "loss": 0.4058, "loss_nan_ranks": 0, "loss_rank_avg": 0.3559831380844116, "step": 985, "valid_targets_mean": 3844.6, "valid_targets_min": 1435 }, { "epoch": 1.5689381933438986, "grad_norm": 0.7144101319476477, "learning_rate": 3.815996716799834e-05, "loss": 0.4376, "loss_nan_ranks": 0, "loss_rank_avg": 0.4442058801651001, "step": 990, "valid_targets_mean": 3304.9, "valid_targets_min": 1338 }, { "epoch": 1.5768621236133122, "grad_norm": 1.1225511402749522, "learning_rate": 3.812671238671344e-05, "loss": 0.4297, "loss_nan_ranks": 0, "loss_rank_avg": 0.5221154093742371, "step": 995, "valid_targets_mean": 1934.2, "valid_targets_min": 1198 }, { "epoch": 1.5847860538827259, "grad_norm": 0.649928936381306, "learning_rate": 3.809317454186691e-05, "loss": 0.3877, "loss_nan_ranks": 0, "loss_rank_avg": 0.3804464042186737, "step": 1000, "valid_targets_mean": 3448.9, "valid_targets_min": 1223 }, { "epoch": 1.5927099841521395, "grad_norm": 0.6846783313137514, "learning_rate": 3.8059354157179856e-05, "loss": 0.403, "loss_nan_ranks": 0, "loss_rank_avg": 0.37651345133781433, "step": 1005, "valid_targets_mean": 3401.1, "valid_targets_min": 797 }, { "epoch": 1.6006339144215531, "grad_norm": 0.7693670022399335, "learning_rate": 3.802525176078547e-05, "loss": 0.4051, "loss_nan_ranks": 0, "loss_rank_avg": 0.44831791520118713, "step": 1010, "valid_targets_mean": 2622.1, "valid_targets_min": 965 }, { "epoch": 1.6085578446909667, "grad_norm": 0.6930287612571057, "learning_rate": 3.7990867885220796e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.35027647018432617, "step": 1015, "valid_targets_mean": 3623.8, "valid_targets_min": 1302 }, { "epoch": 1.6164817749603804, "grad_norm": 0.687012918482246, "learning_rate": 3.7956203067418404e-05, "loss": 0.4078, "loss_nan_ranks": 0, "loss_rank_avg": 0.3655385673046112, "step": 1020, "valid_targets_mean": 3311.2, "valid_targets_min": 1444 }, { "epoch": 1.624405705229794, "grad_norm": 0.7482238561024599, "learning_rate": 3.792125784869801e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.4137212634086609, "step": 1025, "valid_targets_mean": 3026.4, "valid_targets_min": 1491 }, { "epoch": 1.6323296354992076, "grad_norm": 0.66746545382943, "learning_rate": 3.788603277475802e-05, "loss": 0.4134, "loss_nan_ranks": 0, "loss_rank_avg": 0.41697245836257935, "step": 1030, "valid_targets_mean": 4302.0, "valid_targets_min": 1413 }, { "epoch": 1.6402535657686212, "grad_norm": 0.753161569313501, "learning_rate": 3.785052839566701e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.4113873243331909, "step": 1035, "valid_targets_mean": 2856.5, "valid_targets_min": 1125 }, { "epoch": 1.6481774960380349, "grad_norm": 0.6546256771695564, "learning_rate": 3.781474526585515e-05, "loss": 0.4115, "loss_nan_ranks": 0, "loss_rank_avg": 0.394817054271698, "step": 1040, "valid_targets_mean": 3403.2, "valid_targets_min": 1422 }, { "epoch": 1.6561014263074485, "grad_norm": 0.7277585250229833, "learning_rate": 3.777868394410549e-05, "loss": 0.4284, "loss_nan_ranks": 0, "loss_rank_avg": 0.47451382875442505, "step": 1045, "valid_targets_mean": 3198.6, "valid_targets_min": 1517 }, { "epoch": 1.6640253565768621, "grad_norm": 0.7015006171574263, "learning_rate": 3.774234499354534e-05, "loss": 0.4044, "loss_nan_ranks": 0, "loss_rank_avg": 0.39788326621055603, "step": 1050, "valid_targets_mean": 3490.7, "valid_targets_min": 1153 }, { "epoch": 1.6719492868462758, "grad_norm": 0.8474760122796657, "learning_rate": 3.7705728981637356e-05, "loss": 0.4203, "loss_nan_ranks": 0, "loss_rank_avg": 0.4005127549171448, "step": 1055, "valid_targets_mean": 2430.2, "valid_targets_min": 1168 }, { "epoch": 1.6798732171156894, "grad_norm": 0.7000912329433476, "learning_rate": 3.7668836480170766e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.37566471099853516, "step": 1060, "valid_targets_mean": 3148.2, "valid_targets_min": 742 }, { "epoch": 1.687797147385103, "grad_norm": 0.7518484582066471, "learning_rate": 3.763166806525241e-05, "loss": 0.411, "loss_nan_ranks": 0, "loss_rank_avg": 0.4494781494140625, "step": 1065, "valid_targets_mean": 2883.8, "valid_targets_min": 949 }, { "epoch": 1.6957210776545166, "grad_norm": 0.7045093699139731, "learning_rate": 3.759422431729772e-05, "loss": 0.4124, "loss_nan_ranks": 0, "loss_rank_avg": 0.360650897026062, "step": 1070, "valid_targets_mean": 2946.6, "valid_targets_min": 1392 }, { "epoch": 1.7036450079239303, "grad_norm": 0.7676628810172328, "learning_rate": 3.7556505821021716e-05, "loss": 0.4324, "loss_nan_ranks": 0, "loss_rank_avg": 0.4218803942203522, "step": 1075, "valid_targets_mean": 2905.9, "valid_targets_min": 1305 }, { "epoch": 1.7115689381933439, "grad_norm": 0.8253811089122368, "learning_rate": 3.751851316542981e-05, "loss": 0.4057, "loss_nan_ranks": 0, "loss_rank_avg": 0.3761538863182068, "step": 1080, "valid_targets_mean": 3308.4, "valid_targets_min": 683 }, { "epoch": 1.7194928684627575, "grad_norm": 0.6654441883446629, "learning_rate": 3.748024694380864e-05, "loss": 0.4001, "loss_nan_ranks": 0, "loss_rank_avg": 0.3409106135368347, "step": 1085, "valid_targets_mean": 3397.1, "valid_targets_min": 980 }, { "epoch": 1.7274167987321711, "grad_norm": 0.6484360369162916, "learning_rate": 3.744170775371683e-05, "loss": 0.3975, "loss_nan_ranks": 0, "loss_rank_avg": 0.3883214294910431, "step": 1090, "valid_targets_mean": 3733.1, "valid_targets_min": 1168 }, { "epoch": 1.7353407290015848, "grad_norm": 0.7031281814385612, "learning_rate": 3.740289619697561e-05, "loss": 0.4089, "loss_nan_ranks": 0, "loss_rank_avg": 0.3461092710494995, "step": 1095, "valid_targets_mean": 3039.8, "valid_targets_min": 511 }, { "epoch": 1.7432646592709984, "grad_norm": 0.8032936865207325, "learning_rate": 3.736381287965943e-05, "loss": 0.4128, "loss_nan_ranks": 0, "loss_rank_avg": 0.41207650303840637, "step": 1100, "valid_targets_mean": 2640.8, "valid_targets_min": 1094 }, { "epoch": 1.751188589540412, "grad_norm": 0.7024977935027796, "learning_rate": 3.7324458412086547e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.4368237853050232, "step": 1105, "valid_targets_mean": 3143.6, "valid_targets_min": 1047 }, { "epoch": 1.7591125198098256, "grad_norm": 0.7123522087918879, "learning_rate": 3.728483340880939e-05, "loss": 0.3909, "loss_nan_ranks": 0, "loss_rank_avg": 0.42601120471954346, "step": 1110, "valid_targets_mean": 3299.2, "valid_targets_min": 1364 }, { "epoch": 1.7670364500792393, "grad_norm": 0.7419859314602727, "learning_rate": 3.7244938488605084e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.37845379114151, "step": 1115, "valid_targets_mean": 3138.9, "valid_targets_min": 956 }, { "epoch": 1.7749603803486529, "grad_norm": 0.8181546771338208, "learning_rate": 3.7204774274465694e-05, "loss": 0.382, "loss_nan_ranks": 0, "loss_rank_avg": 0.43097904324531555, "step": 1120, "valid_targets_mean": 2586.9, "valid_targets_min": 1087 }, { "epoch": 1.7828843106180665, "grad_norm": 0.6818665315017823, "learning_rate": 3.716434139358855e-05, "loss": 0.4197, "loss_nan_ranks": 0, "loss_rank_avg": 0.40882283449172974, "step": 1125, "valid_targets_mean": 3429.4, "valid_targets_min": 1192 }, { "epoch": 1.7908082408874801, "grad_norm": 0.8821106883318396, "learning_rate": 3.712364047736643e-05, "loss": 0.4063, "loss_nan_ranks": 0, "loss_rank_avg": 0.38789087533950806, "step": 1130, "valid_targets_mean": 2882.9, "valid_targets_min": 1102 }, { "epoch": 1.7987321711568938, "grad_norm": 0.6396888823145678, "learning_rate": 3.7082672161377706e-05, "loss": 0.4018, "loss_nan_ranks": 0, "loss_rank_avg": 0.375009685754776, "step": 1135, "valid_targets_mean": 3623.6, "valid_targets_min": 1434 }, { "epoch": 1.8066561014263076, "grad_norm": 0.6985921775082531, "learning_rate": 3.70414370853764e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.4500548243522644, "step": 1140, "valid_targets_mean": 3521.9, "valid_targets_min": 1123 }, { "epoch": 1.814580031695721, "grad_norm": 0.6528447006130813, "learning_rate": 3.6999935893282254e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.3747301697731018, "step": 1145, "valid_targets_mean": 3697.4, "valid_targets_min": 1239 }, { "epoch": 1.8225039619651349, "grad_norm": 0.777122366373374, "learning_rate": 3.695816923317058e-05, "loss": 0.4189, "loss_nan_ranks": 0, "loss_rank_avg": 0.3883894085884094, "step": 1150, "valid_targets_mean": 2929.1, "valid_targets_min": 1149 }, { "epoch": 1.8304278922345483, "grad_norm": 0.7469966383617292, "learning_rate": 3.691613775726223e-05, "loss": 0.3863, "loss_nan_ranks": 0, "loss_rank_avg": 0.4305916726589203, "step": 1155, "valid_targets_mean": 2614.3, "valid_targets_min": 1168 }, { "epoch": 1.8383518225039621, "grad_norm": 0.6111573888862004, "learning_rate": 3.687384212191336e-05, "loss": 0.3952, "loss_nan_ranks": 0, "loss_rank_avg": 0.3437587022781372, "step": 1160, "valid_targets_mean": 4098.4, "valid_targets_min": 926 }, { "epoch": 1.8462757527733755, "grad_norm": 0.7266326774607562, "learning_rate": 3.6831282987605185e-05, "loss": 0.4203, "loss_nan_ranks": 0, "loss_rank_avg": 0.39362356066703796, "step": 1165, "valid_targets_mean": 2666.9, "valid_targets_min": 772 }, { "epoch": 1.8541996830427894, "grad_norm": 0.8846404507919211, "learning_rate": 3.6788461018933695e-05, "loss": 0.3953, "loss_nan_ranks": 0, "loss_rank_avg": 0.37495893239974976, "step": 1170, "valid_targets_mean": 3182.8, "valid_targets_min": 1724 }, { "epoch": 1.8621236133122028, "grad_norm": 0.7579090022128943, "learning_rate": 3.674537688459924e-05, "loss": 0.3982, "loss_nan_ranks": 0, "loss_rank_avg": 0.41980457305908203, "step": 1175, "valid_targets_mean": 2550.7, "valid_targets_min": 1142 }, { "epoch": 1.8700475435816166, "grad_norm": 0.8055268692496189, "learning_rate": 3.67020312573961e-05, "loss": 0.4301, "loss_nan_ranks": 0, "loss_rank_avg": 0.4746722877025604, "step": 1180, "valid_targets_mean": 2543.4, "valid_targets_min": 1425 }, { "epoch": 1.87797147385103, "grad_norm": 0.7072175582291216, "learning_rate": 3.665842481420199e-05, "loss": 0.4094, "loss_nan_ranks": 0, "loss_rank_avg": 0.4191814064979553, "step": 1185, "valid_targets_mean": 3546.8, "valid_targets_min": 1471 }, { "epoch": 1.8858954041204439, "grad_norm": 0.755666919283838, "learning_rate": 3.661455823596749e-05, "loss": 0.4235, "loss_nan_ranks": 0, "loss_rank_avg": 0.41528838872909546, "step": 1190, "valid_targets_mean": 2681.6, "valid_targets_min": 868 }, { "epoch": 1.8938193343898573, "grad_norm": 0.6908769369919235, "learning_rate": 3.6570432207705366e-05, "loss": 0.3828, "loss_nan_ranks": 0, "loss_rank_avg": 0.39453238248825073, "step": 1195, "valid_targets_mean": 3171.2, "valid_targets_min": 807 }, { "epoch": 1.9017432646592711, "grad_norm": 0.6611245364364247, "learning_rate": 3.652604741847996e-05, "loss": 0.3746, "loss_nan_ranks": 0, "loss_rank_avg": 0.3662848472595215, "step": 1200, "valid_targets_mean": 3316.7, "valid_targets_min": 1167 }, { "epoch": 1.9096671949286845, "grad_norm": 0.5929280738291254, "learning_rate": 3.648140456139635e-05, "loss": 0.3828, "loss_nan_ranks": 0, "loss_rank_avg": 0.3568131625652313, "step": 1205, "valid_targets_mean": 3974.2, "valid_targets_min": 1544 }, { "epoch": 1.9175911251980984, "grad_norm": 0.6945487108386357, "learning_rate": 3.643650433358956e-05, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.376843124628067, "step": 1210, "valid_targets_mean": 2674.7, "valid_targets_min": 1367 }, { "epoch": 1.9255150554675118, "grad_norm": 0.6712784164628189, "learning_rate": 3.639134743621368e-05, "loss": 0.4015, "loss_nan_ranks": 0, "loss_rank_avg": 0.41648247838020325, "step": 1215, "valid_targets_mean": 3261.2, "valid_targets_min": 1073 }, { "epoch": 1.9334389857369256, "grad_norm": 0.656538586479345, "learning_rate": 3.63459345744309e-05, "loss": 0.3785, "loss_nan_ranks": 0, "loss_rank_avg": 0.3585965633392334, "step": 1220, "valid_targets_mean": 3355.2, "valid_targets_min": 1300 }, { "epoch": 1.941362916006339, "grad_norm": 0.6904029377773084, "learning_rate": 3.630026645740049e-05, "loss": 0.4263, "loss_nan_ranks": 0, "loss_rank_avg": 0.4165318012237549, "step": 1225, "valid_targets_mean": 2927.4, "valid_targets_min": 1580 }, { "epoch": 1.9492868462757529, "grad_norm": 0.6679269706627182, "learning_rate": 3.625434379826777e-05, "loss": 0.4054, "loss_nan_ranks": 0, "loss_rank_avg": 0.42261233925819397, "step": 1230, "valid_targets_mean": 3125.9, "valid_targets_min": 1152 }, { "epoch": 1.9572107765451663, "grad_norm": 0.7041857593125621, "learning_rate": 3.620816731415293e-05, "loss": 0.4009, "loss_nan_ranks": 0, "loss_rank_avg": 0.4373818039894104, "step": 1235, "valid_targets_mean": 3272.8, "valid_targets_min": 852 }, { "epoch": 1.9651347068145801, "grad_norm": 0.7101332039778864, "learning_rate": 3.616173772613985e-05, "loss": 0.392, "loss_nan_ranks": 0, "loss_rank_avg": 0.35600316524505615, "step": 1240, "valid_targets_mean": 2676.8, "valid_targets_min": 1040 }, { "epoch": 1.9730586370839935, "grad_norm": 0.6634520936002515, "learning_rate": 3.611505575926482e-05, "loss": 0.4069, "loss_nan_ranks": 0, "loss_rank_avg": 0.39966195821762085, "step": 1245, "valid_targets_mean": 3331.6, "valid_targets_min": 951 }, { "epoch": 1.9809825673534074, "grad_norm": 0.6785145786730344, "learning_rate": 3.6068122142505265e-05, "loss": 0.3868, "loss_nan_ranks": 0, "loss_rank_avg": 0.38170456886291504, "step": 1250, "valid_targets_mean": 2993.2, "valid_targets_min": 1445 }, { "epoch": 1.9889064976228208, "grad_norm": 0.6316749595759299, "learning_rate": 3.602093760876831e-05, "loss": 0.3925, "loss_nan_ranks": 0, "loss_rank_avg": 0.41541820764541626, "step": 1255, "valid_targets_mean": 4683.4, "valid_targets_min": 1904 }, { "epoch": 1.9968304278922346, "grad_norm": 0.6421496174511931, "learning_rate": 3.597350289487935e-05, "loss": 0.3847, "loss_nan_ranks": 0, "loss_rank_avg": 0.3562106490135193, "step": 1260, "valid_targets_mean": 3179.0, "valid_targets_min": 804 }, { "epoch": 2.004754358161648, "grad_norm": 0.6676059687606999, "learning_rate": 3.5925818741570566e-05, "loss": 0.3712, "loss_nan_ranks": 0, "loss_rank_avg": 0.2841273546218872, "step": 1265, "valid_targets_mean": 3497.7, "valid_targets_min": 1563 }, { "epoch": 2.012678288431062, "grad_norm": 0.7062366601502383, "learning_rate": 3.587788589346932e-05, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.3702091574668884, "step": 1270, "valid_targets_mean": 3476.4, "valid_targets_min": 904 }, { "epoch": 2.0206022187004753, "grad_norm": 0.7515066065460074, "learning_rate": 3.5829705099086586e-05, "loss": 0.355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3285125494003296, "step": 1275, "valid_targets_mean": 3045.9, "valid_targets_min": 967 }, { "epoch": 2.028526148969889, "grad_norm": 0.6511406045365554, "learning_rate": 3.578127711080517e-05, "loss": 0.3331, "loss_nan_ranks": 0, "loss_rank_avg": 0.32423993945121765, "step": 1280, "valid_targets_mean": 3313.9, "valid_targets_min": 1218 }, { "epoch": 2.0364500792393025, "grad_norm": 0.6629925563372985, "learning_rate": 3.5732602684868065e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.35224616527557373, "step": 1285, "valid_targets_mean": 3352.9, "valid_targets_min": 945 }, { "epoch": 2.0443740095087164, "grad_norm": 0.6852450135475233, "learning_rate": 3.568368258136657e-05, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.35313695669174194, "step": 1290, "valid_targets_mean": 3369.9, "valid_targets_min": 778 }, { "epoch": 2.05229793977813, "grad_norm": 0.6804763117304029, "learning_rate": 3.563451756422843e-05, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.3494824171066284, "step": 1295, "valid_targets_mean": 3336.2, "valid_targets_min": 1403 }, { "epoch": 2.0602218700475436, "grad_norm": 0.7451628554485628, "learning_rate": 3.558510840120594e-05, "loss": 0.3825, "loss_nan_ranks": 0, "loss_rank_avg": 0.4016644358634949, "step": 1300, "valid_targets_mean": 3308.9, "valid_targets_min": 1237 }, { "epoch": 2.068145800316957, "grad_norm": 0.7479732131470967, "learning_rate": 3.553545586386392e-05, "loss": 0.3744, "loss_nan_ranks": 0, "loss_rank_avg": 0.3414376974105835, "step": 1305, "valid_targets_mean": 3150.8, "valid_targets_min": 929 }, { "epoch": 2.076069730586371, "grad_norm": 0.6039441228458018, "learning_rate": 3.5485560727567686e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.3465012311935425, "step": 1310, "valid_targets_mean": 3960.5, "valid_targets_min": 1781 }, { "epoch": 2.0839936608557843, "grad_norm": 0.7773497361755427, "learning_rate": 3.543542377147093e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.37093955278396606, "step": 1315, "valid_targets_mean": 2705.9, "valid_targets_min": 1477 }, { "epoch": 2.091917591125198, "grad_norm": 0.7862507036909796, "learning_rate": 3.5385045778503574e-05, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.4063432216644287, "step": 1320, "valid_targets_mean": 2707.6, "valid_targets_min": 1327 }, { "epoch": 2.0998415213946116, "grad_norm": 0.9375539482705244, "learning_rate": 3.533442753535952e-05, "loss": 0.3756, "loss_nan_ranks": 0, "loss_rank_avg": 0.35002627968788147, "step": 1325, "valid_targets_mean": 3312.0, "valid_targets_min": 1131 }, { "epoch": 2.1077654516640254, "grad_norm": 0.7318154628229018, "learning_rate": 3.528356983248438e-05, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.35978320240974426, "step": 1330, "valid_targets_mean": 2899.5, "valid_targets_min": 1433 }, { "epoch": 2.115689381933439, "grad_norm": 0.696363310675273, "learning_rate": 3.523247346406311e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.32494083046913147, "step": 1335, "valid_targets_mean": 3550.9, "valid_targets_min": 1021 }, { "epoch": 2.1236133122028527, "grad_norm": 0.8237973354896262, "learning_rate": 3.518113922800765e-05, "loss": 0.3506, "loss_nan_ranks": 0, "loss_rank_avg": 0.35818031430244446, "step": 1340, "valid_targets_mean": 3031.8, "valid_targets_min": 673 }, { "epoch": 2.131537242472266, "grad_norm": 0.66311971156985, "learning_rate": 3.512956792594442e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.36689960956573486, "step": 1345, "valid_targets_mean": 3550.8, "valid_targets_min": 950 }, { "epoch": 2.13946117274168, "grad_norm": 0.8721689360378009, "learning_rate": 3.5077760363201835e-05, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.385911762714386, "step": 1350, "valid_targets_mean": 2141.8, "valid_targets_min": 953 }, { "epoch": 2.1473851030110933, "grad_norm": 0.6726564862719653, "learning_rate": 3.50257173487977e-05, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.3518974184989929, "step": 1355, "valid_targets_mean": 3165.7, "valid_targets_min": 1298 }, { "epoch": 2.155309033280507, "grad_norm": 0.8591285613969092, "learning_rate": 3.4973439695426606e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.4314518868923187, "step": 1360, "valid_targets_mean": 2363.4, "valid_targets_min": 1010 }, { "epoch": 2.1632329635499206, "grad_norm": 0.6640118779055022, "learning_rate": 3.492092821944722e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.3326745629310608, "step": 1365, "valid_targets_mean": 3621.4, "valid_targets_min": 1238 }, { "epoch": 2.1711568938193344, "grad_norm": 0.7418113772849524, "learning_rate": 3.4868183740869544e-05, "loss": 0.3692, "loss_nan_ranks": 0, "loss_rank_avg": 0.3442697525024414, "step": 1370, "valid_targets_mean": 2723.8, "valid_targets_min": 1171 }, { "epoch": 2.179080824088748, "grad_norm": 0.7504301461052274, "learning_rate": 3.48152070833421e-05, "loss": 0.3793, "loss_nan_ranks": 0, "loss_rank_avg": 0.36825960874557495, "step": 1375, "valid_targets_mean": 2962.6, "valid_targets_min": 1328 }, { "epoch": 2.1870047543581617, "grad_norm": 0.8957004442452282, "learning_rate": 3.476199907413909e-05, "loss": 0.3878, "loss_nan_ranks": 0, "loss_rank_avg": 0.412288099527359, "step": 1380, "valid_targets_mean": 2568.7, "valid_targets_min": 1206 }, { "epoch": 2.194928684627575, "grad_norm": 0.7694928144436127, "learning_rate": 3.4708560544147435e-05, "loss": 0.3805, "loss_nan_ranks": 0, "loss_rank_avg": 0.4149361252784729, "step": 1385, "valid_targets_mean": 2675.1, "valid_targets_min": 1219 }, { "epoch": 2.202852614896989, "grad_norm": 0.7389166507314462, "learning_rate": 3.465489232785388e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.32906919717788696, "step": 1390, "valid_targets_mean": 2730.8, "valid_targets_min": 1188 }, { "epoch": 2.2107765451664028, "grad_norm": 0.79731266620094, "learning_rate": 3.460099526333184e-05, "loss": 0.3801, "loss_nan_ranks": 0, "loss_rank_avg": 0.34242305159568787, "step": 1395, "valid_targets_mean": 2235.1, "valid_targets_min": 982 }, { "epoch": 2.218700475435816, "grad_norm": 0.7176220862553758, "learning_rate": 3.4546870192228446e-05, "loss": 0.3528, "loss_nan_ranks": 0, "loss_rank_avg": 0.36401069164276123, "step": 1400, "valid_targets_mean": 3310.4, "valid_targets_min": 1168 }, { "epoch": 2.2266244057052296, "grad_norm": 0.6300501071926575, "learning_rate": 3.449251795975132e-05, "loss": 0.4117, "loss_nan_ranks": 0, "loss_rank_avg": 0.3608476519584656, "step": 1405, "valid_targets_mean": 3842.1, "valid_targets_min": 1080 }, { "epoch": 2.2345483359746434, "grad_norm": 0.6586933639077392, "learning_rate": 3.4437939414655375e-05, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.29544296860694885, "step": 1410, "valid_targets_mean": 2897.9, "valid_targets_min": 992 }, { "epoch": 2.2424722662440573, "grad_norm": 0.747007744021972, "learning_rate": 3.438313540922961e-05, "loss": 0.3768, "loss_nan_ranks": 0, "loss_rank_avg": 0.378732293844223, "step": 1415, "valid_targets_mean": 2782.6, "valid_targets_min": 1405 }, { "epoch": 2.2503961965134707, "grad_norm": 0.8127811072244645, "learning_rate": 3.432810679928376e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.4382305145263672, "step": 1420, "valid_targets_mean": 2800.4, "valid_targets_min": 1318 }, { "epoch": 2.258320126782884, "grad_norm": 0.7157439338354276, "learning_rate": 3.427285444413495e-05, "loss": 0.3528, "loss_nan_ranks": 0, "loss_rank_avg": 0.3332955241203308, "step": 1425, "valid_targets_mean": 3116.9, "valid_targets_min": 1673 }, { "epoch": 2.266244057052298, "grad_norm": 0.6962204553743823, "learning_rate": 3.421737920659427e-05, "loss": 0.349, "loss_nan_ranks": 0, "loss_rank_avg": 0.32148024439811707, "step": 1430, "valid_targets_mean": 2878.9, "valid_targets_min": 871 }, { "epoch": 2.2741679873217118, "grad_norm": 0.713354512987655, "learning_rate": 3.416168195295329e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.3718951940536499, "step": 1435, "valid_targets_mean": 3088.2, "valid_targets_min": 1342 }, { "epoch": 2.282091917591125, "grad_norm": 0.7008120501571135, "learning_rate": 3.410576355297056e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.33514919877052307, "step": 1440, "valid_targets_mean": 2861.1, "valid_targets_min": 1199 }, { "epoch": 2.2900158478605386, "grad_norm": 0.806299441185959, "learning_rate": 3.404962487985801e-05, "loss": 0.3668, "loss_nan_ranks": 0, "loss_rank_avg": 0.3846312463283539, "step": 1445, "valid_targets_mean": 2405.8, "valid_targets_min": 831 }, { "epoch": 2.2979397781299524, "grad_norm": 0.761461112866616, "learning_rate": 3.399326681026731e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.38813963532447815, "step": 1450, "valid_targets_mean": 2826.6, "valid_targets_min": 1430 }, { "epoch": 2.3058637083993663, "grad_norm": 0.9191487962494499, "learning_rate": 3.3936690224276194e-05, "loss": 0.3761, "loss_nan_ranks": 0, "loss_rank_avg": 0.4349742531776428, "step": 1455, "valid_targets_mean": 2471.1, "valid_targets_min": 809 }, { "epoch": 2.3137876386687797, "grad_norm": 0.6867460029163497, "learning_rate": 3.3879896005374705e-05, "loss": 0.3772, "loss_nan_ranks": 0, "loss_rank_avg": 0.3719336986541748, "step": 1460, "valid_targets_mean": 3600.1, "valid_targets_min": 640 }, { "epoch": 2.3217115689381935, "grad_norm": 0.7140439142369251, "learning_rate": 3.382288504045141e-05, "loss": 0.355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3862805962562561, "step": 1465, "valid_targets_mean": 3404.2, "valid_targets_min": 434 }, { "epoch": 2.329635499207607, "grad_norm": 0.845295556326319, "learning_rate": 3.3765658219779537e-05, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.39049577713012695, "step": 1470, "valid_targets_mean": 2238.2, "valid_targets_min": 767 }, { "epoch": 2.337559429477021, "grad_norm": 0.6210399121619489, "learning_rate": 3.370821643700307e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.34238991141319275, "step": 1475, "valid_targets_mean": 3526.3, "valid_targets_min": 1052 }, { "epoch": 2.345483359746434, "grad_norm": 0.670480766135351, "learning_rate": 3.365056058912282e-05, "loss": 0.383, "loss_nan_ranks": 0, "loss_rank_avg": 0.33082759380340576, "step": 1480, "valid_targets_mean": 3321.8, "valid_targets_min": 1409 }, { "epoch": 2.353407290015848, "grad_norm": 0.6766348332163563, "learning_rate": 3.3592691576482414e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.3270394206047058, "step": 1485, "valid_targets_mean": 3748.6, "valid_targets_min": 1485 }, { "epoch": 2.3613312202852614, "grad_norm": 0.7949053191718662, "learning_rate": 3.353461030275418e-05, "loss": 0.3774, "loss_nan_ranks": 0, "loss_rank_avg": 0.3639070391654968, "step": 1490, "valid_targets_mean": 3388.0, "valid_targets_min": 623 }, { "epoch": 2.3692551505546753, "grad_norm": 0.7129315145411875, "learning_rate": 3.3476317674925126e-05, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.3307371735572815, "step": 1495, "valid_targets_mean": 3125.2, "valid_targets_min": 1123 }, { "epoch": 2.3771790808240887, "grad_norm": 0.7319999465255304, "learning_rate": 3.341781460328267e-05, "loss": 0.3705, "loss_nan_ranks": 0, "loss_rank_avg": 0.3839896619319916, "step": 1500, "valid_targets_mean": 2962.8, "valid_targets_min": 1040 }, { "epoch": 2.3851030110935025, "grad_norm": 0.7492489121406776, "learning_rate": 3.3359102001400555e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.3603183627128601, "step": 1505, "valid_targets_mean": 2949.4, "valid_targets_min": 605 }, { "epoch": 2.393026941362916, "grad_norm": 0.7950258446330948, "learning_rate": 3.330018078612446e-05, "loss": 0.3737, "loss_nan_ranks": 0, "loss_rank_avg": 0.37683820724487305, "step": 1510, "valid_targets_mean": 2834.4, "valid_targets_min": 916 }, { "epoch": 2.40095087163233, "grad_norm": 0.8185064986671969, "learning_rate": 3.324105187755775e-05, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.38336193561553955, "step": 1515, "valid_targets_mean": 2173.2, "valid_targets_min": 1103 }, { "epoch": 2.408874801901743, "grad_norm": 0.6460844220432804, "learning_rate": 3.318171619904709e-05, "loss": 0.3755, "loss_nan_ranks": 0, "loss_rank_avg": 0.34656602144241333, "step": 1520, "valid_targets_mean": 3330.8, "valid_targets_min": 1132 }, { "epoch": 2.416798732171157, "grad_norm": 0.6942145163373754, "learning_rate": 3.3122174677168027e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.392851322889328, "step": 1525, "valid_targets_mean": 3246.0, "valid_targets_min": 305 }, { "epoch": 2.4247226624405704, "grad_norm": 0.6507292400611256, "learning_rate": 3.306242824171053e-05, "loss": 0.3824, "loss_nan_ranks": 0, "loss_rank_avg": 0.38254374265670776, "step": 1530, "valid_targets_mean": 3621.5, "valid_targets_min": 1123 }, { "epoch": 2.4326465927099843, "grad_norm": 0.7278179160659652, "learning_rate": 3.300247782566445e-05, "loss": 0.3678, "loss_nan_ranks": 0, "loss_rank_avg": 0.3891586661338806, "step": 1535, "valid_targets_mean": 3476.8, "valid_targets_min": 1357 }, { "epoch": 2.4405705229793977, "grad_norm": 0.6983942948833125, "learning_rate": 3.294232436520499e-05, "loss": 0.3463, "loss_nan_ranks": 0, "loss_rank_avg": 0.33123183250427246, "step": 1540, "valid_targets_mean": 3465.1, "valid_targets_min": 1288 }, { "epoch": 2.4484944532488115, "grad_norm": 0.6594224791344621, "learning_rate": 3.288196879967801e-05, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.38076046109199524, "step": 1545, "valid_targets_mean": 3734.8, "valid_targets_min": 1161 }, { "epoch": 2.456418383518225, "grad_norm": 0.7471632828891966, "learning_rate": 3.282141207158546e-05, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.3740571141242981, "step": 1550, "valid_targets_mean": 3052.6, "valid_targets_min": 1220 }, { "epoch": 2.464342313787639, "grad_norm": 0.7075053052011875, "learning_rate": 3.276065512657058e-05, "loss": 0.3705, "loss_nan_ranks": 0, "loss_rank_avg": 0.3714832663536072, "step": 1555, "valid_targets_mean": 3095.8, "valid_targets_min": 1603 }, { "epoch": 2.472266244057052, "grad_norm": 0.7245176872705255, "learning_rate": 3.269969891340315e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.3616369664669037, "step": 1560, "valid_targets_mean": 3465.4, "valid_targets_min": 911 }, { "epoch": 2.480190174326466, "grad_norm": 0.707650235922073, "learning_rate": 3.263854438396473e-05, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.3539058268070221, "step": 1565, "valid_targets_mean": 3309.2, "valid_targets_min": 1521 }, { "epoch": 2.4881141045958794, "grad_norm": 0.7349689198868826, "learning_rate": 3.257719249323371e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.37612348794937134, "step": 1570, "valid_targets_mean": 2882.0, "valid_targets_min": 1184 }, { "epoch": 2.4960380348652933, "grad_norm": 0.9170986597030537, "learning_rate": 3.251564419927046e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.39871150255203247, "step": 1575, "valid_targets_mean": 2766.1, "valid_targets_min": 1338 }, { "epoch": 2.5039619651347067, "grad_norm": 0.6961153396437054, "learning_rate": 3.245390046320234e-05, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.3306850492954254, "step": 1580, "valid_targets_mean": 3363.3, "valid_targets_min": 1641 }, { "epoch": 2.5118858954041206, "grad_norm": 0.695789931766822, "learning_rate": 3.239196224920873e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.37488996982574463, "step": 1585, "valid_targets_mean": 3035.2, "valid_targets_min": 969 }, { "epoch": 2.519809825673534, "grad_norm": 0.7571853645906732, "learning_rate": 3.232983052450588e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.3629456162452698, "step": 1590, "valid_targets_mean": 2581.4, "valid_targets_min": 1175 }, { "epoch": 2.527733755942948, "grad_norm": 0.7703230366613334, "learning_rate": 3.2267506259331936e-05, "loss": 0.398, "loss_nan_ranks": 0, "loss_rank_avg": 0.4350147843360901, "step": 1595, "valid_targets_mean": 2874.7, "valid_targets_min": 1122 }, { "epoch": 2.535657686212361, "grad_norm": 0.6346611462613172, "learning_rate": 3.220499042693167e-05, "loss": 0.3724, "loss_nan_ranks": 0, "loss_rank_avg": 0.34332937002182007, "step": 1600, "valid_targets_mean": 3585.5, "valid_targets_min": 1364 }, { "epoch": 2.543581616481775, "grad_norm": 0.8006448514494869, "learning_rate": 3.214228400354137e-05, "loss": 0.3751, "loss_nan_ranks": 0, "loss_rank_avg": 0.40395885705947876, "step": 1605, "valid_targets_mean": 3247.1, "valid_targets_min": 1270 }, { "epoch": 2.5515055467511885, "grad_norm": 0.7559604723688351, "learning_rate": 3.207938796837354e-05, "loss": 0.3904, "loss_nan_ranks": 0, "loss_rank_avg": 0.37246257066726685, "step": 1610, "valid_targets_mean": 2641.6, "valid_targets_min": 1071 }, { "epoch": 2.5594294770206023, "grad_norm": 0.7353157217889033, "learning_rate": 3.201630330360165e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.3442043662071228, "step": 1615, "valid_targets_mean": 2777.2, "valid_targets_min": 1471 }, { "epoch": 2.5673534072900157, "grad_norm": 0.720107392698628, "learning_rate": 3.195303099434474e-05, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.41481178998947144, "step": 1620, "valid_targets_mean": 3245.4, "valid_targets_min": 954 }, { "epoch": 2.5752773375594296, "grad_norm": 0.776231256992938, "learning_rate": 3.1889572028652106e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.36978304386138916, "step": 1625, "valid_targets_mean": 2458.1, "valid_targets_min": 1103 }, { "epoch": 2.583201267828843, "grad_norm": 0.6657358034169792, "learning_rate": 3.182592739748783e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.37111061811447144, "step": 1630, "valid_targets_mean": 3370.6, "valid_targets_min": 1365 }, { "epoch": 2.591125198098257, "grad_norm": 0.6712733739184077, "learning_rate": 3.17620980947153e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.34165388345718384, "step": 1635, "valid_targets_mean": 3146.2, "valid_targets_min": 1259 }, { "epoch": 2.59904912836767, "grad_norm": 0.8228340893308538, "learning_rate": 3.1698085117081725e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.4077662229537964, "step": 1640, "valid_targets_mean": 2459.1, "valid_targets_min": 719 }, { "epoch": 2.606973058637084, "grad_norm": 0.7144944121446368, "learning_rate": 3.163388946420253e-05, "loss": 0.3697, "loss_nan_ranks": 0, "loss_rank_avg": 0.37951573729515076, "step": 1645, "valid_targets_mean": 2752.9, "valid_targets_min": 1282 }, { "epoch": 2.6148969889064975, "grad_norm": 0.8614676246761742, "learning_rate": 3.156951213854578e-05, "loss": 0.3758, "loss_nan_ranks": 0, "loss_rank_avg": 0.3518531024456024, "step": 1650, "valid_targets_mean": 3622.9, "valid_targets_min": 1274 }, { "epoch": 2.6228209191759113, "grad_norm": 0.6797007118760665, "learning_rate": 3.1504954145416494e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.354215145111084, "step": 1655, "valid_targets_mean": 3218.9, "valid_targets_min": 1131 }, { "epoch": 2.6307448494453247, "grad_norm": 0.6901202480893878, "learning_rate": 3.144021649294096e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.36378616094589233, "step": 1660, "valid_targets_mean": 3135.1, "valid_targets_min": 1197 }, { "epoch": 2.6386687797147386, "grad_norm": 0.72642791007056, "learning_rate": 3.137530019205104e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.3361148238182068, "step": 1665, "valid_targets_mean": 3140.4, "valid_targets_min": 1078 }, { "epoch": 2.6465927099841524, "grad_norm": 0.736512606598198, "learning_rate": 3.131020625646827e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.36432206630706787, "step": 1670, "valid_targets_mean": 2840.2, "valid_targets_min": 1376 }, { "epoch": 2.654516640253566, "grad_norm": 0.7161092212114627, "learning_rate": 3.124493570268815e-05, "loss": 0.3697, "loss_nan_ranks": 0, "loss_rank_avg": 0.384030282497406, "step": 1675, "valid_targets_mean": 3557.6, "valid_targets_min": 1364 }, { "epoch": 2.662440570522979, "grad_norm": 0.6866773135599233, "learning_rate": 3.117948954996419e-05, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.3353482186794281, "step": 1680, "valid_targets_mean": 3323.8, "valid_targets_min": 1241 }, { "epoch": 2.670364500792393, "grad_norm": 0.7214323381715583, "learning_rate": 3.111386882029205e-05, "loss": 0.3557, "loss_nan_ranks": 0, "loss_rank_avg": 0.3556535243988037, "step": 1685, "valid_targets_mean": 2939.8, "valid_targets_min": 465 }, { "epoch": 2.678288431061807, "grad_norm": 0.7532775358119311, "learning_rate": 3.1048074538393515e-05, "loss": 0.3705, "loss_nan_ranks": 0, "loss_rank_avg": 0.3484819531440735, "step": 1690, "valid_targets_mean": 2753.2, "valid_targets_min": 926 }, { "epoch": 2.6862123613312203, "grad_norm": 0.7196890582839597, "learning_rate": 3.098210773170057e-05, "loss": 0.3674, "loss_nan_ranks": 0, "loss_rank_avg": 0.39478743076324463, "step": 1695, "valid_targets_mean": 3182.8, "valid_targets_min": 1825 }, { "epoch": 2.6941362916006337, "grad_norm": 0.6412851439845717, "learning_rate": 3.0915969430339285e-05, "loss": 0.3788, "loss_nan_ranks": 0, "loss_rank_avg": 0.4072532057762146, "step": 1700, "valid_targets_mean": 3858.4, "valid_targets_min": 1152 }, { "epoch": 2.7020602218700476, "grad_norm": 0.8200510450598304, "learning_rate": 3.0849660667113785e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.4585651159286499, "step": 1705, "valid_targets_mean": 2658.2, "valid_targets_min": 949 }, { "epoch": 2.7099841521394614, "grad_norm": 0.8199512586359826, "learning_rate": 3.078318247749009e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.43864548206329346, "step": 1710, "valid_targets_mean": 2758.8, "valid_targets_min": 805 }, { "epoch": 2.717908082408875, "grad_norm": 0.7912495090847645, "learning_rate": 3.0716535899579936e-05, "loss": 0.3429, "loss_nan_ranks": 0, "loss_rank_avg": 0.3498538136482239, "step": 1715, "valid_targets_mean": 2157.8, "valid_targets_min": 926 }, { "epoch": 2.7258320126782882, "grad_norm": 0.5876938155418893, "learning_rate": 3.0649721974124606e-05, "loss": 0.3544, "loss_nan_ranks": 0, "loss_rank_avg": 0.32150182127952576, "step": 1720, "valid_targets_mean": 3719.1, "valid_targets_min": 883 }, { "epoch": 2.733755942947702, "grad_norm": 0.877583762546389, "learning_rate": 3.058274174447864e-05, "loss": 0.3744, "loss_nan_ranks": 0, "loss_rank_avg": 0.39479172229766846, "step": 1725, "valid_targets_mean": 2071.7, "valid_targets_min": 994 }, { "epoch": 2.741679873217116, "grad_norm": 0.6592647942561869, "learning_rate": 3.0515596256593566e-05, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.32501962780952454, "step": 1730, "valid_targets_mean": 3369.1, "valid_targets_min": 1144 }, { "epoch": 2.7496038034865293, "grad_norm": 0.7657355885140038, "learning_rate": 3.044828655900153e-05, "loss": 0.3834, "loss_nan_ranks": 0, "loss_rank_avg": 0.3660418391227722, "step": 1735, "valid_targets_mean": 2924.8, "valid_targets_min": 1083 }, { "epoch": 2.7575277337559427, "grad_norm": 0.7593994147389292, "learning_rate": 3.0380813702798975e-05, "loss": 0.3765, "loss_nan_ranks": 0, "loss_rank_avg": 0.38318681716918945, "step": 1740, "valid_targets_mean": 2862.4, "valid_targets_min": 923 }, { "epoch": 2.7654516640253566, "grad_norm": 0.8032261353715695, "learning_rate": 3.0313178741630193e-05, "loss": 0.3775, "loss_nan_ranks": 0, "loss_rank_avg": 0.4111163914203644, "step": 1745, "valid_targets_mean": 2419.5, "valid_targets_min": 845 }, { "epoch": 2.7733755942947704, "grad_norm": 0.7917662706861506, "learning_rate": 3.0245382731670872e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.40242886543273926, "step": 1750, "valid_targets_mean": 2851.2, "valid_targets_min": 824 }, { "epoch": 2.781299524564184, "grad_norm": 0.6994549455580847, "learning_rate": 3.017742673161161e-05, "loss": 0.3694, "loss_nan_ranks": 0, "loss_rank_avg": 0.36322033405303955, "step": 1755, "valid_targets_mean": 3588.1, "valid_targets_min": 680 }, { "epoch": 2.7892234548335972, "grad_norm": 0.6902449352365942, "learning_rate": 3.0109311802641394e-05, "loss": 0.3745, "loss_nan_ranks": 0, "loss_rank_avg": 0.3887173533439636, "step": 1760, "valid_targets_mean": 3538.9, "valid_targets_min": 1645 }, { "epoch": 2.797147385103011, "grad_norm": 0.6572463116289267, "learning_rate": 3.0041039008431006e-05, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.3245548605918884, "step": 1765, "valid_targets_mean": 3434.0, "valid_targets_min": 1483 }, { "epoch": 2.805071315372425, "grad_norm": 0.7520916361470656, "learning_rate": 2.9972609415116424e-05, "loss": 0.3595, "loss_nan_ranks": 0, "loss_rank_avg": 0.36480066180229187, "step": 1770, "valid_targets_mean": 2674.7, "valid_targets_min": 1341 }, { "epoch": 2.8129952456418383, "grad_norm": 0.7013146155031664, "learning_rate": 2.990402409128218e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.3468988239765167, "step": 1775, "valid_targets_mean": 3095.1, "valid_targets_min": 1131 }, { "epoch": 2.8209191759112517, "grad_norm": 0.8604280966015914, "learning_rate": 2.983528410794466e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.36563342809677124, "step": 1780, "valid_targets_mean": 2494.7, "valid_targets_min": 875 }, { "epoch": 2.8288431061806656, "grad_norm": 0.8186766988561371, "learning_rate": 2.9766390538535382e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.3959285318851471, "step": 1785, "valid_targets_mean": 2253.1, "valid_targets_min": 907 }, { "epoch": 2.8367670364500794, "grad_norm": 0.9075815131643683, "learning_rate": 2.9697344458884265e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.34358176589012146, "step": 1790, "valid_targets_mean": 2338.9, "valid_targets_min": 1106 }, { "epoch": 2.844690966719493, "grad_norm": 0.7043856446767114, "learning_rate": 2.9628146947202756e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.354300856590271, "step": 1795, "valid_targets_mean": 3277.2, "valid_targets_min": 1262 }, { "epoch": 2.8526148969889062, "grad_norm": 0.7370078841642661, "learning_rate": 2.9558799084067074e-05, "loss": 0.3718, "loss_nan_ranks": 0, "loss_rank_avg": 0.38159167766571045, "step": 1800, "valid_targets_mean": 2703.7, "valid_targets_min": 1027 }, { "epoch": 2.86053882725832, "grad_norm": 0.6990022019648595, "learning_rate": 2.9489301952401286e-05, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.3276500403881073, "step": 1805, "valid_targets_mean": 3995.8, "valid_targets_min": 675 }, { "epoch": 2.868462757527734, "grad_norm": 0.6638533677079017, "learning_rate": 2.9419656637460413e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.3156994581222534, "step": 1810, "valid_targets_mean": 3012.8, "valid_targets_min": 699 }, { "epoch": 2.8763866877971473, "grad_norm": 0.650719515262378, "learning_rate": 2.9349864226813475e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.3329174518585205, "step": 1815, "valid_targets_mean": 3597.6, "valid_targets_min": 1418 }, { "epoch": 2.8843106180665607, "grad_norm": 0.7687174401357069, "learning_rate": 2.9279925810326516e-05, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.37216711044311523, "step": 1820, "valid_targets_mean": 3317.2, "valid_targets_min": 1141 }, { "epoch": 2.8922345483359746, "grad_norm": 0.6216599334752763, "learning_rate": 2.9209842480145587e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.3306935429573059, "step": 1825, "valid_targets_mean": 3728.8, "valid_targets_min": 1048 }, { "epoch": 2.9001584786053884, "grad_norm": 0.7206089378146915, "learning_rate": 2.913961533067968e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.34333550930023193, "step": 1830, "valid_targets_mean": 3466.3, "valid_targets_min": 1167 }, { "epoch": 2.908082408874802, "grad_norm": 0.7578107255518666, "learning_rate": 2.906924545858364e-05, "loss": 0.371, "loss_nan_ranks": 0, "loss_rank_avg": 0.3424595296382904, "step": 1835, "valid_targets_mean": 2490.8, "valid_targets_min": 805 }, { "epoch": 2.9160063391442153, "grad_norm": 0.7453104444181963, "learning_rate": 2.8998733962741057e-05, "loss": 0.3613, "loss_nan_ranks": 0, "loss_rank_avg": 0.3626144528388977, "step": 1840, "valid_targets_mean": 2894.9, "valid_targets_min": 1095 }, { "epoch": 2.923930269413629, "grad_norm": 0.7718015723542487, "learning_rate": 2.8928081944247088e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.3860081732273102, "step": 1845, "valid_targets_mean": 3889.6, "valid_targets_min": 823 }, { "epoch": 2.931854199683043, "grad_norm": 0.7045879397030554, "learning_rate": 2.8857290506391243e-05, "loss": 0.3724, "loss_nan_ranks": 0, "loss_rank_avg": 0.36101579666137695, "step": 1850, "valid_targets_mean": 2874.3, "valid_targets_min": 1195 }, { "epoch": 2.9397781299524564, "grad_norm": 0.717984417244567, "learning_rate": 2.8786360754640213e-05, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.34760263562202454, "step": 1855, "valid_targets_mean": 2920.6, "valid_targets_min": 1236 }, { "epoch": 2.94770206022187, "grad_norm": 0.6640139889083639, "learning_rate": 2.8715293796620565e-05, "loss": 0.3623, "loss_nan_ranks": 0, "loss_rank_avg": 0.4223308265209198, "step": 1860, "valid_targets_mean": 3860.2, "valid_targets_min": 1403 }, { "epoch": 2.9556259904912836, "grad_norm": 0.6392198399783302, "learning_rate": 2.8644090742101444e-05, "loss": 0.3495, "loss_nan_ranks": 0, "loss_rank_avg": 0.32980644702911377, "step": 1865, "valid_targets_mean": 3921.6, "valid_targets_min": 1156 }, { "epoch": 2.9635499207606975, "grad_norm": 0.6870381101356648, "learning_rate": 2.8572752702977265e-05, "loss": 0.3692, "loss_nan_ranks": 0, "loss_rank_avg": 0.3842689096927643, "step": 1870, "valid_targets_mean": 3652.7, "valid_targets_min": 1219 }, { "epoch": 2.971473851030111, "grad_norm": 0.8762796489016127, "learning_rate": 2.8501280793250343e-05, "loss": 0.3851, "loss_nan_ranks": 0, "loss_rank_avg": 0.41141873598098755, "step": 1875, "valid_targets_mean": 2225.3, "valid_targets_min": 1208 }, { "epoch": 2.9793977812995247, "grad_norm": 0.8115620338836479, "learning_rate": 2.8429676129013476e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.3620631694793701, "step": 1880, "valid_targets_mean": 2161.6, "valid_targets_min": 850 }, { "epoch": 2.987321711568938, "grad_norm": 0.7750980053703787, "learning_rate": 2.835793982843255e-05, "loss": 0.3818, "loss_nan_ranks": 0, "loss_rank_avg": 0.373153418302536, "step": 1885, "valid_targets_mean": 2862.1, "valid_targets_min": 967 }, { "epoch": 2.995245641838352, "grad_norm": 0.7322316673204433, "learning_rate": 2.8286073011729044e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.3833129405975342, "step": 1890, "valid_targets_mean": 3081.8, "valid_targets_min": 1661 }, { "epoch": 3.0031695721077654, "grad_norm": 0.6065227488494328, "learning_rate": 2.8214076801162575e-05, "loss": 0.3712, "loss_nan_ranks": 0, "loss_rank_avg": 0.34482842683792114, "step": 1895, "valid_targets_mean": 3981.5, "valid_targets_min": 1418 }, { "epoch": 3.011093502377179, "grad_norm": 0.6901979613206464, "learning_rate": 2.814195232101334e-05, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.35832148790359497, "step": 1900, "valid_targets_mean": 3975.4, "valid_targets_min": 1122 }, { "epoch": 3.0190174326465926, "grad_norm": 0.7186510353720049, "learning_rate": 2.806970069756456e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.30415624380111694, "step": 1905, "valid_targets_mean": 3198.1, "valid_targets_min": 957 }, { "epoch": 3.0269413629160065, "grad_norm": 0.6882830013798815, "learning_rate": 2.7997323059084926e-05, "loss": 0.331, "loss_nan_ranks": 0, "loss_rank_avg": 0.30928438901901245, "step": 1910, "valid_targets_mean": 3419.6, "valid_targets_min": 1590 }, { "epoch": 3.03486529318542, "grad_norm": 0.7774880183981414, "learning_rate": 2.7924820535810947e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.3439940810203552, "step": 1915, "valid_targets_mean": 2875.5, "valid_targets_min": 742 }, { "epoch": 3.0427892234548337, "grad_norm": 0.7838015454420495, "learning_rate": 2.7852194259929306e-05, "loss": 0.3104, "loss_nan_ranks": 0, "loss_rank_avg": 0.3384024500846863, "step": 1920, "valid_targets_mean": 3003.9, "valid_targets_min": 988 }, { "epoch": 3.050713153724247, "grad_norm": 0.7416290199481121, "learning_rate": 2.7779445365559196e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.35700756311416626, "step": 1925, "valid_targets_mean": 3207.6, "valid_targets_min": 987 }, { "epoch": 3.058637083993661, "grad_norm": 0.7414194431448803, "learning_rate": 2.7706574988734596e-05, "loss": 0.3458, "loss_nan_ranks": 0, "loss_rank_avg": 0.35844355821609497, "step": 1930, "valid_targets_mean": 3496.2, "valid_targets_min": 1326 }, { "epoch": 3.0665610142630744, "grad_norm": 0.7113811917186736, "learning_rate": 2.7633584267386518e-05, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.29518628120422363, "step": 1935, "valid_targets_mean": 3124.2, "valid_targets_min": 680 }, { "epoch": 3.074484944532488, "grad_norm": 0.8314704271197847, "learning_rate": 2.7560474341325276e-05, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.3693086504936218, "step": 1940, "valid_targets_mean": 2553.4, "valid_targets_min": 956 }, { "epoch": 3.0824088748019016, "grad_norm": 0.7863210609659544, "learning_rate": 2.7487246352222648e-05, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.29878532886505127, "step": 1945, "valid_targets_mean": 2444.7, "valid_targets_min": 672 }, { "epoch": 3.0903328050713155, "grad_norm": 0.7257330134496905, "learning_rate": 2.7413901443594073e-05, "loss": 0.3155, "loss_nan_ranks": 0, "loss_rank_avg": 0.30191296339035034, "step": 1950, "valid_targets_mean": 3476.1, "valid_targets_min": 1206 }, { "epoch": 3.098256735340729, "grad_norm": 0.8065297599365323, "learning_rate": 2.7340440760780778e-05, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.32383155822753906, "step": 1955, "valid_targets_mean": 2889.2, "valid_targets_min": 929 }, { "epoch": 3.1061806656101427, "grad_norm": 0.712007666432261, "learning_rate": 2.7266865450931907e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.3361831307411194, "step": 1960, "valid_targets_mean": 3199.6, "valid_targets_min": 1270 }, { "epoch": 3.114104595879556, "grad_norm": 0.7794712083869874, "learning_rate": 2.7193176662986593e-05, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.3365066647529602, "step": 1965, "valid_targets_mean": 2549.4, "valid_targets_min": 989 }, { "epoch": 3.12202852614897, "grad_norm": 0.8498632060188069, "learning_rate": 2.7119375547656025e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.34931614995002747, "step": 1970, "valid_targets_mean": 2771.6, "valid_targets_min": 1096 }, { "epoch": 3.1299524564183834, "grad_norm": 0.7075486291042362, "learning_rate": 2.704546325740548e-05, "loss": 0.3357, "loss_nan_ranks": 0, "loss_rank_avg": 0.31514453887939453, "step": 1975, "valid_targets_mean": 3283.4, "valid_targets_min": 904 }, { "epoch": 3.1378763866877972, "grad_norm": 0.8262903637467062, "learning_rate": 2.6971440946436306e-05, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.3372984528541565, "step": 1980, "valid_targets_mean": 2639.2, "valid_targets_min": 1053 }, { "epoch": 3.1458003169572106, "grad_norm": 0.6978216538446294, "learning_rate": 2.689730977066795e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.3109763264656067, "step": 1985, "valid_targets_mean": 3200.6, "valid_targets_min": 860 }, { "epoch": 3.1537242472266245, "grad_norm": 0.740783802930712, "learning_rate": 2.682307088771984e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.35412776470184326, "step": 1990, "valid_targets_mean": 3045.1, "valid_targets_min": 998 }, { "epoch": 3.161648177496038, "grad_norm": 0.8656214600333869, "learning_rate": 2.6748725456893355e-05, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.32956281304359436, "step": 1995, "valid_targets_mean": 2030.4, "valid_targets_min": 968 }, { "epoch": 3.1695721077654517, "grad_norm": 0.7377230964997741, "learning_rate": 2.66742746391537e-05, "loss": 0.3513, "loss_nan_ranks": 0, "loss_rank_avg": 0.3444298505783081, "step": 2000, "valid_targets_mean": 3455.4, "valid_targets_min": 1280 }, { "epoch": 3.177496038034865, "grad_norm": 0.7541796485264278, "learning_rate": 2.6599719597111794e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.3887772560119629, "step": 2005, "valid_targets_mean": 3408.1, "valid_targets_min": 1341 }, { "epoch": 3.185419968304279, "grad_norm": 0.7815456449009791, "learning_rate": 2.6525061495006103e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.3660275936126709, "step": 2010, "valid_targets_mean": 3231.4, "valid_targets_min": 1124 }, { "epoch": 3.1933438985736924, "grad_norm": 0.6900245267272553, "learning_rate": 2.6450301498684443e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.34687238931655884, "step": 2015, "valid_targets_mean": 3574.1, "valid_targets_min": 1302 }, { "epoch": 3.2012678288431062, "grad_norm": 0.7549001056433992, "learning_rate": 2.637544077558581e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3526916205883026, "step": 2020, "valid_targets_mean": 3198.1, "valid_targets_min": 1741 }, { "epoch": 3.2091917591125196, "grad_norm": 0.7851430991597503, "learning_rate": 2.630048049472213e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.3379470705986023, "step": 2025, "valid_targets_mean": 2515.5, "valid_targets_min": 323 }, { "epoch": 3.2171156893819335, "grad_norm": 0.7004928403794375, "learning_rate": 2.622542182666e-05, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.32637515664100647, "step": 2030, "valid_targets_mean": 3517.1, "valid_targets_min": 1042 }, { "epoch": 3.225039619651347, "grad_norm": 0.7764554104098883, "learning_rate": 2.6150265943502424e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3583545684814453, "step": 2035, "valid_targets_mean": 2765.4, "valid_targets_min": 881 }, { "epoch": 3.2329635499207607, "grad_norm": 0.6465157812209109, "learning_rate": 2.6075014018870483e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.3526315689086914, "step": 2040, "valid_targets_mean": 4235.4, "valid_targets_min": 1086 }, { "epoch": 3.240887480190174, "grad_norm": 0.706625007326448, "learning_rate": 2.599966722788504e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.2997731566429138, "step": 2045, "valid_targets_mean": 3172.4, "valid_targets_min": 1201 }, { "epoch": 3.248811410459588, "grad_norm": 0.7850578365104528, "learning_rate": 2.5924226747148372e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.30590397119522095, "step": 2050, "valid_targets_mean": 2757.9, "valid_targets_min": 1061 }, { "epoch": 3.2567353407290014, "grad_norm": 0.6518087609710441, "learning_rate": 2.584869375472579e-05, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.29854464530944824, "step": 2055, "valid_targets_mean": 3279.2, "valid_targets_min": 1107 }, { "epoch": 3.2646592709984152, "grad_norm": 0.822500398616075, "learning_rate": 2.577306943012725e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.34053948521614075, "step": 2060, "valid_targets_mean": 2633.9, "valid_targets_min": 1317 }, { "epoch": 3.272583201267829, "grad_norm": 0.8125115262492077, "learning_rate": 2.569735495428896e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.32668331265449524, "step": 2065, "valid_targets_mean": 2618.7, "valid_targets_min": 786 }, { "epoch": 3.2805071315372425, "grad_norm": 1.4959208602319205, "learning_rate": 2.562155150955488e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.3204629421234131, "step": 2070, "valid_targets_mean": 2665.9, "valid_targets_min": 1262 }, { "epoch": 3.288431061806656, "grad_norm": 0.611048992859609, "learning_rate": 2.554566027965832e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.2836368680000305, "step": 2075, "valid_targets_mean": 4082.5, "valid_targets_min": 1157 }, { "epoch": 3.2963549920760697, "grad_norm": 0.7774858963866713, "learning_rate": 2.5469682449703414e-05, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.3361954689025879, "step": 2080, "valid_targets_mean": 2990.8, "valid_targets_min": 644 }, { "epoch": 3.3042789223454836, "grad_norm": 0.8182618562206451, "learning_rate": 2.539361920614662e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.3528863191604614, "step": 2085, "valid_targets_mean": 2776.4, "valid_targets_min": 1167 }, { "epoch": 3.312202852614897, "grad_norm": 0.7286378347810851, "learning_rate": 2.5317471736778226e-05, "loss": 0.3348, "loss_nan_ranks": 0, "loss_rank_avg": 0.3281998038291931, "step": 2090, "valid_targets_mean": 3044.1, "valid_targets_min": 592 }, { "epoch": 3.3201267828843104, "grad_norm": 0.5916476860001847, "learning_rate": 2.524124123070375e-05, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.27134382724761963, "step": 2095, "valid_targets_mean": 4022.4, "valid_targets_min": 836 }, { "epoch": 3.3280507131537242, "grad_norm": 0.8344841361605951, "learning_rate": 2.5164928878325404e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.33823129534721375, "step": 2100, "valid_targets_mean": 2500.5, "valid_targets_min": 1030 }, { "epoch": 3.335974643423138, "grad_norm": 0.7080563566881553, "learning_rate": 2.5088535871323502e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.3264184594154358, "step": 2105, "valid_targets_mean": 3250.5, "valid_targets_min": 1023 }, { "epoch": 3.3438985736925515, "grad_norm": 0.7908723696589502, "learning_rate": 2.5012063402637843e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.35519134998321533, "step": 2110, "valid_targets_mean": 2987.3, "valid_targets_min": 1241 }, { "epoch": 3.351822503961965, "grad_norm": 0.70839207204405, "learning_rate": 2.4935512666449085e-05, "loss": 0.3188, "loss_nan_ranks": 0, "loss_rank_avg": 0.31166577339172363, "step": 2115, "valid_targets_mean": 3060.3, "valid_targets_min": 746 }, { "epoch": 3.3597464342313788, "grad_norm": 0.7933084485897915, "learning_rate": 2.4858884858160107e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.3538547158241272, "step": 2120, "valid_targets_mean": 3038.3, "valid_targets_min": 1106 }, { "epoch": 3.3676703645007926, "grad_norm": 0.7663074843622576, "learning_rate": 2.4782181174377314e-05, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.352549284696579, "step": 2125, "valid_targets_mean": 3099.4, "valid_targets_min": 1095 }, { "epoch": 3.375594294770206, "grad_norm": 0.7138476967374972, "learning_rate": 2.470540281289199e-05, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.33138760924339294, "step": 2130, "valid_targets_mean": 2867.1, "valid_targets_min": 1311 }, { "epoch": 3.3835182250396194, "grad_norm": 0.6633701832610104, "learning_rate": 2.4628550972661557e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.30286821722984314, "step": 2135, "valid_targets_mean": 3736.6, "valid_targets_min": 1535 }, { "epoch": 3.3914421553090333, "grad_norm": 0.7181119752621806, "learning_rate": 2.455162685379087e-05, "loss": 0.3212, "loss_nan_ranks": 0, "loss_rank_avg": 0.3247692286968231, "step": 2140, "valid_targets_mean": 3933.5, "valid_targets_min": 1455 }, { "epoch": 3.399366085578447, "grad_norm": 0.58939690424488, "learning_rate": 2.447463165751349e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.28043270111083984, "step": 2145, "valid_targets_mean": 4510.4, "valid_targets_min": 1619 }, { "epoch": 3.4072900158478605, "grad_norm": 0.6905860534611378, "learning_rate": 2.4397566586172883e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.31197258830070496, "step": 2150, "valid_targets_mean": 3251.9, "valid_targets_min": 1084 }, { "epoch": 3.4152139461172744, "grad_norm": 0.7543811037179319, "learning_rate": 2.4320432843203704e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.33104807138442993, "step": 2155, "valid_targets_mean": 2821.9, "valid_targets_min": 1396 }, { "epoch": 3.4231378763866878, "grad_norm": 0.7618177630066788, "learning_rate": 2.4243231633112943e-05, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.33463001251220703, "step": 2160, "valid_targets_mean": 3083.6, "valid_targets_min": 1252 }, { "epoch": 3.4310618066561016, "grad_norm": 0.7273682305306333, "learning_rate": 2.4165964161461167e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.34640154242515564, "step": 2165, "valid_targets_mean": 3702.2, "valid_targets_min": 1381 }, { "epoch": 3.438985736925515, "grad_norm": 0.6923581076598425, "learning_rate": 2.408863163484366e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.33265140652656555, "step": 2170, "valid_targets_mean": 3575.5, "valid_targets_min": 605 }, { "epoch": 3.446909667194929, "grad_norm": 0.7329934998169874, "learning_rate": 2.401123526087159e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3211047947406769, "step": 2175, "valid_targets_mean": 3020.9, "valid_targets_min": 1398 }, { "epoch": 3.4548335974643423, "grad_norm": 0.6822054946764609, "learning_rate": 2.3933776248153168e-05, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3279761075973511, "step": 2180, "valid_targets_mean": 3455.0, "valid_targets_min": 1277 }, { "epoch": 3.462757527733756, "grad_norm": 0.6616693352625908, "learning_rate": 2.385625580627474e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.3381684124469757, "step": 2185, "valid_targets_mean": 3872.2, "valid_targets_min": 1192 }, { "epoch": 3.4706814580031695, "grad_norm": 0.7741372802839244, "learning_rate": 2.377867514578194e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.3979116678237915, "step": 2190, "valid_targets_mean": 3336.3, "valid_targets_min": 997 }, { "epoch": 3.4786053882725834, "grad_norm": 0.7070236701033044, "learning_rate": 2.3701035478160763e-05, "loss": 0.349, "loss_nan_ranks": 0, "loss_rank_avg": 0.35837632417678833, "step": 2195, "valid_targets_mean": 3782.2, "valid_targets_min": 1485 }, { "epoch": 3.4865293185419968, "grad_norm": 0.7494594936521863, "learning_rate": 2.3623338015818623e-05, "loss": 0.3357, "loss_nan_ranks": 0, "loss_rank_avg": 0.3438400626182556, "step": 2200, "valid_targets_mean": 2959.6, "valid_targets_min": 663 }, { "epoch": 3.4944532488114106, "grad_norm": 0.6937608768005562, "learning_rate": 2.3545583972065484e-05, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.3017534911632538, "step": 2205, "valid_targets_mean": 3185.6, "valid_targets_min": 900 }, { "epoch": 3.502377179080824, "grad_norm": 0.6888295505753116, "learning_rate": 2.346777456109485e-05, "loss": 0.3277, "loss_nan_ranks": 0, "loss_rank_avg": 0.26715266704559326, "step": 2210, "valid_targets_mean": 2821.8, "valid_targets_min": 944 }, { "epoch": 3.510301109350238, "grad_norm": 0.7118241028505115, "learning_rate": 2.3389910997964832e-05, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.3349294066429138, "step": 2215, "valid_targets_mean": 3142.1, "valid_targets_min": 1146 }, { "epoch": 3.5182250396196513, "grad_norm": 0.7278682132311887, "learning_rate": 2.3311994498579185e-05, "loss": 0.331, "loss_nan_ranks": 0, "loss_rank_avg": 0.29668980836868286, "step": 2220, "valid_targets_mean": 3287.6, "valid_targets_min": 1218 }, { "epoch": 3.526148969889065, "grad_norm": 0.6941142765146813, "learning_rate": 2.3234026279668296e-05, "loss": 0.3326, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018149733543396, "step": 2225, "valid_targets_mean": 3132.2, "valid_targets_min": 852 }, { "epoch": 3.5340729001584785, "grad_norm": 0.740242823338274, "learning_rate": 2.3156007558770192e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.31529009342193604, "step": 2230, "valid_targets_mean": 2922.2, "valid_targets_min": 1057 }, { "epoch": 3.5419968304278924, "grad_norm": 0.8523972449816457, "learning_rate": 2.307793955421154e-05, "loss": 0.3331, "loss_nan_ranks": 0, "loss_rank_avg": 0.3462240397930145, "step": 2235, "valid_targets_mean": 2572.6, "valid_targets_min": 951 }, { "epoch": 3.5499207606973058, "grad_norm": 0.7990562745382495, "learning_rate": 2.299982348508861e-05, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.3121604025363922, "step": 2240, "valid_targets_mean": 2908.9, "valid_targets_min": 1118 }, { "epoch": 3.5578446909667196, "grad_norm": 0.6945315665088014, "learning_rate": 2.2921660571248237e-05, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.33167335391044617, "step": 2245, "valid_targets_mean": 3621.6, "valid_targets_min": 881 }, { "epoch": 3.565768621236133, "grad_norm": 0.6731796035427767, "learning_rate": 2.2843452033268775e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.30071955919265747, "step": 2250, "valid_targets_mean": 3450.9, "valid_targets_min": 1051 }, { "epoch": 3.573692551505547, "grad_norm": 0.8546792122499989, "learning_rate": 2.2765199092441033e-05, "loss": 0.3335, "loss_nan_ranks": 0, "loss_rank_avg": 0.39534080028533936, "step": 2255, "valid_targets_mean": 2804.2, "valid_targets_min": 1371 }, { "epoch": 3.5816164817749603, "grad_norm": 0.8037548712670296, "learning_rate": 2.2686902970749218e-05, "loss": 0.3326, "loss_nan_ranks": 0, "loss_rank_avg": 0.354625940322876, "step": 2260, "valid_targets_mean": 2839.2, "valid_targets_min": 1273 }, { "epoch": 3.589540412044374, "grad_norm": 0.7463842550414609, "learning_rate": 2.260856489085183e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.3454499840736389, "step": 2265, "valid_targets_mean": 2875.6, "valid_targets_min": 1522 }, { "epoch": 3.5974643423137875, "grad_norm": 0.7214338181235017, "learning_rate": 2.2530186076062588e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.32981571555137634, "step": 2270, "valid_targets_mean": 3369.8, "valid_targets_min": 1324 }, { "epoch": 3.6053882725832014, "grad_norm": 0.7266954380266903, "learning_rate": 2.2451767750331316e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.3404169976711273, "step": 2275, "valid_targets_mean": 3491.8, "valid_targets_min": 1001 }, { "epoch": 3.613312202852615, "grad_norm": 0.7418997208137097, "learning_rate": 2.2373311138224838e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.31640252470970154, "step": 2280, "valid_targets_mean": 2498.8, "valid_targets_min": 901 }, { "epoch": 3.6212361331220286, "grad_norm": 0.7680111061901961, "learning_rate": 2.2294817464907852e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.3239263594150543, "step": 2285, "valid_targets_mean": 2514.9, "valid_targets_min": 1517 }, { "epoch": 3.629160063391442, "grad_norm": 0.6982918820606155, "learning_rate": 2.221628795612379e-05, "loss": 0.3313, "loss_nan_ranks": 0, "loss_rank_avg": 0.32979482412338257, "step": 2290, "valid_targets_mean": 3441.3, "valid_targets_min": 1224 }, { "epoch": 3.637083993660856, "grad_norm": 0.7261379689885271, "learning_rate": 2.2137723838175693e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3410705327987671, "step": 2295, "valid_targets_mean": 2833.8, "valid_targets_min": 1138 }, { "epoch": 3.6450079239302693, "grad_norm": 0.7535963960315106, "learning_rate": 2.205912633790704e-05, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.323788583278656, "step": 2300, "valid_targets_mean": 2891.2, "valid_targets_min": 1241 }, { "epoch": 3.652931854199683, "grad_norm": 0.6969204879397259, "learning_rate": 2.198049668268262e-05, "loss": 0.3284, "loss_nan_ranks": 0, "loss_rank_avg": 0.3207600712776184, "step": 2305, "valid_targets_mean": 3219.8, "valid_targets_min": 1444 }, { "epoch": 3.6608557844690965, "grad_norm": 0.887306839014218, "learning_rate": 2.1901836100369335e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.33578261733055115, "step": 2310, "valid_targets_mean": 2205.1, "valid_targets_min": 906 }, { "epoch": 3.6687797147385104, "grad_norm": 0.9750572459180453, "learning_rate": 2.1823145819317048e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.35123610496520996, "step": 2315, "valid_targets_mean": 2695.4, "valid_targets_min": 1084 }, { "epoch": 3.676703645007924, "grad_norm": 0.7780709496343529, "learning_rate": 2.174442706833938e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.3519875109195709, "step": 2320, "valid_targets_mean": 2882.0, "valid_targets_min": 807 }, { "epoch": 3.6846275752773376, "grad_norm": 0.7243496238272615, "learning_rate": 2.1665681076694544e-05, "loss": 0.3247, "loss_nan_ranks": 0, "loss_rank_avg": 0.31398969888687134, "step": 2325, "valid_targets_mean": 2690.4, "valid_targets_min": 732 }, { "epoch": 3.692551505546751, "grad_norm": 0.7526736641692691, "learning_rate": 2.1586909074066136e-05, "loss": 0.3462, "loss_nan_ranks": 0, "loss_rank_avg": 0.34414851665496826, "step": 2330, "valid_targets_mean": 3210.9, "valid_targets_min": 1143 }, { "epoch": 3.700475435816165, "grad_norm": 0.7452110101075897, "learning_rate": 2.1508112290543933e-05, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.3227662742137909, "step": 2335, "valid_targets_mean": 3213.6, "valid_targets_min": 1032 }, { "epoch": 3.7083993660855783, "grad_norm": 0.7854460633468776, "learning_rate": 2.142929195660469e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.34010860323905945, "step": 2340, "valid_targets_mean": 2676.4, "valid_targets_min": 933 }, { "epoch": 3.716323296354992, "grad_norm": 0.6656721032192763, "learning_rate": 2.1350449303092917e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.29363691806793213, "step": 2345, "valid_targets_mean": 3574.9, "valid_targets_min": 1262 }, { "epoch": 3.7242472266244055, "grad_norm": 0.7337377728820911, "learning_rate": 2.1271585561201666e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.4165416359901428, "step": 2350, "valid_targets_mean": 3303.0, "valid_targets_min": 1199 }, { "epoch": 3.7321711568938194, "grad_norm": 0.6641092113281405, "learning_rate": 2.1192701962453296e-05, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.30195552110671997, "step": 2355, "valid_targets_mean": 3354.2, "valid_targets_min": 916 }, { "epoch": 3.740095087163233, "grad_norm": 0.5875766220259515, "learning_rate": 2.1113799738680254e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.31163403391838074, "step": 2360, "valid_targets_mean": 4143.1, "valid_targets_min": 1838 }, { "epoch": 3.7480190174326466, "grad_norm": 0.717473872317517, "learning_rate": 2.103488012200583e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.35403263568878174, "step": 2365, "valid_targets_mean": 3673.4, "valid_targets_min": 1188 }, { "epoch": 3.75594294770206, "grad_norm": 0.7708312139810358, "learning_rate": 2.095594434482491e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.33274000883102417, "step": 2370, "valid_targets_mean": 3095.4, "valid_targets_min": 1461 }, { "epoch": 3.763866877971474, "grad_norm": 0.6215656666692516, "learning_rate": 2.0876993639784752e-05, "loss": 0.3578, "loss_nan_ranks": 0, "loss_rank_avg": 0.3734382092952728, "step": 2375, "valid_targets_mean": 4395.7, "valid_targets_min": 1069 }, { "epoch": 3.7717908082408877, "grad_norm": 0.696852480633942, "learning_rate": 2.0798029239765722e-05, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.31851282715797424, "step": 2380, "valid_targets_mean": 3874.2, "valid_targets_min": 1802 }, { "epoch": 3.779714738510301, "grad_norm": 0.6951396595704138, "learning_rate": 2.0719052377862033e-05, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.32077187299728394, "step": 2385, "valid_targets_mean": 3521.0, "valid_targets_min": 1390 }, { "epoch": 3.7876386687797146, "grad_norm": 0.7195020532275461, "learning_rate": 2.0640064287362525e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.3314870297908783, "step": 2390, "valid_targets_mean": 3229.4, "valid_targets_min": 1289 }, { "epoch": 3.7955625990491284, "grad_norm": 0.8180751679396766, "learning_rate": 2.056106620173135e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.3853730857372284, "step": 2395, "valid_targets_mean": 2613.6, "valid_targets_min": 1336 }, { "epoch": 3.8034865293185423, "grad_norm": 0.733730511080735, "learning_rate": 2.048205935458877e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.32132023572921753, "step": 2400, "valid_targets_mean": 3179.6, "valid_targets_min": 1221 }, { "epoch": 3.8114104595879557, "grad_norm": 0.6134570576672795, "learning_rate": 2.0403044979691854e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.28578662872314453, "step": 2405, "valid_targets_mean": 3837.6, "valid_targets_min": 1304 }, { "epoch": 3.819334389857369, "grad_norm": 0.7635018637295181, "learning_rate": 2.032402431091522e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.31944137811660767, "step": 2410, "valid_targets_mean": 2599.2, "valid_targets_min": 1296 }, { "epoch": 3.827258320126783, "grad_norm": 0.7372264488783937, "learning_rate": 2.0244998582231767e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.3162527084350586, "step": 2415, "valid_targets_mean": 2805.4, "valid_targets_min": 1464 }, { "epoch": 3.8351822503961968, "grad_norm": 0.6531551753056782, "learning_rate": 2.0165969027693425e-05, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.3599008321762085, "step": 2420, "valid_targets_mean": 4002.8, "valid_targets_min": 1494 }, { "epoch": 3.84310618066561, "grad_norm": 0.8353501525186963, "learning_rate": 2.008693688141185e-05, "loss": 0.3313, "loss_nan_ranks": 0, "loss_rank_avg": 0.3477362394332886, "step": 2425, "valid_targets_mean": 2357.6, "valid_targets_min": 919 }, { "epoch": 3.8510301109350236, "grad_norm": 0.7088029576862485, "learning_rate": 2.0007903377539187e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.28312909603118896, "step": 2430, "valid_targets_mean": 3164.1, "valid_targets_min": 1362 }, { "epoch": 3.8589540412044374, "grad_norm": 0.7274010885836312, "learning_rate": 1.992886975024876e-05, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.31846240162849426, "step": 2435, "valid_targets_mean": 3024.1, "valid_targets_min": 889 }, { "epoch": 3.8668779714738513, "grad_norm": 0.7833894784900323, "learning_rate": 1.984983723371584e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3632742762565613, "step": 2440, "valid_targets_mean": 2629.2, "valid_targets_min": 558 }, { "epoch": 3.8748019017432647, "grad_norm": 0.6668796876085389, "learning_rate": 1.977080706209835e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.34540417790412903, "step": 2445, "valid_targets_mean": 3503.6, "valid_targets_min": 1173 }, { "epoch": 3.882725832012678, "grad_norm": 0.7198481169885637, "learning_rate": 1.9691780469517578e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.3147124648094177, "step": 2450, "valid_targets_mean": 3361.3, "valid_targets_min": 1502 }, { "epoch": 3.890649762282092, "grad_norm": 0.6225664648803466, "learning_rate": 1.961275869003894e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.299946129322052, "step": 2455, "valid_targets_mean": 4080.0, "valid_targets_min": 1743 }, { "epoch": 3.8985736925515058, "grad_norm": 0.586811491312213, "learning_rate": 1.9533742957652683e-05, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.30612677335739136, "step": 2460, "valid_targets_mean": 3907.0, "valid_targets_min": 1502 }, { "epoch": 3.906497622820919, "grad_norm": 0.8015375291847339, "learning_rate": 1.945473450625463e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.3285152316093445, "step": 2465, "valid_targets_mean": 2799.4, "valid_targets_min": 1124 }, { "epoch": 3.9144215530903326, "grad_norm": 0.7768068569253016, "learning_rate": 1.9375734569626904e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.32465943694114685, "step": 2470, "valid_targets_mean": 2695.1, "valid_targets_min": 1188 }, { "epoch": 3.9223454833597464, "grad_norm": 0.6903149189834576, "learning_rate": 1.9296744381418653e-05, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.3335050344467163, "step": 2475, "valid_targets_mean": 3702.8, "valid_targets_min": 1403 }, { "epoch": 3.9302694136291603, "grad_norm": 0.674427230152727, "learning_rate": 1.9217765175126808e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.34546995162963867, "step": 2480, "valid_targets_mean": 3681.2, "valid_targets_min": 1344 }, { "epoch": 3.9381933438985737, "grad_norm": 0.7615168910152336, "learning_rate": 1.9138798184076805e-05, "loss": 0.3389, "loss_nan_ranks": 0, "loss_rank_avg": 0.3379887342453003, "step": 2485, "valid_targets_mean": 2786.8, "valid_targets_min": 665 }, { "epoch": 3.946117274167987, "grad_norm": 0.739627311408071, "learning_rate": 1.9059844641403323e-05, "loss": 0.3386, "loss_nan_ranks": 0, "loss_rank_avg": 0.337485134601593, "step": 2490, "valid_targets_mean": 2974.0, "valid_targets_min": 1066 }, { "epoch": 3.954041204437401, "grad_norm": 0.7540616165257731, "learning_rate": 1.898090578003104e-05, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.3072323203086853, "step": 2495, "valid_targets_mean": 2595.8, "valid_targets_min": 1021 }, { "epoch": 3.9619651347068148, "grad_norm": 0.849781819038183, "learning_rate": 1.890198283265537e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.33093464374542236, "step": 2500, "valid_targets_mean": 2223.1, "valid_targets_min": 1112 }, { "epoch": 3.969889064976228, "grad_norm": 0.6623254756540252, "learning_rate": 1.8823077031723217e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.32428649067878723, "step": 2505, "valid_targets_mean": 3929.8, "valid_targets_min": 1152 }, { "epoch": 3.9778129952456416, "grad_norm": 0.9088875770456144, "learning_rate": 1.8744189609413733e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.3459881544113159, "step": 2510, "valid_targets_mean": 2497.1, "valid_targets_min": 1041 }, { "epoch": 3.9857369255150554, "grad_norm": 0.7118244141970165, "learning_rate": 1.8665321797619068e-05, "loss": 0.3601, "loss_nan_ranks": 0, "loss_rank_avg": 0.3549520969390869, "step": 2515, "valid_targets_mean": 3036.4, "valid_targets_min": 1036 }, { "epoch": 3.9936608557844693, "grad_norm": 0.7872431081558173, "learning_rate": 1.8586474827925142e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.343522310256958, "step": 2520, "valid_targets_mean": 3111.9, "valid_targets_min": 934 }, { "epoch": 4.001584786053883, "grad_norm": 0.6333163189857594, "learning_rate": 1.8507649931592405e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.30445295572280884, "step": 2525, "valid_targets_mean": 3531.7, "valid_targets_min": 1013 }, { "epoch": 4.009508716323296, "grad_norm": 0.6185313213820511, "learning_rate": 1.8428848339536613e-05, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.28447040915489197, "step": 2530, "valid_targets_mean": 3920.8, "valid_targets_min": 965 }, { "epoch": 4.01743264659271, "grad_norm": 1.632827555786203, "learning_rate": 1.8350071282309606e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.2971077561378479, "step": 2535, "valid_targets_mean": 3930.5, "valid_targets_min": 1379 }, { "epoch": 4.025356576862124, "grad_norm": 0.7394593200985027, "learning_rate": 1.8271319990080093e-05, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.2914736270904541, "step": 2540, "valid_targets_mean": 3326.8, "valid_targets_min": 1293 }, { "epoch": 4.033280507131537, "grad_norm": 0.6319798264181055, "learning_rate": 1.8192595692614445e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948256731033325, "step": 2545, "valid_targets_mean": 4935.4, "valid_targets_min": 1569 }, { "epoch": 4.041204437400951, "grad_norm": 0.6195429750205664, "learning_rate": 1.8113899619257487e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.259757399559021, "step": 2550, "valid_targets_mean": 3946.8, "valid_targets_min": 1514 }, { "epoch": 4.049128367670365, "grad_norm": 0.8136555394477911, "learning_rate": 1.8035232998913294e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.3359217345714569, "step": 2555, "valid_targets_mean": 2811.3, "valid_targets_min": 1053 }, { "epoch": 4.057052297939778, "grad_norm": 0.658978371503885, "learning_rate": 1.795659706002602e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.27853959798812866, "step": 2560, "valid_targets_mean": 3751.6, "valid_targets_min": 1163 }, { "epoch": 4.064976228209192, "grad_norm": 0.7024991019538495, "learning_rate": 1.7877993030560693e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.3008027970790863, "step": 2565, "valid_targets_mean": 3564.5, "valid_targets_min": 732 }, { "epoch": 4.072900158478605, "grad_norm": 0.9509196576152328, "learning_rate": 1.7799422137984047e-05, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.3372243642807007, "step": 2570, "valid_targets_mean": 2080.0, "valid_targets_min": 1092 }, { "epoch": 4.080824088748019, "grad_norm": 0.8259571384452493, "learning_rate": 1.772088560924536e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.28471559286117554, "step": 2575, "valid_targets_mean": 2408.6, "valid_targets_min": 1083 }, { "epoch": 4.088748019017433, "grad_norm": 0.8306440223043661, "learning_rate": 1.76423846707573e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.30105167627334595, "step": 2580, "valid_targets_mean": 2728.8, "valid_targets_min": 1359 }, { "epoch": 4.096671949286846, "grad_norm": 0.7821004468315431, "learning_rate": 1.756392054837675e-05, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.35259807109832764, "step": 2585, "valid_targets_mean": 3060.4, "valid_targets_min": 1256 }, { "epoch": 4.10459587955626, "grad_norm": 0.837278260105263, "learning_rate": 1.7485494467385686e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.2958485782146454, "step": 2590, "valid_targets_mean": 2570.9, "valid_targets_min": 1177 }, { "epoch": 4.112519809825674, "grad_norm": 0.7450702161875221, "learning_rate": 1.7407107652472034e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.2652340531349182, "step": 2595, "valid_targets_mean": 2721.6, "valid_targets_min": 988 }, { "epoch": 4.120443740095087, "grad_norm": 0.8272401230749654, "learning_rate": 1.7328761327710545e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961358428001404, "step": 2600, "valid_targets_mean": 2593.1, "valid_targets_min": 1360 }, { "epoch": 4.128367670364501, "grad_norm": 1.2748656480073979, "learning_rate": 1.7250456716543693e-05, "loss": 0.3267, "loss_nan_ranks": 0, "loss_rank_avg": 0.31461167335510254, "step": 2605, "valid_targets_mean": 4279.6, "valid_targets_min": 1170 }, { "epoch": 4.136291600633914, "grad_norm": 0.8167474006377758, "learning_rate": 1.717219504176255e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.3002293109893799, "step": 2610, "valid_targets_mean": 2615.6, "valid_targets_min": 694 }, { "epoch": 4.144215530903328, "grad_norm": 0.7453906065684714, "learning_rate": 1.7093977525487704e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.31392133235931396, "step": 2615, "valid_targets_mean": 3305.8, "valid_targets_min": 824 }, { "epoch": 4.152139461172742, "grad_norm": 0.70102708908017, "learning_rate": 1.701580538915017e-05, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.3022012412548065, "step": 2620, "valid_targets_mean": 3455.0, "valid_targets_min": 1731 }, { "epoch": 4.160063391442155, "grad_norm": 0.7192692867446561, "learning_rate": 1.693767985347232e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.26913607120513916, "step": 2625, "valid_targets_mean": 3015.6, "valid_targets_min": 968 }, { "epoch": 4.167987321711569, "grad_norm": 0.7640141605128163, "learning_rate": 1.6859602138448822e-05, "loss": 0.3103, "loss_nan_ranks": 0, "loss_rank_avg": 0.3088947534561157, "step": 2630, "valid_targets_mean": 3482.1, "valid_targets_min": 814 }, { "epoch": 4.175911251980983, "grad_norm": 0.8117508775782821, "learning_rate": 1.6781573463327573e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.31718161702156067, "step": 2635, "valid_targets_mean": 2880.6, "valid_targets_min": 1500 }, { "epoch": 4.183835182250396, "grad_norm": 0.7420422079275537, "learning_rate": 1.6703595046590685e-05, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.3003275394439697, "step": 2640, "valid_targets_mean": 3582.3, "valid_targets_min": 1096 }, { "epoch": 4.19175911251981, "grad_norm": 0.7642707778816153, "learning_rate": 1.662566810593544e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.2956918478012085, "step": 2645, "valid_targets_mean": 3331.7, "valid_targets_min": 1139 }, { "epoch": 4.199683042789223, "grad_norm": 0.9108013010532445, "learning_rate": 1.6547793858255275e-05, "loss": 0.2901, "loss_nan_ranks": 0, "loss_rank_avg": 0.3331553041934967, "step": 2650, "valid_targets_mean": 2406.9, "valid_targets_min": 737 }, { "epoch": 4.207606973058637, "grad_norm": 0.6958301147034044, "learning_rate": 1.646997351962078e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.2943539023399353, "step": 2655, "valid_targets_mean": 3598.9, "valid_targets_min": 1080 }, { "epoch": 4.215530903328051, "grad_norm": 0.8106867092367795, "learning_rate": 1.639220830526072e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.31939899921417236, "step": 2660, "valid_targets_mean": 2794.2, "valid_targets_min": 826 }, { "epoch": 4.223454833597464, "grad_norm": 0.7722347258533244, "learning_rate": 1.631449942954304e-05, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.2992505133152008, "step": 2665, "valid_targets_mean": 3432.8, "valid_targets_min": 791 }, { "epoch": 4.231378763866878, "grad_norm": 0.6605244498088375, "learning_rate": 1.623684810595592e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.26709267497062683, "step": 2670, "valid_targets_mean": 3478.2, "valid_targets_min": 1440 }, { "epoch": 4.239302694136292, "grad_norm": 0.7294542403387982, "learning_rate": 1.6159255547088806e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.3037455081939697, "step": 2675, "valid_targets_mean": 3395.0, "valid_targets_min": 908 }, { "epoch": 4.247226624405705, "grad_norm": 0.7747203263130421, "learning_rate": 1.608172296461349e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.3067532777786255, "step": 2680, "valid_targets_mean": 3267.0, "valid_targets_min": 1247 }, { "epoch": 4.255150554675119, "grad_norm": 0.7171739409331684, "learning_rate": 1.6004251569265187e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.30375757813453674, "step": 2685, "valid_targets_mean": 3726.8, "valid_targets_min": 1447 }, { "epoch": 4.263074484944532, "grad_norm": 0.6834444351988356, "learning_rate": 1.5926842570823624e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.29319584369659424, "step": 2690, "valid_targets_mean": 3729.8, "valid_targets_min": 965 }, { "epoch": 4.270998415213946, "grad_norm": 0.8517435436774768, "learning_rate": 1.5849497178094132e-05, "loss": 0.3179, "loss_nan_ranks": 0, "loss_rank_avg": 0.3134300410747528, "step": 2695, "valid_targets_mean": 2532.6, "valid_targets_min": 987 }, { "epoch": 4.27892234548336, "grad_norm": 0.7775253010328972, "learning_rate": 1.5772216598888802e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.30423301458358765, "step": 2700, "valid_targets_mean": 2795.2, "valid_targets_min": 742 }, { "epoch": 4.286846275752773, "grad_norm": 0.7218371372885936, "learning_rate": 1.5695002040007613e-05, "loss": 0.3147, "loss_nan_ranks": 0, "loss_rank_avg": 0.3007104992866516, "step": 2705, "valid_targets_mean": 3370.9, "valid_targets_min": 944 }, { "epoch": 4.294770206022187, "grad_norm": 0.743546396207078, "learning_rate": 1.5617854707219574e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.31770211458206177, "step": 2710, "valid_targets_mean": 3224.2, "valid_targets_min": 1224 }, { "epoch": 4.302694136291601, "grad_norm": 0.7458055587700105, "learning_rate": 1.5540775805243896e-05, "loss": 0.3072, "loss_nan_ranks": 0, "loss_rank_avg": 0.2979353368282318, "step": 2715, "valid_targets_mean": 2920.5, "valid_targets_min": 1073 }, { "epoch": 4.310618066561014, "grad_norm": 0.7824000519774981, "learning_rate": 1.5463766537731202e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.33337557315826416, "step": 2720, "valid_targets_mean": 3077.6, "valid_targets_min": 1114 }, { "epoch": 4.318541996830428, "grad_norm": 0.7518246296874621, "learning_rate": 1.5386828107244705e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896403670310974, "step": 2725, "valid_targets_mean": 3393.7, "valid_targets_min": 1552 }, { "epoch": 4.326465927099841, "grad_norm": 0.648023364162129, "learning_rate": 1.530996171524145e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.30871593952178955, "step": 2730, "valid_targets_mean": 4109.9, "valid_targets_min": 1139 }, { "epoch": 4.334389857369255, "grad_norm": 0.769692357957425, "learning_rate": 1.5233168562053517e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.2859308123588562, "step": 2735, "valid_targets_mean": 2917.9, "valid_targets_min": 1157 }, { "epoch": 4.342313787638669, "grad_norm": 0.7237354504090463, "learning_rate": 1.515644984686933e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.3038594424724579, "step": 2740, "valid_targets_mean": 3344.9, "valid_targets_min": 820 }, { "epoch": 4.350237717908082, "grad_norm": 0.7945130184832356, "learning_rate": 1.507980676771489e-05, "loss": 0.2995, "loss_nan_ranks": 0, "loss_rank_avg": 0.2981492877006531, "step": 2745, "valid_targets_mean": 2807.6, "valid_targets_min": 906 }, { "epoch": 4.358161648177496, "grad_norm": 0.7902636448758641, "learning_rate": 1.5003240521435076e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.31415724754333496, "step": 2750, "valid_targets_mean": 2672.6, "valid_targets_min": 746 }, { "epoch": 4.36608557844691, "grad_norm": 0.8020499365789604, "learning_rate": 1.4926752303674967e-05, "loss": 0.3323, "loss_nan_ranks": 0, "loss_rank_avg": 0.36749058961868286, "step": 2755, "valid_targets_mean": 2934.5, "valid_targets_min": 1510 }, { "epoch": 4.374009508716323, "grad_norm": 0.6976026655059031, "learning_rate": 1.4850343308861152e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.2690892815589905, "step": 2760, "valid_targets_mean": 3675.6, "valid_targets_min": 1576 }, { "epoch": 4.381933438985737, "grad_norm": 0.8273604681356571, "learning_rate": 1.47740147301831e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.30167335271835327, "step": 2765, "valid_targets_mean": 2629.6, "valid_targets_min": 989 }, { "epoch": 4.38985736925515, "grad_norm": 0.6544057381783281, "learning_rate": 1.4697767759574508e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769451141357422, "step": 2770, "valid_targets_mean": 4037.2, "valid_targets_min": 1005 }, { "epoch": 4.397781299524564, "grad_norm": 0.8243154638778755, "learning_rate": 1.4621603587694688e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.313541978597641, "step": 2775, "valid_targets_mean": 2701.2, "valid_targets_min": 1603 }, { "epoch": 4.405705229793978, "grad_norm": 0.915560332977614, "learning_rate": 1.454552340391e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.3276725709438324, "step": 2780, "valid_targets_mean": 3331.5, "valid_targets_min": 1087 }, { "epoch": 4.413629160063391, "grad_norm": 0.6485103596763808, "learning_rate": 1.446952839627525e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.3232860565185547, "step": 2785, "valid_targets_mean": 4013.6, "valid_targets_min": 1047 }, { "epoch": 4.4215530903328055, "grad_norm": 1.172378270754862, "learning_rate": 1.4393619751515147e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.308063268661499, "step": 2790, "valid_targets_mean": 2999.6, "valid_targets_min": 1269 }, { "epoch": 4.429477020602219, "grad_norm": 0.768155820928126, "learning_rate": 1.4317798655005777e-05, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.28411513566970825, "step": 2795, "valid_targets_mean": 3562.4, "valid_targets_min": 323 }, { "epoch": 4.437400950871632, "grad_norm": 0.7875527455561598, "learning_rate": 1.4242066290756084e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.3191964328289032, "step": 2800, "valid_targets_mean": 3007.8, "valid_targets_min": 1102 }, { "epoch": 4.445324881141046, "grad_norm": 0.7458242607802088, "learning_rate": 1.4166423841389387e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911447286605835, "step": 2805, "valid_targets_mean": 2887.9, "valid_targets_min": 1028 }, { "epoch": 4.453248811410459, "grad_norm": 0.822647246509666, "learning_rate": 1.4090872488124916e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.307691752910614, "step": 2810, "valid_targets_mean": 2768.2, "valid_targets_min": 536 }, { "epoch": 4.461172741679873, "grad_norm": 0.7771496896525412, "learning_rate": 1.4015413410759343e-05, "loss": 0.3249, "loss_nan_ranks": 0, "loss_rank_avg": 0.3093550205230713, "step": 2815, "valid_targets_mean": 2895.3, "valid_targets_min": 1313 }, { "epoch": 4.469096671949287, "grad_norm": 0.7655768531728774, "learning_rate": 1.3940047787648388e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.3004239797592163, "step": 2820, "valid_targets_mean": 2810.7, "valid_targets_min": 913 }, { "epoch": 4.4770206022187, "grad_norm": 0.936481404258253, "learning_rate": 1.3864776795688408e-05, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.3504589796066284, "step": 2825, "valid_targets_mean": 3516.6, "valid_targets_min": 1193 }, { "epoch": 4.4849445324881145, "grad_norm": 0.816980590525859, "learning_rate": 1.3789601610298013e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.287618488073349, "step": 2830, "valid_targets_mean": 2968.8, "valid_targets_min": 1097 }, { "epoch": 4.492868462757528, "grad_norm": 0.778268098745374, "learning_rate": 1.3714523405399711e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.3074689507484436, "step": 2835, "valid_targets_mean": 2911.4, "valid_targets_min": 1061 }, { "epoch": 4.500792393026941, "grad_norm": 0.6573666416474037, "learning_rate": 1.3639543353401588e-05, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881685495376587, "step": 2840, "valid_targets_mean": 3663.2, "valid_targets_min": 1408 }, { "epoch": 4.508716323296355, "grad_norm": 0.6941710441249608, "learning_rate": 1.3564662625178979e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.33653414249420166, "step": 2845, "valid_targets_mean": 3397.4, "valid_targets_min": 681 }, { "epoch": 4.516640253565768, "grad_norm": 0.7863043325335887, "learning_rate": 1.3489882390056214e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.29496651887893677, "step": 2850, "valid_targets_mean": 2781.9, "valid_targets_min": 1277 }, { "epoch": 4.524564183835182, "grad_norm": 0.8634068488077267, "learning_rate": 1.3415203815788317e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.2938062250614166, "step": 2855, "valid_targets_mean": 3095.8, "valid_targets_min": 954 }, { "epoch": 4.532488114104596, "grad_norm": 0.7939512722364277, "learning_rate": 1.3340628068542816e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.2892675995826721, "step": 2860, "valid_targets_mean": 2929.0, "valid_targets_min": 698 }, { "epoch": 4.540412044374009, "grad_norm": 0.8239988059278375, "learning_rate": 1.3266156312881497e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.29567891359329224, "step": 2865, "valid_targets_mean": 2818.6, "valid_targets_min": 1250 }, { "epoch": 4.5483359746434235, "grad_norm": 0.8011210887144335, "learning_rate": 1.3191789711742237e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.2970122694969177, "step": 2870, "valid_targets_mean": 2888.4, "valid_targets_min": 1206 }, { "epoch": 4.556259904912837, "grad_norm": 0.6220168440568122, "learning_rate": 1.3117529426420838e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.3001657724380493, "step": 2875, "valid_targets_mean": 4320.4, "valid_targets_min": 1126 }, { "epoch": 4.56418383518225, "grad_norm": 0.7549078864914368, "learning_rate": 1.3043376616552889e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.27980339527130127, "step": 2880, "valid_targets_mean": 3092.2, "valid_targets_min": 942 }, { "epoch": 4.572107765451664, "grad_norm": 0.7620019128280029, "learning_rate": 1.296933244009567e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.31075483560562134, "step": 2885, "valid_targets_mean": 3096.1, "valid_targets_min": 1150 }, { "epoch": 4.580031695721077, "grad_norm": 0.7628895287961468, "learning_rate": 1.2895398053310053e-05, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.2894461154937744, "step": 2890, "valid_targets_mean": 3295.6, "valid_targets_min": 636 }, { "epoch": 4.5879556259904914, "grad_norm": 0.9803486983305757, "learning_rate": 1.2821574610742453e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.31783849000930786, "step": 2895, "valid_targets_mean": 2410.8, "valid_targets_min": 845 }, { "epoch": 4.595879556259905, "grad_norm": 0.672927388574443, "learning_rate": 1.2747863265206801e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.308796763420105, "step": 2900, "valid_targets_mean": 3501.9, "valid_targets_min": 868 }, { "epoch": 4.603803486529318, "grad_norm": 0.7279777785970651, "learning_rate": 1.2674265167766545e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.28767889738082886, "step": 2905, "valid_targets_mean": 3142.7, "valid_targets_min": 797 }, { "epoch": 4.6117274167987325, "grad_norm": 0.810766208206082, "learning_rate": 1.2600781467716665e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.3437730073928833, "step": 2910, "valid_targets_mean": 2790.1, "valid_targets_min": 1091 }, { "epoch": 4.619651347068146, "grad_norm": 0.806232766113042, "learning_rate": 1.2527413312565737e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.30441755056381226, "step": 2915, "valid_targets_mean": 2803.9, "valid_targets_min": 1041 }, { "epoch": 4.627575277337559, "grad_norm": 0.771054199386212, "learning_rate": 1.2454161848018003e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.31878095865249634, "step": 2920, "valid_targets_mean": 3022.9, "valid_targets_min": 1210 }, { "epoch": 4.635499207606973, "grad_norm": 0.7455086622171665, "learning_rate": 1.2381028217955486e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.29189303517341614, "step": 2925, "valid_targets_mean": 3102.1, "valid_targets_min": 832 }, { "epoch": 4.643423137876387, "grad_norm": 0.6813592554934786, "learning_rate": 1.2308013564420132e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672593295574188, "step": 2930, "valid_targets_mean": 3894.0, "valid_targets_min": 1700 }, { "epoch": 4.6513470681458005, "grad_norm": 0.7204804043327222, "learning_rate": 1.2235119027595957e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.32479286193847656, "step": 2935, "valid_targets_mean": 3971.2, "valid_targets_min": 1352 }, { "epoch": 4.659270998415214, "grad_norm": 0.7638356280818674, "learning_rate": 1.2162345745791268e-05, "loss": 0.3033, "loss_nan_ranks": 0, "loss_rank_avg": 0.31609421968460083, "step": 2940, "valid_targets_mean": 3019.4, "valid_targets_min": 977 }, { "epoch": 4.667194928684627, "grad_norm": 0.7039388185448092, "learning_rate": 1.2089694855420873e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.287856787443161, "step": 2945, "valid_targets_mean": 3415.1, "valid_targets_min": 1312 }, { "epoch": 4.675118858954042, "grad_norm": 0.7151331805533307, "learning_rate": 1.201716749098833e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.2898104190826416, "step": 2950, "valid_targets_mean": 3416.0, "valid_targets_min": 1124 }, { "epoch": 4.683042789223455, "grad_norm": 1.9704639419589094, "learning_rate": 1.1944764785068248e-05, "loss": 0.3303, "loss_nan_ranks": 0, "loss_rank_avg": 0.3315780758857727, "step": 2955, "valid_targets_mean": 2883.4, "valid_targets_min": 1348 }, { "epoch": 4.690966719492868, "grad_norm": 0.8156790243383886, "learning_rate": 1.187248786828858e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.3219088912010193, "step": 2960, "valid_targets_mean": 2594.6, "valid_targets_min": 1422 }, { "epoch": 4.698890649762282, "grad_norm": 0.8039682183624894, "learning_rate": 1.1800337869312988e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.29908105731010437, "step": 2965, "valid_targets_mean": 2810.3, "valid_targets_min": 1371 }, { "epoch": 4.706814580031696, "grad_norm": 0.8068691479781692, "learning_rate": 1.17283159148232e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.33075129985809326, "step": 2970, "valid_targets_mean": 2863.6, "valid_targets_min": 1015 }, { "epoch": 4.7147385103011095, "grad_norm": 0.689486051910562, "learning_rate": 1.165642312950142e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2692754864692688, "step": 2975, "valid_targets_mean": 3604.5, "valid_targets_min": 1605 }, { "epoch": 4.722662440570523, "grad_norm": 0.8268105603028824, "learning_rate": 1.1584660636012788e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.33773764967918396, "step": 2980, "valid_targets_mean": 3095.1, "valid_targets_min": 947 }, { "epoch": 4.730586370839936, "grad_norm": 0.6575919589133923, "learning_rate": 1.1513029554987804e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.2386166751384735, "step": 2985, "valid_targets_mean": 4465.2, "valid_targets_min": 1680 }, { "epoch": 4.738510301109351, "grad_norm": 0.6371132125962272, "learning_rate": 1.144153100500488e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.2862992286682129, "step": 2990, "valid_targets_mean": 3861.9, "valid_targets_min": 1972 }, { "epoch": 4.746434231378764, "grad_norm": 0.7441439350640655, "learning_rate": 1.1370166102572826e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.36143922805786133, "step": 2995, "valid_targets_mean": 3635.9, "valid_targets_min": 1142 }, { "epoch": 4.754358161648177, "grad_norm": 0.6737445792645919, "learning_rate": 1.1298935962113436e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2750626802444458, "step": 3000, "valid_targets_mean": 3542.1, "valid_targets_min": 1289 }, { "epoch": 4.762282091917591, "grad_norm": 0.7212930569332857, "learning_rate": 1.1227841695944104e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.3105536699295044, "step": 3005, "valid_targets_mean": 3204.9, "valid_targets_min": 1114 }, { "epoch": 4.770206022187005, "grad_norm": 0.6111875624664306, "learning_rate": 1.1156884414260412e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.29388630390167236, "step": 3010, "valid_targets_mean": 3729.1, "valid_targets_min": 1208 }, { "epoch": 4.7781299524564185, "grad_norm": 0.764650461989785, "learning_rate": 1.1086065225118836e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.2933449447154999, "step": 3015, "valid_targets_mean": 3383.9, "valid_targets_min": 984 }, { "epoch": 4.786053882725832, "grad_norm": 0.7224666416313265, "learning_rate": 1.1015385234419402e-05, "loss": 0.3033, "loss_nan_ranks": 0, "loss_rank_avg": 0.29492539167404175, "step": 3020, "valid_targets_mean": 3344.1, "valid_targets_min": 906 }, { "epoch": 4.793977812995245, "grad_norm": 0.7948708382462361, "learning_rate": 1.0944845545888462e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2928083539009094, "step": 3025, "valid_targets_mean": 2741.6, "valid_targets_min": 1171 }, { "epoch": 4.80190174326466, "grad_norm": 0.7388242674514477, "learning_rate": 1.0874447261061406e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.3079679608345032, "step": 3030, "valid_targets_mean": 3113.4, "valid_targets_min": 1405 }, { "epoch": 4.809825673534073, "grad_norm": 0.702881645128125, "learning_rate": 1.0804191479265525e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.2963460087776184, "step": 3035, "valid_targets_mean": 3467.6, "valid_targets_min": 1365 }, { "epoch": 4.817749603803486, "grad_norm": 0.893930060872408, "learning_rate": 1.0734079297602772e-05, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.3658490777015686, "step": 3040, "valid_targets_mean": 2750.2, "valid_targets_min": 1131 }, { "epoch": 4.8256735340729, "grad_norm": 0.6855561554316635, "learning_rate": 1.0664111810932671e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.28777241706848145, "step": 3045, "valid_targets_mean": 3720.5, "valid_targets_min": 605 }, { "epoch": 4.833597464342314, "grad_norm": 0.7116370163557326, "learning_rate": 1.0594290111855245e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.32314878702163696, "step": 3050, "valid_targets_mean": 3834.8, "valid_targets_min": 1553 }, { "epoch": 4.8415213946117275, "grad_norm": 0.8748328547962919, "learning_rate": 1.0524615290693881e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.3117261826992035, "step": 3055, "valid_targets_mean": 2272.6, "valid_targets_min": 795 }, { "epoch": 4.849445324881141, "grad_norm": 0.7163896836836389, "learning_rate": 1.0455088435478384e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054528832435608, "step": 3060, "valid_targets_mean": 3340.7, "valid_targets_min": 685 }, { "epoch": 4.857369255150554, "grad_norm": 0.7990504060097595, "learning_rate": 1.0385710631927917e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.28801190853118896, "step": 3065, "valid_targets_mean": 2581.8, "valid_targets_min": 852 }, { "epoch": 4.865293185419969, "grad_norm": 0.7858386332238347, "learning_rate": 1.031648296343411e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.30044302344322205, "step": 3070, "valid_targets_mean": 3524.5, "valid_targets_min": 699 }, { "epoch": 4.873217115689382, "grad_norm": 0.7573279065310472, "learning_rate": 1.0247406511044079e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.34992167353630066, "step": 3075, "valid_targets_mean": 3097.5, "valid_targets_min": 1330 }, { "epoch": 4.881141045958795, "grad_norm": 0.7999207340654183, "learning_rate": 1.0178482353443588e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.32113009691238403, "step": 3080, "valid_targets_mean": 2807.9, "valid_targets_min": 1241 }, { "epoch": 4.889064976228209, "grad_norm": 0.849335113475438, "learning_rate": 1.010971156694021e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.3222789168357849, "step": 3085, "valid_targets_mean": 2970.4, "valid_targets_min": 1106 }, { "epoch": 4.896988906497623, "grad_norm": 0.6823190767279323, "learning_rate": 1.004109522544647e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.27712273597717285, "step": 3090, "valid_targets_mean": 3440.9, "valid_targets_min": 1461 }, { "epoch": 4.9049128367670365, "grad_norm": 0.7200895601882453, "learning_rate": 9.972634400463135e-06, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.2947770953178406, "step": 3095, "valid_targets_mean": 3490.6, "valid_targets_min": 980 }, { "epoch": 4.91283676703645, "grad_norm": 0.6645038831235541, "learning_rate": 9.90433016106243e-06, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.31558895111083984, "step": 3100, "valid_targets_mean": 3618.5, "valid_targets_min": 1104 }, { "epoch": 4.920760697305864, "grad_norm": 0.8119936304510853, "learning_rate": 9.836183573871394e-06, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948872447013855, "step": 3105, "valid_targets_mean": 2676.7, "valid_targets_min": 1118 }, { "epoch": 4.928684627575278, "grad_norm": 0.8117809416258112, "learning_rate": 9.768195703055163e-06, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.30462121963500977, "step": 3110, "valid_targets_mean": 2633.5, "valid_targets_min": 1138 }, { "epoch": 4.936608557844691, "grad_norm": 0.7939054585691092, "learning_rate": 9.700367610300423e-06, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.3095425069332123, "step": 3115, "valid_targets_mean": 2848.7, "valid_targets_min": 1131 }, { "epoch": 4.944532488114104, "grad_norm": 0.7205066824623103, "learning_rate": 9.632700354798766e-06, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746793031692505, "step": 3120, "valid_targets_mean": 3183.8, "valid_targets_min": 1716 }, { "epoch": 4.952456418383518, "grad_norm": 0.8435432284739308, "learning_rate": 9.565194993230176e-06, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.33743882179260254, "step": 3125, "valid_targets_mean": 2504.1, "valid_targets_min": 933 }, { "epoch": 4.960380348652932, "grad_norm": 0.7878822964478979, "learning_rate": 9.49785257974656e-06, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.2942264676094055, "step": 3130, "valid_targets_mean": 2571.7, "valid_targets_min": 1017 }, { "epoch": 4.9683042789223455, "grad_norm": 0.8361868331960012, "learning_rate": 9.430674165955218e-06, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.34500449895858765, "step": 3135, "valid_targets_mean": 3657.2, "valid_targets_min": 1331 }, { "epoch": 4.976228209191759, "grad_norm": 0.6974763936046318, "learning_rate": 9.363660800902498e-06, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.305804580450058, "step": 3140, "valid_targets_mean": 3425.0, "valid_targets_min": 1135 }, { "epoch": 4.984152139461173, "grad_norm": 0.8185536692198196, "learning_rate": 9.296813531057336e-06, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.28771495819091797, "step": 3145, "valid_targets_mean": 2709.5, "valid_targets_min": 1177 }, { "epoch": 4.992076069730587, "grad_norm": 0.78537077588257, "learning_rate": 9.230133400294994e-06, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.3354733884334564, "step": 3150, "valid_targets_mean": 2970.9, "valid_targets_min": 1264 }, { "epoch": 5.0, "grad_norm": 0.7377919783129347, "learning_rate": 9.163621449880686e-06, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.2943228781223297, "step": 3155, "valid_targets_mean": 3264.5, "valid_targets_min": 854 }, { "epoch": 5.007923930269413, "grad_norm": 0.6897294221365783, "learning_rate": 9.097278718453366e-06, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.24547956883907318, "step": 3160, "valid_targets_mean": 3132.8, "valid_targets_min": 926 }, { "epoch": 5.015847860538828, "grad_norm": 0.7613434863732377, "learning_rate": 9.0311062420095e-06, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.28858259320259094, "step": 3165, "valid_targets_mean": 3152.6, "valid_targets_min": 1006 }, { "epoch": 5.023771790808241, "grad_norm": 0.6810586489493294, "learning_rate": 8.965105053886864e-06, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.31911516189575195, "step": 3170, "valid_targets_mean": 4410.9, "valid_targets_min": 1588 }, { "epoch": 5.0316957210776545, "grad_norm": 0.9023064359994762, "learning_rate": 8.899276184748454e-06, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.28767329454421997, "step": 3175, "valid_targets_mean": 2300.8, "valid_targets_min": 824 }, { "epoch": 5.039619651347068, "grad_norm": 0.8159003566834867, "learning_rate": 8.833620662566325e-06, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.3218589127063751, "step": 3180, "valid_targets_mean": 3145.6, "valid_targets_min": 1378 }, { "epoch": 5.047543581616482, "grad_norm": 0.805782943916796, "learning_rate": 8.768139512605615e-06, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.26077768206596375, "step": 3185, "valid_targets_mean": 3293.0, "valid_targets_min": 434 }, { "epoch": 5.055467511885896, "grad_norm": 0.7270822754678393, "learning_rate": 8.702833757408465e-06, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.29586848616600037, "step": 3190, "valid_targets_mean": 3872.6, "valid_targets_min": 1007 }, { "epoch": 5.063391442155309, "grad_norm": 0.8662314523284074, "learning_rate": 8.637704416778106e-06, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.25883880257606506, "step": 3195, "valid_targets_mean": 2555.5, "valid_targets_min": 1255 }, { "epoch": 5.071315372424722, "grad_norm": 0.9893594514085089, "learning_rate": 8.572752507762893e-06, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.3071678876876831, "step": 3200, "valid_targets_mean": 2334.6, "valid_targets_min": 1084 }, { "epoch": 5.079239302694137, "grad_norm": 0.7663852834514877, "learning_rate": 8.50797904464044e-06, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2686847448348999, "step": 3205, "valid_targets_mean": 3020.4, "valid_targets_min": 974 }, { "epoch": 5.08716323296355, "grad_norm": 0.8272623217334393, "learning_rate": 8.443385038901801e-06, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.3090386390686035, "step": 3210, "valid_targets_mean": 2945.6, "valid_targets_min": 1179 }, { "epoch": 5.0950871632329635, "grad_norm": 0.8759245976491827, "learning_rate": 8.378971499235627e-06, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.3076953887939453, "step": 3215, "valid_targets_mean": 2491.4, "valid_targets_min": 786 }, { "epoch": 5.103011093502377, "grad_norm": 0.8719723671628756, "learning_rate": 8.31473943151247e-06, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.2724665105342865, "step": 3220, "valid_targets_mean": 2282.7, "valid_targets_min": 729 }, { "epoch": 5.110935023771791, "grad_norm": 0.7575608712200748, "learning_rate": 8.250689838769021e-06, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.27652713656425476, "step": 3225, "valid_targets_mean": 3152.2, "valid_targets_min": 1374 }, { "epoch": 5.118858954041205, "grad_norm": 0.7631967106769532, "learning_rate": 8.186823721192505e-06, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2842700481414795, "step": 3230, "valid_targets_mean": 3138.7, "valid_targets_min": 1766 }, { "epoch": 5.126782884310618, "grad_norm": 0.8153756836832209, "learning_rate": 8.123142076105004e-06, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.2878100275993347, "step": 3235, "valid_targets_mean": 2801.4, "valid_targets_min": 1411 }, { "epoch": 5.134706814580031, "grad_norm": 0.8957597318522768, "learning_rate": 8.05964589794791e-06, "loss": 0.2876, "loss_nan_ranks": 0, "loss_rank_avg": 0.3458958864212036, "step": 3240, "valid_targets_mean": 2559.4, "valid_targets_min": 820 }, { "epoch": 5.142630744849446, "grad_norm": 0.7318674323785702, "learning_rate": 7.996336178266422e-06, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.2750980854034424, "step": 3245, "valid_targets_mean": 3455.2, "valid_targets_min": 1764 }, { "epoch": 5.150554675118859, "grad_norm": 0.9159040940127984, "learning_rate": 7.933213905694003e-06, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.3370858132839203, "step": 3250, "valid_targets_mean": 2564.6, "valid_targets_min": 901 }, { "epoch": 5.1584786053882725, "grad_norm": 0.7310111896825241, "learning_rate": 7.87028006593701e-06, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.27499884366989136, "step": 3255, "valid_targets_mean": 3558.4, "valid_targets_min": 878 }, { "epoch": 5.166402535657686, "grad_norm": 0.6998508825943974, "learning_rate": 7.807535641759229e-06, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.2822907567024231, "step": 3260, "valid_targets_mean": 3665.8, "valid_targets_min": 1305 }, { "epoch": 5.1743264659271, "grad_norm": 0.8038693569296806, "learning_rate": 7.744981612966603e-06, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2702692151069641, "step": 3265, "valid_targets_mean": 3427.2, "valid_targets_min": 1193 }, { "epoch": 5.182250396196514, "grad_norm": 0.8132637134761368, "learning_rate": 7.682618956391854e-06, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.297921359539032, "step": 3270, "valid_targets_mean": 3114.1, "valid_targets_min": 933 }, { "epoch": 5.190174326465927, "grad_norm": 0.9332356904299489, "learning_rate": 7.62044864587931e-06, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.29001176357269287, "step": 3275, "valid_targets_mean": 2984.0, "valid_targets_min": 1307 }, { "epoch": 5.19809825673534, "grad_norm": 0.8407249660339803, "learning_rate": 7.558471652269628e-06, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.29336339235305786, "step": 3280, "valid_targets_mean": 3170.8, "valid_targets_min": 955 }, { "epoch": 5.206022187004755, "grad_norm": 0.7286788825357956, "learning_rate": 7.496688943384665e-06, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.2957107424736023, "step": 3285, "valid_targets_mean": 3965.6, "valid_targets_min": 699 }, { "epoch": 5.213946117274168, "grad_norm": 0.843729926958082, "learning_rate": 7.435101484012377e-06, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.26785874366760254, "step": 3290, "valid_targets_mean": 2523.9, "valid_targets_min": 1106 }, { "epoch": 5.2218700475435815, "grad_norm": 0.7543573233989669, "learning_rate": 7.37371023589172e-06, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.30548304319381714, "step": 3295, "valid_targets_mean": 3348.4, "valid_targets_min": 1143 }, { "epoch": 5.229793977812995, "grad_norm": 0.8415736840199303, "learning_rate": 7.312516157697671e-06, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.32893145084381104, "step": 3300, "valid_targets_mean": 3006.1, "valid_targets_min": 1188 }, { "epoch": 5.237717908082409, "grad_norm": 0.8688405311258023, "learning_rate": 7.251520205026206e-06, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2774360775947571, "step": 3305, "valid_targets_mean": 2578.9, "valid_targets_min": 917 }, { "epoch": 5.245641838351823, "grad_norm": 0.741755679162456, "learning_rate": 7.190723330379441e-06, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.26800817251205444, "step": 3310, "valid_targets_mean": 3866.8, "valid_targets_min": 1128 }, { "epoch": 5.253565768621236, "grad_norm": 0.8672010632197062, "learning_rate": 7.1301264831507034e-06, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.30261340737342834, "step": 3315, "valid_targets_mean": 2493.1, "valid_targets_min": 879 }, { "epoch": 5.261489698890649, "grad_norm": 0.7745233459137596, "learning_rate": 7.0697306096097195e-06, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.29366734623908997, "step": 3320, "valid_targets_mean": 3542.4, "valid_targets_min": 1182 }, { "epoch": 5.269413629160064, "grad_norm": 0.7143335848995784, "learning_rate": 7.0095366528878785e-06, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.28641337156295776, "step": 3325, "valid_targets_mean": 3704.6, "valid_targets_min": 1336 }, { "epoch": 5.277337559429477, "grad_norm": 0.8434525424449542, "learning_rate": 6.949545552963432e-06, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.28280267119407654, "step": 3330, "valid_targets_mean": 2677.4, "valid_targets_min": 882 }, { "epoch": 5.2852614896988905, "grad_norm": 0.7211383167902913, "learning_rate": 6.8897582466468935e-06, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.23306918144226074, "step": 3335, "valid_targets_mean": 3320.4, "valid_targets_min": 1214 }, { "epoch": 5.293185419968304, "grad_norm": 0.7978182833247313, "learning_rate": 6.830175667566341e-06, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.315056711435318, "step": 3340, "valid_targets_mean": 2939.9, "valid_targets_min": 1346 }, { "epoch": 5.301109350237718, "grad_norm": 0.7519981164582723, "learning_rate": 6.770798746152889e-06, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.27680274844169617, "step": 3345, "valid_targets_mean": 3183.6, "valid_targets_min": 1318 }, { "epoch": 5.309033280507132, "grad_norm": 0.7260292170527266, "learning_rate": 6.711628409626116e-06, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.2554418444633484, "step": 3350, "valid_targets_mean": 3416.9, "valid_targets_min": 936 }, { "epoch": 5.316957210776545, "grad_norm": 0.7180192291084321, "learning_rate": 6.652665581979638e-06, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.24962565302848816, "step": 3355, "valid_targets_mean": 3221.9, "valid_targets_min": 1302 }, { "epoch": 5.324881141045958, "grad_norm": 0.8635374138802002, "learning_rate": 6.593911183966619e-06, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.3145523965358734, "step": 3360, "valid_targets_mean": 3000.2, "valid_targets_min": 1210 }, { "epoch": 5.332805071315373, "grad_norm": 0.8699435358472265, "learning_rate": 6.53536613308543e-06, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.29066410660743713, "step": 3365, "valid_targets_mean": 2882.2, "valid_targets_min": 1138 }, { "epoch": 5.340729001584786, "grad_norm": 0.7867640692640012, "learning_rate": 6.477031343565332e-06, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.29037970304489136, "step": 3370, "valid_targets_mean": 3145.4, "valid_targets_min": 860 }, { "epoch": 5.3486529318541995, "grad_norm": 0.7507037278817914, "learning_rate": 6.418907726352153e-06, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.2885250449180603, "step": 3375, "valid_targets_mean": 3860.5, "valid_targets_min": 1288 }, { "epoch": 5.356576862123613, "grad_norm": 0.7970118224353988, "learning_rate": 6.36099618909412e-06, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.26279422640800476, "step": 3380, "valid_targets_mean": 2864.9, "valid_targets_min": 819 }, { "epoch": 5.364500792393027, "grad_norm": 0.7741426066555225, "learning_rate": 6.303297636127627e-06, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.27045324444770813, "step": 3385, "valid_targets_mean": 3207.2, "valid_targets_min": 1124 }, { "epoch": 5.372424722662441, "grad_norm": 0.7127854092350832, "learning_rate": 6.245812968463176e-06, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2626931369304657, "step": 3390, "valid_targets_mean": 3690.8, "valid_targets_min": 1093 }, { "epoch": 5.380348652931854, "grad_norm": 0.7646869762243618, "learning_rate": 6.188543083771237e-06, "loss": 0.2981, "loss_nan_ranks": 0, "loss_rank_avg": 0.27869051694869995, "step": 3395, "valid_targets_mean": 3124.8, "valid_targets_min": 767 }, { "epoch": 5.3882725832012675, "grad_norm": 0.7964101106360405, "learning_rate": 6.131488876368303e-06, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000558018684387, "step": 3400, "valid_targets_mean": 2870.7, "valid_targets_min": 694 }, { "epoch": 5.396196513470682, "grad_norm": 0.9014007365513332, "learning_rate": 6.074651237202862e-06, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.2718481123447418, "step": 3405, "valid_targets_mean": 2537.0, "valid_targets_min": 1225 }, { "epoch": 5.404120443740095, "grad_norm": 0.8463931416869477, "learning_rate": 6.018031053841515e-06, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.30765998363494873, "step": 3410, "valid_targets_mean": 2869.0, "valid_targets_min": 1410 }, { "epoch": 5.4120443740095086, "grad_norm": 0.776508481811668, "learning_rate": 5.9616292104551266e-06, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.28548675775527954, "step": 3415, "valid_targets_mean": 3247.4, "valid_targets_min": 993 }, { "epoch": 5.419968304278922, "grad_norm": 0.8811837893257158, "learning_rate": 5.905446587804977e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.3118222653865814, "step": 3420, "valid_targets_mean": 2474.4, "valid_targets_min": 1138 }, { "epoch": 5.427892234548336, "grad_norm": 0.737052644355842, "learning_rate": 5.849484063229065e-06, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.26889342069625854, "step": 3425, "valid_targets_mean": 3359.2, "valid_targets_min": 1296 }, { "epoch": 5.43581616481775, "grad_norm": 0.8075780098541901, "learning_rate": 5.793742510628344e-06, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.2839280366897583, "step": 3430, "valid_targets_mean": 2892.2, "valid_targets_min": 1268 }, { "epoch": 5.443740095087163, "grad_norm": 0.7504122925838632, "learning_rate": 5.738222800453139e-06, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.3097327947616577, "step": 3435, "valid_targets_mean": 3614.0, "valid_targets_min": 1553 }, { "epoch": 5.4516640253565765, "grad_norm": 0.7821341583753948, "learning_rate": 5.682925799689498e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.30923694372177124, "step": 3440, "valid_targets_mean": 3298.6, "valid_targets_min": 805 }, { "epoch": 5.459587955625991, "grad_norm": 0.842641770651966, "learning_rate": 5.627852371845684e-06, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.2851231098175049, "step": 3445, "valid_targets_mean": 2770.8, "valid_targets_min": 1158 }, { "epoch": 5.467511885895404, "grad_norm": 0.6353722332193599, "learning_rate": 5.573003376938697e-06, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.29435908794403076, "step": 3450, "valid_targets_mean": 3954.3, "valid_targets_min": 1330 }, { "epoch": 5.475435816164818, "grad_norm": 0.7328969023306966, "learning_rate": 5.518379671480813e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.2865089178085327, "step": 3455, "valid_targets_mean": 3525.1, "valid_targets_min": 823 }, { "epoch": 5.483359746434231, "grad_norm": 0.7860142473044672, "learning_rate": 5.4639821084662455e-06, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.29145336151123047, "step": 3460, "valid_targets_mean": 3054.6, "valid_targets_min": 1382 }, { "epoch": 5.491283676703645, "grad_norm": 0.6910554226534089, "learning_rate": 5.409811537357789e-06, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.25137072801589966, "step": 3465, "valid_targets_mean": 3725.8, "valid_targets_min": 1728 }, { "epoch": 5.499207606973059, "grad_norm": 0.8218007972441929, "learning_rate": 5.355868804073594e-06, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.28947368264198303, "step": 3470, "valid_targets_mean": 2976.0, "valid_targets_min": 1010 }, { "epoch": 5.507131537242472, "grad_norm": 0.8486787865272499, "learning_rate": 5.302154750973909e-06, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.28270223736763, "step": 3475, "valid_targets_mean": 2702.1, "valid_targets_min": 844 }, { "epoch": 5.5150554675118855, "grad_norm": 0.7386221051012911, "learning_rate": 5.24867021684798e-06, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.26117268204689026, "step": 3480, "valid_targets_mean": 2879.7, "valid_targets_min": 1225 }, { "epoch": 5.5229793977813, "grad_norm": 0.8216354291445843, "learning_rate": 5.195416036900906e-06, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.26249247789382935, "step": 3485, "valid_targets_mean": 3457.2, "valid_targets_min": 767 }, { "epoch": 5.530903328050713, "grad_norm": 1.2084085528993374, "learning_rate": 5.142393042740617e-06, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.29814475774765015, "step": 3490, "valid_targets_mean": 3182.1, "valid_targets_min": 305 }, { "epoch": 5.538827258320127, "grad_norm": 0.7634750141593889, "learning_rate": 5.089602062364898e-06, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.26985257863998413, "step": 3495, "valid_targets_mean": 2986.9, "valid_targets_min": 1617 }, { "epoch": 5.546751188589541, "grad_norm": 0.6904822066759423, "learning_rate": 5.037043920148434e-06, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.2691362202167511, "step": 3500, "valid_targets_mean": 3526.2, "valid_targets_min": 1080 }, { "epoch": 5.554675118858954, "grad_norm": 0.7735767982702189, "learning_rate": 4.984719436829966e-06, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2815571129322052, "step": 3505, "valid_targets_mean": 2997.6, "valid_targets_min": 1134 }, { "epoch": 5.562599049128368, "grad_norm": 0.8692993197122556, "learning_rate": 4.932629429499436e-06, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.33151981234550476, "step": 3510, "valid_targets_mean": 3003.9, "valid_targets_min": 965 }, { "epoch": 5.570522979397781, "grad_norm": 0.7646591093883555, "learning_rate": 4.880774711585276e-06, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.31601202487945557, "step": 3515, "valid_targets_mean": 3189.0, "valid_targets_min": 1157 }, { "epoch": 5.5784469096671945, "grad_norm": 0.8965877881561789, "learning_rate": 4.829156092841663e-06, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.32319316267967224, "step": 3520, "valid_targets_mean": 2551.0, "valid_targets_min": 663 }, { "epoch": 5.586370839936609, "grad_norm": 0.8160633796116353, "learning_rate": 4.777774379335885e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.3042828440666199, "step": 3525, "valid_targets_mean": 3296.0, "valid_targets_min": 1741 }, { "epoch": 5.594294770206022, "grad_norm": 0.7884724935404464, "learning_rate": 4.726630373435783e-06, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717769145965576, "step": 3530, "valid_targets_mean": 2871.7, "valid_targets_min": 1732 }, { "epoch": 5.602218700475436, "grad_norm": 0.7825057706764867, "learning_rate": 4.675724873797171e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.26800742745399475, "step": 3535, "valid_targets_mean": 3067.4, "valid_targets_min": 735 }, { "epoch": 5.61014263074485, "grad_norm": 0.9287978737031195, "learning_rate": 4.625058675351415e-06, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.33994632959365845, "step": 3540, "valid_targets_mean": 2602.8, "valid_targets_min": 1256 }, { "epoch": 5.618066561014263, "grad_norm": 0.7094356128210746, "learning_rate": 4.5746325692929735e-06, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.2771075367927551, "step": 3545, "valid_targets_mean": 3757.5, "valid_targets_min": 916 }, { "epoch": 5.625990491283677, "grad_norm": 0.6859542644396153, "learning_rate": 4.524447343067089e-06, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.2836745083332062, "step": 3550, "valid_targets_mean": 4243.0, "valid_targets_min": 1365 }, { "epoch": 5.63391442155309, "grad_norm": 0.7767300135724696, "learning_rate": 4.474503780357435e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.2820754647254944, "step": 3555, "valid_targets_mean": 2876.2, "valid_targets_min": 742 }, { "epoch": 5.6418383518225035, "grad_norm": 0.7629257100358653, "learning_rate": 4.424802661073946e-06, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.27318716049194336, "step": 3560, "valid_targets_mean": 3280.9, "valid_targets_min": 1270 }, { "epoch": 5.649762282091918, "grad_norm": 0.7934856602984349, "learning_rate": 4.375344761340576e-06, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571597099304199, "step": 3565, "valid_targets_mean": 2402.7, "valid_targets_min": 853 }, { "epoch": 5.657686212361331, "grad_norm": 0.8440924879483904, "learning_rate": 4.326130853483206e-06, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.26417356729507446, "step": 3570, "valid_targets_mean": 2511.9, "valid_targets_min": 1487 }, { "epoch": 5.665610142630745, "grad_norm": 0.7334809221953392, "learning_rate": 4.277161706017605e-06, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.28534117341041565, "step": 3575, "valid_targets_mean": 4596.6, "valid_targets_min": 1402 }, { "epoch": 5.673534072900159, "grad_norm": 0.8738186406944687, "learning_rate": 4.228438083637376e-06, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.29095956683158875, "step": 3580, "valid_targets_mean": 3154.4, "valid_targets_min": 996 }, { "epoch": 5.681458003169572, "grad_norm": 0.8033107801600781, "learning_rate": 4.179960747202079e-06, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.28336301445961, "step": 3585, "valid_targets_mean": 3012.1, "valid_targets_min": 1565 }, { "epoch": 5.689381933438986, "grad_norm": 0.7721918898048784, "learning_rate": 4.1317304537252804e-06, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.260518342256546, "step": 3590, "valid_targets_mean": 3144.4, "valid_targets_min": 981 }, { "epoch": 5.697305863708399, "grad_norm": 0.694223463065273, "learning_rate": 4.0837479563627955e-06, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.2553626298904419, "step": 3595, "valid_targets_mean": 3345.8, "valid_targets_min": 1444 }, { "epoch": 5.705229793977813, "grad_norm": 0.6331316194608342, "learning_rate": 4.03601400440089e-06, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.2481665164232254, "step": 3600, "valid_targets_mean": 3937.8, "valid_targets_min": 944 }, { "epoch": 5.713153724247227, "grad_norm": 0.7590163702300113, "learning_rate": 3.988529343244573e-06, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.28363344073295593, "step": 3605, "valid_targets_mean": 3357.2, "valid_targets_min": 1556 }, { "epoch": 5.72107765451664, "grad_norm": 0.7862970467968567, "learning_rate": 3.941294714406001e-06, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.26843172311782837, "step": 3610, "valid_targets_mean": 2685.3, "valid_targets_min": 1441 }, { "epoch": 5.729001584786054, "grad_norm": 0.811895324185377, "learning_rate": 3.8943108554928396e-06, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.29337239265441895, "step": 3615, "valid_targets_mean": 2627.5, "valid_targets_min": 767 }, { "epoch": 5.736925515055468, "grad_norm": 0.7818395934035374, "learning_rate": 3.8475785001968045e-06, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.30510663986206055, "step": 3620, "valid_targets_mean": 3426.6, "valid_targets_min": 1372 }, { "epoch": 5.744849445324881, "grad_norm": 0.7237109014055133, "learning_rate": 3.8010983782821464e-06, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.25533539056777954, "step": 3625, "valid_targets_mean": 3133.6, "valid_targets_min": 921 }, { "epoch": 5.752773375594295, "grad_norm": 0.723095303208419, "learning_rate": 3.7548712155743096e-06, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.2870684862136841, "step": 3630, "valid_targets_mean": 3996.8, "valid_targets_min": 942 }, { "epoch": 5.760697305863708, "grad_norm": 0.8844100592127758, "learning_rate": 3.708897733948551e-06, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.29853054881095886, "step": 3635, "valid_targets_mean": 2297.3, "valid_targets_min": 584 }, { "epoch": 5.768621236133122, "grad_norm": 0.7893659220405335, "learning_rate": 3.6631786513187017e-06, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.2839739918708801, "step": 3640, "valid_targets_mean": 3098.4, "valid_targets_min": 1312 }, { "epoch": 5.776545166402536, "grad_norm": 0.7810985118615383, "learning_rate": 3.617714681625939e-06, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.2782176733016968, "step": 3645, "valid_targets_mean": 3081.3, "valid_targets_min": 1199 }, { "epoch": 5.784469096671949, "grad_norm": 0.8015794756139869, "learning_rate": 3.5725065348276332e-06, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.28658199310302734, "step": 3650, "valid_targets_mean": 3216.1, "valid_targets_min": 1163 }, { "epoch": 5.792393026941363, "grad_norm": 0.8065135711286809, "learning_rate": 3.5275549168862843e-06, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.3158048391342163, "step": 3655, "valid_targets_mean": 3061.4, "valid_targets_min": 1504 }, { "epoch": 5.800316957210777, "grad_norm": 0.7907193883577602, "learning_rate": 3.482860529758467e-06, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.2796323895454407, "step": 3660, "valid_targets_mean": 2935.3, "valid_targets_min": 1241 }, { "epoch": 5.80824088748019, "grad_norm": 0.8415609267338444, "learning_rate": 3.4384240713839034e-06, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.3068225383758545, "step": 3665, "valid_targets_mean": 3065.4, "valid_targets_min": 1341 }, { "epoch": 5.816164817749604, "grad_norm": 1.0611550853060565, "learning_rate": 3.3942462356745188e-06, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.285479873418808, "step": 3670, "valid_targets_mean": 3949.0, "valid_targets_min": 1399 }, { "epoch": 5.824088748019017, "grad_norm": 0.8018422821150991, "learning_rate": 3.350327712503665e-06, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.29329565167427063, "step": 3675, "valid_targets_mean": 3313.6, "valid_targets_min": 672 }, { "epoch": 5.832012678288431, "grad_norm": 0.8030610419531269, "learning_rate": 3.306669187695286e-06, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.25516191124916077, "step": 3680, "valid_targets_mean": 2793.8, "valid_targets_min": 1390 }, { "epoch": 5.839936608557845, "grad_norm": 0.761756852048967, "learning_rate": 3.2632713430132502e-06, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2513202130794525, "step": 3685, "valid_targets_mean": 3200.6, "valid_targets_min": 1081 }, { "epoch": 5.847860538827258, "grad_norm": 1.1902444568785213, "learning_rate": 3.220134856150692e-06, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2957605719566345, "step": 3690, "valid_targets_mean": 2885.6, "valid_targets_min": 834 }, { "epoch": 5.855784469096672, "grad_norm": 0.7866773610863317, "learning_rate": 3.177260400719422e-06, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.28008750081062317, "step": 3695, "valid_targets_mean": 4172.1, "valid_targets_min": 1492 }, { "epoch": 5.863708399366086, "grad_norm": 0.8126826054651635, "learning_rate": 3.134648646239422e-06, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.2800007462501526, "step": 3700, "valid_targets_mean": 2865.2, "valid_targets_min": 1157 }, { "epoch": 5.871632329635499, "grad_norm": 0.7014430955558992, "learning_rate": 3.092300258128369e-06, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964010238647461, "step": 3705, "valid_targets_mean": 3767.6, "valid_targets_min": 778 }, { "epoch": 5.879556259904913, "grad_norm": 0.9601998578307006, "learning_rate": 3.0502158976912733e-06, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.2710258960723877, "step": 3710, "valid_targets_mean": 2326.4, "valid_targets_min": 1060 }, { "epoch": 5.887480190174326, "grad_norm": 0.8008616041237828, "learning_rate": 3.0083962221101193e-06, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.27677208185195923, "step": 3715, "valid_targets_mean": 2879.9, "valid_targets_min": 1298 }, { "epoch": 5.89540412044374, "grad_norm": 0.7720062924445003, "learning_rate": 2.9668418844336356e-06, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.26314905285835266, "step": 3720, "valid_targets_mean": 3117.0, "valid_targets_min": 1529 }, { "epoch": 5.903328050713154, "grad_norm": 0.964559252585821, "learning_rate": 2.9255535335670673e-06, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.30997902154922485, "step": 3725, "valid_targets_mean": 2333.3, "valid_targets_min": 973 }, { "epoch": 5.911251980982567, "grad_norm": 0.863580039309836, "learning_rate": 2.8845318142620526e-06, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.3259606957435608, "step": 3730, "valid_targets_mean": 2724.1, "valid_targets_min": 719 }, { "epoch": 5.919175911251981, "grad_norm": 0.7223684462952389, "learning_rate": 2.8437773671065796e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.2662881910800934, "step": 3735, "valid_targets_mean": 3433.8, "valid_targets_min": 845 }, { "epoch": 5.927099841521395, "grad_norm": 0.8997397517104827, "learning_rate": 2.803290828514935e-06, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.2858402729034424, "step": 3740, "valid_targets_mean": 2252.3, "valid_targets_min": 795 }, { "epoch": 5.935023771790808, "grad_norm": 1.257589056146217, "learning_rate": 2.7630728307178166e-06, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.3157416582107544, "step": 3745, "valid_targets_mean": 3201.3, "valid_targets_min": 1047 }, { "epoch": 5.942947702060222, "grad_norm": 1.004305514240146, "learning_rate": 2.723124001752415e-06, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.294961541891098, "step": 3750, "valid_targets_mean": 1967.2, "valid_targets_min": 842 }, { "epoch": 5.950871632329635, "grad_norm": 0.9606671850132081, "learning_rate": 2.6834449654526463e-06, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.34209227561950684, "step": 3755, "valid_targets_mean": 2170.5, "valid_targets_min": 720 }, { "epoch": 5.958795562599049, "grad_norm": 0.7957342434386907, "learning_rate": 2.6440363414393776e-06, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.2978052496910095, "step": 3760, "valid_targets_mean": 2861.3, "valid_targets_min": 1318 }, { "epoch": 5.966719492868463, "grad_norm": 0.906718243376995, "learning_rate": 2.6048987451107667e-06, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.34471917152404785, "step": 3765, "valid_targets_mean": 2459.7, "valid_targets_min": 919 }, { "epoch": 5.974643423137876, "grad_norm": 0.9374249518211754, "learning_rate": 2.5660327876326596e-06, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.31891578435897827, "step": 3770, "valid_targets_mean": 2455.0, "valid_targets_min": 949 }, { "epoch": 5.9825673534072905, "grad_norm": 0.7160565242876318, "learning_rate": 2.527439075929028e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.250852108001709, "step": 3775, "valid_targets_mean": 3327.8, "valid_targets_min": 1186 }, { "epoch": 5.990491283676704, "grad_norm": 0.8255785273755935, "learning_rate": 2.489118212672512e-06, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.3088967204093933, "step": 3780, "valid_targets_mean": 2943.2, "valid_targets_min": 800 }, { "epoch": 5.998415213946117, "grad_norm": 0.6942790595633246, "learning_rate": 2.4510707962749813e-06, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.31014499068260193, "step": 3785, "valid_targets_mean": 4262.9, "valid_targets_min": 1053 }, { "epoch": 6.006339144215531, "grad_norm": 0.8405826416690129, "learning_rate": 2.413297420878231e-06, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536356449127197, "step": 3790, "valid_targets_mean": 2973.3, "valid_targets_min": 819 }, { "epoch": 6.014263074484944, "grad_norm": 0.9255627668051156, "learning_rate": 2.375798676344652e-06, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.3057909607887268, "step": 3795, "valid_targets_mean": 2337.0, "valid_targets_min": 824 }, { "epoch": 6.022187004754358, "grad_norm": 0.7408039931277529, "learning_rate": 2.338575148248077e-06, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888672649860382, "step": 3800, "valid_targets_mean": 3384.5, "valid_targets_min": 996 }, { "epoch": 6.030110935023772, "grad_norm": 0.744846896666886, "learning_rate": 2.3016274178645826e-06, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.2156473994255066, "step": 3805, "valid_targets_mean": 3281.6, "valid_targets_min": 1175 }, { "epoch": 6.038034865293185, "grad_norm": 1.0372675808168368, "learning_rate": 2.264956062163448e-06, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.28580576181411743, "step": 3810, "valid_targets_mean": 3315.4, "valid_targets_min": 1034 }, { "epoch": 6.045958795562599, "grad_norm": 0.7812177830894746, "learning_rate": 2.2285616537981382e-06, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.31875208020210266, "step": 3815, "valid_targets_mean": 3482.0, "valid_targets_min": 825 }, { "epoch": 6.053882725832013, "grad_norm": 0.9237011609509943, "learning_rate": 2.192444761097341e-06, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.29322725534439087, "step": 3820, "valid_targets_mean": 2307.0, "valid_targets_min": 842 }, { "epoch": 6.061806656101426, "grad_norm": 0.8990191236648827, "learning_rate": 2.1566059480561276e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2766517698764801, "step": 3825, "valid_targets_mean": 2363.1, "valid_targets_min": 941 }, { "epoch": 6.06973058637084, "grad_norm": 0.7361355418620003, "learning_rate": 2.1210457743271173e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930822968482971, "step": 3830, "valid_targets_mean": 3734.8, "valid_targets_min": 1547 }, { "epoch": 6.077654516640253, "grad_norm": 0.9139892229625006, "learning_rate": 2.085764795211742e-06, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.2555992603302002, "step": 3835, "valid_targets_mean": 3034.4, "valid_targets_min": 1277 }, { "epoch": 6.085578446909667, "grad_norm": 0.771123933373858, "learning_rate": 2.0507635616515896e-06, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631310224533081, "step": 3840, "valid_targets_mean": 2985.9, "valid_targets_min": 1237 }, { "epoch": 6.093502377179081, "grad_norm": 0.7897490876583761, "learning_rate": 2.0160426202197782e-06, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618263363838196, "step": 3845, "valid_targets_mean": 3156.4, "valid_targets_min": 1103 }, { "epoch": 6.101426307448494, "grad_norm": 0.7722775214717016, "learning_rate": 1.981602513112446e-06, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.24826066195964813, "step": 3850, "valid_targets_mean": 3438.9, "valid_targets_min": 889 }, { "epoch": 6.1093502377179085, "grad_norm": 0.7058163459626046, "learning_rate": 1.947443778140259e-06, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.3340873420238495, "step": 3855, "valid_targets_mean": 4009.1, "valid_targets_min": 613 }, { "epoch": 6.117274167987322, "grad_norm": 0.8569365221631509, "learning_rate": 1.9135669487200404e-06, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.29067397117614746, "step": 3860, "valid_targets_mean": 3074.8, "valid_targets_min": 804 }, { "epoch": 6.125198098256735, "grad_norm": 0.7812766506289543, "learning_rate": 1.8799725538664138e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.24928317964076996, "step": 3865, "valid_targets_mean": 3012.5, "valid_targets_min": 756 }, { "epoch": 6.133122028526149, "grad_norm": 0.8199444138458281, "learning_rate": 1.8466611181835504e-06, "loss": 0.2884, "loss_nan_ranks": 0, "loss_rank_avg": 0.26236987113952637, "step": 3870, "valid_targets_mean": 2752.6, "valid_targets_min": 1398 }, { "epoch": 6.141045958795562, "grad_norm": 0.7536336080898335, "learning_rate": 1.813633161856998e-06, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.2606717348098755, "step": 3875, "valid_targets_mean": 3515.2, "valid_targets_min": 1170 }, { "epoch": 6.148969889064976, "grad_norm": 1.296674137353546, "learning_rate": 1.7808892006455236e-06, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.25334101915359497, "step": 3880, "valid_targets_mean": 3008.9, "valid_targets_min": 959 }, { "epoch": 6.15689381933439, "grad_norm": 0.8549376573866226, "learning_rate": 1.7484297458730903e-06, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.27031368017196655, "step": 3885, "valid_targets_mean": 2541.9, "valid_targets_min": 1088 }, { "epoch": 6.164817749603803, "grad_norm": 0.8660477974763549, "learning_rate": 1.7162553044208397e-06, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.27956318855285645, "step": 3890, "valid_targets_mean": 2584.7, "valid_targets_min": 836 }, { "epoch": 6.1727416798732175, "grad_norm": 0.711909383806564, "learning_rate": 1.6843663787192198e-06, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.25135537981987, "step": 3895, "valid_targets_mean": 3468.3, "valid_targets_min": 1001 }, { "epoch": 6.180665610142631, "grad_norm": 0.7256194141801523, "learning_rate": 1.6527634667400905e-06, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.2889530658721924, "step": 3900, "valid_targets_mean": 3539.7, "valid_targets_min": 747 }, { "epoch": 6.188589540412044, "grad_norm": 0.89965843002777, "learning_rate": 1.621447061988992e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.28266841173171997, "step": 3905, "valid_targets_mean": 2481.8, "valid_targets_min": 1242 }, { "epoch": 6.196513470681458, "grad_norm": 0.6424467869924108, "learning_rate": 1.5904176534974026e-06, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.2667967677116394, "step": 3910, "valid_targets_mean": 4722.1, "valid_targets_min": 1482 }, { "epoch": 6.204437400950872, "grad_norm": 0.7166598681182121, "learning_rate": 1.559675725815124e-06, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644422650337219, "step": 3915, "valid_targets_mean": 3448.1, "valid_targets_min": 1400 }, { "epoch": 6.212361331220285, "grad_norm": 0.6883227021978096, "learning_rate": 1.5292217590027126e-06, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2776218056678772, "step": 3920, "valid_targets_mean": 3848.3, "valid_targets_min": 1314 }, { "epoch": 6.220285261489699, "grad_norm": 0.8216293331586425, "learning_rate": 1.4990562286239651e-06, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.27567949891090393, "step": 3925, "valid_targets_mean": 2947.2, "valid_targets_min": 1357 }, { "epoch": 6.228209191759112, "grad_norm": 0.8066020986178258, "learning_rate": 1.4691796057385222e-06, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.32604455947875977, "step": 3930, "valid_targets_mean": 3126.6, "valid_targets_min": 1571 }, { "epoch": 6.2361331220285265, "grad_norm": 0.7786528543223891, "learning_rate": 1.4395923568944792e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671036422252655, "step": 3935, "valid_targets_mean": 3246.4, "valid_targets_min": 720 }, { "epoch": 6.24405705229794, "grad_norm": 0.720991179266921, "learning_rate": 1.4102949441211333e-06, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.2621596157550812, "step": 3940, "valid_targets_mean": 3775.2, "valid_targets_min": 1717 }, { "epoch": 6.251980982567353, "grad_norm": 0.8635951163563789, "learning_rate": 1.3812878249217375e-06, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.2590984106063843, "step": 3945, "valid_targets_mean": 2491.5, "valid_targets_min": 830 }, { "epoch": 6.259904912836767, "grad_norm": 0.8055705967233836, "learning_rate": 1.3525714522663802e-06, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.2969766855239868, "step": 3950, "valid_targets_mean": 3152.1, "valid_targets_min": 1546 }, { "epoch": 6.267828843106181, "grad_norm": 0.8212779657990703, "learning_rate": 1.3241462745849032e-06, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2703918516635895, "step": 3955, "valid_targets_mean": 2716.7, "valid_targets_min": 1124 }, { "epoch": 6.2757527733755945, "grad_norm": 0.7792393371884195, "learning_rate": 1.2960127357598907e-06, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.29034721851348877, "step": 3960, "valid_targets_mean": 3387.6, "valid_targets_min": 1440 }, { "epoch": 6.283676703645008, "grad_norm": 0.7746891412107202, "learning_rate": 1.2681712751197561e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.27121007442474365, "step": 3965, "valid_targets_mean": 3463.2, "valid_targets_min": 1184 }, { "epoch": 6.291600633914421, "grad_norm": 0.7782249097983254, "learning_rate": 1.2406223274318619e-06, "loss": 0.2889, "loss_nan_ranks": 0, "loss_rank_avg": 0.2974588871002197, "step": 3970, "valid_targets_mean": 3313.4, "valid_targets_min": 1128 }, { "epoch": 6.2995245641838356, "grad_norm": 0.7412856374389678, "learning_rate": 1.2133663228957483e-06, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881653606891632, "step": 3975, "valid_targets_mean": 3866.8, "valid_targets_min": 1073 }, { "epoch": 6.307448494453249, "grad_norm": 0.8312977029113554, "learning_rate": 1.186403687136397e-06, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.27708035707473755, "step": 3980, "valid_targets_mean": 3342.8, "valid_targets_min": 933 }, { "epoch": 6.315372424722662, "grad_norm": 0.8197541649986204, "learning_rate": 1.1597348411976038e-06, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.2698556184768677, "step": 3985, "valid_targets_mean": 3237.8, "valid_targets_min": 951 }, { "epoch": 6.323296354992076, "grad_norm": 0.8471159114422045, "learning_rate": 1.1333602015353896e-06, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.26829445362091064, "step": 3990, "valid_targets_mean": 3004.6, "valid_targets_min": 928 }, { "epoch": 6.33122028526149, "grad_norm": 0.7503125828764259, "learning_rate": 1.1072801800114985e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.2777388393878937, "step": 3995, "valid_targets_mean": 3267.4, "valid_targets_min": 947 }, { "epoch": 6.3391442155309035, "grad_norm": 0.8175380063542717, "learning_rate": 1.0814951838869758e-06, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.3123356103897095, "step": 4000, "valid_targets_mean": 2992.7, "valid_targets_min": 950 }, { "epoch": 6.347068145800317, "grad_norm": 0.6162025832470477, "learning_rate": 1.0560056158157938e-06, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.2392377257347107, "step": 4005, "valid_targets_mean": 4391.2, "valid_targets_min": 1106 }, { "epoch": 6.35499207606973, "grad_norm": 0.7072834519407339, "learning_rate": 1.0308118738385865e-06, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.2674199938774109, "step": 4010, "valid_targets_mean": 4024.9, "valid_targets_min": 832 }, { "epoch": 6.362916006339145, "grad_norm": 0.7287197281341509, "learning_rate": 1.0059143513764003e-06, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.2720893621444702, "step": 4015, "valid_targets_mean": 3626.2, "valid_targets_min": 1144 }, { "epoch": 6.370839936608558, "grad_norm": 0.7782133569731706, "learning_rate": 9.81313437224587e-07, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.2739805579185486, "step": 4020, "valid_targets_mean": 3153.7, "valid_targets_min": 1323 }, { "epoch": 6.378763866877971, "grad_norm": 1.0460021255922092, "learning_rate": 9.57009515546703e-07, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.28859415650367737, "step": 4025, "valid_targets_mean": 3569.7, "valid_targets_min": 724 }, { "epoch": 6.386687797147385, "grad_norm": 0.7562261910777165, "learning_rate": 9.330029658685302e-07, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.27344030141830444, "step": 4030, "valid_targets_mean": 3449.7, "valid_targets_min": 1592 }, { "epoch": 6.394611727416799, "grad_norm": 0.8544761844509305, "learning_rate": 9.092941630721363e-07, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.29668188095092773, "step": 4035, "valid_targets_mean": 2992.6, "valid_targets_min": 1013 }, { "epoch": 6.4025356576862125, "grad_norm": 0.6668053311414428, "learning_rate": 8.85883477390026e-07, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.24657505750656128, "step": 4040, "valid_targets_mean": 3835.4, "valid_targets_min": 1336 }, { "epoch": 6.410459587955626, "grad_norm": 0.7216857447286184, "learning_rate": 8.627712743993655e-07, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2436390221118927, "step": 4045, "valid_targets_mean": 3372.4, "valid_targets_min": 1404 }, { "epoch": 6.418383518225039, "grad_norm": 1.0127403923030123, "learning_rate": 8.399579150162585e-07, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2674424648284912, "step": 4050, "valid_targets_mean": 3369.4, "valid_targets_min": 1352 }, { "epoch": 6.426307448494454, "grad_norm": 0.8241874728542988, "learning_rate": 8.174437554901304e-07, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.262814462184906, "step": 4055, "valid_targets_mean": 3054.7, "valid_targets_min": 967 }, { "epoch": 6.434231378763867, "grad_norm": 0.7415633298787859, "learning_rate": 7.9522914739814e-07, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.257989764213562, "step": 4060, "valid_targets_mean": 3583.1, "valid_targets_min": 1582 }, { "epoch": 6.44215530903328, "grad_norm": 0.7949440857800341, "learning_rate": 7.733144376397184e-07, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.28058376908302307, "step": 4065, "valid_targets_mean": 2917.6, "valid_targets_min": 969 }, { "epoch": 6.450079239302694, "grad_norm": 0.7943902641247984, "learning_rate": 7.516999684311277e-07, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.26108643412590027, "step": 4070, "valid_targets_mean": 3074.9, "valid_targets_min": 904 }, { "epoch": 6.458003169572108, "grad_norm": 0.8282850201666918, "learning_rate": 7.303860773001248e-07, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.2973766624927521, "step": 4075, "valid_targets_mean": 3289.0, "valid_targets_min": 1388 }, { "epoch": 6.4659270998415215, "grad_norm": 0.8612035667904403, "learning_rate": 7.093730970807034e-07, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2724660336971283, "step": 4080, "valid_targets_mean": 2506.1, "valid_targets_min": 1134 }, { "epoch": 6.473851030110935, "grad_norm": 0.7705878492600347, "learning_rate": 6.88661355907867e-07, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2626793384552002, "step": 4085, "valid_targets_mean": 3173.4, "valid_targets_min": 1241 }, { "epoch": 6.481774960380348, "grad_norm": 0.8293774983470878, "learning_rate": 6.682511772125422e-07, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623213529586792, "step": 4090, "valid_targets_mean": 2695.9, "valid_targets_min": 1083 }, { "epoch": 6.489698890649763, "grad_norm": 0.7185734573332064, "learning_rate": 6.481428797164957e-07, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.2767176628112793, "step": 4095, "valid_targets_mean": 3695.9, "valid_targets_min": 1610 }, { "epoch": 6.497622820919176, "grad_norm": 0.7192376832208326, "learning_rate": 6.283367774273785e-07, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.2640265226364136, "step": 4100, "valid_targets_mean": 3505.2, "valid_targets_min": 749 }, { "epoch": 6.505546751188589, "grad_norm": 0.7821908648146034, "learning_rate": 6.088331796338032e-07, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2534036934375763, "step": 4105, "valid_targets_mean": 3527.4, "valid_targets_min": 1362 }, { "epoch": 6.513470681458003, "grad_norm": 0.8284059543758624, "learning_rate": 5.896323909005408e-07, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.2960991859436035, "step": 4110, "valid_targets_mean": 2956.4, "valid_targets_min": 1221 }, { "epoch": 6.521394611727417, "grad_norm": 0.7318982088006352, "learning_rate": 5.707347110637363e-07, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784423530101776, "step": 4115, "valid_targets_mean": 3589.7, "valid_targets_min": 1266 }, { "epoch": 6.5293185419968305, "grad_norm": 0.8037460574946733, "learning_rate": 5.521404352262427e-07, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540718913078308, "step": 4120, "valid_targets_mean": 3112.4, "valid_targets_min": 809 }, { "epoch": 6.537242472266244, "grad_norm": 0.8562375564350958, "learning_rate": 5.338498537530146e-07, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838800549507141, "step": 4125, "valid_targets_mean": 2713.3, "valid_targets_min": 613 }, { "epoch": 6.545166402535658, "grad_norm": 0.8404101038916709, "learning_rate": 5.158632522665619e-07, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.27864933013916016, "step": 4130, "valid_targets_mean": 2579.3, "valid_targets_min": 1006 }, { "epoch": 6.553090332805072, "grad_norm": 0.8903943414798002, "learning_rate": 4.981809116424985e-07, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.276671826839447, "step": 4135, "valid_targets_mean": 2540.3, "valid_targets_min": 735 }, { "epoch": 6.561014263074485, "grad_norm": 0.7783873275285311, "learning_rate": 4.808031080051545e-07, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.29601848125457764, "step": 4140, "valid_targets_mean": 3532.1, "valid_targets_min": 987 }, { "epoch": 6.568938193343898, "grad_norm": 0.8487222802895167, "learning_rate": 4.637301127232663e-07, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.2824670672416687, "step": 4145, "valid_targets_mean": 2751.2, "valid_targets_min": 1035 }, { "epoch": 6.576862123613312, "grad_norm": 0.7810288925443892, "learning_rate": 4.4696219240573327e-07, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.29629069566726685, "step": 4150, "valid_targets_mean": 3234.6, "valid_targets_min": 1025 }, { "epoch": 6.584786053882726, "grad_norm": 0.6639163886957854, "learning_rate": 4.3049960889745666e-07, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.2679304778575897, "step": 4155, "valid_targets_mean": 4046.2, "valid_targets_min": 2034 }, { "epoch": 6.5927099841521395, "grad_norm": 0.766246752720584, "learning_rate": 4.143426192752542e-07, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746524214744568, "step": 4160, "valid_targets_mean": 3666.3, "valid_targets_min": 1545 }, { "epoch": 6.600633914421553, "grad_norm": 0.8536786529200687, "learning_rate": 3.984914758438407e-07, "loss": 0.2995, "loss_nan_ranks": 0, "loss_rank_avg": 0.3148544728755951, "step": 4165, "valid_targets_mean": 3556.8, "valid_targets_min": 502 }, { "epoch": 6.608557844690967, "grad_norm": 0.8388466221341304, "learning_rate": 3.8294642613189603e-07, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.2988848388195038, "step": 4170, "valid_targets_mean": 3141.4, "valid_targets_min": 1034 }, { "epoch": 6.616481774960381, "grad_norm": 0.8546205962148445, "learning_rate": 3.6770771288818563e-07, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964688539505005, "step": 4175, "valid_targets_mean": 2680.8, "valid_targets_min": 1146 }, { "epoch": 6.624405705229794, "grad_norm": 0.6352285540163427, "learning_rate": 3.5277557407778605e-07, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.26553648710250854, "step": 4180, "valid_targets_mean": 4059.6, "valid_targets_min": 1237 }, { "epoch": 6.632329635499207, "grad_norm": 0.9620640961546393, "learning_rate": 3.3815024287835895e-07, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.3085815906524658, "step": 4185, "valid_targets_mean": 2293.6, "valid_targets_min": 768 }, { "epoch": 6.640253565768621, "grad_norm": 0.7540474372071029, "learning_rate": 3.2383194767650947e-07, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.257649302482605, "step": 4190, "valid_targets_mean": 3436.9, "valid_targets_min": 1402 }, { "epoch": 6.648177496038035, "grad_norm": 0.8249666226190281, "learning_rate": 3.098209120642248e-07, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.2894267737865448, "step": 4195, "valid_targets_mean": 3102.8, "valid_targets_min": 1485 }, { "epoch": 6.6561014263074485, "grad_norm": 0.7985618899920006, "learning_rate": 2.9611735483537684e-07, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.29402169585227966, "step": 4200, "valid_targets_mean": 3086.1, "valid_targets_min": 923 }, { "epoch": 6.664025356576862, "grad_norm": 0.7971335823491561, "learning_rate": 2.827214899823183e-07, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.28697848320007324, "step": 4205, "valid_targets_mean": 3342.2, "valid_targets_min": 1271 }, { "epoch": 6.671949286846276, "grad_norm": 0.9626143965275245, "learning_rate": 2.6963352669252095e-07, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.29628515243530273, "step": 4210, "valid_targets_mean": 2125.6, "valid_targets_min": 698 }, { "epoch": 6.67987321711569, "grad_norm": 0.7980141278149887, "learning_rate": 2.568536693453272e-07, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726362943649292, "step": 4215, "valid_targets_mean": 2887.1, "valid_targets_min": 1048 }, { "epoch": 6.687797147385103, "grad_norm": 0.8055430110182665, "learning_rate": 2.443821175087435e-07, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.2402665913105011, "step": 4220, "valid_targets_mean": 2865.8, "valid_targets_min": 1197 }, { "epoch": 6.695721077654516, "grad_norm": 0.8616251532210281, "learning_rate": 2.3221906593634102e-07, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.2799178957939148, "step": 4225, "valid_targets_mean": 3122.3, "valid_targets_min": 1305 }, { "epoch": 6.70364500792393, "grad_norm": 0.774098085179844, "learning_rate": 2.2036470456419767e-07, "loss": 0.2889, "loss_nan_ranks": 0, "loss_rank_avg": 0.32133832573890686, "step": 4230, "valid_targets_mean": 3208.2, "valid_targets_min": 1505 }, { "epoch": 6.711568938193344, "grad_norm": 0.7956195714820337, "learning_rate": 2.088192185079385e-07, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.26833003759384155, "step": 4235, "valid_targets_mean": 2955.7, "valid_targets_min": 1027 }, { "epoch": 6.7194928684627575, "grad_norm": 0.8577430299273257, "learning_rate": 1.9758278805985574e-07, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.32463526725769043, "step": 4240, "valid_targets_mean": 2802.4, "valid_targets_min": 1128 }, { "epoch": 6.727416798732171, "grad_norm": 0.6783344453017468, "learning_rate": 1.8665558868607325e-07, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2513703405857086, "step": 4245, "valid_targets_mean": 3795.2, "valid_targets_min": 1668 }, { "epoch": 6.735340729001585, "grad_norm": 0.6750719706575818, "learning_rate": 1.760377910238198e-07, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.2817671597003937, "step": 4250, "valid_targets_mean": 3822.6, "valid_targets_min": 917 }, { "epoch": 6.743264659270999, "grad_norm": 0.7810619939316714, "learning_rate": 1.6572956087876014e-07, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.29501527547836304, "step": 4255, "valid_targets_mean": 3182.8, "valid_targets_min": 1080 }, { "epoch": 6.751188589540412, "grad_norm": 0.9970801859894827, "learning_rate": 1.5573105922241037e-07, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.3328208327293396, "step": 4260, "valid_targets_mean": 2217.5, "valid_targets_min": 1062 }, { "epoch": 6.759112519809825, "grad_norm": 0.7526770442896775, "learning_rate": 1.4604244218962005e-07, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2694515585899353, "step": 4265, "valid_targets_mean": 3435.8, "valid_targets_min": 1346 }, { "epoch": 6.767036450079239, "grad_norm": 0.8154643867852098, "learning_rate": 1.3666386107613173e-07, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.26164501905441284, "step": 4270, "valid_targets_mean": 2867.2, "valid_targets_min": 955 }, { "epoch": 6.774960380348653, "grad_norm": 0.9005705221401481, "learning_rate": 1.2759546233622299e-07, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.304414302110672, "step": 4275, "valid_targets_mean": 2569.8, "valid_targets_min": 906 }, { "epoch": 6.7828843106180665, "grad_norm": 0.9123716561532796, "learning_rate": 1.1883738758041941e-07, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.289928138256073, "step": 4280, "valid_targets_mean": 2864.4, "valid_targets_min": 683 }, { "epoch": 6.79080824088748, "grad_norm": 0.735049289630845, "learning_rate": 1.1038977357328063e-07, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.2669024169445038, "step": 4285, "valid_targets_mean": 3456.4, "valid_targets_min": 913 }, { "epoch": 6.798732171156894, "grad_norm": 0.7856993252453753, "learning_rate": 1.0225275223126219e-07, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.2780317962169647, "step": 4290, "valid_targets_mean": 3268.8, "valid_targets_min": 1330 }, { "epoch": 6.806656101426308, "grad_norm": 0.800287247624352, "learning_rate": 9.442645062066602e-08, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.28255707025527954, "step": 4295, "valid_targets_mean": 3144.7, "valid_targets_min": 1186 }, { "epoch": 6.814580031695721, "grad_norm": 0.7997304917655168, "learning_rate": 8.691099095564426e-08, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793860137462616, "step": 4300, "valid_targets_mean": 3157.3, "valid_targets_min": 1311 }, { "epoch": 6.822503961965134, "grad_norm": 0.7116056078586471, "learning_rate": 7.970649059629853e-08, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.3179277777671814, "step": 4305, "valid_targets_mean": 4103.9, "valid_targets_min": 1133 }, { "epoch": 6.830427892234549, "grad_norm": 0.7338611892910522, "learning_rate": 7.281306204684147e-08, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.25144636631011963, "step": 4310, "valid_targets_mean": 3348.8, "valid_targets_min": 1437 }, { "epoch": 6.838351822503962, "grad_norm": 0.7686317688403141, "learning_rate": 6.623081295384248e-08, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.2780628800392151, "step": 4315, "valid_targets_mean": 3222.4, "valid_targets_min": 1381 }, { "epoch": 6.8462757527733755, "grad_norm": 0.7718844920164412, "learning_rate": 5.995984610455141e-08, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787400484085083, "step": 4320, "valid_targets_mean": 3495.1, "valid_targets_min": 881 }, { "epoch": 6.854199683042789, "grad_norm": 1.1648381903860865, "learning_rate": 5.4000259425286415e-08, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803596556186676, "step": 4325, "valid_targets_mean": 2394.1, "valid_targets_min": 969 }, { "epoch": 6.862123613312203, "grad_norm": 0.7006666990793252, "learning_rate": 4.835214597990856e-08, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585388720035553, "step": 4330, "valid_targets_mean": 3829.1, "valid_targets_min": 748 }, { "epoch": 6.870047543581617, "grad_norm": 0.9365508753028423, "learning_rate": 4.301559396836519e-08, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896960973739624, "step": 4335, "valid_targets_mean": 2411.0, "valid_targets_min": 1057 }, { "epoch": 6.87797147385103, "grad_norm": 0.7887978749058427, "learning_rate": 3.799068672531769e-08, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.2780733108520508, "step": 4340, "valid_targets_mean": 3101.2, "valid_targets_min": 1149 }, { "epoch": 6.885895404120443, "grad_norm": 0.8049956083558146, "learning_rate": 3.3277502718835896e-08, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052785396575928, "step": 4345, "valid_targets_mean": 3174.3, "valid_targets_min": 1707 }, { "epoch": 6.893819334389858, "grad_norm": 0.8368946913702296, "learning_rate": 2.8876115549176796e-08, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.26890894770622253, "step": 4350, "valid_targets_mean": 2879.1, "valid_targets_min": 1387 }, { "epoch": 6.901743264659271, "grad_norm": 0.8341731874690929, "learning_rate": 2.4786593947625503e-08, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.2666037082672119, "step": 4355, "valid_targets_mean": 2962.6, "valid_targets_min": 1371 }, { "epoch": 6.9096671949286845, "grad_norm": 0.8535984792313458, "learning_rate": 2.1009001775440518e-08, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.3076822757720947, "step": 4360, "valid_targets_mean": 2713.1, "valid_targets_min": 984 }, { "epoch": 6.917591125198098, "grad_norm": 0.7324014319593888, "learning_rate": 1.7543398022832337e-08, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.23690354824066162, "step": 4365, "valid_targets_mean": 3588.8, "valid_targets_min": 885 }, { "epoch": 6.925515055467512, "grad_norm": 0.7088032524121062, "learning_rate": 1.4389836808066382e-08, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.2727454900741577, "step": 4370, "valid_targets_mean": 4242.9, "valid_targets_min": 1335 }, { "epoch": 6.933438985736926, "grad_norm": 0.8198153597362804, "learning_rate": 1.1548367376599257e-08, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.2867714762687683, "step": 4375, "valid_targets_mean": 3238.0, "valid_targets_min": 1153 }, { "epoch": 6.941362916006339, "grad_norm": 0.6663493051614263, "learning_rate": 9.019034100319347e-09, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.25853022933006287, "step": 4380, "valid_targets_mean": 3799.1, "valid_targets_min": 823 }, { "epoch": 6.949286846275752, "grad_norm": 0.8065724319838463, "learning_rate": 6.801876476854041e-09, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830263078212738, "step": 4385, "valid_targets_mean": 3164.6, "valid_targets_min": 1264 }, { "epoch": 6.957210776545167, "grad_norm": 0.9171202573479613, "learning_rate": 4.896929128943573e-09, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.27494555711746216, "step": 4390, "valid_targets_mean": 2160.8, "valid_targets_min": 1141 }, { "epoch": 6.96513470681458, "grad_norm": 0.719951132738071, "learning_rate": 3.3042218039147643e-09, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768862843513489, "step": 4395, "valid_targets_mean": 3622.3, "valid_targets_min": 933 }, { "epoch": 6.9730586370839935, "grad_norm": 0.9290612308151752, "learning_rate": 2.0237793732036384e-09, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643606960773468, "step": 4400, "valid_targets_mean": 2387.6, "valid_targets_min": 751 }, { "epoch": 6.980982567353407, "grad_norm": 0.9045790350311159, "learning_rate": 1.0556218319757172e-09, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2653629779815674, "step": 4405, "valid_targets_mean": 2927.2, "valid_targets_min": 1066 }, { "epoch": 6.988906497622821, "grad_norm": 0.8022249964923563, "learning_rate": 3.997642988107231e-10, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2766302824020386, "step": 4410, "valid_targets_mean": 3228.6, "valid_targets_min": 987 }, { "epoch": 6.996830427892235, "grad_norm": 0.8723843600795462, "learning_rate": 5.62170154649877e-11, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.3014870285987854, "step": 4415, "valid_targets_mean": 2630.8, "valid_targets_min": 1016 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.24078989028930664, "step": 4417, "total_flos": 1125904534470656.0, "train_loss": 0.35793851753530226, "train_runtime": 26871.7295, "train_samples_per_second": 2.627, "train_steps_per_second": 0.164, "valid_targets_mean": 2557.6, "valid_targets_min": 1102 } ], "logging_steps": 5, "max_steps": 4417, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1125904534470656.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }