{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4305, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008136696501220505, "grad_norm": 16.090431037903322, "learning_rate": 3.7122969837587006e-07, "loss": 0.7715, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875712513923645, "step": 5, "valid_targets_mean": 4549.8, "valid_targets_min": 252 }, { "epoch": 0.01627339300244101, "grad_norm": 13.600731709495204, "learning_rate": 8.352668213457077e-07, "loss": 0.7117, "loss_nan_ranks": 0, "loss_rank_avg": 0.35614049434661865, "step": 10, "valid_targets_mean": 8209.8, "valid_targets_min": 4066 }, { "epoch": 0.024410089503661515, "grad_norm": 14.14836434723303, "learning_rate": 1.2993039443155453e-06, "loss": 0.694, "loss_nan_ranks": 0, "loss_rank_avg": 0.250732421875, "step": 15, "valid_targets_mean": 4782.0, "valid_targets_min": 867 }, { "epoch": 0.03254678600488202, "grad_norm": 7.548954071846173, "learning_rate": 1.7633410672853829e-06, "loss": 0.6943, "loss_nan_ranks": 0, "loss_rank_avg": 0.22547389566898346, "step": 20, "valid_targets_mean": 5292.1, "valid_targets_min": 1196 }, { "epoch": 0.04068348250610252, "grad_norm": 6.231235771802954, "learning_rate": 2.2273781902552207e-06, "loss": 0.6218, "loss_nan_ranks": 0, "loss_rank_avg": 0.33196526765823364, "step": 25, "valid_targets_mean": 5366.5, "valid_targets_min": 2694 }, { "epoch": 0.04882017900732303, "grad_norm": 3.2220494398584676, "learning_rate": 2.691415313225058e-06, "loss": 0.5883, "loss_nan_ranks": 0, "loss_rank_avg": 0.2818257212638855, "step": 30, "valid_targets_mean": 5397.9, "valid_targets_min": 4217 }, { "epoch": 0.05695687550854353, "grad_norm": 1.9906473871157997, "learning_rate": 3.155452436194896e-06, "loss": 0.5962, "loss_nan_ranks": 0, "loss_rank_avg": 0.29219943284988403, "step": 35, "valid_targets_mean": 6485.5, "valid_targets_min": 4178 }, { "epoch": 0.06509357200976404, "grad_norm": 1.566586623976585, "learning_rate": 3.6194895591647333e-06, "loss": 0.5804, "loss_nan_ranks": 0, "loss_rank_avg": 0.31874755024909973, "step": 40, "valid_targets_mean": 5538.4, "valid_targets_min": 2206 }, { "epoch": 0.07323026851098453, "grad_norm": 0.8989747000335192, "learning_rate": 4.083526682134571e-06, "loss": 0.5337, "loss_nan_ranks": 0, "loss_rank_avg": 0.26823461055755615, "step": 45, "valid_targets_mean": 8599.2, "valid_targets_min": 2163 }, { "epoch": 0.08136696501220504, "grad_norm": 0.9319478495784349, "learning_rate": 4.547563805104409e-06, "loss": 0.5084, "loss_nan_ranks": 0, "loss_rank_avg": 0.24531835317611694, "step": 50, "valid_targets_mean": 5544.0, "valid_targets_min": 3675 }, { "epoch": 0.08950366151342555, "grad_norm": 0.8445321573859387, "learning_rate": 5.011600928074246e-06, "loss": 0.5385, "loss_nan_ranks": 0, "loss_rank_avg": 0.24889877438545227, "step": 55, "valid_targets_mean": 4860.2, "valid_targets_min": 2473 }, { "epoch": 0.09764035801464606, "grad_norm": 0.5631526521452107, "learning_rate": 5.4756380510440845e-06, "loss": 0.5077, "loss_nan_ranks": 0, "loss_rank_avg": 0.1919834017753601, "step": 60, "valid_targets_mean": 8965.6, "valid_targets_min": 1390 }, { "epoch": 0.10577705451586655, "grad_norm": 0.723751948401996, "learning_rate": 5.939675174013921e-06, "loss": 0.5264, "loss_nan_ranks": 0, "loss_rank_avg": 0.24049162864685059, "step": 65, "valid_targets_mean": 5572.6, "valid_targets_min": 987 }, { "epoch": 0.11391375101708706, "grad_norm": 0.6686399938539643, "learning_rate": 6.403712296983759e-06, "loss": 0.525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604122459888458, "step": 70, "valid_targets_mean": 5024.8, "valid_targets_min": 1360 }, { "epoch": 0.12205044751830757, "grad_norm": 0.6374560834798504, "learning_rate": 6.867749419953597e-06, "loss": 0.4679, "loss_nan_ranks": 0, "loss_rank_avg": 0.20338362455368042, "step": 75, "valid_targets_mean": 4254.9, "valid_targets_min": 1926 }, { "epoch": 0.13018714401952808, "grad_norm": 0.5787585870311817, "learning_rate": 7.331786542923435e-06, "loss": 0.4843, "loss_nan_ranks": 0, "loss_rank_avg": 0.21182265877723694, "step": 80, "valid_targets_mean": 6022.1, "valid_targets_min": 2763 }, { "epoch": 0.1383238405207486, "grad_norm": 0.67321565497922, "learning_rate": 7.795823665893271e-06, "loss": 0.4312, "loss_nan_ranks": 0, "loss_rank_avg": 0.23013588786125183, "step": 85, "valid_targets_mean": 5411.8, "valid_targets_min": 3173 }, { "epoch": 0.14646053702196907, "grad_norm": 0.6071366032342709, "learning_rate": 8.25986078886311e-06, "loss": 0.4646, "loss_nan_ranks": 0, "loss_rank_avg": 0.1693999469280243, "step": 90, "valid_targets_mean": 4955.9, "valid_targets_min": 1353 }, { "epoch": 0.15459723352318958, "grad_norm": 0.5269887432627762, "learning_rate": 8.723897911832948e-06, "loss": 0.456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1908610761165619, "step": 95, "valid_targets_mean": 5783.5, "valid_targets_min": 2568 }, { "epoch": 0.16273393002441008, "grad_norm": 0.49470856135363345, "learning_rate": 9.187935034802784e-06, "loss": 0.4707, "loss_nan_ranks": 0, "loss_rank_avg": 0.16176165640354156, "step": 100, "valid_targets_mean": 5736.5, "valid_targets_min": 914 }, { "epoch": 0.1708706265256306, "grad_norm": 0.6634219296905246, "learning_rate": 9.651972157772623e-06, "loss": 0.4261, "loss_nan_ranks": 0, "loss_rank_avg": 0.21228602528572083, "step": 105, "valid_targets_mean": 4824.8, "valid_targets_min": 880 }, { "epoch": 0.1790073230268511, "grad_norm": 0.5503232838963362, "learning_rate": 1.011600928074246e-05, "loss": 0.4521, "loss_nan_ranks": 0, "loss_rank_avg": 0.21243637800216675, "step": 110, "valid_targets_mean": 4871.6, "valid_targets_min": 3180 }, { "epoch": 0.1871440195280716, "grad_norm": 0.5371175803438996, "learning_rate": 1.0580046403712299e-05, "loss": 0.4236, "loss_nan_ranks": 0, "loss_rank_avg": 0.18787938356399536, "step": 115, "valid_targets_mean": 6630.4, "valid_targets_min": 2886 }, { "epoch": 0.19528071602929212, "grad_norm": 0.592957013748528, "learning_rate": 1.1044083526682134e-05, "loss": 0.423, "loss_nan_ranks": 0, "loss_rank_avg": 0.21313674747943878, "step": 120, "valid_targets_mean": 4635.9, "valid_targets_min": 1984 }, { "epoch": 0.20341741253051263, "grad_norm": 0.5850643813081216, "learning_rate": 1.1508120649651972e-05, "loss": 0.441, "loss_nan_ranks": 0, "loss_rank_avg": 0.18926499783992767, "step": 125, "valid_targets_mean": 3976.4, "valid_targets_min": 2195 }, { "epoch": 0.2115541090317331, "grad_norm": 0.6154983784285487, "learning_rate": 1.197215777262181e-05, "loss": 0.4045, "loss_nan_ranks": 0, "loss_rank_avg": 0.32481032609939575, "step": 130, "valid_targets_mean": 7336.1, "valid_targets_min": 2261 }, { "epoch": 0.21969080553295361, "grad_norm": 0.5811910852740185, "learning_rate": 1.2436194895591649e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.19883839786052704, "step": 135, "valid_targets_mean": 4926.2, "valid_targets_min": 1380 }, { "epoch": 0.22782750203417412, "grad_norm": 0.562023919355631, "learning_rate": 1.2900232018561485e-05, "loss": 0.4539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1847591996192932, "step": 140, "valid_targets_mean": 4817.6, "valid_targets_min": 472 }, { "epoch": 0.23596419853539463, "grad_norm": 0.72271568902011, "learning_rate": 1.3364269141531323e-05, "loss": 0.4195, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751965820789337, "step": 145, "valid_targets_mean": 4217.8, "valid_targets_min": 1056 }, { "epoch": 0.24410089503661514, "grad_norm": 0.3938229955385366, "learning_rate": 1.3828306264501162e-05, "loss": 0.3832, "loss_nan_ranks": 0, "loss_rank_avg": 0.14872416853904724, "step": 150, "valid_targets_mean": 9482.1, "valid_targets_min": 1451 }, { "epoch": 0.25223759153783565, "grad_norm": 0.49221594968351173, "learning_rate": 1.4292343387471e-05, "loss": 0.3907, "loss_nan_ranks": 0, "loss_rank_avg": 0.20908868312835693, "step": 155, "valid_targets_mean": 6888.2, "valid_targets_min": 976 }, { "epoch": 0.26037428803905616, "grad_norm": 0.5545201308696927, "learning_rate": 1.4756380510440838e-05, "loss": 0.4102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2789374887943268, "step": 160, "valid_targets_mean": 6530.2, "valid_targets_min": 3557 }, { "epoch": 0.26851098454027666, "grad_norm": 0.4586839023597891, "learning_rate": 1.5220417633410673e-05, "loss": 0.3853, "loss_nan_ranks": 0, "loss_rank_avg": 0.15098837018013, "step": 165, "valid_targets_mean": 6107.5, "valid_targets_min": 3366 }, { "epoch": 0.2766476810414972, "grad_norm": 0.5466087287399158, "learning_rate": 1.5684454756380513e-05, "loss": 0.3823, "loss_nan_ranks": 0, "loss_rank_avg": 0.18119701743125916, "step": 170, "valid_targets_mean": 5958.1, "valid_targets_min": 2636 }, { "epoch": 0.2847843775427177, "grad_norm": 0.7246628057096877, "learning_rate": 1.614849187935035e-05, "loss": 0.3878, "loss_nan_ranks": 0, "loss_rank_avg": 0.18207889795303345, "step": 175, "valid_targets_mean": 3833.5, "valid_targets_min": 731 }, { "epoch": 0.29292107404393813, "grad_norm": 0.538445461461904, "learning_rate": 1.661252900232019e-05, "loss": 0.3899, "loss_nan_ranks": 0, "loss_rank_avg": 0.20349320769309998, "step": 180, "valid_targets_mean": 5779.9, "valid_targets_min": 2408 }, { "epoch": 0.30105777054515864, "grad_norm": 0.5154736408446468, "learning_rate": 1.7076566125290022e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.14643463492393494, "step": 185, "valid_targets_mean": 5368.9, "valid_targets_min": 1130 }, { "epoch": 0.30919446704637915, "grad_norm": 0.5537361180002401, "learning_rate": 1.7540603248259862e-05, "loss": 0.3761, "loss_nan_ranks": 0, "loss_rank_avg": 0.24436548352241516, "step": 190, "valid_targets_mean": 6028.6, "valid_targets_min": 2328 }, { "epoch": 0.31733116354759966, "grad_norm": 0.5029342180508779, "learning_rate": 1.80046403712297e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.1840636283159256, "step": 195, "valid_targets_mean": 5353.9, "valid_targets_min": 2892 }, { "epoch": 0.32546786004882017, "grad_norm": 0.665787256003558, "learning_rate": 1.846867749419954e-05, "loss": 0.4148, "loss_nan_ranks": 0, "loss_rank_avg": 0.20056715607643127, "step": 200, "valid_targets_mean": 4300.5, "valid_targets_min": 2125 }, { "epoch": 0.3336045565500407, "grad_norm": 0.6052671481751055, "learning_rate": 1.8932714617169375e-05, "loss": 0.4007, "loss_nan_ranks": 0, "loss_rank_avg": 0.18301618099212646, "step": 205, "valid_targets_mean": 4318.6, "valid_targets_min": 1348 }, { "epoch": 0.3417412530512612, "grad_norm": 0.5974300039254363, "learning_rate": 1.9396751740139212e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.1635710895061493, "step": 210, "valid_targets_mean": 4149.1, "valid_targets_min": 1341 }, { "epoch": 0.3498779495524817, "grad_norm": 0.5162532888002979, "learning_rate": 1.986078886310905e-05, "loss": 0.3616, "loss_nan_ranks": 0, "loss_rank_avg": 0.1892920732498169, "step": 215, "valid_targets_mean": 5807.4, "valid_targets_min": 3465 }, { "epoch": 0.3580146460537022, "grad_norm": 0.6211875321766217, "learning_rate": 2.0324825986078888e-05, "loss": 0.3707, "loss_nan_ranks": 0, "loss_rank_avg": 0.2048984169960022, "step": 220, "valid_targets_mean": 5146.1, "valid_targets_min": 3448 }, { "epoch": 0.3661513425549227, "grad_norm": 0.5629734837453833, "learning_rate": 2.0788863109048725e-05, "loss": 0.4264, "loss_nan_ranks": 0, "loss_rank_avg": 0.20716804265975952, "step": 225, "valid_targets_mean": 6232.1, "valid_targets_min": 3504 }, { "epoch": 0.3742880390561432, "grad_norm": 0.5754882541364582, "learning_rate": 2.125290023201856e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.17893140017986298, "step": 230, "valid_targets_mean": 5060.4, "valid_targets_min": 1097 }, { "epoch": 0.3824247355573637, "grad_norm": 0.4803589387079019, "learning_rate": 2.17169373549884e-05, "loss": 0.3729, "loss_nan_ranks": 0, "loss_rank_avg": 0.169406920671463, "step": 235, "valid_targets_mean": 10265.1, "valid_targets_min": 3654 }, { "epoch": 0.39056143205858423, "grad_norm": 0.5684141070472157, "learning_rate": 2.2180974477958238e-05, "loss": 0.356, "loss_nan_ranks": 0, "loss_rank_avg": 0.18647357821464539, "step": 240, "valid_targets_mean": 6180.6, "valid_targets_min": 4034 }, { "epoch": 0.39869812855980474, "grad_norm": 2.1822397438079113, "learning_rate": 2.2645011600928078e-05, "loss": 0.3773, "loss_nan_ranks": 0, "loss_rank_avg": 0.13844701647758484, "step": 245, "valid_targets_mean": 3962.9, "valid_targets_min": 1115 }, { "epoch": 0.40683482506102525, "grad_norm": 0.5269077214375306, "learning_rate": 2.3109048723897914e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.22004611790180206, "step": 250, "valid_targets_mean": 7061.2, "valid_targets_min": 1798 }, { "epoch": 0.4149715215622457, "grad_norm": 0.5440786293579026, "learning_rate": 2.357308584686775e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.17783966660499573, "step": 255, "valid_targets_mean": 6231.8, "valid_targets_min": 1180 }, { "epoch": 0.4231082180634662, "grad_norm": 0.5948755408238603, "learning_rate": 2.4037122969837587e-05, "loss": 0.3825, "loss_nan_ranks": 0, "loss_rank_avg": 0.17008402943611145, "step": 260, "valid_targets_mean": 5944.2, "valid_targets_min": 3162 }, { "epoch": 0.4312449145646867, "grad_norm": 0.6242241542196177, "learning_rate": 2.4501160092807427e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.24811501801013947, "step": 265, "valid_targets_mean": 6068.0, "valid_targets_min": 3582 }, { "epoch": 0.43938161106590723, "grad_norm": 0.6339502257062204, "learning_rate": 2.4965197215777264e-05, "loss": 0.378, "loss_nan_ranks": 0, "loss_rank_avg": 0.23643383383750916, "step": 270, "valid_targets_mean": 6240.1, "valid_targets_min": 3166 }, { "epoch": 0.44751830756712774, "grad_norm": 0.620013916375109, "learning_rate": 2.54292343387471e-05, "loss": 0.3781, "loss_nan_ranks": 0, "loss_rank_avg": 0.20989033579826355, "step": 275, "valid_targets_mean": 4992.1, "valid_targets_min": 1974 }, { "epoch": 0.45565500406834825, "grad_norm": 0.6062383822505677, "learning_rate": 2.589327146171694e-05, "loss": 0.3909, "loss_nan_ranks": 0, "loss_rank_avg": 0.165325328707695, "step": 280, "valid_targets_mean": 5992.2, "valid_targets_min": 2286 }, { "epoch": 0.46379170056956875, "grad_norm": 0.5313593137715071, "learning_rate": 2.6357308584686777e-05, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.211288183927536, "step": 285, "valid_targets_mean": 8111.2, "valid_targets_min": 1743 }, { "epoch": 0.47192839707078926, "grad_norm": 0.6295506563199366, "learning_rate": 2.6821345707656617e-05, "loss": 0.4067, "loss_nan_ranks": 0, "loss_rank_avg": 0.2054595947265625, "step": 290, "valid_targets_mean": 5166.6, "valid_targets_min": 665 }, { "epoch": 0.48006509357200977, "grad_norm": 0.49592526684619054, "learning_rate": 2.7285382830626453e-05, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.16820460557937622, "step": 295, "valid_targets_mean": 7745.8, "valid_targets_min": 4466 }, { "epoch": 0.4882017900732303, "grad_norm": 0.567789284281097, "learning_rate": 2.774941995359629e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.20403246581554413, "step": 300, "valid_targets_mean": 5828.9, "valid_targets_min": 3519 }, { "epoch": 0.4963384865744508, "grad_norm": 0.5994970137381144, "learning_rate": 2.8213457076566126e-05, "loss": 0.3616, "loss_nan_ranks": 0, "loss_rank_avg": 0.17800754308700562, "step": 305, "valid_targets_mean": 6173.2, "valid_targets_min": 2727 }, { "epoch": 0.5044751830756713, "grad_norm": 0.4507815805396529, "learning_rate": 2.8677494199535966e-05, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.163581982254982, "step": 310, "valid_targets_mean": 7815.4, "valid_targets_min": 2591 }, { "epoch": 0.5126118795768918, "grad_norm": 0.5239390399565743, "learning_rate": 2.9141531322505803e-05, "loss": 0.3643, "loss_nan_ranks": 0, "loss_rank_avg": 0.17151904106140137, "step": 315, "valid_targets_mean": 6634.5, "valid_targets_min": 2709 }, { "epoch": 0.5207485760781123, "grad_norm": 0.5369612515514515, "learning_rate": 2.9605568445475643e-05, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.18754036724567413, "step": 320, "valid_targets_mean": 7942.8, "valid_targets_min": 2731 }, { "epoch": 0.5288852725793328, "grad_norm": 0.5793782711405452, "learning_rate": 3.006960556844548e-05, "loss": 0.3665, "loss_nan_ranks": 0, "loss_rank_avg": 0.19467616081237793, "step": 325, "valid_targets_mean": 7150.4, "valid_targets_min": 3200 }, { "epoch": 0.5370219690805533, "grad_norm": 0.6555376050209063, "learning_rate": 3.053364269141532e-05, "loss": 0.3597, "loss_nan_ranks": 0, "loss_rank_avg": 0.22380053997039795, "step": 330, "valid_targets_mean": 5470.0, "valid_targets_min": 3328 }, { "epoch": 0.5451586655817738, "grad_norm": 0.47280019324486067, "learning_rate": 3.099767981438515e-05, "loss": 0.353, "loss_nan_ranks": 0, "loss_rank_avg": 0.1600561887025833, "step": 335, "valid_targets_mean": 7268.8, "valid_targets_min": 1187 }, { "epoch": 0.5532953620829943, "grad_norm": 0.5881598770087844, "learning_rate": 3.146171693735499e-05, "loss": 0.3822, "loss_nan_ranks": 0, "loss_rank_avg": 0.24715545773506165, "step": 340, "valid_targets_mean": 6853.9, "valid_targets_min": 3075 }, { "epoch": 0.5614320585842149, "grad_norm": 0.6391589883331622, "learning_rate": 3.1925754060324825e-05, "loss": 0.3614, "loss_nan_ranks": 0, "loss_rank_avg": 0.1951560229063034, "step": 345, "valid_targets_mean": 5299.4, "valid_targets_min": 1246 }, { "epoch": 0.5695687550854354, "grad_norm": 0.5623585142837345, "learning_rate": 3.2389791183294665e-05, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.16995632648468018, "step": 350, "valid_targets_mean": 5440.2, "valid_targets_min": 2508 }, { "epoch": 0.5777054515866559, "grad_norm": 0.6219299756731129, "learning_rate": 3.2853828306264505e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.1758767068386078, "step": 355, "valid_targets_mean": 5666.1, "valid_targets_min": 4068 }, { "epoch": 0.5858421480878763, "grad_norm": 0.5685036390421684, "learning_rate": 3.3317865429234345e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16862249374389648, "step": 360, "valid_targets_mean": 4828.4, "valid_targets_min": 3059 }, { "epoch": 0.5939788445890968, "grad_norm": 0.4625422720060745, "learning_rate": 3.378190255220418e-05, "loss": 0.3712, "loss_nan_ranks": 0, "loss_rank_avg": 0.1963481456041336, "step": 365, "valid_targets_mean": 7321.2, "valid_targets_min": 2340 }, { "epoch": 0.6021155410903173, "grad_norm": 0.5470733880761669, "learning_rate": 3.424593967517402e-05, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.210045725107193, "step": 370, "valid_targets_mean": 6877.0, "valid_targets_min": 3491 }, { "epoch": 0.6102522375915378, "grad_norm": 0.6202487972326748, "learning_rate": 3.470997679814386e-05, "loss": 0.3772, "loss_nan_ranks": 0, "loss_rank_avg": 0.17183330655097961, "step": 375, "valid_targets_mean": 4664.4, "valid_targets_min": 1184 }, { "epoch": 0.6183889340927583, "grad_norm": 0.5221402160582946, "learning_rate": 3.517401392111369e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.12995409965515137, "step": 380, "valid_targets_mean": 4589.5, "valid_targets_min": 1355 }, { "epoch": 0.6265256305939788, "grad_norm": 0.5752601496871426, "learning_rate": 3.563805104408353e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.1458801031112671, "step": 385, "valid_targets_mean": 4861.6, "valid_targets_min": 781 }, { "epoch": 0.6346623270951993, "grad_norm": 0.49073739472195316, "learning_rate": 3.6102088167053364e-05, "loss": 0.3394, "loss_nan_ranks": 0, "loss_rank_avg": 0.14129197597503662, "step": 390, "valid_targets_mean": 7941.0, "valid_targets_min": 1697 }, { "epoch": 0.6427990235964198, "grad_norm": 0.6724135988713974, "learning_rate": 3.6566125290023204e-05, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.20702053606510162, "step": 395, "valid_targets_mean": 5088.1, "valid_targets_min": 3051 }, { "epoch": 0.6509357200976403, "grad_norm": 0.5361691867146933, "learning_rate": 3.7030162412993044e-05, "loss": 0.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.11901885271072388, "step": 400, "valid_targets_mean": 4371.2, "valid_targets_min": 667 }, { "epoch": 0.6590724165988608, "grad_norm": 0.5133700351880802, "learning_rate": 3.7494199535962884e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.19993503391742706, "step": 405, "valid_targets_mean": 7043.2, "valid_targets_min": 2275 }, { "epoch": 0.6672091131000814, "grad_norm": 0.6482819055800569, "learning_rate": 3.795823665893272e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.17060551047325134, "step": 410, "valid_targets_mean": 4805.9, "valid_targets_min": 2812 }, { "epoch": 0.6753458096013019, "grad_norm": 0.6390031583274932, "learning_rate": 3.842227378190256e-05, "loss": 0.3535, "loss_nan_ranks": 0, "loss_rank_avg": 0.21496957540512085, "step": 415, "valid_targets_mean": 5022.5, "valid_targets_min": 3145 }, { "epoch": 0.6834825061025224, "grad_norm": 0.5976519963434623, "learning_rate": 3.888631090487239e-05, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.2512780427932739, "step": 420, "valid_targets_mean": 7279.9, "valid_targets_min": 1433 }, { "epoch": 0.6916192026037429, "grad_norm": 0.47064787232454297, "learning_rate": 3.935034802784223e-05, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.13265804946422577, "step": 425, "valid_targets_mean": 7578.4, "valid_targets_min": 1208 }, { "epoch": 0.6997558991049634, "grad_norm": 0.6527567618207681, "learning_rate": 3.981438515081207e-05, "loss": 0.3574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1878128945827484, "step": 430, "valid_targets_mean": 6056.6, "valid_targets_min": 839 }, { "epoch": 0.7078925956061839, "grad_norm": 0.5735509384032068, "learning_rate": 3.9999940813479674e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.1770503968000412, "step": 435, "valid_targets_mean": 6436.2, "valid_targets_min": 1048 }, { "epoch": 0.7160292921074044, "grad_norm": 0.6261328521415896, "learning_rate": 3.999957911934624e-05, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.18041738867759705, "step": 440, "valid_targets_mean": 4812.4, "valid_targets_min": 978 }, { "epoch": 0.7241659886086249, "grad_norm": 0.6204622587345417, "learning_rate": 3.9998888618418865e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899314522743225, "step": 445, "valid_targets_mean": 5510.2, "valid_targets_min": 3204 }, { "epoch": 0.7323026851098454, "grad_norm": 3.299320631347469, "learning_rate": 3.999786932204985e-05, "loss": 0.3785, "loss_nan_ranks": 0, "loss_rank_avg": 0.1819208562374115, "step": 450, "valid_targets_mean": 4358.6, "valid_targets_min": 1771 }, { "epoch": 0.7404393816110659, "grad_norm": 0.5252880370409836, "learning_rate": 3.999652124699712e-05, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.16896438598632812, "step": 455, "valid_targets_mean": 5077.8, "valid_targets_min": 1348 }, { "epoch": 0.7485760781122864, "grad_norm": 0.6698283241722841, "learning_rate": 3.999484441542395e-05, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.1943579763174057, "step": 460, "valid_targets_mean": 6660.6, "valid_targets_min": 2219 }, { "epoch": 0.7567127746135069, "grad_norm": 0.5507163167952325, "learning_rate": 3.999283885489861e-05, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.17113232612609863, "step": 465, "valid_targets_mean": 5965.8, "valid_targets_min": 821 }, { "epoch": 0.7648494711147275, "grad_norm": 0.5967720564945255, "learning_rate": 3.999050459839389e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.18689490854740143, "step": 470, "valid_targets_mean": 5054.9, "valid_targets_min": 2713 }, { "epoch": 0.772986167615948, "grad_norm": 0.47232445183793803, "learning_rate": 3.998784168428657e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.15000829100608826, "step": 475, "valid_targets_mean": 8201.6, "valid_targets_min": 4044 }, { "epoch": 0.7811228641171685, "grad_norm": 0.621422144424275, "learning_rate": 3.998485015635677e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.1805095225572586, "step": 480, "valid_targets_mean": 5017.2, "valid_targets_min": 2360 }, { "epoch": 0.789259560618389, "grad_norm": 0.5384507298681502, "learning_rate": 3.998153006378727e-05, "loss": 0.3606, "loss_nan_ranks": 0, "loss_rank_avg": 0.14276368916034698, "step": 485, "valid_targets_mean": 5560.0, "valid_targets_min": 3450 }, { "epoch": 0.7973962571196095, "grad_norm": 0.5979879136613555, "learning_rate": 3.997788146116267e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2316283881664276, "step": 490, "valid_targets_mean": 6350.8, "valid_targets_min": 1530 }, { "epoch": 0.80553295362083, "grad_norm": 0.5101547736138818, "learning_rate": 3.99739044084685e-05, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.14997598528862, "step": 495, "valid_targets_mean": 5629.4, "valid_targets_min": 1916 }, { "epoch": 0.8136696501220505, "grad_norm": 0.5665977624248587, "learning_rate": 3.9969598971090225e-05, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.16634723544120789, "step": 500, "valid_targets_mean": 5539.4, "valid_targets_min": 2190 }, { "epoch": 0.8218063466232709, "grad_norm": 0.5440024359106904, "learning_rate": 3.99649652198122e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.12725237011909485, "step": 505, "valid_targets_mean": 5113.1, "valid_targets_min": 2708 }, { "epoch": 0.8299430431244914, "grad_norm": 0.5290865318322414, "learning_rate": 3.9960003230816456e-05, "loss": 0.3289, "loss_nan_ranks": 0, "loss_rank_avg": 0.14404511451721191, "step": 510, "valid_targets_mean": 5173.8, "valid_targets_min": 3136 }, { "epoch": 0.8380797396257119, "grad_norm": 0.5770982920950211, "learning_rate": 3.9954713085681504e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.18526235222816467, "step": 515, "valid_targets_mean": 6702.4, "valid_targets_min": 4946 }, { "epoch": 0.8462164361269324, "grad_norm": 0.47568964474126807, "learning_rate": 3.994909487138096e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.14243432879447937, "step": 520, "valid_targets_mean": 7471.1, "valid_targets_min": 1985 }, { "epoch": 0.8543531326281529, "grad_norm": 0.5983260323228816, "learning_rate": 3.994314868028212e-05, "loss": 0.3711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2362203747034073, "step": 525, "valid_targets_mean": 6965.2, "valid_targets_min": 5206 }, { "epoch": 0.8624898291293734, "grad_norm": 0.5211844138476033, "learning_rate": 3.9936874610144445e-05, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.15538473427295685, "step": 530, "valid_targets_mean": 5649.0, "valid_targets_min": 2480 }, { "epoch": 0.870626525630594, "grad_norm": 0.5747838948995959, "learning_rate": 3.993027276411793e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.14920654892921448, "step": 535, "valid_targets_mean": 5064.1, "valid_targets_min": 1328 }, { "epoch": 0.8787632221318145, "grad_norm": 0.7641456693399412, "learning_rate": 3.992334325074148e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.22456279397010803, "step": 540, "valid_targets_mean": 4989.8, "valid_targets_min": 1908 }, { "epoch": 0.886899918633035, "grad_norm": 0.6130711548025931, "learning_rate": 3.991608618394102e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.13783709704875946, "step": 545, "valid_targets_mean": 4486.8, "valid_targets_min": 2494 }, { "epoch": 0.8950366151342555, "grad_norm": 0.6595580159116637, "learning_rate": 3.9908501683027726e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.1897541582584381, "step": 550, "valid_targets_mean": 4604.0, "valid_targets_min": 3132 }, { "epoch": 0.903173311635476, "grad_norm": 0.5968370142818512, "learning_rate": 3.990058987269597e-05, "loss": 0.3331, "loss_nan_ranks": 0, "loss_rank_avg": 0.15421295166015625, "step": 555, "valid_targets_mean": 5379.5, "valid_targets_min": 1269 }, { "epoch": 0.9113100081366965, "grad_norm": 0.5675265201448391, "learning_rate": 3.9892350883021366e-05, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.15991877019405365, "step": 560, "valid_targets_mean": 5252.5, "valid_targets_min": 1873 }, { "epoch": 0.919446704637917, "grad_norm": 0.4953887074657764, "learning_rate": 3.988378484945853e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.13573208451271057, "step": 565, "valid_targets_mean": 4776.0, "valid_targets_min": 1040 }, { "epoch": 0.9275834011391375, "grad_norm": 0.514455820774763, "learning_rate": 3.987489191283894e-05, "loss": 0.3416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1836441606283188, "step": 570, "valid_targets_mean": 7845.2, "valid_targets_min": 4051 }, { "epoch": 0.935720097640358, "grad_norm": 0.6132417120301569, "learning_rate": 3.9865672219368574e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.20987677574157715, "step": 575, "valid_targets_mean": 7432.6, "valid_targets_min": 3210 }, { "epoch": 0.9438567941415785, "grad_norm": 0.5225003165533024, "learning_rate": 3.98561259206255e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.13004842400550842, "step": 580, "valid_targets_mean": 4851.6, "valid_targets_min": 873 }, { "epoch": 0.951993490642799, "grad_norm": 0.4373690128216657, "learning_rate": 3.984625317355743e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.152201846241951, "step": 585, "valid_targets_mean": 7664.9, "valid_targets_min": 3641 }, { "epoch": 0.9601301871440195, "grad_norm": 0.47431856596663735, "learning_rate": 3.983605414047908e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.21499404311180115, "step": 590, "valid_targets_mean": 7886.2, "valid_targets_min": 2797 }, { "epoch": 0.96826688364524, "grad_norm": 0.5715947847050505, "learning_rate": 3.982552898906956e-05, "loss": 0.3562, "loss_nan_ranks": 0, "loss_rank_avg": 0.20815590023994446, "step": 595, "valid_targets_mean": 5514.9, "valid_targets_min": 2081 }, { "epoch": 0.9764035801464606, "grad_norm": 0.6400810920406435, "learning_rate": 3.981467789236958e-05, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813117265701294, "step": 600, "valid_targets_mean": 5263.9, "valid_targets_min": 850 }, { "epoch": 0.9845402766476811, "grad_norm": 0.507069029775432, "learning_rate": 3.98035010287786e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.15920934081077576, "step": 605, "valid_targets_mean": 6134.8, "valid_targets_min": 1505 }, { "epoch": 0.9926769731489016, "grad_norm": 0.5784988986931031, "learning_rate": 3.979199858205192e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.16542240977287292, "step": 610, "valid_targets_mean": 5547.0, "valid_targets_min": 597 }, { "epoch": 1.0, "grad_norm": 0.907765371978957, "learning_rate": 3.9780170741297655e-05, "loss": 0.3348, "loss_nan_ranks": 0, "loss_rank_avg": 0.36365807056427, "step": 615, "valid_targets_mean": 4512.4, "valid_targets_min": 2120 }, { "epoch": 1.0081366965012204, "grad_norm": 0.5028868621668272, "learning_rate": 3.976801770097361e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.1552557647228241, "step": 620, "valid_targets_mean": 6936.5, "valid_targets_min": 4152 }, { "epoch": 1.016273393002441, "grad_norm": 0.5068697229571411, "learning_rate": 3.975553966088412e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.16703470051288605, "step": 625, "valid_targets_mean": 6322.5, "valid_targets_min": 1831 }, { "epoch": 1.0244100895036614, "grad_norm": 0.6214780240503095, "learning_rate": 3.9742736826176706e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.19309839606285095, "step": 630, "valid_targets_mean": 5129.1, "valid_targets_min": 1722 }, { "epoch": 1.032546786004882, "grad_norm": 0.5206937707201459, "learning_rate": 3.9729609407338745e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1733720600605011, "step": 635, "valid_targets_mean": 5940.8, "valid_targets_min": 3375 }, { "epoch": 1.0406834825061024, "grad_norm": 0.558975152851932, "learning_rate": 3.971615762019401e-05, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.17723140120506287, "step": 640, "valid_targets_mean": 5387.9, "valid_targets_min": 844 }, { "epoch": 1.048820179007323, "grad_norm": 0.52042070753551, "learning_rate": 3.970238168589911e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.16863638162612915, "step": 645, "valid_targets_mean": 5446.0, "valid_targets_min": 3303 }, { "epoch": 1.0569568755085434, "grad_norm": 0.52743590283002, "learning_rate": 3.968828183093984e-05, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.1578497290611267, "step": 650, "valid_targets_mean": 6333.2, "valid_targets_min": 3859 }, { "epoch": 1.065093572009764, "grad_norm": 0.5709713263916416, "learning_rate": 3.9673858287127484e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.13569536805152893, "step": 655, "valid_targets_mean": 6296.2, "valid_targets_min": 4446 }, { "epoch": 1.0732302685109845, "grad_norm": 0.6034080046446395, "learning_rate": 3.965911129159501e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.1853494793176651, "step": 660, "valid_targets_mean": 5594.5, "valid_targets_min": 2807 }, { "epoch": 1.081366965012205, "grad_norm": 0.6783173009548439, "learning_rate": 3.9644041086793115e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.2208280861377716, "step": 665, "valid_targets_mean": 5207.0, "valid_targets_min": 2639 }, { "epoch": 1.0895036615134255, "grad_norm": 0.7073358550878341, "learning_rate": 3.9628647920486313e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.11236638575792313, "step": 670, "valid_targets_mean": 4536.8, "valid_targets_min": 2480 }, { "epoch": 1.097640358014646, "grad_norm": 0.5573022103538503, "learning_rate": 3.961293204574881e-05, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.20048069953918457, "step": 675, "valid_targets_mean": 6317.4, "valid_targets_min": 2446 }, { "epoch": 1.1057770545158665, "grad_norm": 0.6274818878999071, "learning_rate": 3.959689372096034e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.19005917012691498, "step": 680, "valid_targets_mean": 6330.2, "valid_targets_min": 3816 }, { "epoch": 1.1139137510170871, "grad_norm": 0.6054646269903999, "learning_rate": 3.9580533209802e-05, "loss": 0.3085, "loss_nan_ranks": 0, "loss_rank_avg": 0.16152934730052948, "step": 685, "valid_targets_mean": 5820.4, "valid_targets_min": 4284 }, { "epoch": 1.1220504475183075, "grad_norm": 0.5033565392236059, "learning_rate": 3.9563850781251785e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.17019686102867126, "step": 690, "valid_targets_mean": 5422.2, "valid_targets_min": 1910 }, { "epoch": 1.1301871440195281, "grad_norm": 0.6054316108985657, "learning_rate": 3.954684670958027e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751125305891037, "step": 695, "valid_targets_mean": 5926.9, "valid_targets_min": 2434 }, { "epoch": 1.1383238405207485, "grad_norm": 0.5215439424842706, "learning_rate": 3.9529521274346036e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.1284661889076233, "step": 700, "valid_targets_mean": 5178.6, "valid_targets_min": 3204 }, { "epoch": 1.1464605370219692, "grad_norm": 0.5678065554082121, "learning_rate": 3.951187476039114e-05, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.209128275513649, "step": 705, "valid_targets_mean": 6623.4, "valid_targets_min": 977 }, { "epoch": 1.1545972335231895, "grad_norm": 0.517064905402786, "learning_rate": 3.9493907457836355e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.1468493938446045, "step": 710, "valid_targets_mean": 5925.8, "valid_targets_min": 1771 }, { "epoch": 1.1627339300244102, "grad_norm": 0.5878396139579618, "learning_rate": 3.947561966207646e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.23921839892864227, "step": 715, "valid_targets_mean": 7141.8, "valid_targets_min": 4723 }, { "epoch": 1.1708706265256306, "grad_norm": 0.6620036041434723, "learning_rate": 3.945701167377537e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856687366962433, "step": 720, "valid_targets_mean": 5410.5, "valid_targets_min": 1093 }, { "epoch": 1.1790073230268512, "grad_norm": 0.6212164485855235, "learning_rate": 3.9438083798861145e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.14771541953086853, "step": 725, "valid_targets_mean": 3694.8, "valid_targets_min": 1040 }, { "epoch": 1.1871440195280716, "grad_norm": 0.5515816569814562, "learning_rate": 3.9418836348521045e-05, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.17307670414447784, "step": 730, "valid_targets_mean": 5327.5, "valid_targets_min": 3287 }, { "epoch": 1.1952807160292922, "grad_norm": 0.5104440783845825, "learning_rate": 3.939926963919635e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218840628862381, "step": 735, "valid_targets_mean": 6123.0, "valid_targets_min": 1751 }, { "epoch": 1.2034174125305126, "grad_norm": 0.4651258970343293, "learning_rate": 3.9379383992577166e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.14117637276649475, "step": 740, "valid_targets_mean": 5320.9, "valid_targets_min": 1282 }, { "epoch": 1.211554109031733, "grad_norm": 0.5744345931767872, "learning_rate": 3.9359179735597174e-05, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502009928226471, "step": 745, "valid_targets_mean": 5779.2, "valid_targets_min": 1217 }, { "epoch": 1.2196908055329536, "grad_norm": 0.5866014778192581, "learning_rate": 3.9338657200428215e-05, "loss": 0.3116, "loss_nan_ranks": 0, "loss_rank_avg": 0.15397050976753235, "step": 750, "valid_targets_mean": 5608.9, "valid_targets_min": 2017 }, { "epoch": 1.2278275020341742, "grad_norm": 0.49106387973213833, "learning_rate": 3.931781672447482e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318609118461609, "step": 755, "valid_targets_mean": 5518.1, "valid_targets_min": 1324 }, { "epoch": 1.2359641985353946, "grad_norm": 0.535746593811322, "learning_rate": 3.9296658650368707e-05, "loss": 0.3423, "loss_nan_ranks": 0, "loss_rank_avg": 0.20755848288536072, "step": 760, "valid_targets_mean": 6305.9, "valid_targets_min": 2592 }, { "epoch": 1.244100895036615, "grad_norm": 0.7756294072634289, "learning_rate": 3.927518332596313e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.17277516424655914, "step": 765, "valid_targets_mean": 5248.5, "valid_targets_min": 1305 }, { "epoch": 1.2522375915378356, "grad_norm": 0.4743651921197624, "learning_rate": 3.925339110432716e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.13423749804496765, "step": 770, "valid_targets_mean": 6439.6, "valid_targets_min": 741 }, { "epoch": 1.2603742880390563, "grad_norm": 0.5214220787724717, "learning_rate": 3.923128234373984e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.18879708647727966, "step": 775, "valid_targets_mean": 7090.8, "valid_targets_min": 2174 }, { "epoch": 1.2685109845402767, "grad_norm": 0.5794444612757781, "learning_rate": 3.9208857407684356e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.12169642746448517, "step": 780, "valid_targets_mean": 3770.6, "valid_targets_min": 850 }, { "epoch": 1.276647681041497, "grad_norm": 0.9435889725374784, "learning_rate": 3.918611666484205e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.18906664848327637, "step": 785, "valid_targets_mean": 8074.6, "valid_targets_min": 4774 }, { "epoch": 1.2847843775427177, "grad_norm": 0.47698101778309643, "learning_rate": 3.9163060489086305e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338808387517929, "step": 790, "valid_targets_mean": 5215.4, "valid_targets_min": 1686 }, { "epoch": 1.292921074043938, "grad_norm": 0.5413947969675581, "learning_rate": 3.913968925947647e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.09044672548770905, "step": 795, "valid_targets_mean": 5740.1, "valid_targets_min": 1164 }, { "epoch": 1.3010577705451587, "grad_norm": 0.4708777951982262, "learning_rate": 3.91160033602516e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.14017099142074585, "step": 800, "valid_targets_mean": 5497.0, "valid_targets_min": 2063 }, { "epoch": 1.309194467046379, "grad_norm": 0.49062883161248416, "learning_rate": 3.909200318082409e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.13735032081604004, "step": 805, "valid_targets_mean": 7376.5, "valid_targets_min": 2311 }, { "epoch": 1.3173311635475997, "grad_norm": 0.5599551574609924, "learning_rate": 3.906768911577337e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.14982812106609344, "step": 810, "valid_targets_mean": 5673.0, "valid_targets_min": 1423 }, { "epoch": 1.3254678600488201, "grad_norm": 0.5614503755525145, "learning_rate": 3.9043061564839325e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.14781512320041656, "step": 815, "valid_targets_mean": 4763.9, "valid_targets_min": 1955 }, { "epoch": 1.3336045565500407, "grad_norm": 0.4786045979460182, "learning_rate": 3.901812093291579e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.15768522024154663, "step": 820, "valid_targets_mean": 6786.4, "valid_targets_min": 2828 }, { "epoch": 1.3417412530512611, "grad_norm": 0.6560977260032284, "learning_rate": 3.8992867630043855e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.19212278723716736, "step": 825, "valid_targets_mean": 6104.2, "valid_targets_min": 2648 }, { "epoch": 1.3498779495524817, "grad_norm": 0.6879274724026825, "learning_rate": 3.896730207140512e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1794552505016327, "step": 830, "valid_targets_mean": 4482.6, "valid_targets_min": 2414 }, { "epoch": 1.3580146460537021, "grad_norm": 0.5203653762780058, "learning_rate": 3.894142467731492e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.13266748189926147, "step": 835, "valid_targets_mean": 5549.0, "valid_targets_min": 1787 }, { "epoch": 1.3661513425549228, "grad_norm": 0.5135176764267754, "learning_rate": 3.891523587321534e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.13733965158462524, "step": 840, "valid_targets_mean": 4990.9, "valid_targets_min": 975 }, { "epoch": 1.3742880390561432, "grad_norm": 0.550811284010829, "learning_rate": 3.888873608966828e-05, "loss": 0.3087, "loss_nan_ranks": 0, "loss_rank_avg": 0.17198342084884644, "step": 845, "valid_targets_mean": 6360.2, "valid_targets_min": 1126 }, { "epoch": 1.3824247355573638, "grad_norm": 0.46756550131963104, "learning_rate": 3.886192576234836e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.16204015910625458, "step": 850, "valid_targets_mean": 6772.0, "valid_targets_min": 1683 }, { "epoch": 1.3905614320585842, "grad_norm": 0.7407603671535479, "learning_rate": 3.883480533203574e-05, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.13542041182518005, "step": 855, "valid_targets_mean": 5719.1, "valid_targets_min": 1115 }, { "epoch": 1.3986981285598048, "grad_norm": 0.49156469399841785, "learning_rate": 3.880737524460888e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.15303273499011993, "step": 860, "valid_targets_mean": 5483.2, "valid_targets_min": 1521 }, { "epoch": 1.4068348250610252, "grad_norm": 0.6176037825800013, "learning_rate": 3.877963595103725e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.16262325644493103, "step": 865, "valid_targets_mean": 5055.8, "valid_targets_min": 841 }, { "epoch": 1.4149715215622458, "grad_norm": 0.48552964622802863, "learning_rate": 3.875158790737383e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.07722240686416626, "step": 870, "valid_targets_mean": 5601.2, "valid_targets_min": 614 }, { "epoch": 1.4231082180634662, "grad_norm": 0.5920608654664343, "learning_rate": 3.87232315747477e-05, "loss": 0.3416, "loss_nan_ranks": 0, "loss_rank_avg": 0.2405494749546051, "step": 875, "valid_targets_mean": 5470.0, "valid_targets_min": 3268 }, { "epoch": 1.4312449145646866, "grad_norm": 0.5377494420110379, "learning_rate": 3.8694567419356414e-05, "loss": 0.3561, "loss_nan_ranks": 0, "loss_rank_avg": 0.14981283247470856, "step": 880, "valid_targets_mean": 6194.1, "valid_targets_min": 4085 }, { "epoch": 1.4393816110659072, "grad_norm": 0.5103348467193803, "learning_rate": 3.8665595912458346e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.11243285983800888, "step": 885, "valid_targets_mean": 4186.1, "valid_targets_min": 1883 }, { "epoch": 1.4475183075671278, "grad_norm": 0.49573235370231433, "learning_rate": 3.863631753036492e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.15874309837818146, "step": 890, "valid_targets_mean": 5946.5, "valid_targets_min": 1225 }, { "epoch": 1.4556550040683482, "grad_norm": 0.6018434178435743, "learning_rate": 3.860673275443283e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1639241725206375, "step": 895, "valid_targets_mean": 4885.0, "valid_targets_min": 576 }, { "epoch": 1.4637917005695686, "grad_norm": 0.6566529428934831, "learning_rate": 3.857684207105606e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.16956907510757446, "step": 900, "valid_targets_mean": 5790.5, "valid_targets_min": 2026 }, { "epoch": 1.4719283970707893, "grad_norm": 0.6479521917332159, "learning_rate": 3.854664597165795e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.18413260579109192, "step": 905, "valid_targets_mean": 4738.2, "valid_targets_min": 956 }, { "epoch": 1.4800650935720099, "grad_norm": 0.6614607029109295, "learning_rate": 3.851614495268308e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.12402161210775375, "step": 910, "valid_targets_mean": 6095.1, "valid_targets_min": 1638 }, { "epoch": 1.4882017900732303, "grad_norm": 0.5271086668666808, "learning_rate": 3.848533951558912e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.1627025306224823, "step": 915, "valid_targets_mean": 5300.0, "valid_targets_min": 3448 }, { "epoch": 1.4963384865744507, "grad_norm": 0.4963158372629004, "learning_rate": 3.845423016683856e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.14617714285850525, "step": 920, "valid_targets_mean": 5295.8, "valid_targets_min": 2628 }, { "epoch": 1.5044751830756713, "grad_norm": 0.5240147926067843, "learning_rate": 3.842281741789044e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.17961186170578003, "step": 925, "valid_targets_mean": 6973.5, "valid_targets_min": 3698 }, { "epoch": 1.512611879576892, "grad_norm": 0.5416943235639524, "learning_rate": 3.839110178519189e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.16294705867767334, "step": 930, "valid_targets_mean": 5591.8, "valid_targets_min": 1248 }, { "epoch": 1.5207485760781123, "grad_norm": 0.5293043927321138, "learning_rate": 3.835908379016966e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.18354995548725128, "step": 935, "valid_targets_mean": 6090.0, "valid_targets_min": 2196 }, { "epoch": 1.5288852725793327, "grad_norm": 0.6655706480297668, "learning_rate": 3.832676395922153e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.1539248526096344, "step": 940, "valid_targets_mean": 5697.2, "valid_targets_min": 1431 }, { "epoch": 1.5370219690805533, "grad_norm": 0.4426293049857693, "learning_rate": 3.82941428237077e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.14680266380310059, "step": 945, "valid_targets_mean": 7124.8, "valid_targets_min": 2558 }, { "epoch": 1.545158665581774, "grad_norm": 0.5298814060383792, "learning_rate": 3.826122091994198e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.19289115071296692, "step": 950, "valid_targets_mean": 6667.8, "valid_targets_min": 4416 }, { "epoch": 1.5532953620829943, "grad_norm": 0.5978964272190899, "learning_rate": 3.822799878918307e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.1660599559545517, "step": 955, "valid_targets_mean": 5468.9, "valid_targets_min": 2193 }, { "epoch": 1.5614320585842147, "grad_norm": 0.561888873495537, "learning_rate": 3.8194476977625556e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.16075164079666138, "step": 960, "valid_targets_mean": 5366.9, "valid_targets_min": 2111 }, { "epoch": 1.5695687550854354, "grad_norm": 0.4590821633958237, "learning_rate": 3.8160656036391024e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1680944561958313, "step": 965, "valid_targets_mean": 5881.0, "valid_targets_min": 1981 }, { "epoch": 1.577705451586656, "grad_norm": 0.5016615802728864, "learning_rate": 3.812653652151893e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.13341429829597473, "step": 970, "valid_targets_mean": 5605.9, "valid_targets_min": 611 }, { "epoch": 1.5858421480878762, "grad_norm": 0.5543813724974704, "learning_rate": 3.809211899395749e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.14888155460357666, "step": 975, "valid_targets_mean": 4731.4, "valid_targets_min": 2004 }, { "epoch": 1.5939788445890968, "grad_norm": 0.6038340910652956, "learning_rate": 3.8057404019554464e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.20221802592277527, "step": 980, "valid_targets_mean": 5403.4, "valid_targets_min": 2495 }, { "epoch": 1.6021155410903174, "grad_norm": 0.5913190155057948, "learning_rate": 3.802239216904782e-05, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.12410770356655121, "step": 985, "valid_targets_mean": 3962.5, "valid_targets_min": 617 }, { "epoch": 1.6102522375915378, "grad_norm": 0.6202617073499859, "learning_rate": 3.79870840180564e-05, "loss": 0.3299, "loss_nan_ranks": 0, "loss_rank_avg": 0.21062825620174408, "step": 990, "valid_targets_mean": 5342.4, "valid_targets_min": 2829 }, { "epoch": 1.6183889340927582, "grad_norm": 0.42689752582314566, "learning_rate": 3.795148014707042e-05, "loss": 0.3248, "loss_nan_ranks": 0, "loss_rank_avg": 0.13294441998004913, "step": 995, "valid_targets_mean": 6876.8, "valid_targets_min": 3548 }, { "epoch": 1.6265256305939788, "grad_norm": 0.5097378796851677, "learning_rate": 3.791558114144192e-05, "loss": 0.3253, "loss_nan_ranks": 0, "loss_rank_avg": 0.1804441213607788, "step": 1000, "valid_targets_mean": 5285.4, "valid_targets_min": 492 }, { "epoch": 1.6346623270951994, "grad_norm": 0.6005808241710359, "learning_rate": 3.7879387591375174e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667994111776352, "step": 1005, "valid_targets_mean": 4509.6, "valid_targets_min": 1333 }, { "epoch": 1.6427990235964198, "grad_norm": 0.5231818030054007, "learning_rate": 3.7842900091916956e-05, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.13126087188720703, "step": 1010, "valid_targets_mean": 4980.8, "valid_targets_min": 1418 }, { "epoch": 1.6509357200976402, "grad_norm": 0.5627337448855949, "learning_rate": 3.7806119242946785e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.15183790028095245, "step": 1015, "valid_targets_mean": 4827.0, "valid_targets_min": 1418 }, { "epoch": 1.6590724165988608, "grad_norm": 0.5414919926293886, "learning_rate": 3.7769045649167034e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.13620023429393768, "step": 1020, "valid_targets_mean": 5039.8, "valid_targets_min": 1019 }, { "epoch": 1.6672091131000815, "grad_norm": 0.7328913562496312, "learning_rate": 3.7731679920093e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1815638542175293, "step": 1025, "valid_targets_mean": 5956.9, "valid_targets_min": 3557 }, { "epoch": 1.6753458096013019, "grad_norm": 0.4817503231027874, "learning_rate": 3.7694022670042894e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.1990923136472702, "step": 1030, "valid_targets_mean": 8180.1, "valid_targets_min": 2581 }, { "epoch": 1.6834825061025223, "grad_norm": 0.5371824559449501, "learning_rate": 3.765607451812773e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.14338502287864685, "step": 1035, "valid_targets_mean": 6586.2, "valid_targets_min": 2170 }, { "epoch": 1.6916192026037429, "grad_norm": 0.5238554557666614, "learning_rate": 3.7617836088241144e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.17069703340530396, "step": 1040, "valid_targets_mean": 7230.1, "valid_targets_min": 4015 }, { "epoch": 1.6997558991049635, "grad_norm": 0.5512994537952781, "learning_rate": 3.757930800904914e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.18536214530467987, "step": 1045, "valid_targets_mean": 5432.5, "valid_targets_min": 2706 }, { "epoch": 1.707892595606184, "grad_norm": 0.48107844360810964, "learning_rate": 3.754049091397976e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.14424890279769897, "step": 1050, "valid_targets_mean": 5978.6, "valid_targets_min": 2666 }, { "epoch": 1.7160292921074043, "grad_norm": 0.6075024591611888, "learning_rate": 3.7501385441212664e-05, "loss": 0.3182, "loss_nan_ranks": 0, "loss_rank_avg": 0.17810899019241333, "step": 1055, "valid_targets_mean": 4907.1, "valid_targets_min": 1817 }, { "epoch": 1.724165988608625, "grad_norm": 0.5996016937895567, "learning_rate": 3.746199223366863e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.1289026141166687, "step": 1060, "valid_targets_mean": 5785.2, "valid_targets_min": 2095 }, { "epoch": 1.7323026851098455, "grad_norm": 0.5765570637174628, "learning_rate": 3.7422311938999013e-05, "loss": 0.3179, "loss_nan_ranks": 0, "loss_rank_avg": 0.16623811423778534, "step": 1065, "valid_targets_mean": 4367.6, "valid_targets_min": 665 }, { "epoch": 1.740439381611066, "grad_norm": 0.5940920131339937, "learning_rate": 3.738234520957506e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.19219470024108887, "step": 1070, "valid_targets_mean": 6104.2, "valid_targets_min": 1766 }, { "epoch": 1.7485760781122863, "grad_norm": 0.5700715611730844, "learning_rate": 3.73420927024772e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.19549089670181274, "step": 1075, "valid_targets_mean": 5461.0, "valid_targets_min": 1614 }, { "epoch": 1.756712774613507, "grad_norm": 0.7143078330637325, "learning_rate": 3.730155507948426e-05, "loss": 0.3209, "loss_nan_ranks": 0, "loss_rank_avg": 0.13924923539161682, "step": 1080, "valid_targets_mean": 5168.4, "valid_targets_min": 2990 }, { "epoch": 1.7648494711147276, "grad_norm": 0.5056362879775232, "learning_rate": 3.726073300706256e-05, "loss": 0.3125, "loss_nan_ranks": 0, "loss_rank_avg": 0.2037101835012436, "step": 1085, "valid_targets_mean": 7316.2, "valid_targets_min": 4681 }, { "epoch": 1.772986167615948, "grad_norm": 0.6236146764427375, "learning_rate": 3.721962715635495e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.10541586577892303, "step": 1090, "valid_targets_mean": 6140.2, "valid_targets_min": 2053 }, { "epoch": 1.7811228641171684, "grad_norm": 0.4808526495829943, "learning_rate": 3.7178238203169804e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.11800515651702881, "step": 1095, "valid_targets_mean": 5675.6, "valid_targets_min": 3375 }, { "epoch": 1.789259560618389, "grad_norm": 0.5465172567640042, "learning_rate": 3.7136566827969895e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.11254914849996567, "step": 1100, "valid_targets_mean": 4710.8, "valid_targets_min": 3037 }, { "epoch": 1.7973962571196096, "grad_norm": 0.6709120787275277, "learning_rate": 3.70946137158612e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.1213892251253128, "step": 1105, "valid_targets_mean": 4375.8, "valid_targets_min": 767 }, { "epoch": 1.80553295362083, "grad_norm": 0.5484870209932681, "learning_rate": 3.705237955658166e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.12435522675514221, "step": 1110, "valid_targets_mean": 4072.5, "valid_targets_min": 628 }, { "epoch": 1.8136696501220504, "grad_norm": 0.5750687925217363, "learning_rate": 3.70098650444898e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.17003116011619568, "step": 1115, "valid_targets_mean": 5343.2, "valid_targets_min": 2628 }, { "epoch": 1.821806346623271, "grad_norm": 0.546589915088346, "learning_rate": 3.6967070878553346e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.13826923072338104, "step": 1120, "valid_targets_mean": 5285.4, "valid_targets_min": 1237 }, { "epoch": 1.8299430431244914, "grad_norm": 0.4773415462163218, "learning_rate": 3.692399776233775e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.16702383756637573, "step": 1125, "valid_targets_mean": 6414.5, "valid_targets_min": 913 }, { "epoch": 1.8380797396257118, "grad_norm": 0.5328441386714764, "learning_rate": 3.688064640399456e-05, "loss": 0.3206, "loss_nan_ranks": 0, "loss_rank_avg": 0.19889968633651733, "step": 1130, "valid_targets_mean": 5738.4, "valid_targets_min": 2918 }, { "epoch": 1.8462164361269324, "grad_norm": 0.6976118740867715, "learning_rate": 3.683701751624983e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.18962863087654114, "step": 1135, "valid_targets_mean": 4923.5, "valid_targets_min": 566 }, { "epoch": 1.854353132628153, "grad_norm": 0.5304211947920925, "learning_rate": 3.67931118163924e-05, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.14399157464504242, "step": 1140, "valid_targets_mean": 4750.4, "valid_targets_min": 3074 }, { "epoch": 1.8624898291293734, "grad_norm": 0.5257505288021834, "learning_rate": 3.674893002626208e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1668822169303894, "step": 1145, "valid_targets_mean": 4587.6, "valid_targets_min": 2853 }, { "epoch": 1.8706265256305938, "grad_norm": 0.5378879554200597, "learning_rate": 3.6704472872237786e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.13983070850372314, "step": 1150, "valid_targets_mean": 4616.9, "valid_targets_min": 1062 }, { "epoch": 1.8787632221318145, "grad_norm": 0.4433938061464499, "learning_rate": 3.665974108522562e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.13427463173866272, "step": 1155, "valid_targets_mean": 6249.2, "valid_targets_min": 4339 }, { "epoch": 1.886899918633035, "grad_norm": 0.5206360977809323, "learning_rate": 3.6614735400646824e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.16344305872917175, "step": 1160, "valid_targets_mean": 5424.0, "valid_targets_min": 1984 }, { "epoch": 1.8950366151342555, "grad_norm": 0.7386914345471229, "learning_rate": 3.6569456558425724e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.1590915322303772, "step": 1165, "valid_targets_mean": 4894.9, "valid_targets_min": 1686 }, { "epoch": 1.9031733116354759, "grad_norm": 0.5227919706663646, "learning_rate": 3.6523905302977524e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.14777085185050964, "step": 1170, "valid_targets_mean": 5690.5, "valid_targets_min": 2053 }, { "epoch": 1.9113100081366965, "grad_norm": 0.4725060339813615, "learning_rate": 3.64780823831961e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.11375989019870758, "step": 1175, "valid_targets_mean": 5967.5, "valid_targets_min": 2992 }, { "epoch": 1.9194467046379171, "grad_norm": 0.5531722742216661, "learning_rate": 3.643198855244167e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.16253279149532318, "step": 1180, "valid_targets_mean": 4639.1, "valid_targets_min": 536 }, { "epoch": 1.9275834011391375, "grad_norm": 0.5643086611406565, "learning_rate": 3.6385624568528424e-05, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.2203579545021057, "step": 1185, "valid_targets_mean": 5916.4, "valid_targets_min": 2444 }, { "epoch": 1.935720097640358, "grad_norm": 0.5188039070960107, "learning_rate": 3.6338991193712045e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.15397492051124573, "step": 1190, "valid_targets_mean": 5445.5, "valid_targets_min": 1156 }, { "epoch": 1.9438567941415785, "grad_norm": 0.5944670726923176, "learning_rate": 3.629208919467718e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.10873277485370636, "step": 1195, "valid_targets_mean": 5434.2, "valid_targets_min": 1056 }, { "epoch": 1.9519934906427991, "grad_norm": 0.5820905612331527, "learning_rate": 3.624491934252487e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.17353525757789612, "step": 1200, "valid_targets_mean": 5973.5, "valid_targets_min": 2297 }, { "epoch": 1.9601301871440195, "grad_norm": 0.5328994536277564, "learning_rate": 3.619748241275981e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.15726155042648315, "step": 1205, "valid_targets_mean": 5639.8, "valid_targets_min": 2308 }, { "epoch": 1.96826688364524, "grad_norm": 0.5129359181321838, "learning_rate": 3.614977918527767e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.18390318751335144, "step": 1210, "valid_targets_mean": 5109.2, "valid_targets_min": 1159 }, { "epoch": 1.9764035801464606, "grad_norm": 0.5994511326540063, "learning_rate": 3.610181044435221e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.13535848259925842, "step": 1215, "valid_targets_mean": 3102.2, "valid_targets_min": 560 }, { "epoch": 1.9845402766476812, "grad_norm": 0.4870695756000568, "learning_rate": 3.605357697862242e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.12981772422790527, "step": 1220, "valid_targets_mean": 5653.2, "valid_targets_min": 1754 }, { "epoch": 1.9926769731489016, "grad_norm": 0.43943406829275067, "learning_rate": 3.6005079581079545e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.13087867200374603, "step": 1225, "valid_targets_mean": 5805.1, "valid_targets_min": 1258 }, { "epoch": 2.0, "grad_norm": 0.9516475150367983, "learning_rate": 3.595631904905406e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2887159287929535, "step": 1230, "valid_targets_mean": 6080.8, "valid_targets_min": 2494 }, { "epoch": 2.0081366965012206, "grad_norm": 0.6856718094729896, "learning_rate": 3.590729618420255e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.12657839059829712, "step": 1235, "valid_targets_mean": 4212.5, "valid_targets_min": 1370 }, { "epoch": 2.016273393002441, "grad_norm": 0.558226531525447, "learning_rate": 3.585801179249452e-05, "loss": 0.3125, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799025982618332, "step": 1240, "valid_targets_mean": 7292.6, "valid_targets_min": 3950 }, { "epoch": 2.0244100895036614, "grad_norm": 0.5075555500011202, "learning_rate": 3.5808466684199166e-05, "loss": 0.3104, "loss_nan_ranks": 0, "loss_rank_avg": 0.15327878296375275, "step": 1245, "valid_targets_mean": 6603.9, "valid_targets_min": 2080 }, { "epoch": 2.032546786004882, "grad_norm": 0.6541052075091615, "learning_rate": 3.575866167387204e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.10481029748916626, "step": 1250, "valid_targets_mean": 4328.6, "valid_targets_min": 1036 }, { "epoch": 2.0406834825061027, "grad_norm": 0.5007902862675059, "learning_rate": 3.570859758034165e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.11358005553483963, "step": 1255, "valid_targets_mean": 6206.4, "valid_targets_min": 966 }, { "epoch": 2.048820179007323, "grad_norm": 0.4639873782398551, "learning_rate": 3.565827522669605e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.18322622776031494, "step": 1260, "valid_targets_mean": 7581.5, "valid_targets_min": 1826 }, { "epoch": 2.0569568755085434, "grad_norm": 0.47229568303905795, "learning_rate": 3.5607695440269214e-05, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.11020516604185104, "step": 1265, "valid_targets_mean": 5878.0, "valid_targets_min": 743 }, { "epoch": 2.065093572009764, "grad_norm": 0.4606387724405939, "learning_rate": 3.555685905262751e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.12334157526493073, "step": 1270, "valid_targets_mean": 7156.1, "valid_targets_min": 3306 }, { "epoch": 2.0732302685109847, "grad_norm": 0.5568749724181045, "learning_rate": 3.5505766899556026e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.18671417236328125, "step": 1275, "valid_targets_mean": 5929.2, "valid_targets_min": 2774 }, { "epoch": 2.081366965012205, "grad_norm": 0.5320198579082824, "learning_rate": 3.5454419821044786e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.1624656319618225, "step": 1280, "valid_targets_mean": 5359.9, "valid_targets_min": 1879 }, { "epoch": 2.0895036615134255, "grad_norm": 0.4946581187629097, "learning_rate": 3.540281866127496e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.113202303647995, "step": 1285, "valid_targets_mean": 4963.8, "valid_targets_min": 590 }, { "epoch": 2.097640358014646, "grad_norm": 0.5314804091550819, "learning_rate": 3.5350964268605006e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.1298123598098755, "step": 1290, "valid_targets_mean": 5789.2, "valid_targets_min": 524 }, { "epoch": 2.1057770545158667, "grad_norm": 0.4608248324996564, "learning_rate": 3.5298857495556684e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.09899343550205231, "step": 1295, "valid_targets_mean": 6090.4, "valid_targets_min": 625 }, { "epoch": 2.113913751017087, "grad_norm": 0.6160654304320085, "learning_rate": 3.524649919880108e-05, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.1561860293149948, "step": 1300, "valid_targets_mean": 5319.5, "valid_targets_min": 2221 }, { "epoch": 2.1220504475183075, "grad_norm": 0.6034183220777789, "learning_rate": 3.519389023914449e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.1617409586906433, "step": 1305, "valid_targets_mean": 4925.8, "valid_targets_min": 1622 }, { "epoch": 2.130187144019528, "grad_norm": 0.5445584399411685, "learning_rate": 3.5141031481514276e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.15059779584407806, "step": 1310, "valid_targets_mean": 4658.4, "valid_targets_min": 2734 }, { "epoch": 2.1383238405207488, "grad_norm": 0.5409881257424901, "learning_rate": 3.508792379494468e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.1463170051574707, "step": 1315, "valid_targets_mean": 5791.5, "valid_targets_min": 1064 }, { "epoch": 2.146460537021969, "grad_norm": 1.106581439320117, "learning_rate": 3.503456805256246e-05, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.1498536616563797, "step": 1320, "valid_targets_mean": 5623.2, "valid_targets_min": 2620 }, { "epoch": 2.1545972335231895, "grad_norm": 0.4584831942256986, "learning_rate": 3.4980965131572616e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.14147350192070007, "step": 1325, "valid_targets_mean": 5904.6, "valid_targets_min": 3878 }, { "epoch": 2.16273393002441, "grad_norm": 0.4492273639183458, "learning_rate": 3.492711591324392e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.14748775959014893, "step": 1330, "valid_targets_mean": 5023.4, "valid_targets_min": 2861 }, { "epoch": 2.170870626525631, "grad_norm": 0.5811998512861577, "learning_rate": 3.487302128289445e-05, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.11501553654670715, "step": 1335, "valid_targets_mean": 2852.8, "valid_targets_min": 977 }, { "epoch": 2.179007323026851, "grad_norm": 0.4764245873738506, "learning_rate": 3.481868212987702e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383422166109085, "step": 1340, "valid_targets_mean": 6408.1, "valid_targets_min": 2128 }, { "epoch": 2.1871440195280716, "grad_norm": 0.48558055183022075, "learning_rate": 3.476409934756456e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.1000407487154007, "step": 1345, "valid_targets_mean": 5105.9, "valid_targets_min": 542 }, { "epoch": 2.195280716029292, "grad_norm": 0.5180718638517471, "learning_rate": 3.470927383333544e-05, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.10666623711585999, "step": 1350, "valid_targets_mean": 5258.9, "valid_targets_min": 3522 }, { "epoch": 2.203417412530513, "grad_norm": 0.5400230528001939, "learning_rate": 3.46542064885587e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.12988999485969543, "step": 1355, "valid_targets_mean": 4880.5, "valid_targets_min": 573 }, { "epoch": 2.211554109031733, "grad_norm": 0.45852170946065385, "learning_rate": 3.459889821857926e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.11199237406253815, "step": 1360, "valid_targets_mean": 4982.0, "valid_targets_min": 310 }, { "epoch": 2.2196908055329536, "grad_norm": 0.5665127278933965, "learning_rate": 3.4543349932702984e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.18964138627052307, "step": 1365, "valid_targets_mean": 6463.2, "valid_targets_min": 3622 }, { "epoch": 2.2278275020341742, "grad_norm": 0.5118619545403494, "learning_rate": 3.448756254418179e-05, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.18084275722503662, "step": 1370, "valid_targets_mean": 5036.5, "valid_targets_min": 1393 }, { "epoch": 2.2359641985353944, "grad_norm": 0.4567137661572972, "learning_rate": 3.443153697019861e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.13496790826320648, "step": 1375, "valid_targets_mean": 6337.4, "valid_targets_min": 2816 }, { "epoch": 2.244100895036615, "grad_norm": 0.5129895131737416, "learning_rate": 3.437527413185227e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.15807993710041046, "step": 1380, "valid_targets_mean": 6726.0, "valid_targets_min": 1732 }, { "epoch": 2.2522375915378356, "grad_norm": 0.658861425263113, "learning_rate": 3.431877495414242e-05, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.119639553129673, "step": 1385, "valid_targets_mean": 5690.6, "valid_targets_min": 1710 }, { "epoch": 2.2603742880390563, "grad_norm": 0.5053124575310604, "learning_rate": 3.42620403659543e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.14893598854541779, "step": 1390, "valid_targets_mean": 5824.2, "valid_targets_min": 741 }, { "epoch": 2.268510984540277, "grad_norm": 0.5549205480957295, "learning_rate": 3.420507130004341e-05, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.14574193954467773, "step": 1395, "valid_targets_mean": 5895.8, "valid_targets_min": 3196 }, { "epoch": 2.276647681041497, "grad_norm": 0.5169854577549462, "learning_rate": 3.414786869302029e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.1294897347688675, "step": 1400, "valid_targets_mean": 4723.2, "valid_targets_min": 3238 }, { "epoch": 2.2847843775427177, "grad_norm": 0.4968472508374019, "learning_rate": 3.4090433485334996e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.13790994882583618, "step": 1405, "valid_targets_mean": 6752.5, "valid_targets_min": 2943 }, { "epoch": 2.2929210740439383, "grad_norm": 0.5185289577994608, "learning_rate": 3.403276662126173e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724536418914795, "step": 1410, "valid_targets_mean": 6443.1, "valid_targets_min": 1159 }, { "epoch": 2.3010577705451585, "grad_norm": 0.5649680792199295, "learning_rate": 3.397486904888328e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.13218429684638977, "step": 1415, "valid_targets_mean": 4330.9, "valid_targets_min": 2339 }, { "epoch": 2.309194467046379, "grad_norm": 0.5035857907328071, "learning_rate": 3.391674172007544e-05, "loss": 0.2884, "loss_nan_ranks": 0, "loss_rank_avg": 0.1316101849079132, "step": 1420, "valid_targets_mean": 4778.2, "valid_targets_min": 2482 }, { "epoch": 2.3173311635475997, "grad_norm": 0.5303641033831891, "learning_rate": 3.3858385590491347e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1569986343383789, "step": 1425, "valid_targets_mean": 6596.2, "valid_targets_min": 4475 }, { "epoch": 2.3254678600488203, "grad_norm": 0.48585758657147765, "learning_rate": 3.379980161954578e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.11201968044042587, "step": 1430, "valid_targets_mean": 5466.8, "valid_targets_min": 2472 }, { "epoch": 2.3336045565500405, "grad_norm": 0.4949945647060311, "learning_rate": 3.3740990770399404e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.15348434448242188, "step": 1435, "valid_targets_mean": 5463.9, "valid_targets_min": 2560 }, { "epoch": 2.341741253051261, "grad_norm": 0.51532488211287, "learning_rate": 3.368195400994289e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.14001132547855377, "step": 1440, "valid_targets_mean": 5797.4, "valid_targets_min": 3868 }, { "epoch": 2.3498779495524817, "grad_norm": 0.4954512879924778, "learning_rate": 3.362269230878107e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.1684633195400238, "step": 1445, "valid_targets_mean": 5250.2, "valid_targets_min": 484 }, { "epoch": 2.3580146460537024, "grad_norm": 0.5206552287941425, "learning_rate": 3.356320664121694e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.13183483481407166, "step": 1450, "valid_targets_mean": 5600.0, "valid_targets_min": 2037 }, { "epoch": 2.3661513425549225, "grad_norm": 0.5806830244648058, "learning_rate": 3.350349798523566e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.11899223923683167, "step": 1455, "valid_targets_mean": 4941.5, "valid_targets_min": 1237 }, { "epoch": 2.374288039056143, "grad_norm": 0.4835797115209612, "learning_rate": 3.344356732248849e-05, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.12682092189788818, "step": 1460, "valid_targets_mean": 5932.6, "valid_targets_min": 2233 }, { "epoch": 2.382424735557364, "grad_norm": 0.46420895136183626, "learning_rate": 3.33834156382766e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.1228257492184639, "step": 1465, "valid_targets_mean": 6454.4, "valid_targets_min": 3734 }, { "epoch": 2.3905614320585844, "grad_norm": 0.4848046054819125, "learning_rate": 3.332304392153494e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.13247308135032654, "step": 1470, "valid_targets_mean": 5843.1, "valid_targets_min": 3532 }, { "epoch": 2.3986981285598046, "grad_norm": 0.5322468446136851, "learning_rate": 3.326245316481591e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.14443229138851166, "step": 1475, "valid_targets_mean": 5665.5, "valid_targets_min": 2645 }, { "epoch": 2.406834825061025, "grad_norm": 0.4953219209876432, "learning_rate": 3.320164436427311e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.12060455232858658, "step": 1480, "valid_targets_mean": 5264.1, "valid_targets_min": 3318 }, { "epoch": 2.414971521562246, "grad_norm": 0.5103794103032024, "learning_rate": 3.314061851964491e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.12996214628219604, "step": 1485, "valid_targets_mean": 4645.6, "valid_targets_min": 3056 }, { "epoch": 2.423108218063466, "grad_norm": 0.48812963792791125, "learning_rate": 3.307937663423804e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.13980984687805176, "step": 1490, "valid_targets_mean": 6567.1, "valid_targets_min": 3602 }, { "epoch": 2.4312449145646866, "grad_norm": 0.6781638230036592, "learning_rate": 3.3017919714911094e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.11503338813781738, "step": 1495, "valid_targets_mean": 5187.6, "valid_targets_min": 598 }, { "epoch": 2.4393816110659072, "grad_norm": 0.494679876515722, "learning_rate": 3.295624877205796e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.12201376259326935, "step": 1500, "valid_targets_mean": 5504.5, "valid_targets_min": 1291 }, { "epoch": 2.447518307567128, "grad_norm": 0.6017430889988331, "learning_rate": 3.2894364819591224e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.154220849275589, "step": 1505, "valid_targets_mean": 4390.1, "valid_targets_min": 1214 }, { "epoch": 2.4556550040683485, "grad_norm": 0.5265681649533256, "learning_rate": 3.28322688749255e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.14010374248027802, "step": 1510, "valid_targets_mean": 4612.5, "valid_targets_min": 1296 }, { "epoch": 2.4637917005695686, "grad_norm": 0.551484588945014, "learning_rate": 3.2769961958960694e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.14503279328346252, "step": 1515, "valid_targets_mean": 5862.9, "valid_targets_min": 2141 }, { "epoch": 2.4719283970707893, "grad_norm": 0.5213608708077778, "learning_rate": 3.270744509606523e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.12514446675777435, "step": 1520, "valid_targets_mean": 5143.2, "valid_targets_min": 2810 }, { "epoch": 2.48006509357201, "grad_norm": 0.5609869887661976, "learning_rate": 3.26447193140592e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.16480261087417603, "step": 1525, "valid_targets_mean": 4906.8, "valid_targets_min": 2091 }, { "epoch": 2.48820179007323, "grad_norm": 0.45622929795341044, "learning_rate": 3.2581785644197456e-05, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.10129719972610474, "step": 1530, "valid_targets_mean": 4956.2, "valid_targets_min": 2164 }, { "epoch": 2.4963384865744507, "grad_norm": 0.5164564778909829, "learning_rate": 3.251864512115271e-05, "loss": 0.3104, "loss_nan_ranks": 0, "loss_rank_avg": 0.2165476679801941, "step": 1535, "valid_targets_mean": 6606.1, "valid_targets_min": 2363 }, { "epoch": 2.5044751830756713, "grad_norm": 0.3983072775801996, "learning_rate": 3.2455298782998424e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.10032185167074203, "step": 1540, "valid_targets_mean": 8497.1, "valid_targets_min": 2843 }, { "epoch": 2.512611879576892, "grad_norm": 0.5732682239726878, "learning_rate": 3.2391747671191854e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.12304198741912842, "step": 1545, "valid_targets_mean": 6310.2, "valid_targets_min": 2146 }, { "epoch": 2.5207485760781125, "grad_norm": 0.48301651904457216, "learning_rate": 3.2327992830556846e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.1629238873720169, "step": 1550, "valid_targets_mean": 5748.8, "valid_targets_min": 845 }, { "epoch": 2.5288852725793327, "grad_norm": 0.4455251023255143, "learning_rate": 3.22640353092667e-05, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.1761193573474884, "step": 1555, "valid_targets_mean": 5489.5, "valid_targets_min": 1059 }, { "epoch": 2.5370219690805533, "grad_norm": 0.4809788733224243, "learning_rate": 3.2199876158826915e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.1458398401737213, "step": 1560, "valid_targets_mean": 7149.8, "valid_targets_min": 3817 }, { "epoch": 2.545158665581774, "grad_norm": 0.45307852053685194, "learning_rate": 3.2135516434057915e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.11577823013067245, "step": 1565, "valid_targets_mean": 5393.9, "valid_targets_min": 2233 }, { "epoch": 2.553295362082994, "grad_norm": 0.49760950499062984, "learning_rate": 3.2070957193077705e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.12272712588310242, "step": 1570, "valid_targets_mean": 4861.1, "valid_targets_min": 3252 }, { "epoch": 2.5614320585842147, "grad_norm": 0.5355275643102434, "learning_rate": 3.200619949728448e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.1525430828332901, "step": 1575, "valid_targets_mean": 6466.9, "valid_targets_min": 3548 }, { "epoch": 2.5695687550854354, "grad_norm": 0.5018072667233595, "learning_rate": 3.194124441133916e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.14310288429260254, "step": 1580, "valid_targets_mean": 4550.6, "valid_targets_min": 2784 }, { "epoch": 2.577705451586656, "grad_norm": 0.5173938528400699, "learning_rate": 3.187609300314789e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.13510233163833618, "step": 1585, "valid_targets_mean": 5440.2, "valid_targets_min": 923 }, { "epoch": 2.585842148087876, "grad_norm": 0.5159504691075016, "learning_rate": 3.181074634384451e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.14067131280899048, "step": 1590, "valid_targets_mean": 5820.6, "valid_targets_min": 3059 }, { "epoch": 2.5939788445890968, "grad_norm": 0.5405735538422601, "learning_rate": 3.1745205507772876e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.12036160379648209, "step": 1595, "valid_targets_mean": 5669.1, "valid_targets_min": 2723 }, { "epoch": 2.6021155410903174, "grad_norm": 0.7407500991451971, "learning_rate": 3.16794715724693e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.15827390551567078, "step": 1600, "valid_targets_mean": 5583.9, "valid_targets_min": 2685 }, { "epoch": 2.6102522375915376, "grad_norm": 0.5099598998443594, "learning_rate": 3.161354561864474e-05, "loss": 0.2981, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440209299325943, "step": 1605, "valid_targets_mean": 5326.2, "valid_targets_min": 1707 }, { "epoch": 2.618388934092758, "grad_norm": 0.5479785273711072, "learning_rate": 3.154742873016707e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.13522969186306, "step": 1610, "valid_targets_mean": 5222.2, "valid_targets_min": 1303 }, { "epoch": 2.626525630593979, "grad_norm": 0.47481378459752427, "learning_rate": 3.14811219940433e-05, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.13894972205162048, "step": 1615, "valid_targets_mean": 6755.9, "valid_targets_min": 3830 }, { "epoch": 2.6346623270951994, "grad_norm": 0.4650084315327305, "learning_rate": 3.141462650040161e-05, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.1224336326122284, "step": 1620, "valid_targets_mean": 5373.9, "valid_targets_min": 1348 }, { "epoch": 2.64279902359642, "grad_norm": 0.5401018992903237, "learning_rate": 3.134794334247351e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.1545572429895401, "step": 1625, "valid_targets_mean": 5654.0, "valid_targets_min": 1794 }, { "epoch": 2.6509357200976402, "grad_norm": 0.48016953909282284, "learning_rate": 3.1281073616575856e-05, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.13257913291454315, "step": 1630, "valid_targets_mean": 5957.4, "valid_targets_min": 3444 }, { "epoch": 2.659072416598861, "grad_norm": 0.5599972237868494, "learning_rate": 3.121401842209279e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.22545486688613892, "step": 1635, "valid_targets_mean": 6662.0, "valid_targets_min": 3924 }, { "epoch": 2.6672091131000815, "grad_norm": 0.5099869798156484, "learning_rate": 3.114677886145768e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.15294325351715088, "step": 1640, "valid_targets_mean": 5627.6, "valid_targets_min": 2398 }, { "epoch": 2.6753458096013016, "grad_norm": 0.5577431582136917, "learning_rate": 3.107935604013501e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.1127748042345047, "step": 1645, "valid_targets_mean": 4538.1, "valid_targets_min": 1505 }, { "epoch": 2.6834825061025223, "grad_norm": 0.5463423029256798, "learning_rate": 3.101175106660219e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.1513296216726303, "step": 1650, "valid_targets_mean": 5564.5, "valid_targets_min": 1164 }, { "epoch": 2.691619202603743, "grad_norm": 0.6027625180902552, "learning_rate": 3.094396505233135e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423185020685196, "step": 1655, "valid_targets_mean": 4589.9, "valid_targets_min": 1015 }, { "epoch": 2.6997558991049635, "grad_norm": 0.43885668468200845, "learning_rate": 3.087599911177103e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.12957511842250824, "step": 1660, "valid_targets_mean": 7121.9, "valid_targets_min": 4396 }, { "epoch": 2.707892595606184, "grad_norm": 0.5377034711492127, "learning_rate": 3.0807854362327906e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.14502663910388947, "step": 1665, "valid_targets_mean": 5456.5, "valid_targets_min": 3570 }, { "epoch": 2.7160292921074043, "grad_norm": 0.5001336173501958, "learning_rate": 3.073953192434837e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.12598839402198792, "step": 1670, "valid_targets_mean": 4810.9, "valid_targets_min": 873 }, { "epoch": 2.724165988608625, "grad_norm": 0.5220789996194123, "learning_rate": 3.067103292110017e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.14378760755062103, "step": 1675, "valid_targets_mean": 4979.9, "valid_targets_min": 2252 }, { "epoch": 2.7323026851098455, "grad_norm": 0.5162691594592334, "learning_rate": 3.060235847875387e-05, "loss": 0.3052, "loss_nan_ranks": 0, "loss_rank_avg": 0.1796841025352478, "step": 1680, "valid_targets_mean": 6276.2, "valid_targets_min": 521 }, { "epoch": 2.7404393816110657, "grad_norm": 0.48029341615912935, "learning_rate": 3.05335097263644e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.125966876745224, "step": 1685, "valid_targets_mean": 5720.2, "valid_targets_min": 1338 }, { "epoch": 2.7485760781122863, "grad_norm": 0.4803595848509251, "learning_rate": 3.0464487795852463e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.09926225244998932, "step": 1690, "valid_targets_mean": 5128.4, "valid_targets_min": 1470 }, { "epoch": 2.756712774613507, "grad_norm": 0.5106278700225423, "learning_rate": 3.0395293821985906e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.12691687047481537, "step": 1695, "valid_targets_mean": 4647.5, "valid_targets_min": 1087 }, { "epoch": 2.7648494711147276, "grad_norm": 0.61727008379644, "learning_rate": 3.032592894236112e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375855952501297, "step": 1700, "valid_targets_mean": 4063.8, "valid_targets_min": 1345 }, { "epoch": 2.772986167615948, "grad_norm": 0.5220802075309688, "learning_rate": 3.0256394297384273e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398482620716095, "step": 1705, "valid_targets_mean": 5660.1, "valid_targets_min": 3984 }, { "epoch": 2.7811228641171684, "grad_norm": 0.5238354995617224, "learning_rate": 3.0186691030252614e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.132085919380188, "step": 1710, "valid_targets_mean": 5220.8, "valid_targets_min": 801 }, { "epoch": 2.789259560618389, "grad_norm": 0.499241003810301, "learning_rate": 3.0116820286935654e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.177951842546463, "step": 1715, "valid_targets_mean": 5724.1, "valid_targets_min": 2484 }, { "epoch": 2.7973962571196096, "grad_norm": 0.575750437435253, "learning_rate": 3.0046783216156315e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.12942825257778168, "step": 1720, "valid_targets_mean": 4648.0, "valid_targets_min": 2633 }, { "epoch": 2.8055329536208298, "grad_norm": 0.5045556071219864, "learning_rate": 2.997658096937207e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.12483763694763184, "step": 1725, "valid_targets_mean": 5357.9, "valid_targets_min": 895 }, { "epoch": 2.8136696501220504, "grad_norm": 0.684348188778152, "learning_rate": 2.990621470075598e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319955587387085, "step": 1730, "valid_targets_mean": 5457.0, "valid_targets_min": 1374 }, { "epoch": 2.821806346623271, "grad_norm": 0.5671325911785545, "learning_rate": 2.9835685567177763e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.1548902690410614, "step": 1735, "valid_targets_mean": 5260.6, "valid_targets_min": 956 }, { "epoch": 2.8299430431244916, "grad_norm": 0.4629636978551261, "learning_rate": 2.9764994728184725e-05, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.15818393230438232, "step": 1740, "valid_targets_mean": 6452.5, "valid_targets_min": 3759 }, { "epoch": 2.838079739625712, "grad_norm": 0.5953069122381895, "learning_rate": 2.9694143345982732e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.17098405957221985, "step": 1745, "valid_targets_mean": 5593.5, "valid_targets_min": 372 }, { "epoch": 2.8462164361269324, "grad_norm": 0.45172986591859304, "learning_rate": 2.9623132585417096e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.13527032732963562, "step": 1750, "valid_targets_mean": 6704.2, "valid_targets_min": 1353 }, { "epoch": 2.854353132628153, "grad_norm": 0.4975648396200817, "learning_rate": 2.9551963613953404e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.12178505957126617, "step": 1755, "valid_targets_mean": 6038.4, "valid_targets_min": 4521 }, { "epoch": 2.862489829129373, "grad_norm": 0.5414519194121625, "learning_rate": 2.948063760165835e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.12081147730350494, "step": 1760, "valid_targets_mean": 4120.1, "valid_targets_min": 537 }, { "epoch": 2.870626525630594, "grad_norm": 0.4366067141691184, "learning_rate": 2.9409155721180477e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.1350255012512207, "step": 1765, "valid_targets_mean": 6225.4, "valid_targets_min": 3036 }, { "epoch": 2.8787632221318145, "grad_norm": 0.5500766155760595, "learning_rate": 2.9337519147730918e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.10548760741949081, "step": 1770, "valid_targets_mean": 4567.8, "valid_targets_min": 1523 }, { "epoch": 2.886899918633035, "grad_norm": 0.4435904826881841, "learning_rate": 2.9265729059064054e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.13118746876716614, "step": 1775, "valid_targets_mean": 6306.4, "valid_targets_min": 3141 }, { "epoch": 2.8950366151342557, "grad_norm": 0.7587627287786612, "learning_rate": 2.9193786635458178e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.18454968929290771, "step": 1780, "valid_targets_mean": 5579.1, "valid_targets_min": 1106 }, { "epoch": 2.903173311635476, "grad_norm": 0.4897525087855841, "learning_rate": 2.912169305969605e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.13022705912590027, "step": 1785, "valid_targets_mean": 6038.9, "valid_targets_min": 3288 }, { "epoch": 2.9113100081366965, "grad_norm": 0.3896829782222166, "learning_rate": 2.9049449517045497e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.11002755165100098, "step": 1790, "valid_targets_mean": 6118.0, "valid_targets_min": 2338 }, { "epoch": 2.919446704637917, "grad_norm": 0.3784633224945294, "learning_rate": 2.89770571952399e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.11330070346593857, "step": 1795, "valid_targets_mean": 8400.2, "valid_targets_min": 4155 }, { "epoch": 2.9275834011391373, "grad_norm": 0.49491264882028485, "learning_rate": 2.890451728445866e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.18684348464012146, "step": 1800, "valid_targets_mean": 6696.6, "valid_targets_min": 3861 }, { "epoch": 2.935720097640358, "grad_norm": 0.47181247576364993, "learning_rate": 2.8831830977307644e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.16414770483970642, "step": 1805, "valid_targets_mean": 6644.9, "valid_targets_min": 1462 }, { "epoch": 2.9438567941415785, "grad_norm": 0.5155396891551823, "learning_rate": 2.8758999468799594e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.15796388685703278, "step": 1810, "valid_targets_mean": 4846.5, "valid_targets_min": 1632 }, { "epoch": 2.951993490642799, "grad_norm": 0.4514689977307621, "learning_rate": 2.868602395633444e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.19608153402805328, "step": 1815, "valid_targets_mean": 7106.8, "valid_targets_min": 3883 }, { "epoch": 2.9601301871440198, "grad_norm": 0.5846021256028041, "learning_rate": 2.861290563967965e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.0958099514245987, "step": 1820, "valid_targets_mean": 2989.9, "valid_targets_min": 1378 }, { "epoch": 2.96826688364524, "grad_norm": 0.4539261325479636, "learning_rate": 2.8539645720950474e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.15887710452079773, "step": 1825, "valid_targets_mean": 5430.4, "valid_targets_min": 2053 }, { "epoch": 2.9764035801464606, "grad_norm": 0.5167204311608852, "learning_rate": 2.8466245404590226e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.17045152187347412, "step": 1830, "valid_targets_mean": 6415.8, "valid_targets_min": 2274 }, { "epoch": 2.984540276647681, "grad_norm": 0.4910802890132026, "learning_rate": 2.8392705897350425e-05, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.15125080943107605, "step": 1835, "valid_targets_mean": 5811.2, "valid_targets_min": 2158 }, { "epoch": 2.9926769731489014, "grad_norm": 0.46505504808407744, "learning_rate": 2.8319028408270983e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.15869152545928955, "step": 1840, "valid_targets_mean": 7832.1, "valid_targets_min": 3792 }, { "epoch": 3.0, "grad_norm": 0.7018093322068503, "learning_rate": 2.8245214148660364e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.32103702425956726, "step": 1845, "valid_targets_mean": 5602.2, "valid_targets_min": 2942 }, { "epoch": 3.0081366965012206, "grad_norm": 0.557545342235143, "learning_rate": 2.8171264332075588e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.12069088220596313, "step": 1850, "valid_targets_mean": 4822.1, "valid_targets_min": 3071 }, { "epoch": 3.016273393002441, "grad_norm": 0.5055444788767136, "learning_rate": 2.809718017430236e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308608502149582, "step": 1855, "valid_targets_mean": 5950.2, "valid_targets_min": 2493 }, { "epoch": 3.0244100895036614, "grad_norm": 0.564974769389222, "learning_rate": 2.8022962893335023e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.13714183866977692, "step": 1860, "valid_targets_mean": 4790.5, "valid_targets_min": 1710 }, { "epoch": 3.032546786004882, "grad_norm": 0.5368918165884716, "learning_rate": 2.7948613709356565e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.11848818510770798, "step": 1865, "valid_targets_mean": 5709.6, "valid_targets_min": 1869 }, { "epoch": 3.0406834825061027, "grad_norm": 0.6202460762235937, "learning_rate": 2.7874133844718557e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.15099003911018372, "step": 1870, "valid_targets_mean": 5946.1, "valid_targets_min": 3788 }, { "epoch": 3.048820179007323, "grad_norm": 0.47945587720363, "learning_rate": 2.7799524523921038e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.14982934296131134, "step": 1875, "valid_targets_mean": 4646.1, "valid_targets_min": 1010 }, { "epoch": 3.0569568755085434, "grad_norm": 0.5981553209252303, "learning_rate": 2.77247869735924e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.13525862991809845, "step": 1880, "valid_targets_mean": 5607.5, "valid_targets_min": 3276 }, { "epoch": 3.065093572009764, "grad_norm": 0.5197959262649877, "learning_rate": 2.764992242246921e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.12702880799770355, "step": 1885, "valid_targets_mean": 5396.0, "valid_targets_min": 2859 }, { "epoch": 3.0732302685109847, "grad_norm": 0.4896279271559394, "learning_rate": 2.7574932101376034e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.10663357377052307, "step": 1890, "valid_targets_mean": 5472.4, "valid_targets_min": 2781 }, { "epoch": 3.081366965012205, "grad_norm": 0.6197885493966871, "learning_rate": 2.749981724320516e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.14642459154129028, "step": 1895, "valid_targets_mean": 4172.6, "valid_targets_min": 867 }, { "epoch": 3.0895036615134255, "grad_norm": 0.4909453144584929, "learning_rate": 2.7424579082896357e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1485298126935959, "step": 1900, "valid_targets_mean": 5413.5, "valid_targets_min": 2571 }, { "epoch": 3.097640358014646, "grad_norm": 0.4913841836660842, "learning_rate": 2.7349218857416587e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.16140612959861755, "step": 1905, "valid_targets_mean": 6672.6, "valid_targets_min": 1381 }, { "epoch": 3.1057770545158667, "grad_norm": 0.5286751495746139, "learning_rate": 2.7273737805739614e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.09970603883266449, "step": 1910, "valid_targets_mean": 4983.8, "valid_targets_min": 926 }, { "epoch": 3.113913751017087, "grad_norm": 0.4922716591309361, "learning_rate": 2.719813716882569e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.1322004795074463, "step": 1915, "valid_targets_mean": 7345.9, "valid_targets_min": 4037 }, { "epoch": 3.1220504475183075, "grad_norm": 0.4932161067767006, "learning_rate": 2.7122418189601118e-05, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.12052470445632935, "step": 1920, "valid_targets_mean": 5224.1, "valid_targets_min": 3445 }, { "epoch": 3.130187144019528, "grad_norm": 0.49943776929619677, "learning_rate": 2.7046582112937837e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.13334211707115173, "step": 1925, "valid_targets_mean": 7433.6, "valid_targets_min": 1974 }, { "epoch": 3.1383238405207488, "grad_norm": 0.44357138068663077, "learning_rate": 2.697063018563295e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.11824844032526016, "step": 1930, "valid_targets_mean": 6402.1, "valid_targets_min": 3582 }, { "epoch": 3.146460537021969, "grad_norm": 0.6216470540080042, "learning_rate": 2.6894563656388217e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.16654358804225922, "step": 1935, "valid_targets_mean": 4445.5, "valid_targets_min": 652 }, { "epoch": 3.1545972335231895, "grad_norm": 0.5203431916047961, "learning_rate": 2.681838377578954e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.13338005542755127, "step": 1940, "valid_targets_mean": 6740.8, "valid_targets_min": 3477 }, { "epoch": 3.16273393002441, "grad_norm": 0.548730057587269, "learning_rate": 2.6742091796286388e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.14711609482765198, "step": 1945, "valid_targets_mean": 5364.9, "valid_targets_min": 1328 }, { "epoch": 3.170870626525631, "grad_norm": 0.5303267033016945, "learning_rate": 2.6665688972171215e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.1701548993587494, "step": 1950, "valid_targets_mean": 5727.0, "valid_targets_min": 4151 }, { "epoch": 3.179007323026851, "grad_norm": 0.5676758975951339, "learning_rate": 2.658917655955884e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.15539327263832092, "step": 1955, "valid_targets_mean": 4853.1, "valid_targets_min": 2899 }, { "epoch": 3.1871440195280716, "grad_norm": 0.4484115372218612, "learning_rate": 2.651255581636578e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.16180385649204254, "step": 1960, "valid_targets_mean": 7725.1, "valid_targets_min": 4420 }, { "epoch": 3.195280716029292, "grad_norm": 0.5105638327238713, "learning_rate": 2.6435828002289596e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.12511882185935974, "step": 1965, "valid_targets_mean": 5482.6, "valid_targets_min": 2480 }, { "epoch": 3.203417412530513, "grad_norm": 0.45443106401153505, "learning_rate": 2.6358994378788163e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377660185098648, "step": 1970, "valid_targets_mean": 6621.2, "valid_targets_min": 3045 }, { "epoch": 3.211554109031733, "grad_norm": 0.5569701717755269, "learning_rate": 2.6282056209058936e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.12813882529735565, "step": 1975, "valid_targets_mean": 4760.6, "valid_targets_min": 1870 }, { "epoch": 3.2196908055329536, "grad_norm": 0.5403643934008627, "learning_rate": 2.6205014758018176e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.126073956489563, "step": 1980, "valid_targets_mean": 5044.4, "valid_targets_min": 3035 }, { "epoch": 3.2278275020341742, "grad_norm": 0.4746581189512608, "learning_rate": 2.6127871292280165e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11351381242275238, "step": 1985, "valid_targets_mean": 6290.9, "valid_targets_min": 1744 }, { "epoch": 3.2359641985353944, "grad_norm": 0.5001109013797744, "learning_rate": 2.6050627080136376e-05, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.1430266797542572, "step": 1990, "valid_targets_mean": 4843.6, "valid_targets_min": 2324 }, { "epoch": 3.244100895036615, "grad_norm": 0.4495739039013548, "learning_rate": 2.5973283391534615e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.09228505194187164, "step": 1995, "valid_targets_mean": 4507.0, "valid_targets_min": 2149 }, { "epoch": 3.2522375915378356, "grad_norm": 0.48980120047593206, "learning_rate": 2.589584149805817e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.13319309055805206, "step": 2000, "valid_targets_mean": 7194.9, "valid_targets_min": 977 }, { "epoch": 3.2603742880390563, "grad_norm": 0.4812607915960625, "learning_rate": 2.581830267290486e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.1082778349518776, "step": 2005, "valid_targets_mean": 6961.8, "valid_targets_min": 3516 }, { "epoch": 3.268510984540277, "grad_norm": 0.570112545383423, "learning_rate": 2.574066819086613e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.134844571352005, "step": 2010, "valid_targets_mean": 4588.6, "valid_targets_min": 1036 }, { "epoch": 3.276647681041497, "grad_norm": 0.4362815156888107, "learning_rate": 2.5662939328306113e-05, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.16294899582862854, "step": 2015, "valid_targets_mean": 8057.6, "valid_targets_min": 2510 }, { "epoch": 3.2847843775427177, "grad_norm": 0.4089077124565424, "learning_rate": 2.5585117363140592e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.12175396829843521, "step": 2020, "valid_targets_mean": 6774.1, "valid_targets_min": 3456 }, { "epoch": 3.2929210740439383, "grad_norm": 0.502187014362583, "learning_rate": 2.5507203574816043e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.16614243388175964, "step": 2025, "valid_targets_mean": 6135.8, "valid_targets_min": 2329 }, { "epoch": 3.3010577705451585, "grad_norm": 0.4730402208775795, "learning_rate": 2.542919924428856e-05, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.16762784123420715, "step": 2030, "valid_targets_mean": 5869.8, "valid_targets_min": 1504 }, { "epoch": 3.309194467046379, "grad_norm": 0.5339111572346003, "learning_rate": 2.5351105654002838e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370839774608612, "step": 2035, "valid_targets_mean": 5234.9, "valid_targets_min": 2162 }, { "epoch": 3.3173311635475997, "grad_norm": 0.6413302863152066, "learning_rate": 2.527292408787104e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.16920380294322968, "step": 2040, "valid_targets_mean": 4609.8, "valid_targets_min": 1040 }, { "epoch": 3.3254678600488203, "grad_norm": 0.470230236442957, "learning_rate": 2.5194655831251712e-05, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.12207140028476715, "step": 2045, "valid_targets_mean": 5943.4, "valid_targets_min": 2111 }, { "epoch": 3.3336045565500405, "grad_norm": 0.48456012812970206, "learning_rate": 2.5116302170928678e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.11639226973056793, "step": 2050, "valid_targets_mean": 5307.0, "valid_targets_min": 784 }, { "epoch": 3.341741253051261, "grad_norm": 0.5523702500052676, "learning_rate": 2.5037864395089822e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.106050044298172, "step": 2055, "valid_targets_mean": 4106.2, "valid_targets_min": 1187 }, { "epoch": 3.3498779495524817, "grad_norm": 0.6268239379014566, "learning_rate": 2.495934379330597e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.13571971654891968, "step": 2060, "valid_targets_mean": 4496.1, "valid_targets_min": 1237 }, { "epoch": 3.3580146460537024, "grad_norm": 0.5211118227275444, "learning_rate": 2.4880741656509656e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.18967539072036743, "step": 2065, "valid_targets_mean": 5973.8, "valid_targets_min": 2874 }, { "epoch": 3.3661513425549225, "grad_norm": 0.4867184690553686, "learning_rate": 2.4802059276973904e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.08832257986068726, "step": 2070, "valid_targets_mean": 6020.0, "valid_targets_min": 2571 }, { "epoch": 3.374288039056143, "grad_norm": 0.40231974560194717, "learning_rate": 2.4723297948290982e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.13233518600463867, "step": 2075, "valid_targets_mean": 9070.0, "valid_targets_min": 3459 }, { "epoch": 3.382424735557364, "grad_norm": 0.5154449145165141, "learning_rate": 2.464445896535113e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1818242222070694, "step": 2080, "valid_targets_mean": 6717.2, "valid_targets_min": 4298 }, { "epoch": 3.3905614320585844, "grad_norm": 0.5379336133652549, "learning_rate": 2.45655436243213e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.12027017772197723, "step": 2085, "valid_targets_mean": 5752.2, "valid_targets_min": 3219 }, { "epoch": 3.3986981285598046, "grad_norm": 0.4175221191336141, "learning_rate": 2.44865532226238e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.1881314218044281, "step": 2090, "valid_targets_mean": 8001.6, "valid_targets_min": 2705 }, { "epoch": 3.406834825061025, "grad_norm": 0.5961468554541282, "learning_rate": 2.4407489058915004e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.1391357183456421, "step": 2095, "valid_targets_mean": 4966.1, "valid_targets_min": 3157 }, { "epoch": 3.414971521562246, "grad_norm": 0.4943897075326212, "learning_rate": 2.4328352433063966e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.14456993341445923, "step": 2100, "valid_targets_mean": 7371.6, "valid_targets_min": 4929 }, { "epoch": 3.423108218063466, "grad_norm": 0.4798546004908442, "learning_rate": 2.4249144646131083e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.12103509902954102, "step": 2105, "valid_targets_mean": 5275.5, "valid_targets_min": 2062 }, { "epoch": 3.4312449145646866, "grad_norm": 0.6024466670234377, "learning_rate": 2.4169867000346684e-05, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351066529750824, "step": 2110, "valid_targets_mean": 4428.4, "valid_targets_min": 1064 }, { "epoch": 3.4393816110659072, "grad_norm": 0.5447078874142987, "learning_rate": 2.4090520799089612e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.157949760556221, "step": 2115, "valid_targets_mean": 5712.9, "valid_targets_min": 2100 }, { "epoch": 3.447518307567128, "grad_norm": 0.5293454552675316, "learning_rate": 2.4011107346865844e-05, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.19082076847553253, "step": 2120, "valid_targets_mean": 6204.5, "valid_targets_min": 3697 }, { "epoch": 3.4556550040683485, "grad_norm": 0.496357535543296, "learning_rate": 2.393162794928697e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595294177532196, "step": 2125, "valid_targets_mean": 7122.4, "valid_targets_min": 2914 }, { "epoch": 3.4637917005695686, "grad_norm": 0.5390530304141364, "learning_rate": 2.385208391304879e-05, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.13380271196365356, "step": 2130, "valid_targets_mean": 5964.4, "valid_targets_min": 4317 }, { "epoch": 3.4719283970707893, "grad_norm": 0.48671301947421164, "learning_rate": 2.3772476545909794e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.0984102338552475, "step": 2135, "valid_targets_mean": 5276.6, "valid_targets_min": 2773 }, { "epoch": 3.48006509357201, "grad_norm": 0.5168171595907421, "learning_rate": 2.3692807156669684e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.10761836171150208, "step": 2140, "valid_targets_mean": 5127.4, "valid_targets_min": 1005 }, { "epoch": 3.48820179007323, "grad_norm": 0.45917243865127705, "learning_rate": 2.3613077055147855e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.11678306758403778, "step": 2145, "valid_targets_mean": 6023.4, "valid_targets_min": 1403 }, { "epoch": 3.4963384865744507, "grad_norm": 1.0802408916637594, "learning_rate": 2.3533287552161833e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.12424206733703613, "step": 2150, "valid_targets_mean": 4101.6, "valid_targets_min": 1208 }, { "epoch": 3.5044751830756713, "grad_norm": 0.9725147310489535, "learning_rate": 2.345343995950577e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.11299556493759155, "step": 2155, "valid_targets_mean": 5489.8, "valid_targets_min": 2994 }, { "epoch": 3.512611879576892, "grad_norm": 0.5277612614291434, "learning_rate": 2.3373535589928827e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.14234156906604767, "step": 2160, "valid_targets_mean": 5168.0, "valid_targets_min": 1637 }, { "epoch": 3.5207485760781125, "grad_norm": 0.4577806901348409, "learning_rate": 2.3293575757113635e-05, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.11869750916957855, "step": 2165, "valid_targets_mean": 5705.0, "valid_targets_min": 3465 }, { "epoch": 3.5288852725793327, "grad_norm": 0.48813053590763633, "learning_rate": 2.3213561775654678e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.13192936778068542, "step": 2170, "valid_targets_mean": 5435.0, "valid_targets_min": 2039 }, { "epoch": 3.5370219690805533, "grad_norm": 0.5417864760687305, "learning_rate": 2.3133494961036655e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.14656861126422882, "step": 2175, "valid_targets_mean": 4186.5, "valid_targets_min": 3036 }, { "epoch": 3.545158665581774, "grad_norm": 0.5079700581274689, "learning_rate": 2.305337662961292e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.15438416600227356, "step": 2180, "valid_targets_mean": 5634.9, "valid_targets_min": 1514 }, { "epoch": 3.553295362082994, "grad_norm": 0.4302507514212832, "learning_rate": 2.2973208098583767e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1305883228778839, "step": 2185, "valid_targets_mean": 7573.4, "valid_targets_min": 3714 }, { "epoch": 3.5614320585842147, "grad_norm": 0.4784814526634792, "learning_rate": 2.2892990685974815e-05, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.13934920728206635, "step": 2190, "valid_targets_mean": 6661.2, "valid_targets_min": 2725 }, { "epoch": 3.5695687550854354, "grad_norm": 0.5218194964987156, "learning_rate": 2.2812725710615328e-05, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.1036933958530426, "step": 2195, "valid_targets_mean": 4396.5, "valid_targets_min": 530 }, { "epoch": 3.577705451586656, "grad_norm": 0.3915528153922062, "learning_rate": 2.2732414492116538e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.11413315683603287, "step": 2200, "valid_targets_mean": 7739.1, "valid_targets_min": 988 }, { "epoch": 3.585842148087876, "grad_norm": 0.5474376964212345, "learning_rate": 2.2652058350849955e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.12832045555114746, "step": 2205, "valid_targets_mean": 4460.6, "valid_targets_min": 844 }, { "epoch": 3.5939788445890968, "grad_norm": 0.4513603679012204, "learning_rate": 2.2571658607925624e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.11507508158683777, "step": 2210, "valid_targets_mean": 6023.5, "valid_targets_min": 2711 }, { "epoch": 3.6021155410903174, "grad_norm": 0.4358199903498031, "learning_rate": 2.2491216585170458e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.08925238251686096, "step": 2215, "valid_targets_mean": 5539.4, "valid_targets_min": 841 }, { "epoch": 3.6102522375915376, "grad_norm": 0.5033142192460704, "learning_rate": 2.2410733605106462e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.07945795357227325, "step": 2220, "valid_targets_mean": 4576.6, "valid_targets_min": 1937 }, { "epoch": 3.618388934092758, "grad_norm": 0.5295724882881188, "learning_rate": 2.233021099092902e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273106187582016, "step": 2225, "valid_targets_mean": 5181.6, "valid_targets_min": 3580 }, { "epoch": 3.626525630593979, "grad_norm": 0.49909534425266827, "learning_rate": 2.224965006648512e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.11837124824523926, "step": 2230, "valid_targets_mean": 6526.1, "valid_targets_min": 956 }, { "epoch": 3.6346623270951994, "grad_norm": 0.48550502453666, "learning_rate": 2.2169052156251585e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.13036608695983887, "step": 2235, "valid_targets_mean": 5403.1, "valid_targets_min": 1572 }, { "epoch": 3.64279902359642, "grad_norm": 0.6877569373231779, "learning_rate": 2.2088418585313346e-05, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.15400430560112, "step": 2240, "valid_targets_mean": 4920.0, "valid_targets_min": 1879 }, { "epoch": 3.6509357200976402, "grad_norm": 0.5449931803254913, "learning_rate": 2.200775067934158e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.11476185917854309, "step": 2245, "valid_targets_mean": 4997.9, "valid_targets_min": 1732 }, { "epoch": 3.659072416598861, "grad_norm": 0.4525544723604396, "learning_rate": 2.192704976457198e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.1380799114704132, "step": 2250, "valid_targets_mean": 6882.5, "valid_targets_min": 4428 }, { "epoch": 3.6672091131000815, "grad_norm": 0.5174034196077824, "learning_rate": 2.1846317167782923e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.152031809091568, "step": 2255, "valid_targets_mean": 5447.2, "valid_targets_min": 2463 }, { "epoch": 3.6753458096013016, "grad_norm": 0.44137473000448374, "learning_rate": 2.1765554216273652e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.1166839748620987, "step": 2260, "valid_targets_mean": 6610.4, "valid_targets_min": 3051 }, { "epoch": 3.6834825061025223, "grad_norm": 0.5023783889425373, "learning_rate": 2.1684762237842466e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.20356138050556183, "step": 2265, "valid_targets_mean": 6716.1, "valid_targets_min": 2851 }, { "epoch": 3.691619202603743, "grad_norm": 0.5649370975103999, "learning_rate": 2.1603942560764884e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.14867046475410461, "step": 2270, "valid_targets_mean": 4637.0, "valid_targets_min": 1356 }, { "epoch": 3.6997558991049635, "grad_norm": 0.43128962161492657, "learning_rate": 2.1523096513771825e-05, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.11670452356338501, "step": 2275, "valid_targets_mean": 6769.8, "valid_targets_min": 3135 }, { "epoch": 3.707892595606184, "grad_norm": 0.6107884039191125, "learning_rate": 2.1442225426027724e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.1622416079044342, "step": 2280, "valid_targets_mean": 4730.1, "valid_targets_min": 2457 }, { "epoch": 3.7160292921074043, "grad_norm": 0.42009628659466286, "learning_rate": 2.1361330627108724e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.14188794791698456, "step": 2285, "valid_targets_mean": 8693.0, "valid_targets_min": 3303 }, { "epoch": 3.724165988608625, "grad_norm": 0.4593106062963763, "learning_rate": 2.128041344698078e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.10363125801086426, "step": 2290, "valid_targets_mean": 4878.5, "valid_targets_min": 1828 }, { "epoch": 3.7323026851098455, "grad_norm": 0.43814883641270597, "learning_rate": 2.1199475215977817e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.10538579523563385, "step": 2295, "valid_targets_mean": 5957.1, "valid_targets_min": 2916 }, { "epoch": 3.7404393816110657, "grad_norm": 0.5103737751157224, "learning_rate": 2.1118517264779858e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.12744760513305664, "step": 2300, "valid_targets_mean": 4476.2, "valid_targets_min": 1892 }, { "epoch": 3.7485760781122863, "grad_norm": 0.47819552478708083, "learning_rate": 2.103754092439112e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.11515910178422928, "step": 2305, "valid_targets_mean": 6143.5, "valid_targets_min": 1626 }, { "epoch": 3.756712774613507, "grad_norm": 0.5649450823382121, "learning_rate": 2.095654752611817e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.15299847722053528, "step": 2310, "valid_targets_mean": 5482.8, "valid_targets_min": 624 }, { "epoch": 3.7648494711147276, "grad_norm": 0.43149118197396086, "learning_rate": 2.087553840154801e-05, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.12518690526485443, "step": 2315, "valid_targets_mean": 6021.2, "valid_targets_min": 2664 }, { "epoch": 3.772986167615948, "grad_norm": 0.4891027718138667, "learning_rate": 2.0794514882526196e-05, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.11703081429004669, "step": 2320, "valid_targets_mean": 4964.6, "valid_targets_min": 397 }, { "epoch": 3.7811228641171684, "grad_norm": 0.48601703764578974, "learning_rate": 2.0713478301134935e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.13128621876239777, "step": 2325, "valid_targets_mean": 6682.8, "valid_targets_min": 2997 }, { "epoch": 3.789259560618389, "grad_norm": 0.5447061578281931, "learning_rate": 2.063242998967118e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.12155985832214355, "step": 2330, "valid_targets_mean": 4736.2, "valid_targets_min": 2174 }, { "epoch": 3.7973962571196096, "grad_norm": 0.45017085915069277, "learning_rate": 2.0551371280624758e-05, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.158024862408638, "step": 2335, "valid_targets_mean": 8097.1, "valid_targets_min": 4594 }, { "epoch": 3.8055329536208298, "grad_norm": 0.48647898978382154, "learning_rate": 2.0470303506656414e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.12568457424640656, "step": 2340, "valid_targets_mean": 4161.4, "valid_targets_min": 611 }, { "epoch": 3.8136696501220504, "grad_norm": 0.5446656209319005, "learning_rate": 2.0389228000575953e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.16627874970436096, "step": 2345, "valid_targets_mean": 5223.8, "valid_targets_min": 3621 }, { "epoch": 3.821806346623271, "grad_norm": 0.5378101789966692, "learning_rate": 2.0308146095320275e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.11316706240177155, "step": 2350, "valid_targets_mean": 5668.1, "valid_targets_min": 2857 }, { "epoch": 3.8299430431244916, "grad_norm": 0.4704455377437423, "learning_rate": 2.0227059123931504e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.14419454336166382, "step": 2355, "valid_targets_mean": 6657.2, "valid_targets_min": 2752 }, { "epoch": 3.838079739625712, "grad_norm": 0.4545925318504704, "learning_rate": 2.0145968419535045e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.0803401917219162, "step": 2360, "valid_targets_mean": 5352.0, "valid_targets_min": 2022 }, { "epoch": 3.8462164361269324, "grad_norm": 0.5261750953052919, "learning_rate": 2.0064875315317674e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1119522899389267, "step": 2365, "valid_targets_mean": 5081.0, "valid_targets_min": 1380 }, { "epoch": 3.854353132628153, "grad_norm": 0.5977456077727262, "learning_rate": 1.998378114450565e-05, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.10629862546920776, "step": 2370, "valid_targets_mean": 4967.9, "valid_targets_min": 559 }, { "epoch": 3.862489829129373, "grad_norm": 0.6008964888102649, "learning_rate": 1.9902687240342722e-05, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.11401569843292236, "step": 2375, "valid_targets_mean": 4733.9, "valid_targets_min": 2100 }, { "epoch": 3.870626525630594, "grad_norm": 0.5127247595415064, "learning_rate": 1.982159493606829e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426711082458496, "step": 2380, "valid_targets_mean": 5931.9, "valid_targets_min": 4307 }, { "epoch": 3.8787632221318145, "grad_norm": 0.5231212605718677, "learning_rate": 1.9740505564895436e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.15910865366458893, "step": 2385, "valid_targets_mean": 5790.6, "valid_targets_min": 3166 }, { "epoch": 3.886899918633035, "grad_norm": 0.5112833558456881, "learning_rate": 1.9659420459989026e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.12127886712551117, "step": 2390, "valid_targets_mean": 4869.2, "valid_targets_min": 3034 }, { "epoch": 3.8950366151342557, "grad_norm": 0.4557114664235136, "learning_rate": 1.9578340954443784e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.132114976644516, "step": 2395, "valid_targets_mean": 6727.5, "valid_targets_min": 360 }, { "epoch": 3.903173311635476, "grad_norm": 0.5394796995535039, "learning_rate": 1.949726838126237e-05, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.15240266919136047, "step": 2400, "valid_targets_mean": 5102.9, "valid_targets_min": 2064 }, { "epoch": 3.9113100081366965, "grad_norm": 0.5486897951018997, "learning_rate": 1.941620407333347e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.12607380747795105, "step": 2405, "valid_targets_mean": 4510.5, "valid_targets_min": 1648 }, { "epoch": 3.919446704637917, "grad_norm": 0.42322274272575794, "learning_rate": 1.933514936340991e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.06517419964075089, "step": 2410, "valid_targets_mean": 5701.9, "valid_targets_min": 1451 }, { "epoch": 3.9275834011391373, "grad_norm": 0.49141277897204666, "learning_rate": 1.9254105584086683e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.12552395462989807, "step": 2415, "valid_targets_mean": 5657.6, "valid_targets_min": 3092 }, { "epoch": 3.935720097640358, "grad_norm": 0.5126538411225738, "learning_rate": 1.9173074067779102e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.13129568099975586, "step": 2420, "valid_targets_mean": 5424.1, "valid_targets_min": 2023 }, { "epoch": 3.9438567941415785, "grad_norm": 0.4865930267161227, "learning_rate": 1.9092056146700844e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.12925077974796295, "step": 2425, "valid_targets_mean": 5372.9, "valid_targets_min": 3511 }, { "epoch": 3.951993490642799, "grad_norm": 0.5288677950325463, "learning_rate": 1.9011053152842087e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1401764452457428, "step": 2430, "valid_targets_mean": 5477.1, "valid_targets_min": 958 }, { "epoch": 3.9601301871440198, "grad_norm": 0.5471093288120334, "learning_rate": 1.89300664179476e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709902137517929, "step": 2435, "valid_targets_mean": 5307.8, "valid_targets_min": 1418 }, { "epoch": 3.96826688364524, "grad_norm": 0.6064125532966921, "learning_rate": 1.8849097273494827e-05, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471061408519745, "step": 2440, "valid_targets_mean": 5405.4, "valid_targets_min": 582 }, { "epoch": 3.9764035801464606, "grad_norm": 0.41587136888702764, "learning_rate": 1.8768147050672028e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.09928697347640991, "step": 2445, "valid_targets_mean": 6103.5, "valid_targets_min": 1364 }, { "epoch": 3.984540276647681, "grad_norm": 0.5513050609197007, "learning_rate": 1.8687217080356365e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.12455247342586517, "step": 2450, "valid_targets_mean": 3710.2, "valid_targets_min": 468 }, { "epoch": 3.9926769731489014, "grad_norm": 0.5016492346972834, "learning_rate": 1.8606308693092035e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.10865034908056259, "step": 2455, "valid_targets_mean": 4436.8, "valid_targets_min": 2339 }, { "epoch": 4.0, "grad_norm": 0.6629905256300082, "learning_rate": 1.8525423219068423e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.2965284585952759, "step": 2460, "valid_targets_mean": 5677.5, "valid_targets_min": 2822 }, { "epoch": 4.008136696501221, "grad_norm": 0.5129517123763623, "learning_rate": 1.844456198809817e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.10877451300621033, "step": 2465, "valid_targets_mean": 5123.9, "valid_targets_min": 2568 }, { "epoch": 4.016273393002441, "grad_norm": 0.473163436849981, "learning_rate": 1.8363726329595356e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.14932730793952942, "step": 2470, "valid_targets_mean": 7151.4, "valid_targets_min": 3539 }, { "epoch": 4.024410089503662, "grad_norm": 0.4124240574592047, "learning_rate": 1.828291757255364e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.11770130693912506, "step": 2475, "valid_targets_mean": 8133.2, "valid_targets_min": 3713 }, { "epoch": 4.032546786004882, "grad_norm": 0.6586399627241981, "learning_rate": 1.8202137045524383e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.13058783113956451, "step": 2480, "valid_targets_mean": 6915.6, "valid_targets_min": 4175 }, { "epoch": 4.040683482506102, "grad_norm": 0.5513424168769842, "learning_rate": 1.812138607659486e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.12268248945474625, "step": 2485, "valid_targets_mean": 5776.4, "valid_targets_min": 2434 }, { "epoch": 4.048820179007323, "grad_norm": 0.5252916649047769, "learning_rate": 1.8040665993366355e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.13886849582195282, "step": 2490, "valid_targets_mean": 5557.5, "valid_targets_min": 2120 }, { "epoch": 4.0569568755085434, "grad_norm": 0.5060252786002666, "learning_rate": 1.795997812293239e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.20440292358398438, "step": 2495, "valid_targets_mean": 8090.6, "valid_targets_min": 3649 }, { "epoch": 4.065093572009764, "grad_norm": 0.5304099045808806, "learning_rate": 1.7879323791856875e-05, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.11923650652170181, "step": 2500, "valid_targets_mean": 5128.9, "valid_targets_min": 3118 }, { "epoch": 4.073230268510985, "grad_norm": 0.5848838368779085, "learning_rate": 1.7798704326152317e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.19044384360313416, "step": 2505, "valid_targets_mean": 6830.1, "valid_targets_min": 4289 }, { "epoch": 4.081366965012205, "grad_norm": 0.5705122461346422, "learning_rate": 1.7718121051258016e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.14008468389511108, "step": 2510, "valid_targets_mean": 5542.6, "valid_targets_min": 2108 }, { "epoch": 4.089503661513426, "grad_norm": 0.441927710137963, "learning_rate": 1.763757529201826e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.12376945465803146, "step": 2515, "valid_targets_mean": 6966.4, "valid_targets_min": 1952 }, { "epoch": 4.097640358014646, "grad_norm": 0.7043747925369948, "learning_rate": 1.7557068372660562e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.12836799025535583, "step": 2520, "valid_targets_mean": 4607.2, "valid_targets_min": 2518 }, { "epoch": 4.105777054515866, "grad_norm": 0.5410005564912586, "learning_rate": 1.747660161677387e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.15527786314487457, "step": 2525, "valid_targets_mean": 6187.5, "valid_targets_min": 1744 }, { "epoch": 4.113913751017087, "grad_norm": 0.4912342111176402, "learning_rate": 1.7396176347286838e-05, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.1411733329296112, "step": 2530, "valid_targets_mean": 6837.1, "valid_targets_min": 2828 }, { "epoch": 4.1220504475183075, "grad_norm": 0.5865774973750087, "learning_rate": 1.7315793886446036e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1618509590625763, "step": 2535, "valid_targets_mean": 5910.0, "valid_targets_min": 3286 }, { "epoch": 4.130187144019528, "grad_norm": 0.626903542457007, "learning_rate": 1.7235455555794236e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.13324236869812012, "step": 2540, "valid_targets_mean": 5587.8, "valid_targets_min": 2551 }, { "epoch": 4.138323840520749, "grad_norm": 0.5795141806915454, "learning_rate": 1.7155162676148682e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.12815946340560913, "step": 2545, "valid_targets_mean": 5687.1, "valid_targets_min": 1514 }, { "epoch": 4.146460537021969, "grad_norm": 0.5206487840907027, "learning_rate": 1.707491656757936e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.14685989916324615, "step": 2550, "valid_targets_mean": 6729.9, "valid_targets_min": 1309 }, { "epoch": 4.15459723352319, "grad_norm": 0.5418721063841692, "learning_rate": 1.6994718549387332e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.11401748657226562, "step": 2555, "valid_targets_mean": 4553.0, "valid_targets_min": 914 }, { "epoch": 4.16273393002441, "grad_norm": 0.5304635472704533, "learning_rate": 1.6914569940083004e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.15515920519828796, "step": 2560, "valid_targets_mean": 5698.4, "valid_targets_min": 3076 }, { "epoch": 4.17087062652563, "grad_norm": 0.5577644314206343, "learning_rate": 1.6834472057364462e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.1251552402973175, "step": 2565, "valid_targets_mean": 5167.2, "valid_targets_min": 897 }, { "epoch": 4.179007323026851, "grad_norm": 0.516551191316929, "learning_rate": 1.6754426218095827e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.13127167522907257, "step": 2570, "valid_targets_mean": 5867.4, "valid_targets_min": 3286 }, { "epoch": 4.187144019528072, "grad_norm": 0.4789758761612466, "learning_rate": 1.6674433738285573e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.1123281717300415, "step": 2575, "valid_targets_mean": 6434.2, "valid_targets_min": 3024 }, { "epoch": 4.195280716029292, "grad_norm": 0.5647313559781841, "learning_rate": 1.6594495933064926e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.16273194551467896, "step": 2580, "valid_targets_mean": 5906.6, "valid_targets_min": 3636 }, { "epoch": 4.203417412530513, "grad_norm": 0.4660706331602136, "learning_rate": 1.6514614116666213e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.11347354203462601, "step": 2585, "valid_targets_mean": 7309.0, "valid_targets_min": 2153 }, { "epoch": 4.211554109031733, "grad_norm": 0.5253962224050552, "learning_rate": 1.6434789602401264e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1410287618637085, "step": 2590, "valid_targets_mean": 6679.8, "valid_targets_min": 1391 }, { "epoch": 4.219690805532954, "grad_norm": 0.5081317554456144, "learning_rate": 1.6355023702639835e-05, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.10498687624931335, "step": 2595, "valid_targets_mean": 5955.5, "valid_targets_min": 1427 }, { "epoch": 4.227827502034174, "grad_norm": 0.5133995179689695, "learning_rate": 1.6275317728787995e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.15336143970489502, "step": 2600, "valid_targets_mean": 6639.5, "valid_targets_min": 3253 }, { "epoch": 4.235964198535394, "grad_norm": 0.6025044099778876, "learning_rate": 1.6195672991266627e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540364921092987, "step": 2605, "valid_targets_mean": 5138.1, "valid_targets_min": 1887 }, { "epoch": 4.244100895036615, "grad_norm": 0.5322557851182275, "learning_rate": 1.6116090799489817e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.13185200095176697, "step": 2610, "valid_targets_mean": 6066.1, "valid_targets_min": 3914 }, { "epoch": 4.252237591537836, "grad_norm": 0.5441188482256656, "learning_rate": 1.603657246184337e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.12901723384857178, "step": 2615, "valid_targets_mean": 4693.8, "valid_targets_min": 1555 }, { "epoch": 4.260374288039056, "grad_norm": 0.5849782251122515, "learning_rate": 1.5957119285663276e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.11500156670808792, "step": 2620, "valid_targets_mean": 5282.9, "valid_targets_min": 2751 }, { "epoch": 4.268510984540277, "grad_norm": 0.48316160524922036, "learning_rate": 1.5877732577214227e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.12493854761123657, "step": 2625, "valid_targets_mean": 6715.5, "valid_targets_min": 2447 }, { "epoch": 4.2766476810414975, "grad_norm": 0.5053057310492522, "learning_rate": 1.5798413641668152e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.10976533591747284, "step": 2630, "valid_targets_mean": 5234.4, "valid_targets_min": 3316 }, { "epoch": 4.284784377542717, "grad_norm": 0.5519671887282555, "learning_rate": 1.5719163783082735e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.11516216397285461, "step": 2635, "valid_targets_mean": 4224.4, "valid_targets_min": 2866 }, { "epoch": 4.292921074043938, "grad_norm": 0.5225037254497872, "learning_rate": 1.563998430437999e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.17195287346839905, "step": 2640, "valid_targets_mean": 5706.8, "valid_targets_min": 3850 }, { "epoch": 4.3010577705451585, "grad_norm": 0.598135661385332, "learning_rate": 1.556087650732483e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.13336588442325592, "step": 2645, "valid_targets_mean": 4468.4, "valid_targets_min": 3203 }, { "epoch": 4.309194467046379, "grad_norm": 0.5569556750382165, "learning_rate": 1.5481841692503696e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.1275118738412857, "step": 2650, "valid_targets_mean": 6468.5, "valid_targets_min": 2076 }, { "epoch": 4.3173311635476, "grad_norm": 0.5748124791778696, "learning_rate": 1.5402881159303132e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.13305258750915527, "step": 2655, "valid_targets_mean": 5509.2, "valid_targets_min": 4168 }, { "epoch": 4.32546786004882, "grad_norm": 0.5867859868511631, "learning_rate": 1.5323996205888444e-05, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.10594667494297028, "step": 2660, "valid_targets_mean": 4375.5, "valid_targets_min": 1215 }, { "epoch": 4.333604556550041, "grad_norm": 0.5536999755590897, "learning_rate": 1.5245188129182352e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.15136541426181793, "step": 2665, "valid_targets_mean": 6034.4, "valid_targets_min": 2955 }, { "epoch": 4.341741253051262, "grad_norm": 0.45096926773078744, "learning_rate": 1.5166458224843666e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.15225692093372345, "step": 2670, "valid_targets_mean": 7230.6, "valid_targets_min": 4046 }, { "epoch": 4.349877949552481, "grad_norm": 0.4876695137087219, "learning_rate": 1.5087807787246018e-05, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.1192513108253479, "step": 2675, "valid_targets_mean": 6170.1, "valid_targets_min": 4160 }, { "epoch": 4.358014646053702, "grad_norm": 0.518906460408022, "learning_rate": 1.5009238109456519e-05, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.11651073396205902, "step": 2680, "valid_targets_mean": 5396.5, "valid_targets_min": 2022 }, { "epoch": 4.3661513425549225, "grad_norm": 0.49929632927019785, "learning_rate": 1.4930750483214545e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.12936654686927795, "step": 2685, "valid_targets_mean": 6563.0, "valid_targets_min": 3114 }, { "epoch": 4.374288039056143, "grad_norm": 0.6156782440298237, "learning_rate": 1.485234619891049e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.11831729114055634, "step": 2690, "valid_targets_mean": 3777.8, "valid_targets_min": 1211 }, { "epoch": 4.382424735557364, "grad_norm": 0.49361613525157977, "learning_rate": 1.4774026545564542e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.13980375230312347, "step": 2695, "valid_targets_mean": 6734.5, "valid_targets_min": 3579 }, { "epoch": 4.390561432058584, "grad_norm": 0.4945912218477993, "learning_rate": 1.4695792810805513e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.11305113881826401, "step": 2700, "valid_targets_mean": 4944.9, "valid_targets_min": 2712 }, { "epoch": 4.398698128559805, "grad_norm": 0.5756325553240135, "learning_rate": 1.4617646280849642e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.12662610411643982, "step": 2705, "valid_targets_mean": 4155.1, "valid_targets_min": 2861 }, { "epoch": 4.406834825061026, "grad_norm": 0.4985205743712053, "learning_rate": 1.4539588240479465e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.12237317860126495, "step": 2710, "valid_targets_mean": 6090.8, "valid_targets_min": 4559 }, { "epoch": 4.414971521562245, "grad_norm": 0.5203081116851938, "learning_rate": 1.4461619973022687e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1582365483045578, "step": 2715, "valid_targets_mean": 5534.2, "valid_targets_min": 2713 }, { "epoch": 4.423108218063466, "grad_norm": 0.5071779116892461, "learning_rate": 1.4383742760331076e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.10871212184429169, "step": 2720, "valid_targets_mean": 5417.2, "valid_targets_min": 1808 }, { "epoch": 4.431244914564687, "grad_norm": 0.5122608576322747, "learning_rate": 1.4305957882759427e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.09927636384963989, "step": 2725, "valid_targets_mean": 4650.1, "valid_targets_min": 544 }, { "epoch": 4.439381611065907, "grad_norm": 0.6181215239682092, "learning_rate": 1.4228266619144453e-05, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.1790265142917633, "step": 2730, "valid_targets_mean": 5120.4, "valid_targets_min": 2997 }, { "epoch": 4.447518307567128, "grad_norm": 0.568948631389522, "learning_rate": 1.4150670246783799e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.12507446110248566, "step": 2735, "valid_targets_mean": 4760.6, "valid_targets_min": 2546 }, { "epoch": 4.4556550040683485, "grad_norm": 0.49435152766723117, "learning_rate": 1.4073170041415028e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1444876343011856, "step": 2740, "valid_targets_mean": 6215.4, "valid_targets_min": 3236 }, { "epoch": 4.463791700569569, "grad_norm": 0.6181766282098673, "learning_rate": 1.3995767277194665e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.10405126214027405, "step": 2745, "valid_targets_mean": 4468.4, "valid_targets_min": 724 }, { "epoch": 4.471928397070789, "grad_norm": 0.41154847544209594, "learning_rate": 1.391846322667722e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.0906953513622284, "step": 2750, "valid_targets_mean": 5218.9, "valid_targets_min": 2520 }, { "epoch": 4.480065093572009, "grad_norm": 0.6572132993720595, "learning_rate": 1.3841259160794298e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.12475261837244034, "step": 2755, "valid_targets_mean": 6810.9, "valid_targets_min": 2340 }, { "epoch": 4.48820179007323, "grad_norm": 0.5336969527360339, "learning_rate": 1.3764156348833666e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.12281182408332825, "step": 2760, "valid_targets_mean": 6573.4, "valid_targets_min": 984 }, { "epoch": 4.496338486574451, "grad_norm": 0.568863776583933, "learning_rate": 1.3687156058418422e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.1258392333984375, "step": 2765, "valid_targets_mean": 4216.4, "valid_targets_min": 2142 }, { "epoch": 4.504475183075671, "grad_norm": 0.5202434927147002, "learning_rate": 1.3610259555486152e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.14846715331077576, "step": 2770, "valid_targets_mean": 5878.0, "valid_targets_min": 880 }, { "epoch": 4.512611879576892, "grad_norm": 0.620131546040906, "learning_rate": 1.3533468104268078e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.1723940074443817, "step": 2775, "valid_targets_mean": 5155.9, "valid_targets_min": 902 }, { "epoch": 4.5207485760781125, "grad_norm": 0.49196921841926167, "learning_rate": 1.3456782967268316e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.12150443345308304, "step": 2780, "valid_targets_mean": 5932.6, "valid_targets_min": 3864 }, { "epoch": 4.528885272579333, "grad_norm": 0.4638624677398862, "learning_rate": 1.3380205405243096e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.09334471076726913, "step": 2785, "valid_targets_mean": 5831.0, "valid_targets_min": 2304 }, { "epoch": 4.537021969080554, "grad_norm": 0.582037329244977, "learning_rate": 1.3303736677180044e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.17545725405216217, "step": 2790, "valid_targets_mean": 5931.8, "valid_targets_min": 1744 }, { "epoch": 4.5451586655817735, "grad_norm": 0.40849974141197115, "learning_rate": 1.322737804027749e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.11623605340719223, "step": 2795, "valid_targets_mean": 8913.4, "valid_targets_min": 3525 }, { "epoch": 4.553295362082994, "grad_norm": 0.5932308533815444, "learning_rate": 1.315113074992378e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.11075286567211151, "step": 2800, "valid_targets_mean": 6780.4, "valid_targets_min": 4594 }, { "epoch": 4.561432058584215, "grad_norm": 0.5613236786122735, "learning_rate": 1.3074996059676644e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.12261034548282623, "step": 2805, "valid_targets_mean": 6014.5, "valid_targets_min": 1412 }, { "epoch": 4.569568755085435, "grad_norm": 0.6145107752409859, "learning_rate": 1.2998975221242596e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.11969676613807678, "step": 2810, "valid_targets_mean": 6176.0, "valid_targets_min": 2517 }, { "epoch": 4.577705451586656, "grad_norm": 0.5116817887496089, "learning_rate": 1.292306948445634e-05, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.09205292165279388, "step": 2815, "valid_targets_mean": 4062.6, "valid_targets_min": 1865 }, { "epoch": 4.585842148087877, "grad_norm": 0.5032628834115105, "learning_rate": 1.2847280097260245e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.10667150467634201, "step": 2820, "valid_targets_mean": 5223.2, "valid_targets_min": 1628 }, { "epoch": 4.593978844589097, "grad_norm": 0.519138895357275, "learning_rate": 1.2771608305683798e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.1109437346458435, "step": 2825, "valid_targets_mean": 5241.1, "valid_targets_min": 2067 }, { "epoch": 4.602115541090317, "grad_norm": 0.525394243588212, "learning_rate": 1.269605535382314e-05, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.16636374592781067, "step": 2830, "valid_targets_mean": 6438.2, "valid_targets_min": 558 }, { "epoch": 4.610252237591538, "grad_norm": 0.5191821565520898, "learning_rate": 1.2620622483820604e-05, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.11650275439023972, "step": 2835, "valid_targets_mean": 4864.6, "valid_targets_min": 524 }, { "epoch": 4.618388934092758, "grad_norm": 0.5627143798214106, "learning_rate": 1.2545310935844288e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.09677013009786606, "step": 2840, "valid_targets_mean": 3457.5, "valid_targets_min": 360 }, { "epoch": 4.626525630593979, "grad_norm": 0.5874185551809977, "learning_rate": 1.2470121948067693e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.1323344111442566, "step": 2845, "valid_targets_mean": 5520.2, "valid_targets_min": 2752 }, { "epoch": 4.634662327095199, "grad_norm": 0.5568858672026162, "learning_rate": 1.2395056756649328e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.13221968710422516, "step": 2850, "valid_targets_mean": 5042.0, "valid_targets_min": 1374 }, { "epoch": 4.64279902359642, "grad_norm": 0.4669743898337823, "learning_rate": 1.2320116595712413e-05, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.10005086660385132, "step": 2855, "valid_targets_mean": 6354.0, "valid_targets_min": 2977 }, { "epoch": 4.650935720097641, "grad_norm": 0.890197194306011, "learning_rate": 1.224530269732457e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.11468639224767685, "step": 2860, "valid_targets_mean": 4317.4, "valid_targets_min": 1349 }, { "epoch": 4.65907241659886, "grad_norm": 0.523673019189796, "learning_rate": 1.2170616291477595e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.10656925290822983, "step": 2865, "valid_targets_mean": 5904.4, "valid_targets_min": 513 }, { "epoch": 4.667209113100081, "grad_norm": 0.5080582692191867, "learning_rate": 1.2096058606067205e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.10707581788301468, "step": 2870, "valid_targets_mean": 4963.8, "valid_targets_min": 2731 }, { "epoch": 4.675345809601302, "grad_norm": 0.5988092562512479, "learning_rate": 1.2021630866872877e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1406228244304657, "step": 2875, "valid_targets_mean": 5334.5, "valid_targets_min": 1531 }, { "epoch": 4.683482506102522, "grad_norm": 0.41508039808193575, "learning_rate": 1.1947334297537675e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.07547567784786224, "step": 2880, "valid_targets_mean": 6389.6, "valid_targets_min": 1338 }, { "epoch": 4.691619202603743, "grad_norm": 0.4920978401058176, "learning_rate": 1.1873170119548134e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.12869910895824432, "step": 2885, "valid_targets_mean": 6174.5, "valid_targets_min": 1998 }, { "epoch": 4.6997558991049635, "grad_norm": 0.5167942635637724, "learning_rate": 1.1799139552214202e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.16343358159065247, "step": 2890, "valid_targets_mean": 5750.2, "valid_targets_min": 3412 }, { "epoch": 4.707892595606184, "grad_norm": 0.6239170640519179, "learning_rate": 1.1725243812649168e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.14894859492778778, "step": 2895, "valid_targets_mean": 5554.4, "valid_targets_min": 4602 }, { "epoch": 4.716029292107405, "grad_norm": 0.5652543437239146, "learning_rate": 1.1651484115749647e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.13217860460281372, "step": 2900, "valid_targets_mean": 4814.0, "valid_targets_min": 1908 }, { "epoch": 4.724165988608625, "grad_norm": 0.43613616950750617, "learning_rate": 1.1577861674175645e-05, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.11000243574380875, "step": 2905, "valid_targets_mean": 6706.0, "valid_targets_min": 2946 }, { "epoch": 4.732302685109845, "grad_norm": 0.5312582849880375, "learning_rate": 1.1504377698330575e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.10568075627088547, "step": 2910, "valid_targets_mean": 4921.6, "valid_targets_min": 2460 }, { "epoch": 4.740439381611066, "grad_norm": 0.47078207010849765, "learning_rate": 1.1431033396341391e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.1127002015709877, "step": 2915, "valid_targets_mean": 6926.8, "valid_targets_min": 1427 }, { "epoch": 4.748576078112286, "grad_norm": 0.5215888340298842, "learning_rate": 1.1357829974038703e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564989537000656, "step": 2920, "valid_targets_mean": 6785.0, "valid_targets_min": 3423 }, { "epoch": 4.756712774613507, "grad_norm": 0.5470344569640518, "learning_rate": 1.1284768634936971e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.187900573015213, "step": 2925, "valid_targets_mean": 6071.8, "valid_targets_min": 2555 }, { "epoch": 4.764849471114728, "grad_norm": 0.5184922299861338, "learning_rate": 1.1211850580214703e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.10915215313434601, "step": 2930, "valid_targets_mean": 5272.6, "valid_targets_min": 774 }, { "epoch": 4.772986167615948, "grad_norm": 0.5260960542301046, "learning_rate": 1.1139077008694712e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.16236786544322968, "step": 2935, "valid_targets_mean": 6286.5, "valid_targets_min": 1737 }, { "epoch": 4.781122864117169, "grad_norm": 0.5220847375110784, "learning_rate": 1.1066449116824428e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.12581384181976318, "step": 2940, "valid_targets_mean": 5605.1, "valid_targets_min": 4296 }, { "epoch": 4.7892595606183885, "grad_norm": 0.48555117830549954, "learning_rate": 1.099396809865618e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.10319238156080246, "step": 2945, "valid_targets_mean": 5697.5, "valid_targets_min": 1837 }, { "epoch": 4.797396257119609, "grad_norm": 0.5192267689139981, "learning_rate": 1.0921635145827611e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1321655809879303, "step": 2950, "valid_targets_mean": 6476.0, "valid_targets_min": 3020 }, { "epoch": 4.80553295362083, "grad_norm": 0.5076930593639264, "learning_rate": 1.0849451447542054e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.11374587565660477, "step": 2955, "valid_targets_mean": 6396.4, "valid_targets_min": 1826 }, { "epoch": 4.81366965012205, "grad_norm": 0.6351691391627748, "learning_rate": 1.0777418190549018e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.2092050015926361, "step": 2960, "valid_targets_mean": 4927.0, "valid_targets_min": 803 }, { "epoch": 4.821806346623271, "grad_norm": 0.55668226084915, "learning_rate": 1.070553655912463e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.11320999264717102, "step": 2965, "valid_targets_mean": 4125.8, "valid_targets_min": 1163 }, { "epoch": 4.829943043124492, "grad_norm": 0.4950231660068158, "learning_rate": 1.0633807735052202e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.11982996016740799, "step": 2970, "valid_targets_mean": 4853.8, "valid_targets_min": 2324 }, { "epoch": 4.838079739625712, "grad_norm": 0.7573897869396419, "learning_rate": 1.056223289760278e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10986106842756271, "step": 2975, "valid_targets_mean": 6308.2, "valid_targets_min": 2719 }, { "epoch": 4.846216436126932, "grad_norm": 0.5238872739771269, "learning_rate": 1.0490813223515764e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.12110009789466858, "step": 2980, "valid_targets_mean": 6574.9, "valid_targets_min": 3849 }, { "epoch": 4.854353132628153, "grad_norm": 0.6054997927877389, "learning_rate": 1.0419549886979582e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.14355552196502686, "step": 2985, "valid_targets_mean": 4339.4, "valid_targets_min": 947 }, { "epoch": 4.862489829129373, "grad_norm": 0.5891493401006247, "learning_rate": 1.0348444059612338e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.12982431054115295, "step": 2990, "valid_targets_mean": 4962.1, "valid_targets_min": 3174 }, { "epoch": 4.870626525630594, "grad_norm": 0.49481010220886834, "learning_rate": 1.0277496910442596e-05, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.11110454797744751, "step": 2995, "valid_targets_mean": 5967.2, "valid_targets_min": 767 }, { "epoch": 4.8787632221318145, "grad_norm": 0.45375461974264514, "learning_rate": 1.0206709605890133e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309911608695984, "step": 3000, "valid_targets_mean": 5787.9, "valid_targets_min": 3290 }, { "epoch": 4.886899918633035, "grad_norm": 0.4717289745698522, "learning_rate": 1.0136083309746765e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.18679049611091614, "step": 3005, "valid_targets_mean": 8518.8, "valid_targets_min": 5241 }, { "epoch": 4.895036615134256, "grad_norm": 0.4826417818565528, "learning_rate": 1.006561918315724e-05, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.14399048686027527, "step": 3010, "valid_targets_mean": 6302.8, "valid_targets_min": 4959 }, { "epoch": 4.903173311635476, "grad_norm": 0.626033134101394, "learning_rate": 9.995318384600112e-06, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.13014422357082367, "step": 3015, "valid_targets_mean": 6003.1, "valid_targets_min": 1225 }, { "epoch": 4.911310008136697, "grad_norm": 0.530085231028136, "learning_rate": 9.92518206986871e-06, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.09500178694725037, "step": 3020, "valid_targets_mean": 4791.5, "valid_targets_min": 524 }, { "epoch": 4.919446704637917, "grad_norm": 0.645773429216433, "learning_rate": 9.855211392052139e-06, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.1401991993188858, "step": 3025, "valid_targets_mean": 4193.1, "valid_targets_min": 2546 }, { "epoch": 4.927583401139137, "grad_norm": 0.5337804157823813, "learning_rate": 9.78540750151632e-06, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.13427186012268066, "step": 3030, "valid_targets_mean": 5285.6, "valid_targets_min": 1577 }, { "epoch": 4.935720097640358, "grad_norm": 1.9302688171029854, "learning_rate": 9.715771545885076e-06, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.14041340351104736, "step": 3035, "valid_targets_mean": 7417.6, "valid_targets_min": 3274 }, { "epoch": 4.9438567941415785, "grad_norm": 0.5343935268176057, "learning_rate": 9.646304670021263e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1480150669813156, "step": 3040, "valid_targets_mean": 6581.8, "valid_targets_min": 1927 }, { "epoch": 4.951993490642799, "grad_norm": 0.569875399697325, "learning_rate": 9.577008016007956e-06, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.17220965027809143, "step": 3045, "valid_targets_mean": 5431.8, "valid_targets_min": 1040 }, { "epoch": 4.96013018714402, "grad_norm": 0.47006455437543826, "learning_rate": 9.50788272312966e-06, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282365322113037, "step": 3050, "valid_targets_mean": 6441.4, "valid_targets_min": 427 }, { "epoch": 4.96826688364524, "grad_norm": 0.5349848814276844, "learning_rate": 9.43892992785358e-06, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.12551423907279968, "step": 3055, "valid_targets_mean": 5614.6, "valid_targets_min": 2311 }, { "epoch": 4.97640358014646, "grad_norm": 0.5428356503095221, "learning_rate": 9.370150763810966e-06, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.10237240791320801, "step": 3060, "valid_targets_mean": 4330.6, "valid_targets_min": 2059 }, { "epoch": 4.984540276647681, "grad_norm": 0.48029744452868756, "learning_rate": 9.301546361778424e-06, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.13645213842391968, "step": 3065, "valid_targets_mean": 8541.2, "valid_targets_min": 2287 }, { "epoch": 4.992676973148901, "grad_norm": 0.6660157157795131, "learning_rate": 9.233117849659367e-06, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.12218661606311798, "step": 3070, "valid_targets_mean": 5242.0, "valid_targets_min": 3400 }, { "epoch": 5.0, "grad_norm": 0.6496835877212901, "learning_rate": 9.164866352465447e-06, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.23714704811573029, "step": 3075, "valid_targets_mean": 6213.5, "valid_targets_min": 4269 }, { "epoch": 5.008136696501221, "grad_norm": 0.5523377269177591, "learning_rate": 9.096792992298089e-06, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.14559800922870636, "step": 3080, "valid_targets_mean": 5338.9, "valid_targets_min": 1860 }, { "epoch": 5.016273393002441, "grad_norm": 0.48621978067676924, "learning_rate": 9.028898888330005e-06, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.11603275686502457, "step": 3085, "valid_targets_mean": 7716.8, "valid_targets_min": 4160 }, { "epoch": 5.024410089503662, "grad_norm": 0.4888228209250331, "learning_rate": 8.961185156786815e-06, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15556365251541138, "step": 3090, "valid_targets_mean": 7306.2, "valid_targets_min": 1730 }, { "epoch": 5.032546786004882, "grad_norm": 0.5604592596720499, "learning_rate": 8.893652910928698e-06, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.09606099128723145, "step": 3095, "valid_targets_mean": 4868.5, "valid_targets_min": 867 }, { "epoch": 5.040683482506102, "grad_norm": 0.5312703952374581, "learning_rate": 8.826303261032072e-06, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.14954786002635956, "step": 3100, "valid_targets_mean": 5175.0, "valid_targets_min": 3054 }, { "epoch": 5.048820179007323, "grad_norm": 0.49989048406424097, "learning_rate": 8.759137314371378e-06, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.10760124027729034, "step": 3105, "valid_targets_mean": 6618.8, "valid_targets_min": 2164 }, { "epoch": 5.0569568755085434, "grad_norm": 0.7886032990488385, "learning_rate": 8.692156175200823e-06, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1214192658662796, "step": 3110, "valid_targets_mean": 6027.0, "valid_targets_min": 2787 }, { "epoch": 5.065093572009764, "grad_norm": 0.48898341530084205, "learning_rate": 8.625360944736262e-06, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.11569772660732269, "step": 3115, "valid_targets_mean": 6272.9, "valid_targets_min": 372 }, { "epoch": 5.073230268510985, "grad_norm": 0.5956493423805724, "learning_rate": 8.558752721137089e-06, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.1290283203125, "step": 3120, "valid_targets_mean": 5507.6, "valid_targets_min": 3024 }, { "epoch": 5.081366965012205, "grad_norm": 0.5660632743523386, "learning_rate": 8.492332599488157e-06, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.10170029103755951, "step": 3125, "valid_targets_mean": 4242.0, "valid_targets_min": 541 }, { "epoch": 5.089503661513426, "grad_norm": 0.5887922517647676, "learning_rate": 8.42610167178183e-06, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.15197445452213287, "step": 3130, "valid_targets_mean": 5382.2, "valid_targets_min": 3204 }, { "epoch": 5.097640358014646, "grad_norm": 0.487011491561986, "learning_rate": 8.360061026899962e-06, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.12325992435216904, "step": 3135, "valid_targets_mean": 8065.1, "valid_targets_min": 3117 }, { "epoch": 5.105777054515866, "grad_norm": 0.5182417975398911, "learning_rate": 8.294211750596035e-06, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.09405682235956192, "step": 3140, "valid_targets_mean": 5815.0, "valid_targets_min": 466 }, { "epoch": 5.113913751017087, "grad_norm": 0.5322887135274532, "learning_rate": 8.228554925477306e-06, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.11751969158649445, "step": 3145, "valid_targets_mean": 6338.4, "valid_targets_min": 2067 }, { "epoch": 5.1220504475183075, "grad_norm": 0.5012197400585588, "learning_rate": 8.163091630987e-06, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.16712604463100433, "step": 3150, "valid_targets_mean": 6505.2, "valid_targets_min": 2195 }, { "epoch": 5.130187144019528, "grad_norm": 0.5774573904412683, "learning_rate": 8.097822943386563e-06, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.14454790949821472, "step": 3155, "valid_targets_mean": 5446.6, "valid_targets_min": 2004 }, { "epoch": 5.138323840520749, "grad_norm": 0.5165060277624411, "learning_rate": 8.03274993573797e-06, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.14901450276374817, "step": 3160, "valid_targets_mean": 6276.4, "valid_targets_min": 3350 }, { "epoch": 5.146460537021969, "grad_norm": 0.4804753447195192, "learning_rate": 7.96787367788609e-06, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.11782047897577286, "step": 3165, "valid_targets_mean": 6550.2, "valid_targets_min": 1879 }, { "epoch": 5.15459723352319, "grad_norm": 0.6535091078691466, "learning_rate": 7.903195236441086e-06, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.11725549399852753, "step": 3170, "valid_targets_mean": 6698.9, "valid_targets_min": 1744 }, { "epoch": 5.16273393002441, "grad_norm": 0.4259935959590437, "learning_rate": 7.838715674760874e-06, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.0984138548374176, "step": 3175, "valid_targets_mean": 7291.5, "valid_targets_min": 2757 }, { "epoch": 5.17087062652563, "grad_norm": 0.5362331748478609, "learning_rate": 7.774436052933675e-06, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1301015317440033, "step": 3180, "valid_targets_mean": 5733.1, "valid_targets_min": 2704 }, { "epoch": 5.179007323026851, "grad_norm": 0.4742304640079011, "learning_rate": 7.710357427760541e-06, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.11534355580806732, "step": 3185, "valid_targets_mean": 7236.4, "valid_targets_min": 897 }, { "epoch": 5.187144019528072, "grad_norm": 0.5344847333949452, "learning_rate": 7.646480852738008e-06, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.11348524689674377, "step": 3190, "valid_targets_mean": 6580.0, "valid_targets_min": 1862 }, { "epoch": 5.195280716029292, "grad_norm": 0.5127549344284401, "learning_rate": 7.5828073780407575e-06, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.12163542211055756, "step": 3195, "valid_targets_mean": 7134.1, "valid_targets_min": 4067 }, { "epoch": 5.203417412530513, "grad_norm": 0.43286097887389563, "learning_rate": 7.51933805050439e-06, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.11376143991947174, "step": 3200, "valid_targets_mean": 9556.1, "valid_targets_min": 3383 }, { "epoch": 5.211554109031733, "grad_norm": 0.574180003978773, "learning_rate": 7.45607391360816e-06, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.0861620083451271, "step": 3205, "valid_targets_mean": 3932.6, "valid_targets_min": 1533 }, { "epoch": 5.219690805532954, "grad_norm": 0.6356603119387289, "learning_rate": 7.393016007457858e-06, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.19337713718414307, "step": 3210, "valid_targets_mean": 6120.9, "valid_targets_min": 3426 }, { "epoch": 5.227827502034174, "grad_norm": 0.7725829783966397, "learning_rate": 7.3301653687687005e-06, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.1038031131029129, "step": 3215, "valid_targets_mean": 5630.2, "valid_targets_min": 1724 }, { "epoch": 5.235964198535394, "grad_norm": 0.6539324695436758, "learning_rate": 7.2675230308482715e-06, "loss": 0.2431, "loss_nan_ranks": 0, "loss_rank_avg": 0.12459734082221985, "step": 3220, "valid_targets_mean": 7373.1, "valid_targets_min": 4269 }, { "epoch": 5.244100895036615, "grad_norm": 0.5030860212842273, "learning_rate": 7.205090023579575e-06, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.12467215210199356, "step": 3225, "valid_targets_mean": 6925.0, "valid_targets_min": 2743 }, { "epoch": 5.252237591537836, "grad_norm": 0.5831950972097935, "learning_rate": 7.142867373404054e-06, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.120590440928936, "step": 3230, "valid_targets_mean": 5793.6, "valid_targets_min": 1388 }, { "epoch": 5.260374288039056, "grad_norm": 0.550231410324282, "learning_rate": 7.080856103304739e-06, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.12391173839569092, "step": 3235, "valid_targets_mean": 5339.4, "valid_targets_min": 3466 }, { "epoch": 5.268510984540277, "grad_norm": 0.5759308774766279, "learning_rate": 7.019057232789432e-06, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.11659073829650879, "step": 3240, "valid_targets_mean": 4783.8, "valid_targets_min": 1721 }, { "epoch": 5.2766476810414975, "grad_norm": 0.6119869770255949, "learning_rate": 6.95747177787393e-06, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.12066857516765594, "step": 3245, "valid_targets_mean": 5504.8, "valid_targets_min": 2771 }, { "epoch": 5.284784377542717, "grad_norm": 0.4599465517768359, "learning_rate": 6.896100751065355e-06, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.10617942363023758, "step": 3250, "valid_targets_mean": 6689.1, "valid_targets_min": 4081 }, { "epoch": 5.292921074043938, "grad_norm": 0.6272025768366799, "learning_rate": 6.834945161345458e-06, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.12755145132541656, "step": 3255, "valid_targets_mean": 5025.0, "valid_targets_min": 1015 }, { "epoch": 5.3010577705451585, "grad_norm": 0.6127725285042429, "learning_rate": 6.7740060141540735e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.13596072793006897, "step": 3260, "valid_targets_mean": 3870.8, "valid_targets_min": 614 }, { "epoch": 5.309194467046379, "grad_norm": 0.6393405669196937, "learning_rate": 6.713284311372559e-06, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.13608285784721375, "step": 3265, "valid_targets_mean": 3831.1, "valid_targets_min": 1395 }, { "epoch": 5.3173311635476, "grad_norm": 0.519005266223286, "learning_rate": 6.652781051307347e-06, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.09571771323680878, "step": 3270, "valid_targets_mean": 5871.8, "valid_targets_min": 1771 }, { "epoch": 5.32546786004882, "grad_norm": 0.4801756872745154, "learning_rate": 6.592497228673515e-06, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.09945647418498993, "step": 3275, "valid_targets_mean": 5828.0, "valid_targets_min": 3637 }, { "epoch": 5.333604556550041, "grad_norm": 0.6255645015728781, "learning_rate": 6.532433834578449e-06, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1372753381729126, "step": 3280, "valid_targets_mean": 5747.9, "valid_targets_min": 2363 }, { "epoch": 5.341741253051262, "grad_norm": 0.5792091744981441, "learning_rate": 6.472591856505526e-06, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.12719324231147766, "step": 3285, "valid_targets_mean": 5969.4, "valid_targets_min": 3258 }, { "epoch": 5.349877949552481, "grad_norm": 0.46470017871854946, "learning_rate": 6.412972278297893e-06, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.0882813110947609, "step": 3290, "valid_targets_mean": 6402.1, "valid_targets_min": 774 }, { "epoch": 5.358014646053702, "grad_norm": 0.521223858319776, "learning_rate": 6.353576080142309e-06, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.11632373183965683, "step": 3295, "valid_targets_mean": 6959.1, "valid_targets_min": 5246 }, { "epoch": 5.3661513425549225, "grad_norm": 0.5413214801922716, "learning_rate": 6.294404238552994e-06, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13462717831134796, "step": 3300, "valid_targets_mean": 6453.6, "valid_targets_min": 3165 }, { "epoch": 5.374288039056143, "grad_norm": 0.5573148190013232, "learning_rate": 6.235457726355591e-06, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.08801619708538055, "step": 3305, "valid_targets_mean": 4524.6, "valid_targets_min": 903 }, { "epoch": 5.382424735557364, "grad_norm": 0.606307196821786, "learning_rate": 6.176737512671182e-06, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.13813389837741852, "step": 3310, "valid_targets_mean": 4672.2, "valid_targets_min": 1451 }, { "epoch": 5.390561432058584, "grad_norm": 0.6132589856336323, "learning_rate": 6.11824456290034e-06, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388852894306183, "step": 3315, "valid_targets_mean": 7884.9, "valid_targets_min": 3424 }, { "epoch": 5.398698128559805, "grad_norm": 0.5924080709083809, "learning_rate": 6.05997983870727e-06, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.17288537323474884, "step": 3320, "valid_targets_mean": 4974.5, "valid_targets_min": 1145 }, { "epoch": 5.406834825061026, "grad_norm": 0.5457228907298186, "learning_rate": 6.00194429800399e-06, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.13619005680084229, "step": 3325, "valid_targets_mean": 5901.8, "valid_targets_min": 1958 }, { "epoch": 5.414971521562245, "grad_norm": 0.5079754475219553, "learning_rate": 5.944138894934582e-06, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.13231110572814941, "step": 3330, "valid_targets_mean": 4886.6, "valid_targets_min": 1461 }, { "epoch": 5.423108218063466, "grad_norm": 0.5492790566828493, "learning_rate": 5.886564579859504e-06, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.10987076908349991, "step": 3335, "valid_targets_mean": 4042.6, "valid_targets_min": 397 }, { "epoch": 5.431244914564687, "grad_norm": 0.5765503149421513, "learning_rate": 5.829222299339969e-06, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.09734175354242325, "step": 3340, "valid_targets_mean": 4017.5, "valid_targets_min": 687 }, { "epoch": 5.439381611065907, "grad_norm": 0.4945201441893148, "learning_rate": 5.772112996122403e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.12293386459350586, "step": 3345, "valid_targets_mean": 6276.8, "valid_targets_min": 1669 }, { "epoch": 5.447518307567128, "grad_norm": 0.5241675442790266, "learning_rate": 5.715237609122896e-06, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.13944748044013977, "step": 3350, "valid_targets_mean": 6314.0, "valid_targets_min": 4246 }, { "epoch": 5.4556550040683485, "grad_norm": 0.5086698627055527, "learning_rate": 5.658597073411816e-06, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.10946042835712433, "step": 3355, "valid_targets_mean": 4947.4, "valid_targets_min": 803 }, { "epoch": 5.463791700569569, "grad_norm": 0.5087935856854946, "learning_rate": 5.602192320198401e-06, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.11571265012025833, "step": 3360, "valid_targets_mean": 4712.5, "valid_targets_min": 768 }, { "epoch": 5.471928397070789, "grad_norm": 0.6209480221847946, "learning_rate": 5.546024276815467e-06, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.12471382319927216, "step": 3365, "valid_targets_mean": 6229.0, "valid_targets_min": 2774 }, { "epoch": 5.480065093572009, "grad_norm": 0.5740469197183198, "learning_rate": 5.490093866704171e-06, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.15511798858642578, "step": 3370, "valid_targets_mean": 5492.1, "valid_targets_min": 2163 }, { "epoch": 5.48820179007323, "grad_norm": 0.5005163631534619, "learning_rate": 5.434402009398798e-06, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.10742124915122986, "step": 3375, "valid_targets_mean": 5065.9, "valid_targets_min": 1052 }, { "epoch": 5.496338486574451, "grad_norm": 0.5671784567412589, "learning_rate": 5.378949620511671e-06, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.11315690726041794, "step": 3380, "valid_targets_mean": 3717.4, "valid_targets_min": 1470 }, { "epoch": 5.504475183075671, "grad_norm": 0.4360799056624353, "learning_rate": 5.3237376117180854e-06, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.0977911725640297, "step": 3385, "valid_targets_mean": 6910.8, "valid_targets_min": 3082 }, { "epoch": 5.512611879576892, "grad_norm": 0.5142900343224198, "learning_rate": 5.268766890741315e-06, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.13378457725048065, "step": 3390, "valid_targets_mean": 6389.2, "valid_targets_min": 3445 }, { "epoch": 5.5207485760781125, "grad_norm": 0.5602434630005119, "learning_rate": 5.214038361337719e-06, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.10973970592021942, "step": 3395, "valid_targets_mean": 4815.2, "valid_targets_min": 1484 }, { "epoch": 5.528885272579333, "grad_norm": 0.5342812643462996, "learning_rate": 5.159552923281841e-06, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.0758785754442215, "step": 3400, "valid_targets_mean": 4529.4, "valid_targets_min": 2360 }, { "epoch": 5.537021969080554, "grad_norm": 0.5716216749186573, "learning_rate": 5.105311472351639e-06, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.121833935379982, "step": 3405, "valid_targets_mean": 5706.9, "valid_targets_min": 4080 }, { "epoch": 5.5451586655817735, "grad_norm": 0.43346386249748464, "learning_rate": 5.051314900313764e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.07879453897476196, "step": 3410, "valid_targets_mean": 5555.4, "valid_targets_min": 3770 }, { "epoch": 5.553295362082994, "grad_norm": 0.49340156082331843, "learning_rate": 4.997564094908878e-06, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.12145587801933289, "step": 3415, "valid_targets_mean": 6155.6, "valid_targets_min": 2387 }, { "epoch": 5.561432058584215, "grad_norm": 0.47890012005963234, "learning_rate": 4.944059939837082e-06, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.12839338183403015, "step": 3420, "valid_targets_mean": 6536.0, "valid_targets_min": 1825 }, { "epoch": 5.569568755085435, "grad_norm": 0.4903125361830746, "learning_rate": 4.890803314743371e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.11269734799861908, "step": 3425, "valid_targets_mean": 5621.2, "valid_targets_min": 3511 }, { "epoch": 5.577705451586656, "grad_norm": 0.5283918720724791, "learning_rate": 4.837795095203175e-06, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.10433046519756317, "step": 3430, "valid_targets_mean": 5621.9, "valid_targets_min": 2251 }, { "epoch": 5.585842148087877, "grad_norm": 0.6026011579728354, "learning_rate": 4.785036152707969e-06, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.12681570649147034, "step": 3435, "valid_targets_mean": 4668.2, "valid_targets_min": 2544 }, { "epoch": 5.593978844589097, "grad_norm": 0.6061374193583238, "learning_rate": 4.732527354650951e-06, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.13143488764762878, "step": 3440, "valid_targets_mean": 4703.0, "valid_targets_min": 1974 }, { "epoch": 5.602115541090317, "grad_norm": 0.5221796158770693, "learning_rate": 4.68026956431276e-06, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.149415522813797, "step": 3445, "valid_targets_mean": 6412.0, "valid_targets_min": 4008 }, { "epoch": 5.610252237591538, "grad_norm": 0.576901307893142, "learning_rate": 4.628263640847304e-06, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.12277019023895264, "step": 3450, "valid_targets_mean": 5465.6, "valid_targets_min": 3759 }, { "epoch": 5.618388934092758, "grad_norm": 0.5641514509002485, "learning_rate": 4.5765104392676205e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.13894778490066528, "step": 3455, "valid_targets_mean": 5405.1, "valid_targets_min": 1513 }, { "epoch": 5.626525630593979, "grad_norm": 0.7340535896041918, "learning_rate": 4.525010810431825e-06, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.13835415244102478, "step": 3460, "valid_targets_mean": 3785.0, "valid_targets_min": 2039 }, { "epoch": 5.634662327095199, "grad_norm": 0.5034917359869234, "learning_rate": 4.4737656010291366e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1569593846797943, "step": 3465, "valid_targets_mean": 8556.2, "valid_targets_min": 4927 }, { "epoch": 5.64279902359642, "grad_norm": 0.6255736017643779, "learning_rate": 4.422775653565934e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.10940764844417572, "step": 3470, "valid_targets_mean": 4768.1, "valid_targets_min": 1338 }, { "epoch": 5.650935720097641, "grad_norm": 0.46222130787565185, "learning_rate": 4.372041806351914e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.12370267510414124, "step": 3475, "valid_targets_mean": 6039.4, "valid_targets_min": 2221 }, { "epoch": 5.65907241659886, "grad_norm": 0.7151061983633159, "learning_rate": 4.321564893486312e-06, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.10197927057743073, "step": 3480, "valid_targets_mean": 5656.9, "valid_targets_min": 3191 }, { "epoch": 5.667209113100081, "grad_norm": 0.4612178221303647, "learning_rate": 4.271345744844182e-06, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.07878731191158295, "step": 3485, "valid_targets_mean": 5026.6, "valid_targets_min": 781 }, { "epoch": 5.675345809601302, "grad_norm": 0.5034775896468006, "learning_rate": 4.2213851860627696e-06, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.11451518535614014, "step": 3490, "valid_targets_mean": 5065.0, "valid_targets_min": 3912 }, { "epoch": 5.683482506102522, "grad_norm": 0.48370829828670214, "learning_rate": 4.171684038527914e-06, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.1177678257226944, "step": 3495, "valid_targets_mean": 5450.1, "valid_targets_min": 2203 }, { "epoch": 5.691619202603743, "grad_norm": 0.4915476071311832, "learning_rate": 4.12224311936056e-06, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.11996840685606003, "step": 3500, "valid_targets_mean": 7179.9, "valid_targets_min": 4365 }, { "epoch": 5.6997558991049635, "grad_norm": 0.5337016634168994, "learning_rate": 4.073063241403316e-06, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.12122653424739838, "step": 3505, "valid_targets_mean": 5070.0, "valid_targets_min": 784 }, { "epoch": 5.707892595606184, "grad_norm": 0.5853690423707902, "learning_rate": 4.024145213207103e-06, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.10927228629589081, "step": 3510, "valid_targets_mean": 4184.2, "valid_targets_min": 867 }, { "epoch": 5.716029292107405, "grad_norm": 0.5353891362994679, "learning_rate": 3.975489839017846e-06, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.12216495722532272, "step": 3515, "valid_targets_mean": 5225.1, "valid_targets_min": 949 }, { "epoch": 5.724165988608625, "grad_norm": 0.9481430336242733, "learning_rate": 3.9270979187632516e-06, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.12332406640052795, "step": 3520, "valid_targets_mean": 5509.9, "valid_targets_min": 2682 }, { "epoch": 5.732302685109845, "grad_norm": 0.47893060639696544, "learning_rate": 3.878970248039678e-06, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404319554567337, "step": 3525, "valid_targets_mean": 7358.9, "valid_targets_min": 3809 }, { "epoch": 5.740439381611066, "grad_norm": 0.509875821596104, "learning_rate": 3.831107618099026e-06, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.19203639030456543, "step": 3530, "valid_targets_mean": 6786.8, "valid_targets_min": 2958 }, { "epoch": 5.748576078112286, "grad_norm": 0.47911534628300395, "learning_rate": 3.7835108158357537e-06, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.12184299528598785, "step": 3535, "valid_targets_mean": 7290.6, "valid_targets_min": 3489 }, { "epoch": 5.756712774613507, "grad_norm": 0.45486474848191916, "learning_rate": 3.7361806237739264e-06, "loss": 0.2317, "loss_nan_ranks": 0, "loss_rank_avg": 0.08215008676052094, "step": 3540, "valid_targets_mean": 5637.9, "valid_targets_min": 1196 }, { "epoch": 5.764849471114728, "grad_norm": 0.5210595475392571, "learning_rate": 3.689117820054351e-06, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.08964404463768005, "step": 3545, "valid_targets_mean": 5758.0, "valid_targets_min": 2964 }, { "epoch": 5.772986167615948, "grad_norm": 0.5267608109326574, "learning_rate": 3.6423231784217918e-06, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.14031247794628143, "step": 3550, "valid_targets_mean": 6369.0, "valid_targets_min": 1512 }, { "epoch": 5.781122864117169, "grad_norm": 0.5326050285350579, "learning_rate": 3.595797468212241e-06, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.10683193802833557, "step": 3555, "valid_targets_mean": 4920.4, "valid_targets_min": 806 }, { "epoch": 5.7892595606183885, "grad_norm": 0.47240098718567736, "learning_rate": 3.549541454340284e-06, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.07187937200069427, "step": 3560, "valid_targets_mean": 4559.9, "valid_targets_min": 556 }, { "epoch": 5.797396257119609, "grad_norm": 0.5523118981586366, "learning_rate": 3.503555897286499e-06, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383015513420105, "step": 3565, "valid_targets_mean": 6232.8, "valid_targets_min": 3199 }, { "epoch": 5.80553295362083, "grad_norm": 0.47382486470602847, "learning_rate": 3.4578415530849794e-06, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.10226757824420929, "step": 3570, "valid_targets_mean": 6907.6, "valid_targets_min": 2369 }, { "epoch": 5.81366965012205, "grad_norm": 0.559498744815589, "learning_rate": 3.4123991733108852e-06, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.11900554597377777, "step": 3575, "valid_targets_mean": 4755.1, "valid_targets_min": 1019 }, { "epoch": 5.821806346623271, "grad_norm": 0.5114120203304382, "learning_rate": 3.3672295050680946e-06, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.14657077193260193, "step": 3580, "valid_targets_mean": 6173.2, "valid_targets_min": 3078 }, { "epoch": 5.829943043124492, "grad_norm": 0.9817994961771758, "learning_rate": 3.322333290976936e-06, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.13037019968032837, "step": 3585, "valid_targets_mean": 4806.9, "valid_targets_min": 948 }, { "epoch": 5.838079739625712, "grad_norm": 0.49960877842083473, "learning_rate": 3.2777112691619473e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.11504438519477844, "step": 3590, "valid_targets_mean": 5366.2, "valid_targets_min": 3196 }, { "epoch": 5.846216436126932, "grad_norm": 0.5060382703438006, "learning_rate": 3.233364173239766e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.11748774349689484, "step": 3595, "valid_targets_mean": 5511.2, "valid_targets_min": 2098 }, { "epoch": 5.854353132628153, "grad_norm": 0.5646071765030719, "learning_rate": 3.189292732307052e-06, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.11946381628513336, "step": 3600, "valid_targets_mean": 5497.6, "valid_targets_min": 3401 }, { "epoch": 5.862489829129373, "grad_norm": 1.9085216141047994, "learning_rate": 3.1454976709285124e-06, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.12498481571674347, "step": 3605, "valid_targets_mean": 5483.4, "valid_targets_min": 756 }, { "epoch": 5.870626525630594, "grad_norm": 0.6119847782021685, "learning_rate": 3.1019797091249938e-06, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357029676437378, "step": 3610, "valid_targets_mean": 4750.2, "valid_targets_min": 1614 }, { "epoch": 5.8787632221318145, "grad_norm": 0.5952452103733551, "learning_rate": 3.058739562361621e-06, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497454881668091, "step": 3615, "valid_targets_mean": 4917.1, "valid_targets_min": 3716 }, { "epoch": 5.886899918633035, "grad_norm": 0.5378260436755556, "learning_rate": 3.015777941536058e-06, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.10903813689947128, "step": 3620, "valid_targets_mean": 4843.9, "valid_targets_min": 2199 }, { "epoch": 5.895036615134256, "grad_norm": 0.5888457289118504, "learning_rate": 2.973095552966805e-06, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.13942526280879974, "step": 3625, "valid_targets_mean": 5965.9, "valid_targets_min": 3408 }, { "epoch": 5.903173311635476, "grad_norm": 0.5111041219072542, "learning_rate": 2.9306930983816005e-06, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.15496578812599182, "step": 3630, "valid_targets_mean": 6038.0, "valid_targets_min": 1693 }, { "epoch": 5.911310008136697, "grad_norm": 0.5794364971608068, "learning_rate": 2.8885712749058737e-06, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.1413809061050415, "step": 3635, "valid_targets_mean": 5439.6, "valid_targets_min": 1362 }, { "epoch": 5.919446704637917, "grad_norm": 0.498196696749723, "learning_rate": 2.8467307750512808e-06, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.14829573035240173, "step": 3640, "valid_targets_mean": 7339.1, "valid_targets_min": 1391 }, { "epoch": 5.927583401139137, "grad_norm": 0.5485087375601867, "learning_rate": 2.80517228670433e-06, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.12239962071180344, "step": 3645, "valid_targets_mean": 5950.1, "valid_targets_min": 1544 }, { "epoch": 5.935720097640358, "grad_norm": 0.9852713752535961, "learning_rate": 2.7638964931150637e-06, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.13210991024971008, "step": 3650, "valid_targets_mean": 5893.9, "valid_targets_min": 1385 }, { "epoch": 5.9438567941415785, "grad_norm": 0.5176163129021438, "learning_rate": 2.7229040728858323e-06, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.10251633077859879, "step": 3655, "valid_targets_mean": 5866.8, "valid_targets_min": 2058 }, { "epoch": 5.951993490642799, "grad_norm": 0.553870107905142, "learning_rate": 2.6821956999601306e-06, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.11761283129453659, "step": 3660, "valid_targets_mean": 4549.0, "valid_targets_min": 504 }, { "epoch": 5.96013018714402, "grad_norm": 0.5622284508277662, "learning_rate": 2.641772043611521e-06, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.11832987517118454, "step": 3665, "valid_targets_mean": 5334.1, "valid_targets_min": 1997 }, { "epoch": 5.96826688364524, "grad_norm": 0.6002412417162024, "learning_rate": 2.6016337684326342e-06, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1252046376466751, "step": 3670, "valid_targets_mean": 5856.5, "valid_targets_min": 670 }, { "epoch": 5.97640358014646, "grad_norm": 0.5820259812808503, "learning_rate": 2.5617815343242327e-06, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.15230754017829895, "step": 3675, "valid_targets_mean": 5588.6, "valid_targets_min": 1374 }, { "epoch": 5.984540276647681, "grad_norm": 0.5006926676913205, "learning_rate": 2.522215996484374e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.10319880396127701, "step": 3680, "valid_targets_mean": 5475.5, "valid_targets_min": 2095 }, { "epoch": 5.992676973148901, "grad_norm": 0.4818010996292355, "learning_rate": 2.4829378053976318e-06, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.12096649408340454, "step": 3685, "valid_targets_mean": 6174.9, "valid_targets_min": 3864 }, { "epoch": 6.0, "grad_norm": 0.7286610952593501, "learning_rate": 2.4439476068243927e-06, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2138330638408661, "step": 3690, "valid_targets_mean": 5464.5, "valid_targets_min": 1291 }, { "epoch": 6.008136696501221, "grad_norm": 0.5858367728890088, "learning_rate": 2.4052460417902613e-06, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.14344994723796844, "step": 3695, "valid_targets_mean": 5086.1, "valid_targets_min": 1582 }, { "epoch": 6.016273393002441, "grad_norm": 0.5202481454299519, "learning_rate": 2.3668337465754985e-06, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.10779225826263428, "step": 3700, "valid_targets_mean": 6387.1, "valid_targets_min": 2931 }, { "epoch": 6.024410089503662, "grad_norm": 0.45889546479866966, "learning_rate": 2.3287113527045823e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.1384791135787964, "step": 3705, "valid_targets_mean": 8278.0, "valid_targets_min": 3366 }, { "epoch": 6.032546786004882, "grad_norm": 0.5089628731085755, "learning_rate": 2.2908794869358044e-06, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.15829752385616302, "step": 3710, "valid_targets_mean": 6261.4, "valid_targets_min": 2457 }, { "epoch": 6.040683482506102, "grad_norm": 0.5462143117486035, "learning_rate": 2.253338771250977e-06, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.08127269148826599, "step": 3715, "valid_targets_mean": 3890.1, "valid_targets_min": 1056 }, { "epoch": 6.048820179007323, "grad_norm": 0.5707430580005115, "learning_rate": 2.216089822845211e-06, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.09576968103647232, "step": 3720, "valid_targets_mean": 4583.1, "valid_targets_min": 606 }, { "epoch": 6.0569568755085434, "grad_norm": 0.4608492749702116, "learning_rate": 2.1791332541167497e-06, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.0854940190911293, "step": 3725, "valid_targets_mean": 5545.5, "valid_targets_min": 1019 }, { "epoch": 6.065093572009764, "grad_norm": 0.5002751592382064, "learning_rate": 2.142469672656935e-06, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.10318467766046524, "step": 3730, "valid_targets_mean": 6957.6, "valid_targets_min": 3822 }, { "epoch": 6.073230268510985, "grad_norm": 0.570462395210286, "learning_rate": 2.106099681240179e-06, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.09837909042835236, "step": 3735, "valid_targets_mean": 4815.5, "valid_targets_min": 1144 }, { "epoch": 6.081366965012205, "grad_norm": 0.5408066637162211, "learning_rate": 2.07002387781408e-06, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.15398940443992615, "step": 3740, "valid_targets_mean": 5805.0, "valid_targets_min": 3641 }, { "epoch": 6.089503661513426, "grad_norm": 0.6160653619825817, "learning_rate": 2.0342428554895788e-06, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.10584094375371933, "step": 3745, "valid_targets_mean": 4334.1, "valid_targets_min": 767 }, { "epoch": 6.097640358014646, "grad_norm": 0.48826990351762456, "learning_rate": 1.998757202531223e-06, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.09239885210990906, "step": 3750, "valid_targets_mean": 5868.6, "valid_targets_min": 391 }, { "epoch": 6.105777054515866, "grad_norm": 0.6379627065382744, "learning_rate": 1.9635675023474764e-06, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.11344724893569946, "step": 3755, "valid_targets_mean": 5121.8, "valid_targets_min": 2171 }, { "epoch": 6.113913751017087, "grad_norm": 0.5446797282952438, "learning_rate": 1.92867433348114e-06, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.09264282137155533, "step": 3760, "valid_targets_mean": 4778.0, "valid_targets_min": 1570 }, { "epoch": 6.1220504475183075, "grad_norm": 0.626815073545696, "learning_rate": 1.8940782695998305e-06, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.10249383747577667, "step": 3765, "valid_targets_mean": 5221.0, "valid_targets_min": 3398 }, { "epoch": 6.130187144019528, "grad_norm": 0.5214124493423383, "learning_rate": 1.859779879486565e-06, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.13012221455574036, "step": 3770, "valid_targets_mean": 6414.4, "valid_targets_min": 947 }, { "epoch": 6.138323840520749, "grad_norm": 0.4894257977488121, "learning_rate": 1.8257797270303924e-06, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.08547305315732956, "step": 3775, "valid_targets_mean": 5550.0, "valid_targets_min": 1010 }, { "epoch": 6.146460537021969, "grad_norm": 0.4914282914782947, "learning_rate": 1.792078371217132e-06, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.1106870174407959, "step": 3780, "valid_targets_mean": 6550.1, "valid_targets_min": 2920 }, { "epoch": 6.15459723352319, "grad_norm": 0.5426971061042444, "learning_rate": 1.7586763661201821e-06, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.0976264476776123, "step": 3785, "valid_targets_mean": 5254.1, "valid_targets_min": 1979 }, { "epoch": 6.16273393002441, "grad_norm": 0.5986618193157306, "learning_rate": 1.7255742608914095e-06, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.14822298288345337, "step": 3790, "valid_targets_mean": 5250.0, "valid_targets_min": 1139 }, { "epoch": 6.17087062652563, "grad_norm": 0.5924847870251507, "learning_rate": 1.6927725997521171e-06, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.11596965044736862, "step": 3795, "valid_targets_mean": 5393.9, "valid_targets_min": 3392 }, { "epoch": 6.179007323026851, "grad_norm": 0.5014703652224826, "learning_rate": 1.6602719219841135e-06, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.09786193817853928, "step": 3800, "valid_targets_mean": 7391.9, "valid_targets_min": 3280 }, { "epoch": 6.187144019528072, "grad_norm": 0.5273515456482646, "learning_rate": 1.6280727619208202e-06, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.12879054248332977, "step": 3805, "valid_targets_mean": 5833.8, "valid_targets_min": 1693 }, { "epoch": 6.195280716029292, "grad_norm": 0.5379631945457531, "learning_rate": 1.5961756489385117e-06, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.13405945897102356, "step": 3810, "valid_targets_mean": 6324.8, "valid_targets_min": 3480 }, { "epoch": 6.203417412530513, "grad_norm": 0.5506482251419262, "learning_rate": 1.5645811074475915e-06, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1008005291223526, "step": 3815, "valid_targets_mean": 5211.1, "valid_targets_min": 2095 }, { "epoch": 6.211554109031733, "grad_norm": 0.5525468218833477, "learning_rate": 1.533289656883985e-06, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.12161102890968323, "step": 3820, "valid_targets_mean": 5366.6, "valid_targets_min": 1201 }, { "epoch": 6.219690805532954, "grad_norm": 1.3205892043820247, "learning_rate": 1.5023018117005995e-06, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.13536399602890015, "step": 3825, "valid_targets_mean": 5411.5, "valid_targets_min": 976 }, { "epoch": 6.227827502034174, "grad_norm": 0.6399965745417111, "learning_rate": 1.4716180813588566e-06, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.14973969757556915, "step": 3830, "valid_targets_mean": 5368.0, "valid_targets_min": 3462 }, { "epoch": 6.235964198535394, "grad_norm": 0.5609556474306848, "learning_rate": 1.44123897032032e-06, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.13443996012210846, "step": 3835, "valid_targets_mean": 5981.2, "valid_targets_min": 3215 }, { "epoch": 6.244100895036615, "grad_norm": 0.6385228076191484, "learning_rate": 1.411164978038404e-06, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1237209141254425, "step": 3840, "valid_targets_mean": 4783.6, "valid_targets_min": 1112 }, { "epoch": 6.252237591537836, "grad_norm": 0.6555481944926224, "learning_rate": 1.3813965989501687e-06, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.10206277668476105, "step": 3845, "valid_targets_mean": 6029.4, "valid_targets_min": 1648 }, { "epoch": 6.260374288039056, "grad_norm": 0.5440883938396228, "learning_rate": 1.3519343224681758e-06, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.13689102232456207, "step": 3850, "valid_targets_mean": 5527.1, "valid_targets_min": 2357 }, { "epoch": 6.268510984540277, "grad_norm": 0.5738449854156686, "learning_rate": 1.3227786329724479e-06, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.13260340690612793, "step": 3855, "valid_targets_mean": 4806.5, "valid_targets_min": 1773 }, { "epoch": 6.2766476810414975, "grad_norm": 0.5551324266480604, "learning_rate": 1.2939300098025177e-06, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.14535200595855713, "step": 3860, "valid_targets_mean": 5923.5, "valid_targets_min": 919 }, { "epoch": 6.284784377542717, "grad_norm": 0.6073163759364055, "learning_rate": 1.2653889272495223e-06, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.10163906216621399, "step": 3865, "valid_targets_mean": 4454.5, "valid_targets_min": 427 }, { "epoch": 6.292921074043938, "grad_norm": 0.6023482154559401, "learning_rate": 1.2371558545484375e-06, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.13912144303321838, "step": 3870, "valid_targets_mean": 4576.5, "valid_targets_min": 2053 }, { "epoch": 6.3010577705451585, "grad_norm": 0.4614699781457518, "learning_rate": 1.2092312558703333e-06, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.09365392476320267, "step": 3875, "valid_targets_mean": 5213.4, "valid_targets_min": 2221 }, { "epoch": 6.309194467046379, "grad_norm": 0.5158867835539471, "learning_rate": 1.181615590314762e-06, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.12160620093345642, "step": 3880, "valid_targets_mean": 6346.5, "valid_targets_min": 3619 }, { "epoch": 6.3173311635476, "grad_norm": 2.2609058090585687, "learning_rate": 1.1543093119021976e-06, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.13036061823368073, "step": 3885, "valid_targets_mean": 4674.4, "valid_targets_min": 1355 }, { "epoch": 6.32546786004882, "grad_norm": 0.6835770950079834, "learning_rate": 1.1273128695665814e-06, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.16928444802761078, "step": 3890, "valid_targets_mean": 5820.9, "valid_targets_min": 1498 }, { "epoch": 6.333604556550041, "grad_norm": 0.5664875984145479, "learning_rate": 1.1006267071479359e-06, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.10270114988088608, "step": 3895, "valid_targets_mean": 5303.8, "valid_targets_min": 1183 }, { "epoch": 6.341741253051262, "grad_norm": 0.4578194482636973, "learning_rate": 1.074251263385071e-06, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.08202557265758514, "step": 3900, "valid_targets_mean": 6897.5, "valid_targets_min": 2742 }, { "epoch": 6.349877949552481, "grad_norm": 0.5720561944484039, "learning_rate": 1.0481869719083647e-06, "loss": 0.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.12599898874759674, "step": 3905, "valid_targets_mean": 4984.6, "valid_targets_min": 1067 }, { "epoch": 6.358014646053702, "grad_norm": 0.5346739530338187, "learning_rate": 1.022434261232641e-06, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.18678709864616394, "step": 3910, "valid_targets_mean": 7899.0, "valid_targets_min": 2439 }, { "epoch": 6.3661513425549225, "grad_norm": 0.5245267855591524, "learning_rate": 9.969935547501208e-07, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1010551005601883, "step": 3915, "valid_targets_mean": 5726.0, "valid_targets_min": 2426 }, { "epoch": 6.374288039056143, "grad_norm": 0.577988469761867, "learning_rate": 9.718652707234667e-07, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.15215085446834564, "step": 3920, "valid_targets_mean": 6691.8, "valid_targets_min": 741 }, { "epoch": 6.382424735557364, "grad_norm": 0.5313322523199454, "learning_rate": 9.47049822278896e-07, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1224609836935997, "step": 3925, "valid_targets_mean": 7647.4, "valid_targets_min": 3864 }, { "epoch": 6.390561432058584, "grad_norm": 0.5506328179742512, "learning_rate": 9.225476173993941e-07, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.11494912952184677, "step": 3930, "valid_targets_mean": 5041.4, "valid_targets_min": 1844 }, { "epoch": 6.398698128559805, "grad_norm": 0.6221746878029165, "learning_rate": 8.983590589180125e-07, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.13699518144130707, "step": 3935, "valid_targets_mean": 4982.8, "valid_targets_min": 596 }, { "epoch": 6.406834825061026, "grad_norm": 0.5322907918953855, "learning_rate": 8.744845445112337e-07, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.14416161179542542, "step": 3940, "valid_targets_mean": 6786.8, "valid_targets_min": 3528 }, { "epoch": 6.414971521562245, "grad_norm": 0.6032735858410141, "learning_rate": 8.50924466692451e-07, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.12138237059116364, "step": 3945, "valid_targets_mean": 5486.4, "valid_targets_min": 1091 }, { "epoch": 6.423108218063466, "grad_norm": 0.6020791332482403, "learning_rate": 8.276792128054967e-07, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.11796577274799347, "step": 3950, "valid_targets_mean": 4668.9, "valid_targets_min": 2761 }, { "epoch": 6.431244914564687, "grad_norm": 0.550955973668879, "learning_rate": 8.047491650182815e-07, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.14780160784721375, "step": 3955, "valid_targets_mean": 5403.9, "valid_targets_min": 1514 }, { "epoch": 6.439381611065907, "grad_norm": 0.5899929467979808, "learning_rate": 7.821347003165125e-07, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.13076281547546387, "step": 3960, "valid_targets_mean": 5458.2, "valid_targets_min": 715 }, { "epoch": 6.447518307567128, "grad_norm": 0.46432249628629235, "learning_rate": 7.598361904974982e-07, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.103657066822052, "step": 3965, "valid_targets_mean": 5980.2, "valid_targets_min": 4230 }, { "epoch": 6.4556550040683485, "grad_norm": 0.7371030234438611, "learning_rate": 7.378540021640313e-07, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.07392923533916473, "step": 3970, "valid_targets_mean": 4101.2, "valid_targets_min": 756 }, { "epoch": 6.463791700569569, "grad_norm": 0.5682466131911814, "learning_rate": 7.161884967183552e-07, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1610821634531021, "step": 3975, "valid_targets_mean": 6404.6, "valid_targets_min": 2554 }, { "epoch": 6.471928397070789, "grad_norm": 0.5442753436375526, "learning_rate": 6.948400303562386e-07, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.13828691840171814, "step": 3980, "valid_targets_mean": 6081.0, "valid_targets_min": 1105 }, { "epoch": 6.480065093572009, "grad_norm": 0.5290599896063467, "learning_rate": 6.738089540611059e-07, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.12780803442001343, "step": 3985, "valid_targets_mean": 5326.5, "valid_targets_min": 3083 }, { "epoch": 6.48820179007323, "grad_norm": 0.4829545021115107, "learning_rate": 6.530956135982713e-07, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.07991525530815125, "step": 3990, "valid_targets_mean": 5208.4, "valid_targets_min": 988 }, { "epoch": 6.496338486574451, "grad_norm": 0.4941367346868645, "learning_rate": 6.327003495092565e-07, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.09314847737550735, "step": 3995, "valid_targets_mean": 6371.6, "valid_targets_min": 3403 }, { "epoch": 6.504475183075671, "grad_norm": 0.603169711820912, "learning_rate": 6.126234971061861e-07, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.14228929579257965, "step": 4000, "valid_targets_mean": 5264.0, "valid_targets_min": 542 }, { "epoch": 6.512611879576892, "grad_norm": 0.5710471143580141, "learning_rate": 5.928653864662815e-07, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.15178368985652924, "step": 4005, "valid_targets_mean": 5708.6, "valid_targets_min": 3584 }, { "epoch": 6.5207485760781125, "grad_norm": 0.4842323415856468, "learning_rate": 5.734263424264242e-07, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.0898006483912468, "step": 4010, "valid_targets_mean": 5642.4, "valid_targets_min": 1473 }, { "epoch": 6.528885272579333, "grad_norm": 0.5617774998939432, "learning_rate": 5.543066845778345e-07, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239703118801117, "step": 4015, "valid_targets_mean": 4555.8, "valid_targets_min": 1628 }, { "epoch": 6.537021969080554, "grad_norm": 0.5072944150418117, "learning_rate": 5.355067272607928e-07, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.11048190295696259, "step": 4020, "valid_targets_mean": 7035.8, "valid_targets_min": 803 }, { "epoch": 6.5451586655817735, "grad_norm": 0.4954909171386829, "learning_rate": 5.170267795594886e-07, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.11649087071418762, "step": 4025, "valid_targets_mean": 6345.4, "valid_targets_min": 2927 }, { "epoch": 6.553295362082994, "grad_norm": 0.6103860123458417, "learning_rate": 4.988671452969329e-07, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.10858224332332611, "step": 4030, "valid_targets_mean": 4031.6, "valid_targets_min": 2584 }, { "epoch": 6.561432058584215, "grad_norm": 0.539076716156704, "learning_rate": 4.810281230299674e-07, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.10688619315624237, "step": 4035, "valid_targets_mean": 4906.5, "valid_targets_min": 1837 }, { "epoch": 6.569568755085435, "grad_norm": 0.5451844058939661, "learning_rate": 4.6351000604434537e-07, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.13301129639148712, "step": 4040, "valid_targets_mean": 6030.0, "valid_targets_min": 3338 }, { "epoch": 6.577705451586656, "grad_norm": 0.6364692773603006, "learning_rate": 4.463130823499273e-07, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.1468641757965088, "step": 4045, "valid_targets_mean": 5677.6, "valid_targets_min": 560 }, { "epoch": 6.585842148087877, "grad_norm": 0.5318256719237091, "learning_rate": 4.2943763467592436e-07, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.10516038537025452, "step": 4050, "valid_targets_mean": 4711.4, "valid_targets_min": 1877 }, { "epoch": 6.593978844589097, "grad_norm": 0.5509512683634988, "learning_rate": 4.12883940466271e-07, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.10421756654977798, "step": 4055, "valid_targets_mean": 4614.4, "valid_targets_min": 2460 }, { "epoch": 6.602115541090317, "grad_norm": 0.5200751439970589, "learning_rate": 3.9665227187505097e-07, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.10616647452116013, "step": 4060, "valid_targets_mean": 4184.4, "valid_targets_min": 2193 }, { "epoch": 6.610252237591538, "grad_norm": 0.5747208042923473, "learning_rate": 3.8074289576202295e-07, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.11532352864742279, "step": 4065, "valid_targets_mean": 4391.8, "valid_targets_min": 2875 }, { "epoch": 6.618388934092758, "grad_norm": 0.5442269160669613, "learning_rate": 3.6515607368824203e-07, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.14139285683631897, "step": 4070, "valid_targets_mean": 5408.9, "valid_targets_min": 1305 }, { "epoch": 6.626525630593979, "grad_norm": 0.6566336791778115, "learning_rate": 3.498920619117474e-07, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.10617846250534058, "step": 4075, "valid_targets_mean": 4429.5, "valid_targets_min": 1337 }, { "epoch": 6.634662327095199, "grad_norm": 0.5122404519465269, "learning_rate": 3.3495111138336147e-07, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.10197494924068451, "step": 4080, "valid_targets_mean": 4975.5, "valid_targets_min": 1614 }, { "epoch": 6.64279902359642, "grad_norm": 0.6028082911064025, "learning_rate": 3.203334677425529e-07, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.09473268687725067, "step": 4085, "valid_targets_mean": 3829.1, "valid_targets_min": 1555 }, { "epoch": 6.650935720097641, "grad_norm": 0.5205649448698142, "learning_rate": 3.060393713134091e-07, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1434570699930191, "step": 4090, "valid_targets_mean": 6809.5, "valid_targets_min": 1572 }, { "epoch": 6.65907241659886, "grad_norm": 0.5601018905652814, "learning_rate": 2.920690571006768e-07, "loss": 0.2317, "loss_nan_ranks": 0, "loss_rank_avg": 0.12937568128108978, "step": 4095, "valid_targets_mean": 7661.0, "valid_targets_min": 1771 }, { "epoch": 6.667209113100081, "grad_norm": 0.6361282605163243, "learning_rate": 2.784227547858964e-07, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.0899709165096283, "step": 4100, "valid_targets_mean": 4337.1, "valid_targets_min": 484 }, { "epoch": 6.675345809601302, "grad_norm": 0.5508211250858578, "learning_rate": 2.651006887236385e-07, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.09255590289831161, "step": 4105, "valid_targets_mean": 5757.0, "valid_targets_min": 3592 }, { "epoch": 6.683482506102522, "grad_norm": 0.5929185382963317, "learning_rate": 2.52103077937802e-07, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.11462150514125824, "step": 4110, "valid_targets_mean": 8654.9, "valid_targets_min": 687 }, { "epoch": 6.691619202603743, "grad_norm": 0.5406995619531852, "learning_rate": 2.394301361180218e-07, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.09833990037441254, "step": 4115, "valid_targets_mean": 5543.6, "valid_targets_min": 1684 }, { "epoch": 6.6997558991049635, "grad_norm": 0.5202765802597007, "learning_rate": 2.2708207161615147e-07, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.12440069019794464, "step": 4120, "valid_targets_mean": 6339.9, "valid_targets_min": 2935 }, { "epoch": 6.707892595606184, "grad_norm": 0.5477566339180919, "learning_rate": 2.150590874428371e-07, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.16028626263141632, "step": 4125, "valid_targets_mean": 6068.5, "valid_targets_min": 665 }, { "epoch": 6.716029292107405, "grad_norm": 0.5263469114319956, "learning_rate": 2.0336138126417994e-07, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12802526354789734, "step": 4130, "valid_targets_mean": 6818.8, "valid_targets_min": 3843 }, { "epoch": 6.724165988608625, "grad_norm": 0.6239937148070356, "learning_rate": 1.9198914539849455e-07, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.10577556490898132, "step": 4135, "valid_targets_mean": 4284.1, "valid_targets_min": 524 }, { "epoch": 6.732302685109845, "grad_norm": 0.5786354008011593, "learning_rate": 1.8094256681313593e-07, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.17910592257976532, "step": 4140, "valid_targets_mean": 5484.6, "valid_targets_min": 1652 }, { "epoch": 6.740439381611066, "grad_norm": 0.6573268588625598, "learning_rate": 1.702218271214262e-07, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.12595227360725403, "step": 4145, "valid_targets_mean": 4625.1, "valid_targets_min": 1444 }, { "epoch": 6.748576078112286, "grad_norm": 0.4184562575542007, "learning_rate": 1.598271025796816e-07, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.09041139483451843, "step": 4150, "valid_targets_mean": 5593.0, "valid_targets_min": 1619 }, { "epoch": 6.756712774613507, "grad_norm": 0.49775516096636063, "learning_rate": 1.4975856408429912e-07, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.12942853569984436, "step": 4155, "valid_targets_mean": 4617.5, "valid_targets_min": 1893 }, { "epoch": 6.764849471114728, "grad_norm": 0.5158152468576911, "learning_rate": 1.4001637716895445e-07, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.12505996227264404, "step": 4160, "valid_targets_mean": 5568.4, "valid_targets_min": 2868 }, { "epoch": 6.772986167615948, "grad_norm": 0.45862764208578194, "learning_rate": 1.3060070200188179e-07, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.09306715428829193, "step": 4165, "valid_targets_mean": 7481.6, "valid_targets_min": 1395 }, { "epoch": 6.781122864117169, "grad_norm": 0.5484801191580874, "learning_rate": 1.215116933832361e-07, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.0996013730764389, "step": 4170, "valid_targets_mean": 5064.8, "valid_targets_min": 1288 }, { "epoch": 6.7892595606183885, "grad_norm": 0.5432376350068135, "learning_rate": 1.1274950074255053e-07, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.14020952582359314, "step": 4175, "valid_targets_mean": 5912.4, "valid_targets_min": 3887 }, { "epoch": 6.797396257119609, "grad_norm": 0.63592955162879, "learning_rate": 1.0431426813628298e-07, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.14750230312347412, "step": 4180, "valid_targets_mean": 6155.6, "valid_targets_min": 2960 }, { "epoch": 6.80553295362083, "grad_norm": 0.5502827308580879, "learning_rate": 9.62061342454379e-08, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.08104512095451355, "step": 4185, "valid_targets_mean": 4188.5, "valid_targets_min": 1325 }, { "epoch": 6.81366965012205, "grad_norm": 0.5325444503557673, "learning_rate": 8.842523237329925e-08, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.12346133589744568, "step": 4190, "valid_targets_mean": 6763.8, "valid_targets_min": 1068 }, { "epoch": 6.821806346623271, "grad_norm": 0.546512190706496, "learning_rate": 8.097169044322561e-08, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1239863932132721, "step": 4195, "valid_targets_mean": 5937.0, "valid_targets_min": 2620 }, { "epoch": 6.829943043124492, "grad_norm": 0.5906532640459007, "learning_rate": 7.38456309965585e-08, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.12631988525390625, "step": 4200, "valid_targets_mean": 5960.2, "valid_targets_min": 2942 }, { "epoch": 6.838079739625712, "grad_norm": 0.6953061985356663, "learning_rate": 6.7047171190604e-08, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.13684195280075073, "step": 4205, "valid_targets_mean": 4888.6, "valid_targets_min": 2983 }, { "epoch": 6.846216436126932, "grad_norm": 0.5425415272735113, "learning_rate": 6.057642279669874e-08, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.10478918999433517, "step": 4210, "valid_targets_mean": 4543.4, "valid_targets_min": 1180 }, { "epoch": 6.854353132628153, "grad_norm": 0.48291552518428543, "learning_rate": 5.4433492198386895e-08, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.16383056342601776, "step": 4215, "valid_targets_mean": 7361.4, "valid_targets_min": 4819 }, { "epoch": 6.862489829129373, "grad_norm": 0.5655144988352875, "learning_rate": 4.861848038965722e-08, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.1411811113357544, "step": 4220, "valid_targets_mean": 5598.1, "valid_targets_min": 2990 }, { "epoch": 6.870626525630594, "grad_norm": 0.477678998506917, "learning_rate": 4.313148297328873e-08, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.14228369295597076, "step": 4225, "valid_targets_mean": 6497.6, "valid_targets_min": 3097 }, { "epoch": 6.8787632221318145, "grad_norm": 0.581502670933742, "learning_rate": 3.797259015928534e-08, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.15068471431732178, "step": 4230, "valid_targets_mean": 4712.4, "valid_targets_min": 2505 }, { "epoch": 6.886899918633035, "grad_norm": 0.4756280191630647, "learning_rate": 3.314188676338148e-08, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1089138463139534, "step": 4235, "valid_targets_mean": 5755.9, "valid_targets_min": 2892 }, { "epoch": 6.895036615134256, "grad_norm": 0.5398206094881605, "learning_rate": 2.863945220565434e-08, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.11508828401565552, "step": 4240, "valid_targets_mean": 5286.5, "valid_targets_min": 2360 }, { "epoch": 6.903173311635476, "grad_norm": 0.5717657037216582, "learning_rate": 2.4465360509211555e-08, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13908590376377106, "step": 4245, "valid_targets_mean": 5737.0, "valid_targets_min": 2518 }, { "epoch": 6.911310008136697, "grad_norm": 0.5554985915270165, "learning_rate": 2.0619680298983313e-08, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.11254111677408218, "step": 4250, "valid_targets_mean": 4905.9, "valid_targets_min": 792 }, { "epoch": 6.919446704637917, "grad_norm": 0.5218369286912145, "learning_rate": 1.7102474800592128e-08, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.13761496543884277, "step": 4255, "valid_targets_mean": 5413.0, "valid_targets_min": 2422 }, { "epoch": 6.927583401139137, "grad_norm": 0.5381548129002338, "learning_rate": 1.3913801839307017e-08, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14477401971817017, "step": 4260, "valid_targets_mean": 6205.5, "valid_targets_min": 558 }, { "epoch": 6.935720097640358, "grad_norm": 0.44713106150780874, "learning_rate": 1.105371383909759e-08, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.10858777165412903, "step": 4265, "valid_targets_mean": 8534.0, "valid_targets_min": 1522 }, { "epoch": 6.9438567941415785, "grad_norm": 0.5274514347290213, "learning_rate": 8.522257821770296e-09, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.1236865222454071, "step": 4270, "valid_targets_mean": 6043.4, "valid_targets_min": 3334 }, { "epoch": 6.951993490642799, "grad_norm": 0.5801773088235224, "learning_rate": 6.319475406200148e-09, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.11447873711585999, "step": 4275, "valid_targets_mean": 4326.0, "valid_targets_min": 2843 }, { "epoch": 6.96013018714402, "grad_norm": 0.5965479996719061, "learning_rate": 4.445402807637944e-09, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.13095706701278687, "step": 4280, "valid_targets_mean": 5125.6, "valid_targets_min": 3083 }, { "epoch": 6.96826688364524, "grad_norm": 0.596073208594123, "learning_rate": 2.9000708371240695e-09, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.12374962121248245, "step": 4285, "valid_targets_mean": 4898.1, "valid_targets_min": 1390 }, { "epoch": 6.97640358014646, "grad_norm": 0.547455008958649, "learning_rate": 1.6835049009755745e-09, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13343475759029388, "step": 4290, "valid_targets_mean": 6155.8, "valid_targets_min": 1121 }, { "epoch": 6.984540276647681, "grad_norm": 0.5017858705960277, "learning_rate": 7.9572500036873e-10, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.11443660408258438, "step": 4295, "valid_targets_mean": 7366.5, "valid_targets_min": 3418 }, { "epoch": 6.992676973148901, "grad_norm": 0.5649590473030836, "learning_rate": 2.367457310170629e-10, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.168892502784729, "step": 4300, "valid_targets_mean": 6009.1, "valid_targets_min": 3140 }, { "epoch": 7.0, "grad_norm": 0.6042592466198581, "learning_rate": 6.5762829204452095e-12, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.17104065418243408, "step": 4305, "valid_targets_mean": 7242.6, "valid_targets_min": 3287 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.17104065418243408, "step": 4305, "total_flos": 2.6783135993776046e+18, "train_loss": 0.2845736916749181, "train_runtime": 62000.2676, "train_samples_per_second": 1.109, "train_steps_per_second": 0.069, "valid_targets_mean": 7242.6, "valid_targets_min": 3287 } ], "logging_steps": 5, "max_steps": 4305, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.6783135993776046e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }