{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4389, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007974481658692184, "grad_norm": 22.539601593654673, "learning_rate": 3.644646924829157e-07, "loss": 0.7236, "loss_nan_ranks": 0, "loss_rank_avg": 0.7600098848342896, "step": 5, "valid_targets_mean": 4851.9, "valid_targets_min": 237 }, { "epoch": 0.01594896331738437, "grad_norm": 23.275682007480874, "learning_rate": 8.200455580865605e-07, "loss": 0.7422, "loss_nan_ranks": 0, "loss_rank_avg": 0.7550889253616333, "step": 10, "valid_targets_mean": 4153.7, "valid_targets_min": 269 }, { "epoch": 0.023923444976076555, "grad_norm": 21.554468206830432, "learning_rate": 1.2756264236902052e-06, "loss": 0.7207, "loss_nan_ranks": 0, "loss_rank_avg": 0.7336411476135254, "step": 15, "valid_targets_mean": 5106.7, "valid_targets_min": 266 }, { "epoch": 0.03189792663476874, "grad_norm": 17.34512536090768, "learning_rate": 1.7312072892938498e-06, "loss": 0.6838, "loss_nan_ranks": 0, "loss_rank_avg": 0.7120847702026367, "step": 20, "valid_targets_mean": 4411.2, "valid_targets_min": 235 }, { "epoch": 0.03987240829346093, "grad_norm": 9.588441353519025, "learning_rate": 2.1867881548974945e-06, "loss": 0.6246, "loss_nan_ranks": 0, "loss_rank_avg": 0.6012063026428223, "step": 25, "valid_targets_mean": 4489.4, "valid_targets_min": 200 }, { "epoch": 0.04784688995215311, "grad_norm": 4.870389531616145, "learning_rate": 2.642369020501139e-06, "loss": 0.5402, "loss_nan_ranks": 0, "loss_rank_avg": 0.4939027726650238, "step": 30, "valid_targets_mean": 5847.0, "valid_targets_min": 315 }, { "epoch": 0.05582137161084529, "grad_norm": 2.7658562996335365, "learning_rate": 3.0979498861047843e-06, "loss": 0.5073, "loss_nan_ranks": 0, "loss_rank_avg": 0.4871441423892975, "step": 35, "valid_targets_mean": 5392.2, "valid_targets_min": 495 }, { "epoch": 0.06379585326953748, "grad_norm": 1.6108362387448016, "learning_rate": 3.5535307517084285e-06, "loss": 0.4935, "loss_nan_ranks": 0, "loss_rank_avg": 0.47061264514923096, "step": 40, "valid_targets_mean": 5388.4, "valid_targets_min": 208 }, { "epoch": 0.07177033492822966, "grad_norm": 1.3386250154648769, "learning_rate": 4.009111617312073e-06, "loss": 0.4709, "loss_nan_ranks": 0, "loss_rank_avg": 0.4864431619644165, "step": 45, "valid_targets_mean": 4927.4, "valid_targets_min": 817 }, { "epoch": 0.07974481658692185, "grad_norm": 0.9037410217035577, "learning_rate": 4.464692482915718e-06, "loss": 0.436, "loss_nan_ranks": 0, "loss_rank_avg": 0.37901973724365234, "step": 50, "valid_targets_mean": 5363.9, "valid_targets_min": 344 }, { "epoch": 0.08771929824561403, "grad_norm": 0.8962668028470888, "learning_rate": 4.920273348519363e-06, "loss": 0.4353, "loss_nan_ranks": 0, "loss_rank_avg": 0.42550718784332275, "step": 55, "valid_targets_mean": 4650.9, "valid_targets_min": 214 }, { "epoch": 0.09569377990430622, "grad_norm": 0.7175155926848071, "learning_rate": 5.375854214123008e-06, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.379960298538208, "step": 60, "valid_targets_mean": 5349.0, "valid_targets_min": 1052 }, { "epoch": 0.10366826156299841, "grad_norm": 0.6623643426461047, "learning_rate": 5.831435079726651e-06, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.43091630935668945, "step": 65, "valid_targets_mean": 5121.9, "valid_targets_min": 207 }, { "epoch": 0.11164274322169059, "grad_norm": 0.6754894343009573, "learning_rate": 6.287015945330297e-06, "loss": 0.3789, "loss_nan_ranks": 0, "loss_rank_avg": 0.43398618698120117, "step": 70, "valid_targets_mean": 4971.6, "valid_targets_min": 290 }, { "epoch": 0.11961722488038277, "grad_norm": 0.5515059112771347, "learning_rate": 6.742596810933942e-06, "loss": 0.377, "loss_nan_ranks": 0, "loss_rank_avg": 0.36535507440567017, "step": 75, "valid_targets_mean": 5889.2, "valid_targets_min": 237 }, { "epoch": 0.12759170653907495, "grad_norm": 0.5773732873387002, "learning_rate": 7.1981776765375854e-06, "loss": 0.3822, "loss_nan_ranks": 0, "loss_rank_avg": 0.3957010507583618, "step": 80, "valid_targets_mean": 5604.6, "valid_targets_min": 1493 }, { "epoch": 0.13556618819776714, "grad_norm": 0.551936709789771, "learning_rate": 7.65375854214123e-06, "loss": 0.367, "loss_nan_ranks": 0, "loss_rank_avg": 0.3580014705657959, "step": 85, "valid_targets_mean": 5206.6, "valid_targets_min": 239 }, { "epoch": 0.14354066985645933, "grad_norm": 0.5490810118496819, "learning_rate": 8.109339407744875e-06, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.33477139472961426, "step": 90, "valid_targets_mean": 5279.1, "valid_targets_min": 366 }, { "epoch": 0.15151515151515152, "grad_norm": 0.5212462100646008, "learning_rate": 8.564920273348521e-06, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.3179510235786438, "step": 95, "valid_targets_mean": 5520.1, "valid_targets_min": 551 }, { "epoch": 0.1594896331738437, "grad_norm": 0.5483602561286001, "learning_rate": 9.020501138952164e-06, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.3079075217247009, "step": 100, "valid_targets_mean": 4469.1, "valid_targets_min": 247 }, { "epoch": 0.1674641148325359, "grad_norm": 0.5163840976300561, "learning_rate": 9.47608200455581e-06, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911684513092041, "step": 105, "valid_targets_mean": 4836.1, "valid_targets_min": 245 }, { "epoch": 0.17543859649122806, "grad_norm": 0.49241293958882054, "learning_rate": 9.931662870159453e-06, "loss": 0.3284, "loss_nan_ranks": 0, "loss_rank_avg": 0.32421791553497314, "step": 110, "valid_targets_mean": 4989.3, "valid_targets_min": 259 }, { "epoch": 0.18341307814992025, "grad_norm": 0.6731661811960075, "learning_rate": 1.03872437357631e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.3411160111427307, "step": 115, "valid_targets_mean": 3303.2, "valid_targets_min": 220 }, { "epoch": 0.19138755980861244, "grad_norm": 0.6093925029848669, "learning_rate": 1.0842824601366744e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.30621105432510376, "step": 120, "valid_targets_mean": 5066.4, "valid_targets_min": 269 }, { "epoch": 0.19936204146730463, "grad_norm": 0.5593908924009113, "learning_rate": 1.1298405466970387e-05, "loss": 0.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.3183234632015228, "step": 125, "valid_targets_mean": 6049.1, "valid_targets_min": 346 }, { "epoch": 0.20733652312599682, "grad_norm": 0.6050357561923428, "learning_rate": 1.1753986332574032e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018328547477722, "step": 130, "valid_targets_mean": 4385.7, "valid_targets_min": 241 }, { "epoch": 0.215311004784689, "grad_norm": 0.49058884266137975, "learning_rate": 1.2209567198177677e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.29568153619766235, "step": 135, "valid_targets_mean": 5280.4, "valid_targets_min": 260 }, { "epoch": 0.22328548644338117, "grad_norm": 0.4997292646119957, "learning_rate": 1.2665148063781323e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.3315421938896179, "step": 140, "valid_targets_mean": 6060.2, "valid_targets_min": 237 }, { "epoch": 0.23125996810207336, "grad_norm": 0.5787387582389717, "learning_rate": 1.3120728929384968e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.29679274559020996, "step": 145, "valid_targets_mean": 3525.4, "valid_targets_min": 226 }, { "epoch": 0.23923444976076555, "grad_norm": 0.5372974158957257, "learning_rate": 1.357630979498861e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.28743451833724976, "step": 150, "valid_targets_mean": 4102.1, "valid_targets_min": 224 }, { "epoch": 0.24720893141945774, "grad_norm": 0.4870503108003043, "learning_rate": 1.4031890660592255e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.2642919421195984, "step": 155, "valid_targets_mean": 5220.6, "valid_targets_min": 253 }, { "epoch": 0.2551834130781499, "grad_norm": 0.5266528254525839, "learning_rate": 1.4487471526195902e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.28630515933036804, "step": 160, "valid_targets_mean": 5168.8, "valid_targets_min": 255 }, { "epoch": 0.2631578947368421, "grad_norm": 0.5363668887252679, "learning_rate": 1.4943052391799546e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562587559223175, "step": 165, "valid_targets_mean": 4222.8, "valid_targets_min": 229 }, { "epoch": 0.2711323763955343, "grad_norm": 0.5652284763255125, "learning_rate": 1.539863325740319e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.27037516236305237, "step": 170, "valid_targets_mean": 4190.6, "valid_targets_min": 206 }, { "epoch": 0.27910685805422647, "grad_norm": 0.5317822792661527, "learning_rate": 1.5854214123006836e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.2907927334308624, "step": 175, "valid_targets_mean": 5068.0, "valid_targets_min": 161 }, { "epoch": 0.28708133971291866, "grad_norm": 0.5849656228564338, "learning_rate": 1.630979498861048e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.30426454544067383, "step": 180, "valid_targets_mean": 4185.5, "valid_targets_min": 437 }, { "epoch": 0.29505582137161085, "grad_norm": 0.43284955804317315, "learning_rate": 1.6765375854214125e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.2738342881202698, "step": 185, "valid_targets_mean": 6524.4, "valid_targets_min": 245 }, { "epoch": 0.30303030303030304, "grad_norm": 0.5173143108613342, "learning_rate": 1.722095671981777e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.29575982689857483, "step": 190, "valid_targets_mean": 4829.8, "valid_targets_min": 238 }, { "epoch": 0.31100478468899523, "grad_norm": 0.4761442663752431, "learning_rate": 1.7676537585421415e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.29583317041397095, "step": 195, "valid_targets_mean": 5772.1, "valid_targets_min": 1205 }, { "epoch": 0.3189792663476874, "grad_norm": 0.5018234043143022, "learning_rate": 1.813211845102506e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.31572768092155457, "step": 200, "valid_targets_mean": 5848.1, "valid_targets_min": 763 }, { "epoch": 0.3269537480063796, "grad_norm": 0.5455291918243139, "learning_rate": 1.8587699316628704e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2614780366420746, "step": 205, "valid_targets_mean": 4031.1, "valid_targets_min": 234 }, { "epoch": 0.3349282296650718, "grad_norm": 0.5022211222995883, "learning_rate": 1.904328018223235e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.27170923352241516, "step": 210, "valid_targets_mean": 5658.9, "valid_targets_min": 683 }, { "epoch": 0.34290271132376393, "grad_norm": 0.5363369685681201, "learning_rate": 1.9498861047835993e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.27169087529182434, "step": 215, "valid_targets_mean": 5476.3, "valid_targets_min": 3242 }, { "epoch": 0.3508771929824561, "grad_norm": 0.5138610867517525, "learning_rate": 1.9954441913439638e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.24844178557395935, "step": 220, "valid_targets_mean": 4867.3, "valid_targets_min": 222 }, { "epoch": 0.3588516746411483, "grad_norm": 0.45211684676685016, "learning_rate": 2.0410022779043283e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.25427666306495667, "step": 225, "valid_targets_mean": 6399.5, "valid_targets_min": 1011 }, { "epoch": 0.3668261562998405, "grad_norm": 0.5281985035133087, "learning_rate": 2.0865603644646927e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.26478126645088196, "step": 230, "valid_targets_mean": 4467.6, "valid_targets_min": 234 }, { "epoch": 0.3748006379585327, "grad_norm": 0.49350328076325595, "learning_rate": 2.1321184510250572e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.2781916856765747, "step": 235, "valid_targets_mean": 5363.7, "valid_targets_min": 308 }, { "epoch": 0.3827751196172249, "grad_norm": 0.5171735546449495, "learning_rate": 2.1776765375854217e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.2462097555398941, "step": 240, "valid_targets_mean": 4708.7, "valid_targets_min": 283 }, { "epoch": 0.39074960127591707, "grad_norm": 0.5406966523586195, "learning_rate": 2.223234624145786e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.27877381443977356, "step": 245, "valid_targets_mean": 4887.6, "valid_targets_min": 309 }, { "epoch": 0.39872408293460926, "grad_norm": 0.6896080417250773, "learning_rate": 2.2687927107061506e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2548321783542633, "step": 250, "valid_targets_mean": 5287.0, "valid_targets_min": 239 }, { "epoch": 0.40669856459330145, "grad_norm": 0.5173014170367707, "learning_rate": 2.314350797266515e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.25407731533050537, "step": 255, "valid_targets_mean": 5538.5, "valid_targets_min": 224 }, { "epoch": 0.41467304625199364, "grad_norm": 0.5161188756710522, "learning_rate": 2.3599088838268792e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.23988167941570282, "step": 260, "valid_targets_mean": 4940.8, "valid_targets_min": 271 }, { "epoch": 0.4226475279106858, "grad_norm": 0.6956583936758113, "learning_rate": 2.4054669703872436e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.24012714624404907, "step": 265, "valid_targets_mean": 3144.9, "valid_targets_min": 248 }, { "epoch": 0.430622009569378, "grad_norm": 0.7718804998493908, "learning_rate": 2.4510250569476085e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716878056526184, "step": 270, "valid_targets_mean": 5462.4, "valid_targets_min": 3412 }, { "epoch": 0.43859649122807015, "grad_norm": 0.5600994786468025, "learning_rate": 2.496583143507973e-05, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530458867549896, "step": 275, "valid_targets_mean": 4378.4, "valid_targets_min": 235 }, { "epoch": 0.44657097288676234, "grad_norm": 0.5749427915716706, "learning_rate": 2.5421412300683374e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.26579219102859497, "step": 280, "valid_targets_mean": 4329.8, "valid_targets_min": 243 }, { "epoch": 0.45454545454545453, "grad_norm": 0.5715496983969146, "learning_rate": 2.587699316628702e-05, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.2740967571735382, "step": 285, "valid_targets_mean": 4174.0, "valid_targets_min": 466 }, { "epoch": 0.4625199362041467, "grad_norm": 0.5046434387262629, "learning_rate": 2.6332574031890663e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2572627663612366, "step": 290, "valid_targets_mean": 5345.4, "valid_targets_min": 285 }, { "epoch": 0.4704944178628389, "grad_norm": 0.4924149138472084, "learning_rate": 2.6788154897494308e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.25392043590545654, "step": 295, "valid_targets_mean": 4933.1, "valid_targets_min": 209 }, { "epoch": 0.4784688995215311, "grad_norm": 0.6346007282511187, "learning_rate": 2.7243735763097953e-05, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.26829683780670166, "step": 300, "valid_targets_mean": 4915.8, "valid_targets_min": 628 }, { "epoch": 0.4864433811802233, "grad_norm": 0.5963249286669925, "learning_rate": 2.7699316628701597e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.2773645520210266, "step": 305, "valid_targets_mean": 4269.3, "valid_targets_min": 188 }, { "epoch": 0.4944178628389155, "grad_norm": 0.4926305295857678, "learning_rate": 2.815489749430524e-05, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.2462100088596344, "step": 310, "valid_targets_mean": 5357.4, "valid_targets_min": 447 }, { "epoch": 0.5023923444976076, "grad_norm": 0.6162803917326616, "learning_rate": 2.8610478359908883e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961190640926361, "step": 315, "valid_targets_mean": 4947.2, "valid_targets_min": 353 }, { "epoch": 0.5103668261562998, "grad_norm": 0.4585210580601163, "learning_rate": 2.906605922551253e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2386709600687027, "step": 320, "valid_targets_mean": 6055.6, "valid_targets_min": 901 }, { "epoch": 0.518341307814992, "grad_norm": 0.47805452614285815, "learning_rate": 2.9521640091116176e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.2311428189277649, "step": 325, "valid_targets_mean": 5337.5, "valid_targets_min": 550 }, { "epoch": 0.5263157894736842, "grad_norm": 0.567045162516125, "learning_rate": 2.997722095671982e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.24028460681438446, "step": 330, "valid_targets_mean": 4772.8, "valid_targets_min": 214 }, { "epoch": 0.5342902711323764, "grad_norm": 0.5319903869888214, "learning_rate": 3.0432801822323465e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.26871269941329956, "step": 335, "valid_targets_mean": 5710.7, "valid_targets_min": 1852 }, { "epoch": 0.5422647527910686, "grad_norm": 0.5268481071254558, "learning_rate": 3.088838268792711e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.25552791357040405, "step": 340, "valid_targets_mean": 4551.9, "valid_targets_min": 239 }, { "epoch": 0.5502392344497608, "grad_norm": 0.5246127684755286, "learning_rate": 3.1343963553530755e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.24578902125358582, "step": 345, "valid_targets_mean": 4407.8, "valid_targets_min": 245 }, { "epoch": 0.5582137161084529, "grad_norm": 0.5463821322401736, "learning_rate": 3.17995444191344e-05, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530014216899872, "step": 350, "valid_targets_mean": 5196.0, "valid_targets_min": 258 }, { "epoch": 0.5661881977671451, "grad_norm": 0.5577611010208283, "learning_rate": 3.2255125284738044e-05, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.2547740340232849, "step": 355, "valid_targets_mean": 4768.6, "valid_targets_min": 255 }, { "epoch": 0.5741626794258373, "grad_norm": 0.5348299340224125, "learning_rate": 3.271070615034169e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.24138829112052917, "step": 360, "valid_targets_mean": 6000.2, "valid_targets_min": 4248 }, { "epoch": 0.5821371610845295, "grad_norm": 0.5208781233506476, "learning_rate": 3.316628701594533e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.25419485569000244, "step": 365, "valid_targets_mean": 5256.7, "valid_targets_min": 439 }, { "epoch": 0.5901116427432217, "grad_norm": 0.49107029316580497, "learning_rate": 3.362186788154898e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.2487025111913681, "step": 370, "valid_targets_mean": 5005.3, "valid_targets_min": 252 }, { "epoch": 0.5980861244019139, "grad_norm": 0.6062940329738492, "learning_rate": 3.407744874715262e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.24524852633476257, "step": 375, "valid_targets_mean": 4933.1, "valid_targets_min": 377 }, { "epoch": 0.6060606060606061, "grad_norm": 0.5256030165269368, "learning_rate": 3.453302961275627e-05, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.22848409414291382, "step": 380, "valid_targets_mean": 4897.2, "valid_targets_min": 337 }, { "epoch": 0.6140350877192983, "grad_norm": 0.7317569754705133, "learning_rate": 3.498861047835991e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.2637185752391815, "step": 385, "valid_targets_mean": 3556.1, "valid_targets_min": 748 }, { "epoch": 0.6220095693779905, "grad_norm": 0.450094616900918, "learning_rate": 3.5444191343963557e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506665587425232, "step": 390, "valid_targets_mean": 6679.1, "valid_targets_min": 2470 }, { "epoch": 0.6299840510366826, "grad_norm": 0.5519907109153948, "learning_rate": 3.58997722095672e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557337284088135, "step": 395, "valid_targets_mean": 4688.7, "valid_targets_min": 276 }, { "epoch": 0.6379585326953748, "grad_norm": 0.4923228611797438, "learning_rate": 3.6355353075170846e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.2390061914920807, "step": 400, "valid_targets_mean": 4348.0, "valid_targets_min": 235 }, { "epoch": 0.645933014354067, "grad_norm": 0.58492013354936, "learning_rate": 3.681093394077449e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.23605602979660034, "step": 405, "valid_targets_mean": 3866.8, "valid_targets_min": 263 }, { "epoch": 0.6539074960127592, "grad_norm": 0.5800372174854277, "learning_rate": 3.7266514806378135e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580878436565399, "step": 410, "valid_targets_mean": 4487.8, "valid_targets_min": 728 }, { "epoch": 0.6618819776714514, "grad_norm": 0.5700368613429726, "learning_rate": 3.772209567198178e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.24940025806427002, "step": 415, "valid_targets_mean": 4252.4, "valid_targets_min": 185 }, { "epoch": 0.6698564593301436, "grad_norm": 0.5691664020081905, "learning_rate": 3.8177676537585425e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.23814374208450317, "step": 420, "valid_targets_mean": 4767.3, "valid_targets_min": 226 }, { "epoch": 0.6778309409888357, "grad_norm": 0.5041552220249231, "learning_rate": 3.863325740318907e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.26317381858825684, "step": 425, "valid_targets_mean": 5216.6, "valid_targets_min": 213 }, { "epoch": 0.6858054226475279, "grad_norm": 0.5191567542690365, "learning_rate": 3.9088838268792714e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.2395055890083313, "step": 430, "valid_targets_mean": 4498.9, "valid_targets_min": 606 }, { "epoch": 0.69377990430622, "grad_norm": 0.507951082676675, "learning_rate": 3.954441913439636e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.23812133073806763, "step": 435, "valid_targets_mean": 4862.8, "valid_targets_min": 599 }, { "epoch": 0.7017543859649122, "grad_norm": 0.4415015257689068, "learning_rate": 4e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.284793496131897, "step": 440, "valid_targets_mean": 7053.9, "valid_targets_min": 726 }, { "epoch": 0.7097288676236044, "grad_norm": 0.4687788595713669, "learning_rate": 3.9999841858814384e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.22677697241306305, "step": 445, "valid_targets_mean": 5137.8, "valid_targets_min": 332 }, { "epoch": 0.7177033492822966, "grad_norm": 0.4729761272261808, "learning_rate": 3.999936743775839e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.208622008562088, "step": 450, "valid_targets_mean": 4527.2, "valid_targets_min": 238 }, { "epoch": 0.7256778309409888, "grad_norm": 0.555015237464751, "learning_rate": 3.9998576744334574e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.21826383471488953, "step": 455, "valid_targets_mean": 4742.9, "valid_targets_min": 302 }, { "epoch": 0.733652312599681, "grad_norm": 0.5310365582781416, "learning_rate": 3.999746979104705e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.25395524501800537, "step": 460, "valid_targets_mean": 5156.8, "valid_targets_min": 237 }, { "epoch": 0.7416267942583732, "grad_norm": 0.4553894968924494, "learning_rate": 3.999604659540131e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.2229715883731842, "step": 465, "valid_targets_mean": 5806.7, "valid_targets_min": 227 }, { "epoch": 0.7496012759170654, "grad_norm": 0.553859237915477, "learning_rate": 3.999430717990395e-05, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.24489501118659973, "step": 470, "valid_targets_mean": 4576.5, "valid_targets_min": 393 }, { "epoch": 0.7575757575757576, "grad_norm": 0.5150108769606636, "learning_rate": 3.999225157206228e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.23615041375160217, "step": 475, "valid_targets_mean": 5394.9, "valid_targets_min": 426 }, { "epoch": 0.7655502392344498, "grad_norm": 0.6385286959140647, "learning_rate": 3.998987980438393e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.22305330634117126, "step": 480, "valid_targets_mean": 5164.2, "valid_targets_min": 223 }, { "epoch": 0.773524720893142, "grad_norm": 0.4830051792435215, "learning_rate": 3.9987191914376306e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.2323000133037567, "step": 485, "valid_targets_mean": 4675.6, "valid_targets_min": 242 }, { "epoch": 0.7814992025518341, "grad_norm": 0.5028756759202847, "learning_rate": 3.998418794454604e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.21495231986045837, "step": 490, "valid_targets_mean": 4435.6, "valid_targets_min": 253 }, { "epoch": 0.7894736842105263, "grad_norm": 0.5087547658254494, "learning_rate": 3.998086794239825e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.23997387290000916, "step": 495, "valid_targets_mean": 5214.6, "valid_targets_min": 252 }, { "epoch": 0.7974481658692185, "grad_norm": 0.4669380659732096, "learning_rate": 3.997723196043585e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.22620384395122528, "step": 500, "valid_targets_mean": 4997.2, "valid_targets_min": 220 }, { "epoch": 0.8054226475279107, "grad_norm": 0.5551348865851036, "learning_rate": 3.9973280056158695e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.25103485584259033, "step": 505, "valid_targets_mean": 5329.7, "valid_targets_min": 243 }, { "epoch": 0.8133971291866029, "grad_norm": 0.49318722832524914, "learning_rate": 3.9969012292062655e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.25136399269104004, "step": 510, "valid_targets_mean": 5802.3, "valid_targets_min": 342 }, { "epoch": 0.8213716108452951, "grad_norm": 0.5198628597650791, "learning_rate": 3.996442873563866e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2384355366230011, "step": 515, "valid_targets_mean": 5362.5, "valid_targets_min": 256 }, { "epoch": 0.8293460925039873, "grad_norm": 0.5205934398395562, "learning_rate": 3.9959529459371624e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787361443042755, "step": 520, "valid_targets_mean": 5885.7, "valid_targets_min": 228 }, { "epoch": 0.8373205741626795, "grad_norm": 0.5252409924659849, "learning_rate": 3.9954314540739284e-05, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.2512431740760803, "step": 525, "valid_targets_mean": 5641.8, "valid_targets_min": 1587 }, { "epoch": 0.8452950558213717, "grad_norm": 0.4704007226125745, "learning_rate": 3.994878406221097e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.23621171712875366, "step": 530, "valid_targets_mean": 5600.2, "valid_targets_min": 536 }, { "epoch": 0.8532695374800638, "grad_norm": 0.6083127057740186, "learning_rate": 3.994293811124632e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.2614426612854004, "step": 535, "valid_targets_mean": 5253.0, "valid_targets_min": 238 }, { "epoch": 0.861244019138756, "grad_norm": 0.4746686115421954, "learning_rate": 3.993677678029392e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.24418990314006805, "step": 540, "valid_targets_mean": 5040.0, "valid_targets_min": 1001 }, { "epoch": 0.8692185007974481, "grad_norm": 0.49549218402068856, "learning_rate": 3.9930300166789765e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.25148677825927734, "step": 545, "valid_targets_mean": 5570.9, "valid_targets_min": 319 }, { "epoch": 0.8771929824561403, "grad_norm": 0.5269114935537167, "learning_rate": 3.992350837315581e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.2529415786266327, "step": 550, "valid_targets_mean": 4481.4, "valid_targets_min": 418 }, { "epoch": 0.8851674641148325, "grad_norm": 0.4966140006866359, "learning_rate": 3.991640150679826e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.23965132236480713, "step": 555, "valid_targets_mean": 4778.5, "valid_targets_min": 193 }, { "epoch": 0.8931419457735247, "grad_norm": 0.46356963034858145, "learning_rate": 3.990897968010596e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.22081106901168823, "step": 560, "valid_targets_mean": 4536.8, "valid_targets_min": 318 }, { "epoch": 0.9011164274322169, "grad_norm": 0.5158811337778442, "learning_rate": 3.990124301044855e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.25084495544433594, "step": 565, "valid_targets_mean": 5180.1, "valid_targets_min": 262 }, { "epoch": 0.9090909090909091, "grad_norm": 0.4577837821562966, "learning_rate": 3.989319162017465e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.23798081278800964, "step": 570, "valid_targets_mean": 5647.1, "valid_targets_min": 292 }, { "epoch": 0.9170653907496013, "grad_norm": 0.44187500790924766, "learning_rate": 3.988482563660989e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.23343367874622345, "step": 575, "valid_targets_mean": 5496.6, "valid_targets_min": 179 }, { "epoch": 0.9250398724082934, "grad_norm": 0.5270106574297865, "learning_rate": 3.987614519205493e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.23939090967178345, "step": 580, "valid_targets_mean": 5919.2, "valid_targets_min": 1221 }, { "epoch": 0.9330143540669856, "grad_norm": 0.463729984008716, "learning_rate": 3.986715042378334e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.22995294630527496, "step": 585, "valid_targets_mean": 5917.2, "valid_targets_min": 852 }, { "epoch": 0.9409888357256778, "grad_norm": 0.47283664295456057, "learning_rate": 3.985784147403947e-05, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.2240312099456787, "step": 590, "valid_targets_mean": 5174.1, "valid_targets_min": 536 }, { "epoch": 0.94896331738437, "grad_norm": 0.5658848917368027, "learning_rate": 3.9848218490036144e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.232914000749588, "step": 595, "valid_targets_mean": 5265.4, "valid_targets_min": 732 }, { "epoch": 0.9569377990430622, "grad_norm": 0.4239055430774934, "learning_rate": 3.983828162395238e-05, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.20710644125938416, "step": 600, "valid_targets_mean": 6367.3, "valid_targets_min": 1579 }, { "epoch": 0.9649122807017544, "grad_norm": 0.44068282934869724, "learning_rate": 3.9828031032930944e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.23547522723674774, "step": 605, "valid_targets_mean": 5768.8, "valid_targets_min": 342 }, { "epoch": 0.9728867623604466, "grad_norm": 0.4301339156888651, "learning_rate": 3.98174668790759e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.22576510906219482, "step": 610, "valid_targets_mean": 5758.6, "valid_targets_min": 250 }, { "epoch": 0.9808612440191388, "grad_norm": 0.4083465304334347, "learning_rate": 3.9806589329450045e-05, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.21958738565444946, "step": 615, "valid_targets_mean": 6139.3, "valid_targets_min": 258 }, { "epoch": 0.988835725677831, "grad_norm": 0.5589998597597372, "learning_rate": 3.979539855607222e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.2316368967294693, "step": 620, "valid_targets_mean": 4443.0, "valid_targets_min": 293 }, { "epoch": 0.9968102073365231, "grad_norm": 0.49386174717125697, "learning_rate": 3.9783894735914646e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.23019137978553772, "step": 625, "valid_targets_mean": 5904.1, "valid_targets_min": 407 }, { "epoch": 1.0047846889952152, "grad_norm": 0.44385071840879137, "learning_rate": 3.9772078050900105e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.19644610583782196, "step": 630, "valid_targets_mean": 5611.9, "valid_targets_min": 342 }, { "epoch": 1.0127591706539074, "grad_norm": 0.48156890413963743, "learning_rate": 3.9759948687899055e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.2283916473388672, "step": 635, "valid_targets_mean": 4642.0, "valid_targets_min": 226 }, { "epoch": 1.0207336523125996, "grad_norm": 0.5551974573135551, "learning_rate": 3.974750683872667e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.2257927656173706, "step": 640, "valid_targets_mean": 4712.1, "valid_targets_min": 253 }, { "epoch": 1.0287081339712918, "grad_norm": 0.5112679546587456, "learning_rate": 3.973475270013984e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.2036946564912796, "step": 645, "valid_targets_mean": 3350.3, "valid_targets_min": 220 }, { "epoch": 1.036682615629984, "grad_norm": 0.5657504932352997, "learning_rate": 3.972168647383402e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2104548066854477, "step": 650, "valid_targets_mean": 5710.1, "valid_targets_min": 975 }, { "epoch": 1.0446570972886762, "grad_norm": 0.498819802151185, "learning_rate": 3.970830836644006e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.2443195879459381, "step": 655, "valid_targets_mean": 4341.6, "valid_targets_min": 237 }, { "epoch": 1.0526315789473684, "grad_norm": 0.4777708787250058, "learning_rate": 3.9694618589520945e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.21855522692203522, "step": 660, "valid_targets_mean": 6137.1, "valid_targets_min": 3874 }, { "epoch": 1.0606060606060606, "grad_norm": 0.42516424950849196, "learning_rate": 3.9680617359568414e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.22529324889183044, "step": 665, "valid_targets_mean": 5659.9, "valid_targets_min": 265 }, { "epoch": 1.0685805422647527, "grad_norm": 0.43957454727525247, "learning_rate": 3.966630489799959e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.20638194680213928, "step": 670, "valid_targets_mean": 5418.2, "valid_targets_min": 605 }, { "epoch": 1.076555023923445, "grad_norm": 0.480992229013917, "learning_rate": 3.9651681431153445e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.21741151809692383, "step": 675, "valid_targets_mean": 5676.9, "valid_targets_min": 653 }, { "epoch": 1.0845295055821371, "grad_norm": 0.5286831646993043, "learning_rate": 3.96367471902872e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.22559064626693726, "step": 680, "valid_targets_mean": 4749.8, "valid_targets_min": 1138 }, { "epoch": 1.0925039872408293, "grad_norm": 0.48401700631042965, "learning_rate": 3.9621502411572705e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.21404454112052917, "step": 685, "valid_targets_mean": 5151.9, "valid_targets_min": 492 }, { "epoch": 1.1004784688995215, "grad_norm": 0.49933746338574914, "learning_rate": 3.960594733609273e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.24951139092445374, "step": 690, "valid_targets_mean": 5677.1, "valid_targets_min": 414 }, { "epoch": 1.1084529505582137, "grad_norm": 0.5374555564691006, "learning_rate": 3.9590082209837054e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.23958654701709747, "step": 695, "valid_targets_mean": 4576.1, "valid_targets_min": 250 }, { "epoch": 1.1164274322169059, "grad_norm": 0.43156726192991535, "learning_rate": 3.957390728369867e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.22211644053459167, "step": 700, "valid_targets_mean": 5652.7, "valid_targets_min": 240 }, { "epoch": 1.124401913875598, "grad_norm": 0.5290650459685178, "learning_rate": 3.955742281346979e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.24193495512008667, "step": 705, "valid_targets_mean": 4738.0, "valid_targets_min": 1201 }, { "epoch": 1.1323763955342903, "grad_norm": 0.4590727414985068, "learning_rate": 3.9540629059837767e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.20210333168506622, "step": 710, "valid_targets_mean": 5049.0, "valid_targets_min": 386 }, { "epoch": 1.1403508771929824, "grad_norm": 0.5441856418870333, "learning_rate": 3.952352628838102e-05, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.20969565212726593, "step": 715, "valid_targets_mean": 4226.9, "valid_targets_min": 249 }, { "epoch": 1.1483253588516746, "grad_norm": 0.5380939962565157, "learning_rate": 3.95061147695648e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.240693137049675, "step": 720, "valid_targets_mean": 4818.9, "valid_targets_min": 549 }, { "epoch": 1.1562998405103668, "grad_norm": 0.5686689166363135, "learning_rate": 3.9488394778736935e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.24537625908851624, "step": 725, "valid_targets_mean": 3922.4, "valid_targets_min": 129 }, { "epoch": 1.164274322169059, "grad_norm": 0.4593411130317016, "learning_rate": 3.947036659612345e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.20501753687858582, "step": 730, "valid_targets_mean": 4789.3, "valid_targets_min": 242 }, { "epoch": 1.1722488038277512, "grad_norm": 0.5929679220372989, "learning_rate": 3.945203050682418e-05, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.2176203429698944, "step": 735, "valid_targets_mean": 5827.9, "valid_targets_min": 1421 }, { "epoch": 1.1802232854864434, "grad_norm": 0.49571444514839247, "learning_rate": 3.94333868008082e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.22823849320411682, "step": 740, "valid_targets_mean": 4559.8, "valid_targets_min": 955 }, { "epoch": 1.1881977671451356, "grad_norm": 0.47051475648971036, "learning_rate": 3.94144357729093e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.21944183111190796, "step": 745, "valid_targets_mean": 5556.9, "valid_targets_min": 241 }, { "epoch": 1.1961722488038278, "grad_norm": 0.4545193137066266, "learning_rate": 3.939517772282127e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2306528091430664, "step": 750, "valid_targets_mean": 5773.1, "valid_targets_min": 339 }, { "epoch": 1.20414673046252, "grad_norm": 0.5070293389053494, "learning_rate": 3.93756129550932e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.2366933524608612, "step": 755, "valid_targets_mean": 4809.0, "valid_targets_min": 225 }, { "epoch": 1.2121212121212122, "grad_norm": 0.4581327620567569, "learning_rate": 3.935574177912465e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.23561245203018188, "step": 760, "valid_targets_mean": 5730.1, "valid_targets_min": 431 }, { "epoch": 1.2200956937799043, "grad_norm": 0.44689390466942713, "learning_rate": 3.9335564509160746e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.25527051091194153, "step": 765, "valid_targets_mean": 5937.5, "valid_targets_min": 308 }, { "epoch": 1.2280701754385965, "grad_norm": 0.5105030340361397, "learning_rate": 3.931508146428724e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.21357367932796478, "step": 770, "valid_targets_mean": 4240.1, "valid_targets_min": 238 }, { "epoch": 1.2360446570972887, "grad_norm": 0.4285106295808272, "learning_rate": 3.929429296842542e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.22223004698753357, "step": 775, "valid_targets_mean": 5140.4, "valid_targets_min": 207 }, { "epoch": 1.244019138755981, "grad_norm": 0.5033088319271173, "learning_rate": 3.927319935032703e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.2382790595293045, "step": 780, "valid_targets_mean": 4656.1, "valid_targets_min": 190 }, { "epoch": 1.251993620414673, "grad_norm": 0.4832920433952073, "learning_rate": 3.925180094356905e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.22841961681842804, "step": 785, "valid_targets_mean": 4821.2, "valid_targets_min": 332 }, { "epoch": 1.2599681020733653, "grad_norm": 0.5541953861894534, "learning_rate": 3.9230098086548414e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.22924378514289856, "step": 790, "valid_targets_mean": 5035.1, "valid_targets_min": 387 }, { "epoch": 1.2679425837320575, "grad_norm": 0.45492743605486735, "learning_rate": 3.920809112247668e-05, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.2217010259628296, "step": 795, "valid_targets_mean": 5301.2, "valid_targets_min": 280 }, { "epoch": 1.2759170653907497, "grad_norm": 0.4050403811606527, "learning_rate": 3.918578039937459e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.20149385929107666, "step": 800, "valid_targets_mean": 6168.7, "valid_targets_min": 3585 }, { "epoch": 1.2838915470494419, "grad_norm": 0.49884758775784616, "learning_rate": 3.916316627006656e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.22389544546604156, "step": 805, "valid_targets_mean": 4229.8, "valid_targets_min": 205 }, { "epoch": 1.291866028708134, "grad_norm": 0.5437724639192097, "learning_rate": 3.914024909217511e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.21842722594738007, "step": 810, "valid_targets_mean": 5059.4, "valid_targets_min": 261 }, { "epoch": 1.2998405103668262, "grad_norm": 0.4614914901673496, "learning_rate": 3.911702922811522e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.22969508171081543, "step": 815, "valid_targets_mean": 5216.5, "valid_targets_min": 944 }, { "epoch": 1.3078149920255182, "grad_norm": 0.41670448262684845, "learning_rate": 3.909350704508856e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.21079647541046143, "step": 820, "valid_targets_mean": 5512.1, "valid_targets_min": 985 }, { "epoch": 1.3157894736842106, "grad_norm": 0.4532640251959151, "learning_rate": 3.906968291507773e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.2069890946149826, "step": 825, "valid_targets_mean": 4720.1, "valid_targets_min": 223 }, { "epoch": 1.3237639553429026, "grad_norm": 0.5068128448354305, "learning_rate": 3.904555721484034e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.22296027839183807, "step": 830, "valid_targets_mean": 4510.1, "valid_targets_min": 213 }, { "epoch": 1.331738437001595, "grad_norm": 0.44758555237161834, "learning_rate": 3.9021130325903076e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.22679689526557922, "step": 835, "valid_targets_mean": 4813.0, "valid_targets_min": 491 }, { "epoch": 1.339712918660287, "grad_norm": 0.4343562516139951, "learning_rate": 3.899640263455566e-05, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.20167089998722076, "step": 840, "valid_targets_mean": 5034.6, "valid_targets_min": 250 }, { "epoch": 1.3476874003189794, "grad_norm": 0.4572454435644633, "learning_rate": 3.897137453184472e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.20767706632614136, "step": 845, "valid_targets_mean": 5134.5, "valid_targets_min": 278 }, { "epoch": 1.3556618819776713, "grad_norm": 0.5014219811560465, "learning_rate": 3.894604641356767e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.20389358699321747, "step": 850, "valid_targets_mean": 3887.2, "valid_targets_min": 210 }, { "epoch": 1.3636363636363638, "grad_norm": 0.48510005391738675, "learning_rate": 3.8920418680266346e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.22810472548007965, "step": 855, "valid_targets_mean": 5032.4, "valid_targets_min": 391 }, { "epoch": 1.3716108452950557, "grad_norm": 0.5183414139626299, "learning_rate": 3.889449173722077e-05, "loss": 0.2163, "loss_nan_ranks": 0, "loss_rank_avg": 0.2274407297372818, "step": 860, "valid_targets_mean": 4475.8, "valid_targets_min": 272 }, { "epoch": 1.3795853269537481, "grad_norm": 0.5158129823910096, "learning_rate": 3.8868265994442694e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2289605587720871, "step": 865, "valid_targets_mean": 4482.9, "valid_targets_min": 298 }, { "epoch": 1.38755980861244, "grad_norm": 0.46178793662898315, "learning_rate": 3.8841741866669126e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.20329372584819794, "step": 870, "valid_targets_mean": 4624.8, "valid_targets_min": 201 }, { "epoch": 1.3955342902711323, "grad_norm": 0.43110143764599795, "learning_rate": 3.881491977335577e-05, "loss": 0.2145, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101316750049591, "step": 875, "valid_targets_mean": 5321.4, "valid_targets_min": 213 }, { "epoch": 1.4035087719298245, "grad_norm": 0.503740796436895, "learning_rate": 3.878780013867038e-05, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.20829784870147705, "step": 880, "valid_targets_mean": 4938.4, "valid_targets_min": 208 }, { "epoch": 1.4114832535885167, "grad_norm": 0.46875611927410893, "learning_rate": 3.8760383391486074e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.2217826247215271, "step": 885, "valid_targets_mean": 5166.4, "valid_targets_min": 1977 }, { "epoch": 1.4194577352472089, "grad_norm": 0.40715680224468764, "learning_rate": 3.873266996537456e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.2007824033498764, "step": 890, "valid_targets_mean": 6011.9, "valid_targets_min": 1107 }, { "epoch": 1.427432216905901, "grad_norm": 0.4538795595368198, "learning_rate": 3.8704660298599225e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.19974635541439056, "step": 895, "valid_targets_mean": 5461.1, "valid_targets_min": 233 }, { "epoch": 1.4354066985645932, "grad_norm": 0.3925116796629304, "learning_rate": 3.867635483410827e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.19021229445934296, "step": 900, "valid_targets_mean": 5960.0, "valid_targets_min": 287 }, { "epoch": 1.4433811802232854, "grad_norm": 0.4526958366149273, "learning_rate": 3.864775401952767e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.224770188331604, "step": 905, "valid_targets_mean": 4794.1, "valid_targets_min": 385 }, { "epoch": 1.4513556618819776, "grad_norm": 0.47739345174396636, "learning_rate": 3.8618858307154085e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.21421770751476288, "step": 910, "valid_targets_mean": 4971.1, "valid_targets_min": 229 }, { "epoch": 1.4593301435406698, "grad_norm": 0.48441435233113955, "learning_rate": 3.8589668153947743e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.2115284949541092, "step": 915, "valid_targets_mean": 4584.6, "valid_targets_min": 613 }, { "epoch": 1.467304625199362, "grad_norm": 0.48463948682962943, "learning_rate": 3.8560184021525194e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.21348783373832703, "step": 920, "valid_targets_mean": 4442.5, "valid_targets_min": 192 }, { "epoch": 1.4752791068580542, "grad_norm": 0.4451502603868636, "learning_rate": 3.853040637615199e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.23046502470970154, "step": 925, "valid_targets_mean": 4936.4, "valid_targets_min": 395 }, { "epoch": 1.4832535885167464, "grad_norm": 0.40199972450433025, "learning_rate": 3.850033568873536e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.19406135380268097, "step": 930, "valid_targets_mean": 5947.2, "valid_targets_min": 479 }, { "epoch": 1.4912280701754386, "grad_norm": 0.5368761175611442, "learning_rate": 3.8469972434816706e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.21021592617034912, "step": 935, "valid_targets_mean": 4767.3, "valid_targets_min": 243 }, { "epoch": 1.4992025518341308, "grad_norm": 0.3986721112323499, "learning_rate": 3.843931709456414e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.19780415296554565, "step": 940, "valid_targets_mean": 5795.1, "valid_targets_min": 861 }, { "epoch": 1.507177033492823, "grad_norm": 0.4587666035993858, "learning_rate": 3.840837015276483e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.22320160269737244, "step": 945, "valid_targets_mean": 5755.1, "valid_targets_min": 941 }, { "epoch": 1.5151515151515151, "grad_norm": 0.45703951269412757, "learning_rate": 3.83771320988174e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.22210641205310822, "step": 950, "valid_targets_mean": 4737.4, "valid_targets_min": 399 }, { "epoch": 1.5231259968102073, "grad_norm": 0.48709993942146484, "learning_rate": 3.834560342672413e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.22919026017189026, "step": 955, "valid_targets_mean": 5368.0, "valid_targets_min": 471 }, { "epoch": 1.5311004784688995, "grad_norm": 0.5327015189373576, "learning_rate": 3.831378463508318e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.20985502004623413, "step": 960, "valid_targets_mean": 3672.7, "valid_targets_min": 255 }, { "epoch": 1.5390749601275917, "grad_norm": 0.4889458724924527, "learning_rate": 3.8281676227080694e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.23470205068588257, "step": 965, "valid_targets_mean": 4279.4, "valid_targets_min": 545 }, { "epoch": 1.547049441786284, "grad_norm": 0.4816208661066147, "learning_rate": 3.824927871048284e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.22319866716861725, "step": 970, "valid_targets_mean": 5811.1, "valid_targets_min": 691 }, { "epoch": 1.555023923444976, "grad_norm": 0.49629303617677123, "learning_rate": 3.8216592597627797e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.20921722054481506, "step": 975, "valid_targets_mean": 4481.5, "valid_targets_min": 458 }, { "epoch": 1.5629984051036683, "grad_norm": 0.4486748383761303, "learning_rate": 3.818361840541761e-05, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.2034325897693634, "step": 980, "valid_targets_mean": 5753.4, "valid_targets_min": 249 }, { "epoch": 1.5709728867623605, "grad_norm": 0.4704184941444946, "learning_rate": 3.815035665531008e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.2329174280166626, "step": 985, "valid_targets_mean": 5679.9, "valid_targets_min": 794 }, { "epoch": 1.5789473684210527, "grad_norm": 0.7126080076891846, "learning_rate": 3.811680787331047e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.20356056094169617, "step": 990, "valid_targets_mean": 4500.5, "valid_targets_min": 200 }, { "epoch": 1.5869218500797448, "grad_norm": 0.4362810483573207, "learning_rate": 3.8082972589963175e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.25651684403419495, "step": 995, "valid_targets_mean": 5741.7, "valid_targets_min": 485 }, { "epoch": 1.594896331738437, "grad_norm": 0.5308816657896737, "learning_rate": 3.80488513403434e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.22023651003837585, "step": 1000, "valid_targets_mean": 3424.5, "valid_targets_min": 259 }, { "epoch": 1.6028708133971292, "grad_norm": 0.4510219809474634, "learning_rate": 3.8014444664048616e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.21104635298252106, "step": 1005, "valid_targets_mean": 5196.3, "valid_targets_min": 240 }, { "epoch": 1.6108452950558214, "grad_norm": 0.4803455404102778, "learning_rate": 3.797975310519009e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.21788547933101654, "step": 1010, "valid_targets_mean": 4816.5, "valid_targets_min": 274 }, { "epoch": 1.6188197767145136, "grad_norm": 0.47472698938848756, "learning_rate": 3.794477721238425e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.23355194926261902, "step": 1015, "valid_targets_mean": 4637.8, "valid_targets_min": 234 }, { "epoch": 1.6267942583732058, "grad_norm": 0.4147989370142633, "learning_rate": 3.7909517538744e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.19726088643074036, "step": 1020, "valid_targets_mean": 5528.1, "valid_targets_min": 713 }, { "epoch": 1.6347687400318978, "grad_norm": 0.43057872861456375, "learning_rate": 3.7873974641870006e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.23569004237651825, "step": 1025, "valid_targets_mean": 5202.3, "valid_targets_min": 429 }, { "epoch": 1.6427432216905902, "grad_norm": 0.4944214692564835, "learning_rate": 3.7838149083841856e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.22196251153945923, "step": 1030, "valid_targets_mean": 4496.9, "valid_targets_min": 367 }, { "epoch": 1.6507177033492821, "grad_norm": 0.484950405225721, "learning_rate": 3.7802041431209166e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.22201311588287354, "step": 1035, "valid_targets_mean": 5337.4, "valid_targets_min": 276 }, { "epoch": 1.6586921850079746, "grad_norm": 0.46643309909033687, "learning_rate": 3.776565225498264e-05, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.20948752760887146, "step": 1040, "valid_targets_mean": 5726.2, "valid_targets_min": 216 }, { "epoch": 1.6666666666666665, "grad_norm": 0.4505057278309987, "learning_rate": 3.7728982130625025e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.21404105424880981, "step": 1045, "valid_targets_mean": 5463.8, "valid_targets_min": 624 }, { "epoch": 1.674641148325359, "grad_norm": 0.4632571232381542, "learning_rate": 3.769203163804202e-05, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.2386375069618225, "step": 1050, "valid_targets_mean": 4372.1, "valid_targets_min": 212 }, { "epoch": 1.682615629984051, "grad_norm": 0.5885949234294394, "learning_rate": 3.7654801361573076e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.2116532027721405, "step": 1055, "valid_targets_mean": 3293.9, "valid_targets_min": 164 }, { "epoch": 1.6905901116427433, "grad_norm": 0.476396006242146, "learning_rate": 3.761729188998222e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.2132015824317932, "step": 1060, "valid_targets_mean": 4883.0, "valid_targets_min": 234 }, { "epoch": 1.6985645933014353, "grad_norm": 0.4415064752469964, "learning_rate": 3.757950381644868e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.18930253386497498, "step": 1065, "valid_targets_mean": 4347.8, "valid_targets_min": 201 }, { "epoch": 1.7065390749601277, "grad_norm": 0.4918318431688853, "learning_rate": 3.7541437738557524e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.22140301764011383, "step": 1070, "valid_targets_mean": 4014.4, "valid_targets_min": 266 }, { "epoch": 1.7145135566188197, "grad_norm": 0.4757910103440479, "learning_rate": 3.750309425829022e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.22511640191078186, "step": 1075, "valid_targets_mean": 4329.7, "valid_targets_min": 234 }, { "epoch": 1.722488038277512, "grad_norm": 0.418880480295893, "learning_rate": 3.746447398201512e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.2123282253742218, "step": 1080, "valid_targets_mean": 6908.0, "valid_targets_min": 4942 }, { "epoch": 1.730462519936204, "grad_norm": 0.49617766079766823, "learning_rate": 3.7425577520477846e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.21871669590473175, "step": 1085, "valid_targets_mean": 4811.3, "valid_targets_min": 198 }, { "epoch": 1.7384370015948964, "grad_norm": 0.4598780604045823, "learning_rate": 3.738640548879166e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.20024099946022034, "step": 1090, "valid_targets_mean": 4600.0, "valid_targets_min": 295 }, { "epoch": 1.7464114832535884, "grad_norm": 0.4184329372379239, "learning_rate": 3.7346958506427696e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.20633798837661743, "step": 1095, "valid_targets_mean": 6165.7, "valid_targets_min": 4183 }, { "epoch": 1.7543859649122808, "grad_norm": 0.4797137007699827, "learning_rate": 3.730723719720523e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.21521145105361938, "step": 1100, "valid_targets_mean": 4948.5, "valid_targets_min": 238 }, { "epoch": 1.7623604465709728, "grad_norm": 0.464012546044584, "learning_rate": 3.7267242189281746e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.2169262021780014, "step": 1105, "valid_targets_mean": 6075.7, "valid_targets_min": 2766 }, { "epoch": 1.7703349282296652, "grad_norm": 0.47591074751434326, "learning_rate": 3.722697411514305e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.22949981689453125, "step": 1110, "valid_targets_mean": 5401.1, "valid_targets_min": 251 }, { "epoch": 1.7783094098883572, "grad_norm": 0.4993896425623004, "learning_rate": 3.7186433611593225e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.1904512345790863, "step": 1115, "valid_targets_mean": 5432.9, "valid_targets_min": 238 }, { "epoch": 1.7862838915470496, "grad_norm": 0.45815865946027584, "learning_rate": 3.7145621319744614e-05, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.2207677662372589, "step": 1120, "valid_targets_mean": 5302.4, "valid_targets_min": 193 }, { "epoch": 1.7942583732057416, "grad_norm": 0.4341993760317199, "learning_rate": 3.7104537885007635e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.21209567785263062, "step": 1125, "valid_targets_mean": 5470.0, "valid_targets_min": 291 }, { "epoch": 1.802232854864434, "grad_norm": 0.4329735980280842, "learning_rate": 3.7063183957080594e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.21948090195655823, "step": 1130, "valid_targets_mean": 6026.4, "valid_targets_min": 971 }, { "epoch": 1.810207336523126, "grad_norm": 0.4481414703783188, "learning_rate": 3.7021560189939416e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.2207806408405304, "step": 1135, "valid_targets_mean": 5682.9, "valid_targets_min": 1396 }, { "epoch": 1.8181818181818183, "grad_norm": 0.522534265852767, "learning_rate": 3.697966724182729e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.21881750226020813, "step": 1140, "valid_targets_mean": 5429.8, "valid_targets_min": 447 }, { "epoch": 1.8261562998405103, "grad_norm": 0.4974497276431288, "learning_rate": 3.6937505775244246e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.190834641456604, "step": 1145, "valid_targets_mean": 4105.1, "valid_targets_min": 215 }, { "epoch": 1.8341307814992025, "grad_norm": 0.4079277949685025, "learning_rate": 3.689507645693674e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.22405077517032623, "step": 1150, "valid_targets_mean": 5792.1, "valid_targets_min": 686 }, { "epoch": 1.8421052631578947, "grad_norm": 0.49811626292486966, "learning_rate": 3.6852379957887025e-05, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.2030624896287918, "step": 1155, "valid_targets_mean": 5252.1, "valid_targets_min": 455 }, { "epoch": 1.8500797448165869, "grad_norm": 0.4204561756675584, "learning_rate": 3.6809416953302606e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.20025420188903809, "step": 1160, "valid_targets_mean": 5681.7, "valid_targets_min": 1357 }, { "epoch": 1.858054226475279, "grad_norm": 0.44519682325171034, "learning_rate": 3.676618812260553e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.21237683296203613, "step": 1165, "valid_targets_mean": 5172.7, "valid_targets_min": 315 }, { "epoch": 1.8660287081339713, "grad_norm": 0.39822025331588046, "learning_rate": 3.672269414942166e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.20583263039588928, "step": 1170, "valid_targets_mean": 6143.7, "valid_targets_min": 4416 }, { "epoch": 1.8740031897926634, "grad_norm": 0.4171821917382488, "learning_rate": 3.6678935721569825e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.19881102442741394, "step": 1175, "valid_targets_mean": 5497.3, "valid_targets_min": 315 }, { "epoch": 1.8819776714513556, "grad_norm": 0.4738173624083104, "learning_rate": 3.663491353105101e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.21670684218406677, "step": 1180, "valid_targets_mean": 4734.4, "valid_targets_min": 252 }, { "epoch": 1.8899521531100478, "grad_norm": 0.38986990747488626, "learning_rate": 3.659062827403735e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.19631826877593994, "step": 1185, "valid_targets_mean": 5470.2, "valid_targets_min": 544 }, { "epoch": 1.89792663476874, "grad_norm": 0.43069168920501544, "learning_rate": 3.654608065086115e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.22201283276081085, "step": 1190, "valid_targets_mean": 5315.6, "valid_targets_min": 1025 }, { "epoch": 1.9059011164274322, "grad_norm": 0.4756282213697449, "learning_rate": 3.650127136600379e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.20297697186470032, "step": 1195, "valid_targets_mean": 4748.2, "valid_targets_min": 220 }, { "epoch": 1.9138755980861244, "grad_norm": 0.42489920562160244, "learning_rate": 3.645620112808464e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.20593520998954773, "step": 1200, "valid_targets_mean": 5418.3, "valid_targets_min": 253 }, { "epoch": 1.9218500797448166, "grad_norm": 0.4334876163320044, "learning_rate": 3.641087064984977e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.22070161998271942, "step": 1205, "valid_targets_mean": 4694.1, "valid_targets_min": 258 }, { "epoch": 1.9298245614035088, "grad_norm": 0.4516336012066562, "learning_rate": 3.636528064816073e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.20581312477588654, "step": 1210, "valid_targets_mean": 4649.5, "valid_targets_min": 401 }, { "epoch": 1.937799043062201, "grad_norm": 0.4767246444943567, "learning_rate": 3.6319431843983223e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.21031825244426727, "step": 1215, "valid_targets_mean": 5190.2, "valid_targets_min": 1234 }, { "epoch": 1.9457735247208932, "grad_norm": 0.4411208057237242, "learning_rate": 3.6273324962375676e-05, "loss": 0.2169, "loss_nan_ranks": 0, "loss_rank_avg": 0.20570659637451172, "step": 1220, "valid_targets_mean": 4742.9, "valid_targets_min": 277 }, { "epoch": 1.9537480063795853, "grad_norm": 0.43422619282432606, "learning_rate": 3.622696073247777e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.23021955788135529, "step": 1225, "valid_targets_mean": 5510.6, "valid_targets_min": 220 }, { "epoch": 1.9617224880382775, "grad_norm": 0.3958863238593673, "learning_rate": 3.6180339887498953e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.21620529890060425, "step": 1230, "valid_targets_mean": 5932.4, "valid_targets_min": 3927 }, { "epoch": 1.9696969696969697, "grad_norm": 0.450040729571919, "learning_rate": 3.613346316470678e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.21761035919189453, "step": 1235, "valid_targets_mean": 5147.7, "valid_targets_min": 197 }, { "epoch": 1.977671451355662, "grad_norm": 0.41291052485814267, "learning_rate": 3.60863313054153e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.2143172323703766, "step": 1240, "valid_targets_mean": 5364.6, "valid_targets_min": 198 }, { "epoch": 1.985645933014354, "grad_norm": 0.4220642316941175, "learning_rate": 3.6038945054973334e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.18891289830207825, "step": 1245, "valid_targets_mean": 4778.4, "valid_targets_min": 350 }, { "epoch": 1.9936204146730463, "grad_norm": 0.41397715465144314, "learning_rate": 3.599130516275266e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.21088147163391113, "step": 1250, "valid_targets_mean": 5391.7, "valid_targets_min": 1017 }, { "epoch": 2.0015948963317385, "grad_norm": 0.3643446187203916, "learning_rate": 3.594341238213618e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.199854776263237, "step": 1255, "valid_targets_mean": 7008.9, "valid_targets_min": 1310 }, { "epoch": 2.0095693779904304, "grad_norm": 0.5089005502007752, "learning_rate": 3.589526747050601e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.19922807812690735, "step": 1260, "valid_targets_mean": 5693.9, "valid_targets_min": 253 }, { "epoch": 2.017543859649123, "grad_norm": 0.503959442172207, "learning_rate": 3.584687118923149e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.1943974494934082, "step": 1265, "valid_targets_mean": 4555.7, "valid_targets_min": 294 }, { "epoch": 2.025518341307815, "grad_norm": 0.479827670134503, "learning_rate": 3.579822430365714e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.20069649815559387, "step": 1270, "valid_targets_mean": 5865.2, "valid_targets_min": 319 }, { "epoch": 2.0334928229665072, "grad_norm": 0.531555659296794, "learning_rate": 3.57493275830906e-05, "loss": 0.2025, "loss_nan_ranks": 0, "loss_rank_avg": 0.18816310167312622, "step": 1275, "valid_targets_mean": 4013.8, "valid_targets_min": 257 }, { "epoch": 2.041467304625199, "grad_norm": 0.4535957632544287, "learning_rate": 3.570018180079037e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.182516947388649, "step": 1280, "valid_targets_mean": 4548.5, "valid_targets_min": 404 }, { "epoch": 2.0494417862838916, "grad_norm": 0.4102394127837868, "learning_rate": 3.5650787733953715e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1951259821653366, "step": 1285, "valid_targets_mean": 5618.1, "valid_targets_min": 485 }, { "epoch": 2.0574162679425836, "grad_norm": 0.4455885359883081, "learning_rate": 3.560114616370425e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.18562662601470947, "step": 1290, "valid_targets_mean": 5641.9, "valid_targets_min": 1013 }, { "epoch": 2.065390749601276, "grad_norm": 0.428626874635782, "learning_rate": 3.555125787507964e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.18140408396720886, "step": 1295, "valid_targets_mean": 5703.9, "valid_targets_min": 880 }, { "epoch": 2.073365231259968, "grad_norm": 0.4584548418763648, "learning_rate": 3.550112365701921e-05, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.18239644169807434, "step": 1300, "valid_targets_mean": 4791.1, "valid_targets_min": 306 }, { "epoch": 2.0813397129186604, "grad_norm": 0.43039743066547864, "learning_rate": 3.545074430235142e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.17609882354736328, "step": 1305, "valid_targets_mean": 5186.6, "valid_targets_min": 993 }, { "epoch": 2.0893141945773523, "grad_norm": 0.570297651690843, "learning_rate": 3.540012060778137e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940477192401886, "step": 1310, "valid_targets_mean": 5585.9, "valid_targets_min": 2335 }, { "epoch": 2.0972886762360448, "grad_norm": 0.5667347176037617, "learning_rate": 3.534925337387816e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.23207005858421326, "step": 1315, "valid_targets_mean": 4650.1, "valid_targets_min": 988 }, { "epoch": 2.1052631578947367, "grad_norm": 0.437965181451973, "learning_rate": 3.529814340506226e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.18409255146980286, "step": 1320, "valid_targets_mean": 5324.3, "valid_targets_min": 498 }, { "epoch": 2.113237639553429, "grad_norm": 0.48750716332724386, "learning_rate": 3.524679150959277e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.19646605849266052, "step": 1325, "valid_targets_mean": 5267.9, "valid_targets_min": 242 }, { "epoch": 2.121212121212121, "grad_norm": 0.4674875720772593, "learning_rate": 3.519519849955466e-05, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.184675931930542, "step": 1330, "valid_targets_mean": 5060.6, "valid_targets_min": 231 }, { "epoch": 2.1291866028708135, "grad_norm": 0.412128726013319, "learning_rate": 3.514336519084591e-05, "loss": 0.2034, "loss_nan_ranks": 0, "loss_rank_avg": 0.19906136393547058, "step": 1335, "valid_targets_mean": 6195.8, "valid_targets_min": 1126 }, { "epoch": 2.1371610845295055, "grad_norm": 0.454372966625409, "learning_rate": 3.509129240316461e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1770518273115158, "step": 1340, "valid_targets_mean": 4886.6, "valid_targets_min": 229 }, { "epoch": 2.145135566188198, "grad_norm": 0.41470060548444787, "learning_rate": 3.5038980959995985e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.21732914447784424, "step": 1345, "valid_targets_mean": 5456.9, "valid_targets_min": 431 }, { "epoch": 2.15311004784689, "grad_norm": 0.5082279794924567, "learning_rate": 3.498643168859941e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.2050442099571228, "step": 1350, "valid_targets_mean": 3737.6, "valid_targets_min": 237 }, { "epoch": 2.1610845295055823, "grad_norm": 0.4465994627612317, "learning_rate": 3.493364541999529e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.1864827573299408, "step": 1355, "valid_targets_mean": 5549.5, "valid_targets_min": 265 }, { "epoch": 2.1690590111642742, "grad_norm": 0.4959175879648974, "learning_rate": 3.488062298895194e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.19287291169166565, "step": 1360, "valid_targets_mean": 5856.5, "valid_targets_min": 187 }, { "epoch": 2.1770334928229667, "grad_norm": 0.44527239357999826, "learning_rate": 3.482736523397237e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.1782650649547577, "step": 1365, "valid_targets_mean": 6042.2, "valid_targets_min": 283 }, { "epoch": 2.1850079744816586, "grad_norm": 0.48649563144503055, "learning_rate": 3.4773872997281026e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.19013699889183044, "step": 1370, "valid_targets_mean": 4519.7, "valid_targets_min": 234 }, { "epoch": 2.192982456140351, "grad_norm": 0.45009208736512063, "learning_rate": 3.472014712481048e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.20921623706817627, "step": 1375, "valid_targets_mean": 5785.2, "valid_targets_min": 1188 }, { "epoch": 2.200956937799043, "grad_norm": 0.47367304566980717, "learning_rate": 3.466618846618806e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.19029450416564941, "step": 1380, "valid_targets_mean": 4545.1, "valid_targets_min": 218 }, { "epoch": 2.2089314194577354, "grad_norm": 0.44532555731302303, "learning_rate": 3.461199787472238e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.2194649875164032, "step": 1385, "valid_targets_mean": 6045.2, "valid_targets_min": 353 }, { "epoch": 2.2169059011164274, "grad_norm": 0.4574540062857725, "learning_rate": 3.455757620738989e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2010454535484314, "step": 1390, "valid_targets_mean": 5319.1, "valid_targets_min": 192 }, { "epoch": 2.22488038277512, "grad_norm": 0.4137662066758735, "learning_rate": 3.450292432482127e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1860542595386505, "step": 1395, "valid_targets_mean": 5334.2, "valid_targets_min": 254 }, { "epoch": 2.2328548644338118, "grad_norm": 0.5266331960391181, "learning_rate": 3.444804309128789e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.20332130789756775, "step": 1400, "valid_targets_mean": 4094.9, "valid_targets_min": 276 }, { "epoch": 2.240829346092504, "grad_norm": 0.4275504408813166, "learning_rate": 3.439293337468808e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.20420581102371216, "step": 1405, "valid_targets_mean": 5697.4, "valid_targets_min": 280 }, { "epoch": 2.248803827751196, "grad_norm": 0.6098551773610512, "learning_rate": 3.4337596046533426e-05, "loss": 0.2025, "loss_nan_ranks": 0, "loss_rank_avg": 0.2192438542842865, "step": 1410, "valid_targets_mean": 4067.2, "valid_targets_min": 273 }, { "epoch": 2.2567783094098885, "grad_norm": 0.46223066080996034, "learning_rate": 3.4282031981935e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.19895970821380615, "step": 1415, "valid_targets_mean": 5468.5, "valid_targets_min": 241 }, { "epoch": 2.2647527910685805, "grad_norm": 0.4816233736428177, "learning_rate": 3.42262420595895e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.20274695754051208, "step": 1420, "valid_targets_mean": 4453.4, "valid_targets_min": 243 }, { "epoch": 2.2727272727272725, "grad_norm": 0.5447011231170933, "learning_rate": 3.417022716176539e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.23817561566829681, "step": 1425, "valid_targets_mean": 4389.7, "valid_targets_min": 207 }, { "epoch": 2.280701754385965, "grad_norm": 0.4065575430290217, "learning_rate": 3.411398817428889e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.17134660482406616, "step": 1430, "valid_targets_mean": 5676.4, "valid_targets_min": 287 }, { "epoch": 2.2886762360446573, "grad_norm": 0.42839943743721853, "learning_rate": 3.4057525986530016e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1901647001504898, "step": 1435, "valid_targets_mean": 5106.8, "valid_targets_min": 231 }, { "epoch": 2.2966507177033493, "grad_norm": 0.5843289079352976, "learning_rate": 3.400084149138851e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.19277843832969666, "step": 1440, "valid_targets_mean": 5061.8, "valid_targets_min": 248 }, { "epoch": 2.3046251993620412, "grad_norm": 0.41359975340834615, "learning_rate": 3.394393558527969e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.1865783929824829, "step": 1445, "valid_targets_mean": 4914.6, "valid_targets_min": 215 }, { "epoch": 2.3125996810207337, "grad_norm": 0.8413467284644864, "learning_rate": 3.388680916812031e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.19681130349636078, "step": 1450, "valid_targets_mean": 3662.1, "valid_targets_min": 231 }, { "epoch": 2.320574162679426, "grad_norm": 0.42971911311204314, "learning_rate": 3.382946314331429e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.1996922791004181, "step": 1455, "valid_targets_mean": 5618.2, "valid_targets_min": 238 }, { "epoch": 2.328548644338118, "grad_norm": 0.44153231073372906, "learning_rate": 3.377189841773848e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.1980620175600052, "step": 1460, "valid_targets_mean": 6170.3, "valid_targets_min": 231 }, { "epoch": 2.33652312599681, "grad_norm": 0.5293878213403573, "learning_rate": 3.371411590172827e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.18319925665855408, "step": 1465, "valid_targets_mean": 5088.3, "valid_targets_min": 293 }, { "epoch": 2.3444976076555024, "grad_norm": 0.6426703391266552, "learning_rate": 3.365611650906321e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.20919805765151978, "step": 1470, "valid_targets_mean": 4000.6, "valid_targets_min": 245 }, { "epoch": 2.352472089314195, "grad_norm": 0.3978379280431999, "learning_rate": 3.359790115695259e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.18329757452011108, "step": 1475, "valid_targets_mean": 5595.2, "valid_targets_min": 236 }, { "epoch": 2.360446570972887, "grad_norm": 0.4545853833674734, "learning_rate": 3.353947076602088e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.20800280570983887, "step": 1480, "valid_targets_mean": 4826.0, "valid_targets_min": 240 }, { "epoch": 2.3684210526315788, "grad_norm": 0.44645999692405564, "learning_rate": 3.34808262602932e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.20406398177146912, "step": 1485, "valid_targets_mean": 5473.4, "valid_targets_min": 352 }, { "epoch": 2.376395534290271, "grad_norm": 0.445133870638968, "learning_rate": 3.342196856718074e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.2017001211643219, "step": 1490, "valid_targets_mean": 6088.2, "valid_targets_min": 661 }, { "epoch": 2.384370015948963, "grad_norm": 0.597332937011485, "learning_rate": 3.336289861746602e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.19852346181869507, "step": 1495, "valid_targets_mean": 4930.6, "valid_targets_min": 234 }, { "epoch": 2.3923444976076556, "grad_norm": 0.45394616672617394, "learning_rate": 3.330361734528823e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.190562903881073, "step": 1500, "valid_targets_mean": 4513.7, "valid_targets_min": 471 }, { "epoch": 2.4003189792663475, "grad_norm": 0.4805966610484533, "learning_rate": 3.324412568812844e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.20358845591545105, "step": 1505, "valid_targets_mean": 4287.1, "valid_targets_min": 242 }, { "epoch": 2.40829346092504, "grad_norm": 0.42131026059287974, "learning_rate": 3.318442458679477e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.19886666536331177, "step": 1510, "valid_targets_mean": 5740.6, "valid_targets_min": 1204 }, { "epoch": 2.416267942583732, "grad_norm": 0.4625097603216523, "learning_rate": 3.312451498540751e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.2181396782398224, "step": 1515, "valid_targets_mean": 4945.9, "valid_targets_min": 208 }, { "epoch": 2.4242424242424243, "grad_norm": 0.7157764991804577, "learning_rate": 3.306439783138421e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.18493902683258057, "step": 1520, "valid_targets_mean": 4290.6, "valid_targets_min": 233 }, { "epoch": 2.4322169059011163, "grad_norm": 0.48585805226131235, "learning_rate": 3.3004074075424666e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.1977916955947876, "step": 1525, "valid_targets_mean": 4688.1, "valid_targets_min": 371 }, { "epoch": 2.4401913875598087, "grad_norm": 0.4127665889358799, "learning_rate": 3.29435446714959e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.21614857017993927, "step": 1530, "valid_targets_mean": 5571.1, "valid_targets_min": 247 }, { "epoch": 2.4481658692185007, "grad_norm": 0.42425666745682966, "learning_rate": 3.288281057681709e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.20173463225364685, "step": 1535, "valid_targets_mean": 5986.9, "valid_targets_min": 3398 }, { "epoch": 2.456140350877193, "grad_norm": 0.4248076718805002, "learning_rate": 3.28218727518444e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.1972285509109497, "step": 1540, "valid_targets_mean": 6004.7, "valid_targets_min": 312 }, { "epoch": 2.464114832535885, "grad_norm": 0.3922347541694817, "learning_rate": 3.2760732160255835e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.18398353457450867, "step": 1545, "valid_targets_mean": 5221.8, "valid_targets_min": 257 }, { "epoch": 2.4720893141945774, "grad_norm": 0.4303243717469087, "learning_rate": 3.269938976893595e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.21553900837898254, "step": 1550, "valid_targets_mean": 5332.7, "valid_targets_min": 385 }, { "epoch": 2.4800637958532694, "grad_norm": 0.4854770545469238, "learning_rate": 3.2637846547960596e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.17565301060676575, "step": 1555, "valid_targets_mean": 4513.3, "valid_targets_min": 265 }, { "epoch": 2.488038277511962, "grad_norm": 0.43977338387056625, "learning_rate": 3.2576103470581564e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.19088605046272278, "step": 1560, "valid_targets_mean": 4912.8, "valid_targets_min": 237 }, { "epoch": 2.496012759170654, "grad_norm": 0.4520785254838387, "learning_rate": 3.25141615132112e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.20245029032230377, "step": 1565, "valid_targets_mean": 5112.1, "valid_targets_min": 897 }, { "epoch": 2.503987240829346, "grad_norm": 0.5068509455429572, "learning_rate": 3.245202165540697e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.19341543316841125, "step": 1570, "valid_targets_mean": 4056.7, "valid_targets_min": 234 }, { "epoch": 2.511961722488038, "grad_norm": 0.5435007785354973, "learning_rate": 3.238968487985594e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.22572636604309082, "step": 1575, "valid_targets_mean": 5079.7, "valid_targets_min": 470 }, { "epoch": 2.5199362041467306, "grad_norm": 0.45017998405884907, "learning_rate": 3.232715217235927e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1891011893749237, "step": 1580, "valid_targets_mean": 4659.2, "valid_targets_min": 269 }, { "epoch": 2.5279106858054226, "grad_norm": 0.46614430155117725, "learning_rate": 3.226442452181662e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.21900171041488647, "step": 1585, "valid_targets_mean": 4712.8, "valid_targets_min": 290 }, { "epoch": 2.535885167464115, "grad_norm": 0.4179797529076482, "learning_rate": 3.220150292021049e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.20042002201080322, "step": 1590, "valid_targets_mean": 5453.1, "valid_targets_min": 397 }, { "epoch": 2.543859649122807, "grad_norm": 0.3941065291864704, "learning_rate": 3.213838836259055e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.1991400420665741, "step": 1595, "valid_targets_mean": 6182.4, "valid_targets_min": 1366 }, { "epoch": 2.5518341307814993, "grad_norm": 0.5251204241670916, "learning_rate": 3.2075081847057886e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.1915452778339386, "step": 1600, "valid_targets_mean": 5069.6, "valid_targets_min": 315 }, { "epoch": 2.5598086124401913, "grad_norm": 0.4344757969866471, "learning_rate": 3.201158437474925e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.20345640182495117, "step": 1605, "valid_targets_mean": 5158.1, "valid_targets_min": 291 }, { "epoch": 2.5677830940988837, "grad_norm": 0.486960352408697, "learning_rate": 3.194789694982119e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.20748808979988098, "step": 1610, "valid_targets_mean": 4422.7, "valid_targets_min": 313 }, { "epoch": 2.5757575757575757, "grad_norm": 0.40817659538238277, "learning_rate": 3.1884020579434216e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.19428619742393494, "step": 1615, "valid_targets_mean": 5725.4, "valid_targets_min": 1368 }, { "epoch": 2.583732057416268, "grad_norm": 0.5274105752709692, "learning_rate": 3.181995627373679e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.1966966688632965, "step": 1620, "valid_targets_mean": 4958.5, "valid_targets_min": 244 }, { "epoch": 2.59170653907496, "grad_norm": 0.6069953846941016, "learning_rate": 3.1755705045849465e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.21730463206768036, "step": 1625, "valid_targets_mean": 5876.8, "valid_targets_min": 231 }, { "epoch": 2.5996810207336525, "grad_norm": 0.4266434532453334, "learning_rate": 3.1691267911848765e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.19540351629257202, "step": 1630, "valid_targets_mean": 6337.5, "valid_targets_min": 1361 }, { "epoch": 2.6076555023923444, "grad_norm": 0.4740580478639372, "learning_rate": 3.1626645890751167e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.20163899660110474, "step": 1635, "valid_targets_mean": 4218.8, "valid_targets_min": 375 }, { "epoch": 2.6156299840510364, "grad_norm": 0.45637845415807304, "learning_rate": 3.156184000449697e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.20877380669116974, "step": 1640, "valid_targets_mean": 5568.1, "valid_targets_min": 1781 }, { "epoch": 2.623604465709729, "grad_norm": 0.4308877600902401, "learning_rate": 3.149685127793415e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.18682101368904114, "step": 1645, "valid_targets_mean": 5184.0, "valid_targets_min": 234 }, { "epoch": 2.6315789473684212, "grad_norm": 0.4189163208718231, "learning_rate": 3.143168073880214e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.18947117030620575, "step": 1650, "valid_targets_mean": 7086.4, "valid_targets_min": 3741 }, { "epoch": 2.639553429027113, "grad_norm": 0.5597913294956877, "learning_rate": 3.1366329417715556e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.20389412343502045, "step": 1655, "valid_targets_mean": 2807.3, "valid_targets_min": 245 }, { "epoch": 2.647527910685805, "grad_norm": 0.4577649992315954, "learning_rate": 3.1300798348147954e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.21411626040935516, "step": 1660, "valid_targets_mean": 4915.6, "valid_targets_min": 244 }, { "epoch": 2.6555023923444976, "grad_norm": 0.5697741917006428, "learning_rate": 3.123508856641542e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.18438398838043213, "step": 1665, "valid_targets_mean": 2729.6, "valid_targets_min": 212 }, { "epoch": 2.66347687400319, "grad_norm": 0.4954551623019788, "learning_rate": 3.116920111166025e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.19248652458190918, "step": 1670, "valid_targets_mean": 5454.8, "valid_targets_min": 1300 }, { "epoch": 2.671451355661882, "grad_norm": 0.6574670833738052, "learning_rate": 3.1103137025834456e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.20095154643058777, "step": 1675, "valid_targets_mean": 4381.1, "valid_targets_min": 227 }, { "epoch": 2.679425837320574, "grad_norm": 0.5132611155528096, "learning_rate": 3.103689735368333e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.1844911277294159, "step": 1680, "valid_targets_mean": 5391.4, "valid_targets_min": 252 }, { "epoch": 2.6874003189792663, "grad_norm": 0.4212211839126058, "learning_rate": 3.097048314272889e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.18505148589611053, "step": 1685, "valid_targets_mean": 5102.6, "valid_targets_min": 300 }, { "epoch": 2.6953748006379588, "grad_norm": 0.4423902059794495, "learning_rate": 3.090389544325335e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.1688818335533142, "step": 1690, "valid_targets_mean": 4878.3, "valid_targets_min": 324 }, { "epoch": 2.7033492822966507, "grad_norm": 0.5581123858755366, "learning_rate": 3.08371353082825e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.19731852412223816, "step": 1695, "valid_targets_mean": 3715.7, "valid_targets_min": 251 }, { "epoch": 2.7113237639553427, "grad_norm": 0.42350710595986724, "learning_rate": 3.0770203793568994e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.16717937588691711, "step": 1700, "valid_targets_mean": 4077.0, "valid_targets_min": 233 }, { "epoch": 2.719298245614035, "grad_norm": 0.49090848376444596, "learning_rate": 3.0703101957575765e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.15885134041309357, "step": 1705, "valid_targets_mean": 4482.4, "valid_targets_min": 243 }, { "epoch": 2.7272727272727275, "grad_norm": 0.6436929861619126, "learning_rate": 3.0635830861459204e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.18233323097229004, "step": 1710, "valid_targets_mean": 4834.9, "valid_targets_min": 195 }, { "epoch": 2.7352472089314195, "grad_norm": 0.46088720776870845, "learning_rate": 3.056839156905239e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.1806366741657257, "step": 1715, "valid_targets_mean": 4546.9, "valid_targets_min": 237 }, { "epoch": 2.7432216905901115, "grad_norm": 0.4474922756938493, "learning_rate": 3.0500785146848303e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.22203987836837769, "step": 1720, "valid_targets_mean": 5486.4, "valid_targets_min": 3263 }, { "epoch": 2.751196172248804, "grad_norm": 0.4954321658053421, "learning_rate": 3.04330126639829e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.19901606440544128, "step": 1725, "valid_targets_mean": 4870.5, "valid_targets_min": 344 }, { "epoch": 2.7591706539074963, "grad_norm": 0.4289601290987771, "learning_rate": 3.0365075192218278e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18361328542232513, "step": 1730, "valid_targets_mean": 5532.9, "valid_targets_min": 361 }, { "epoch": 2.7671451355661882, "grad_norm": 0.43515257338738716, "learning_rate": 3.0296973805925663e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.1985451728105545, "step": 1735, "valid_targets_mean": 4923.9, "valid_targets_min": 205 }, { "epoch": 2.77511961722488, "grad_norm": 0.49286906233457306, "learning_rate": 3.022870958206845e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.22014012932777405, "step": 1740, "valid_targets_mean": 4225.8, "valid_targets_min": 241 }, { "epoch": 2.7830940988835726, "grad_norm": 0.46268729106701734, "learning_rate": 3.0160283600185168e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.1991043984889984, "step": 1745, "valid_targets_mean": 5857.8, "valid_targets_min": 2502 }, { "epoch": 2.7910685805422646, "grad_norm": 0.43987550309271245, "learning_rate": 3.0091696942372412e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.22454778850078583, "step": 1750, "valid_targets_mean": 5287.6, "valid_targets_min": 426 }, { "epoch": 2.799043062200957, "grad_norm": 0.3909802203598762, "learning_rate": 3.002295069326772e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.18474428355693817, "step": 1755, "valid_targets_mean": 6217.1, "valid_targets_min": 798 }, { "epoch": 2.807017543859649, "grad_norm": 0.4519033373142686, "learning_rate": 2.9954045940032423e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228385955095291, "step": 1760, "valid_targets_mean": 4893.2, "valid_targets_min": 796 }, { "epoch": 2.8149920255183414, "grad_norm": 0.443167897058933, "learning_rate": 2.988498377233446e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.19619905948638916, "step": 1765, "valid_targets_mean": 4660.5, "valid_targets_min": 537 }, { "epoch": 2.8229665071770333, "grad_norm": 0.40577323628578027, "learning_rate": 2.981576528233114e-05, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.1754124015569687, "step": 1770, "valid_targets_mean": 5301.9, "valid_targets_min": 1010 }, { "epoch": 2.8309409888357258, "grad_norm": 0.7482306867842724, "learning_rate": 2.9746391564651867e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.19741225242614746, "step": 1775, "valid_targets_mean": 5149.7, "valid_targets_min": 442 }, { "epoch": 2.8389154704944177, "grad_norm": 0.4247278253753553, "learning_rate": 2.9676863716380845e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.17590616643428802, "step": 1780, "valid_targets_mean": 4805.6, "valid_targets_min": 245 }, { "epoch": 2.84688995215311, "grad_norm": 0.3967661509113751, "learning_rate": 2.9607182837039697e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.19023631513118744, "step": 1785, "valid_targets_mean": 5670.9, "valid_targets_min": 342 }, { "epoch": 2.854864433811802, "grad_norm": 0.469096556872057, "learning_rate": 2.9537350028570126e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.1898074746131897, "step": 1790, "valid_targets_mean": 5681.8, "valid_targets_min": 589 }, { "epoch": 2.8628389154704945, "grad_norm": 0.47473047259461487, "learning_rate": 2.946736639531643e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.18150553107261658, "step": 1795, "valid_targets_mean": 3808.1, "valid_targets_min": 222 }, { "epoch": 2.8708133971291865, "grad_norm": 0.5204904028442524, "learning_rate": 2.9397233044008092e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.23707595467567444, "step": 1800, "valid_targets_mean": 4178.8, "valid_targets_min": 220 }, { "epoch": 2.878787878787879, "grad_norm": 0.47501836141359854, "learning_rate": 2.9326951083742243e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.19446857273578644, "step": 1805, "valid_targets_mean": 4535.6, "valid_targets_min": 389 }, { "epoch": 2.886762360446571, "grad_norm": 0.42948864890631583, "learning_rate": 2.925652162596613e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.17343220114707947, "step": 1810, "valid_targets_mean": 4889.4, "valid_targets_min": 236 }, { "epoch": 2.8947368421052633, "grad_norm": 0.5059534986758673, "learning_rate": 2.9185945784459558e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.2241000235080719, "step": 1815, "valid_targets_mean": 5150.2, "valid_targets_min": 330 }, { "epoch": 2.9027113237639552, "grad_norm": 0.47658050657237366, "learning_rate": 2.9115224675317252e-05, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.21023055911064148, "step": 1820, "valid_targets_mean": 4221.5, "valid_targets_min": 214 }, { "epoch": 2.9106858054226477, "grad_norm": 0.41994426403573426, "learning_rate": 2.9044359416931206e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.1868569403886795, "step": 1825, "valid_targets_mean": 5305.3, "valid_targets_min": 350 }, { "epoch": 2.9186602870813396, "grad_norm": 0.41704691170495495, "learning_rate": 2.897335112997302e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.18512971699237823, "step": 1830, "valid_targets_mean": 5721.6, "valid_targets_min": 1638 }, { "epoch": 2.926634768740032, "grad_norm": 0.44070738637909757, "learning_rate": 2.8902200937376173e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.187473863363266, "step": 1835, "valid_targets_mean": 4991.3, "valid_targets_min": 220 }, { "epoch": 2.934609250398724, "grad_norm": 0.41564417066878323, "learning_rate": 2.8830909964318242e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.1944010853767395, "step": 1840, "valid_targets_mean": 5204.4, "valid_targets_min": 254 }, { "epoch": 2.9425837320574164, "grad_norm": 0.4711330801343301, "learning_rate": 2.875947933820312e-05, "loss": 0.1909, "loss_nan_ranks": 0, "loss_rank_avg": 0.18439987301826477, "step": 1845, "valid_targets_mean": 4334.9, "valid_targets_min": 358 }, { "epoch": 2.9505582137161084, "grad_norm": 0.4312204583935454, "learning_rate": 2.868791018864321e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.2141954004764557, "step": 1850, "valid_targets_mean": 5918.7, "valid_targets_min": 729 }, { "epoch": 2.958532695374801, "grad_norm": 0.3992293087829351, "learning_rate": 2.861620364744151e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1783233880996704, "step": 1855, "valid_targets_mean": 5647.2, "valid_targets_min": 265 }, { "epoch": 2.9665071770334928, "grad_norm": 0.4507956223008353, "learning_rate": 2.854436084857379e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.17667381465435028, "step": 1860, "valid_targets_mean": 4852.1, "valid_targets_min": 213 }, { "epoch": 2.974481658692185, "grad_norm": 0.4773163155858111, "learning_rate": 2.847238292817057e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.20969876646995544, "step": 1865, "valid_targets_mean": 4586.2, "valid_targets_min": 445 }, { "epoch": 2.982456140350877, "grad_norm": 0.4528434719614539, "learning_rate": 2.8400271024499212e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.2054166942834854, "step": 1870, "valid_targets_mean": 4955.4, "valid_targets_min": 226 }, { "epoch": 2.990430622009569, "grad_norm": 0.3885619872358622, "learning_rate": 2.832802627794593e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.1787319779396057, "step": 1875, "valid_targets_mean": 5796.7, "valid_targets_min": 237 }, { "epoch": 2.9984051036682615, "grad_norm": 0.42804120084625014, "learning_rate": 2.8255649830997704e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.17473948001861572, "step": 1880, "valid_targets_mean": 5018.7, "valid_targets_min": 268 }, { "epoch": 3.006379585326954, "grad_norm": 0.433732961845131, "learning_rate": 2.8183142828224238e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.17086060345172882, "step": 1885, "valid_targets_mean": 5365.8, "valid_targets_min": 974 }, { "epoch": 3.014354066985646, "grad_norm": 0.4863024499849261, "learning_rate": 2.811050641625988e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.191526398062706, "step": 1890, "valid_targets_mean": 5307.4, "valid_targets_min": 280 }, { "epoch": 3.0223285486443383, "grad_norm": 0.4706758519016476, "learning_rate": 2.8037741743785458e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.18275225162506104, "step": 1895, "valid_targets_mean": 5210.0, "valid_targets_min": 1063 }, { "epoch": 3.0303030303030303, "grad_norm": 0.48525571024905406, "learning_rate": 2.796484996151013e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842869222164154, "step": 1900, "valid_targets_mean": 4938.5, "valid_targets_min": 346 }, { "epoch": 3.0382775119617227, "grad_norm": 0.412438730549393, "learning_rate": 2.7891832222153188e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.17894425988197327, "step": 1905, "valid_targets_mean": 6566.9, "valid_targets_min": 3239 }, { "epoch": 3.0462519936204147, "grad_norm": 0.4304985686601505, "learning_rate": 2.7818689680425807e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.17525765299797058, "step": 1910, "valid_targets_mean": 5481.5, "valid_targets_min": 217 }, { "epoch": 3.054226475279107, "grad_norm": 0.3943796487066891, "learning_rate": 2.7745423493012827e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.17475299537181854, "step": 1915, "valid_targets_mean": 5954.4, "valid_targets_min": 286 }, { "epoch": 3.062200956937799, "grad_norm": 0.4539894149791786, "learning_rate": 2.767203481855441e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.19275791943073273, "step": 1920, "valid_targets_mean": 5459.8, "valid_targets_min": 715 }, { "epoch": 3.0701754385964914, "grad_norm": 0.5140612143362417, "learning_rate": 2.7598524817627764e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.18038983643054962, "step": 1925, "valid_targets_mean": 5190.4, "valid_targets_min": 253 }, { "epoch": 3.0781499202551834, "grad_norm": 0.5065917391396272, "learning_rate": 2.7524894652728754e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.17167213559150696, "step": 1930, "valid_targets_mean": 5318.8, "valid_targets_min": 210 }, { "epoch": 3.0861244019138754, "grad_norm": 0.4869400509228171, "learning_rate": 2.7451145488253544e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.19056691229343414, "step": 1935, "valid_targets_mean": 4080.8, "valid_targets_min": 198 }, { "epoch": 3.094098883572568, "grad_norm": 0.43805490959459653, "learning_rate": 2.7377278490480157e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.18080243468284607, "step": 1940, "valid_targets_mean": 5616.9, "valid_targets_min": 1092 }, { "epoch": 3.1020733652312598, "grad_norm": 0.5757191060457126, "learning_rate": 2.730329482755006e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.19692851603031158, "step": 1945, "valid_targets_mean": 4502.3, "valid_targets_min": 285 }, { "epoch": 3.110047846889952, "grad_norm": 0.4558677202034122, "learning_rate": 2.7229195669449667e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.19101294875144958, "step": 1950, "valid_targets_mean": 5041.2, "valid_targets_min": 213 }, { "epoch": 3.118022328548644, "grad_norm": 0.5737066377290475, "learning_rate": 2.7154982187991855e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.17446887493133545, "step": 1955, "valid_targets_mean": 4123.6, "valid_targets_min": 164 }, { "epoch": 3.1259968102073366, "grad_norm": 0.4748676581841484, "learning_rate": 2.7080655556797406e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1776636242866516, "step": 1960, "valid_targets_mean": 4680.4, "valid_targets_min": 277 }, { "epoch": 3.1339712918660285, "grad_norm": 0.6049727128355192, "learning_rate": 2.700621695127649e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.19648462533950806, "step": 1965, "valid_targets_mean": 3179.7, "valid_targets_min": 239 }, { "epoch": 3.141945773524721, "grad_norm": 0.904407825912653, "learning_rate": 2.693166754861003e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.16663089394569397, "step": 1970, "valid_targets_mean": 5391.8, "valid_targets_min": 944 }, { "epoch": 3.149920255183413, "grad_norm": 0.4709363791045733, "learning_rate": 2.685700852773113e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.18905910849571228, "step": 1975, "valid_targets_mean": 4695.8, "valid_targets_min": 229 }, { "epoch": 3.1578947368421053, "grad_norm": 0.42759989366433276, "learning_rate": 2.6782241069306395e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.15810883045196533, "step": 1980, "valid_targets_mean": 4624.4, "valid_targets_min": 264 }, { "epoch": 3.1658692185007973, "grad_norm": 0.5668755951710633, "learning_rate": 2.6707366355717268e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.19498129189014435, "step": 1985, "valid_targets_mean": 3415.8, "valid_targets_min": 237 }, { "epoch": 3.1738437001594897, "grad_norm": 0.5117307401139212, "learning_rate": 2.663238557104136e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.18552227318286896, "step": 1990, "valid_targets_mean": 5261.2, "valid_targets_min": 1556 }, { "epoch": 3.1818181818181817, "grad_norm": 0.4511472489219715, "learning_rate": 2.655729990103368e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.19818511605262756, "step": 1995, "valid_targets_mean": 4634.6, "valid_targets_min": 238 }, { "epoch": 3.189792663476874, "grad_norm": 0.45119915336535704, "learning_rate": 2.648211053310792e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.17265570163726807, "step": 2000, "valid_targets_mean": 4349.8, "valid_targets_min": 274 }, { "epoch": 3.197767145135566, "grad_norm": 0.5099187438099473, "learning_rate": 2.6406818656317654e-05, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.18631012737751007, "step": 2005, "valid_targets_mean": 5041.1, "valid_targets_min": 186 }, { "epoch": 3.2057416267942584, "grad_norm": 0.43152334301712886, "learning_rate": 2.6331425461337557e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.20323804020881653, "step": 2010, "valid_targets_mean": 5194.4, "valid_targets_min": 363 }, { "epoch": 3.2137161084529504, "grad_norm": 0.5058093159841838, "learning_rate": 2.6255932140444546e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.1969982385635376, "step": 2015, "valid_targets_mean": 4715.8, "valid_targets_min": 564 }, { "epoch": 3.221690590111643, "grad_norm": 0.5417933534703635, "learning_rate": 2.618033988749895e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.17095516622066498, "step": 2020, "valid_targets_mean": 5090.6, "valid_targets_min": 549 }, { "epoch": 3.229665071770335, "grad_norm": 0.5215923504113277, "learning_rate": 2.6104649897925622e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.18847623467445374, "step": 2025, "valid_targets_mean": 4847.3, "valid_targets_min": 250 }, { "epoch": 3.237639553429027, "grad_norm": 0.4854778649654015, "learning_rate": 2.602886336869503e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.18689140677452087, "step": 2030, "valid_targets_mean": 4723.2, "valid_targets_min": 696 }, { "epoch": 3.245614035087719, "grad_norm": 0.41371731832822933, "learning_rate": 2.595298149830433e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.168317049741745, "step": 2035, "valid_targets_mean": 5431.8, "valid_targets_min": 449 }, { "epoch": 3.2535885167464116, "grad_norm": 0.4766656293066071, "learning_rate": 2.5877005486758424e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.16988810896873474, "step": 2040, "valid_targets_mean": 4498.4, "valid_targets_min": 259 }, { "epoch": 3.2615629984051036, "grad_norm": 0.4657699021786932, "learning_rate": 2.5800936535550954e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.19996368885040283, "step": 2045, "valid_targets_mean": 5065.3, "valid_targets_min": 389 }, { "epoch": 3.269537480063796, "grad_norm": 0.579537992120868, "learning_rate": 2.5724775847645345e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.1846703290939331, "step": 2050, "valid_targets_mean": 3962.0, "valid_targets_min": 356 }, { "epoch": 3.277511961722488, "grad_norm": 0.43962432468601853, "learning_rate": 2.5648524627455738e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.17168590426445007, "step": 2055, "valid_targets_mean": 4880.3, "valid_targets_min": 241 }, { "epoch": 3.2854864433811803, "grad_norm": 0.43976364075492486, "learning_rate": 2.557218408082798e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.17411866784095764, "step": 2060, "valid_targets_mean": 5362.1, "valid_targets_min": 842 }, { "epoch": 3.2934609250398723, "grad_norm": 0.4166736194901456, "learning_rate": 2.5495755415020504e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.17816022038459778, "step": 2065, "valid_targets_mean": 5734.4, "valid_targets_min": 905 }, { "epoch": 3.3014354066985647, "grad_norm": 0.4697125475765612, "learning_rate": 2.5419239838685325e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751966029405594, "step": 2070, "valid_targets_mean": 4562.7, "valid_targets_min": 285 }, { "epoch": 3.3094098883572567, "grad_norm": 0.4671449458327588, "learning_rate": 2.5342638561848817e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.16543221473693848, "step": 2075, "valid_targets_mean": 4974.4, "valid_targets_min": 226 }, { "epoch": 3.317384370015949, "grad_norm": 0.40997152428438766, "learning_rate": 2.526595279589265e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.1541728526353836, "step": 2080, "valid_targets_mean": 4638.1, "valid_targets_min": 226 }, { "epoch": 3.325358851674641, "grad_norm": 0.4771138092691609, "learning_rate": 2.5189183753534634e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.1681135892868042, "step": 2085, "valid_targets_mean": 4536.9, "valid_targets_min": 210 }, { "epoch": 3.3333333333333335, "grad_norm": 0.43928713346598164, "learning_rate": 2.5112332648809495e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.14815892279148102, "step": 2090, "valid_targets_mean": 5117.4, "valid_targets_min": 229 }, { "epoch": 3.3413078149920254, "grad_norm": 0.4313014172799839, "learning_rate": 2.503540069704973e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.17248690128326416, "step": 2095, "valid_targets_mean": 4849.8, "valid_targets_min": 241 }, { "epoch": 3.349282296650718, "grad_norm": 0.4133044248197675, "learning_rate": 2.4958389114866326e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.17558759450912476, "step": 2100, "valid_targets_mean": 5708.4, "valid_targets_min": 266 }, { "epoch": 3.35725677830941, "grad_norm": 0.4626815305223826, "learning_rate": 2.488129912012958e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18145158886909485, "step": 2105, "valid_targets_mean": 5372.7, "valid_targets_min": 290 }, { "epoch": 3.3652312599681022, "grad_norm": 0.5376199276841933, "learning_rate": 2.4804131931949823e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.20464350283145905, "step": 2110, "valid_targets_mean": 3939.8, "valid_targets_min": 471 }, { "epoch": 3.373205741626794, "grad_norm": 0.39017410377798123, "learning_rate": 2.4726888770658103e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.16700437664985657, "step": 2115, "valid_targets_mean": 6394.6, "valid_targets_min": 239 }, { "epoch": 3.3811802232854866, "grad_norm": 0.4501347693294624, "learning_rate": 2.4649570857786928e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.18887585401535034, "step": 2120, "valid_targets_mean": 5312.3, "valid_targets_min": 257 }, { "epoch": 3.3891547049441786, "grad_norm": 0.3953602084293926, "learning_rate": 2.4572179416050953e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.16343992948532104, "step": 2125, "valid_targets_mean": 5817.3, "valid_targets_min": 243 }, { "epoch": 3.397129186602871, "grad_norm": 0.5007835737617361, "learning_rate": 2.449471566932761e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.17662839591503143, "step": 2130, "valid_targets_mean": 4295.5, "valid_targets_min": 226 }, { "epoch": 3.405103668261563, "grad_norm": 0.4957544588950391, "learning_rate": 2.4417180842637764e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.17977860569953918, "step": 2135, "valid_targets_mean": 3976.7, "valid_targets_min": 194 }, { "epoch": 3.4130781499202554, "grad_norm": 0.38831190373740015, "learning_rate": 2.4339576162126362e-05, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.16816681623458862, "step": 2140, "valid_targets_mean": 5675.8, "valid_targets_min": 319 }, { "epoch": 3.4210526315789473, "grad_norm": 0.9616520701738128, "learning_rate": 2.4261902855043027e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.17975673079490662, "step": 2145, "valid_targets_mean": 4098.2, "valid_targets_min": 603 }, { "epoch": 3.4290271132376393, "grad_norm": 0.4782879314316972, "learning_rate": 2.418416214972265e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.17841896414756775, "step": 2150, "valid_targets_mean": 4659.6, "valid_targets_min": 223 }, { "epoch": 3.4370015948963317, "grad_norm": 0.4811275110351178, "learning_rate": 2.4106355275565937e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.17591729760169983, "step": 2155, "valid_targets_mean": 4179.1, "valid_targets_min": 238 }, { "epoch": 3.444976076555024, "grad_norm": 0.3982427739209225, "learning_rate": 2.4028483463020053e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.15703259408473969, "step": 2160, "valid_targets_mean": 5950.8, "valid_targets_min": 3447 }, { "epoch": 3.452950558213716, "grad_norm": 0.4924681333200768, "learning_rate": 2.3950547943559056e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.16207414865493774, "step": 2165, "valid_targets_mean": 5059.4, "valid_targets_min": 244 }, { "epoch": 3.460925039872408, "grad_norm": 0.4085937153688259, "learning_rate": 2.3872549949664493e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.17049971222877502, "step": 2170, "valid_targets_mean": 5347.9, "valid_targets_min": 283 }, { "epoch": 3.4688995215311005, "grad_norm": 0.4421895807116598, "learning_rate": 2.3794490714805897e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.17558689415454865, "step": 2175, "valid_targets_mean": 5187.2, "valid_targets_min": 381 }, { "epoch": 3.476874003189793, "grad_norm": 0.419246164689495, "learning_rate": 2.3716371473421242e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.20042678713798523, "step": 2180, "valid_targets_mean": 5921.3, "valid_targets_min": 705 }, { "epoch": 3.484848484848485, "grad_norm": 0.4534306165338507, "learning_rate": 2.36381934608975e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.17749859392642975, "step": 2185, "valid_targets_mean": 5067.5, "valid_targets_min": 230 }, { "epoch": 3.492822966507177, "grad_norm": 0.5306038480542064, "learning_rate": 2.3559957913551014e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.18456803262233734, "step": 2190, "valid_targets_mean": 5680.9, "valid_targets_min": 237 }, { "epoch": 3.5007974481658692, "grad_norm": 0.49172607407811136, "learning_rate": 2.3481666068607994e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.1954020857810974, "step": 2195, "valid_targets_mean": 4640.9, "valid_targets_min": 357 }, { "epoch": 3.5087719298245617, "grad_norm": 0.41516895750937666, "learning_rate": 2.3403319164184986e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.15638519823551178, "step": 2200, "valid_targets_mean": 5532.4, "valid_targets_min": 958 }, { "epoch": 3.5167464114832536, "grad_norm": 0.4251311303323281, "learning_rate": 2.3324918439269206e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.1633860468864441, "step": 2205, "valid_targets_mean": 5711.6, "valid_targets_min": 3042 }, { "epoch": 3.5247208931419456, "grad_norm": 0.41401228714505406, "learning_rate": 2.3246465133699024e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.15223251283168793, "step": 2210, "valid_targets_mean": 5461.5, "valid_targets_min": 1728 }, { "epoch": 3.532695374800638, "grad_norm": 0.43338985811687897, "learning_rate": 2.31679604881443e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.23456290364265442, "step": 2215, "valid_targets_mean": 6196.2, "valid_targets_min": 234 }, { "epoch": 3.5406698564593304, "grad_norm": 0.4391172774731024, "learning_rate": 2.3089405744086823e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.16365471482276917, "step": 2220, "valid_targets_mean": 4690.2, "valid_targets_min": 237 }, { "epoch": 3.5486443381180224, "grad_norm": 0.41279470884015235, "learning_rate": 2.3010802143800626e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.17660290002822876, "step": 2225, "valid_targets_mean": 5499.1, "valid_targets_min": 255 }, { "epoch": 3.5566188197767143, "grad_norm": 0.4616887719700764, "learning_rate": 2.2932150930332363e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628832221031189, "step": 2230, "valid_targets_mean": 4519.4, "valid_targets_min": 236 }, { "epoch": 3.5645933014354068, "grad_norm": 0.4143421206391745, "learning_rate": 2.2853453347481635e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.17244276404380798, "step": 2235, "valid_targets_mean": 5402.8, "valid_targets_min": 227 }, { "epoch": 3.5725677830940987, "grad_norm": 0.4491746905194006, "learning_rate": 2.277471063978137e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.15876632928848267, "step": 2240, "valid_targets_mean": 4808.6, "valid_targets_min": 231 }, { "epoch": 3.580542264752791, "grad_norm": 0.5060019043175118, "learning_rate": 2.2695924052478065e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.17421862483024597, "step": 2245, "valid_targets_mean": 4258.2, "valid_targets_min": 260 }, { "epoch": 3.588516746411483, "grad_norm": 0.41387766339051296, "learning_rate": 2.2617094831512167e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.17327752709388733, "step": 2250, "valid_targets_mean": 6265.3, "valid_targets_min": 2950 }, { "epoch": 3.5964912280701755, "grad_norm": 0.4611729813954408, "learning_rate": 2.253822422349831e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.1817869246006012, "step": 2255, "valid_targets_mean": 4701.2, "valid_targets_min": 397 }, { "epoch": 3.6044657097288675, "grad_norm": 0.43026115082741934, "learning_rate": 2.2459313475705645e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.1769014596939087, "step": 2260, "valid_targets_mean": 5325.2, "valid_targets_min": 205 }, { "epoch": 3.61244019138756, "grad_norm": 0.5249375671075871, "learning_rate": 2.23803638360381e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.18358995020389557, "step": 2265, "valid_targets_mean": 3656.4, "valid_targets_min": 199 }, { "epoch": 3.620414673046252, "grad_norm": 0.4541299825413091, "learning_rate": 2.2301376553014625e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612316220998764, "step": 2270, "valid_targets_mean": 4446.9, "valid_targets_min": 245 }, { "epoch": 3.6283891547049443, "grad_norm": 0.5119351564216902, "learning_rate": 2.2222352875749493e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.19726499915122986, "step": 2275, "valid_targets_mean": 5226.8, "valid_targets_min": 395 }, { "epoch": 3.6363636363636362, "grad_norm": 0.4597152452341196, "learning_rate": 2.214329405393249e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666208803653717, "step": 2280, "valid_targets_mean": 4824.7, "valid_targets_min": 1500 }, { "epoch": 3.6443381180223287, "grad_norm": 0.41930922950793337, "learning_rate": 2.2064201337809212e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.17563220858573914, "step": 2285, "valid_targets_mean": 5103.7, "valid_targets_min": 2380 }, { "epoch": 3.6523125996810206, "grad_norm": 0.551536941032092, "learning_rate": 2.1985075978161236e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.1810903698205948, "step": 2290, "valid_targets_mean": 4225.5, "valid_targets_min": 238 }, { "epoch": 3.660287081339713, "grad_norm": 0.46416383882322815, "learning_rate": 2.1905919226286385e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1780536025762558, "step": 2295, "valid_targets_mean": 4323.2, "valid_targets_min": 349 }, { "epoch": 3.668261562998405, "grad_norm": 0.4379742235735547, "learning_rate": 2.1826732333978924e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.1874227225780487, "step": 2300, "valid_targets_mean": 4977.4, "valid_targets_min": 236 }, { "epoch": 3.6762360446570974, "grad_norm": 0.4619563699283561, "learning_rate": 2.1747516553509755e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.17133791744709015, "step": 2305, "valid_targets_mean": 4711.6, "valid_targets_min": 245 }, { "epoch": 3.6842105263157894, "grad_norm": 0.489064170185469, "learning_rate": 2.166827313760662e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.1689237505197525, "step": 2310, "valid_targets_mean": 4220.6, "valid_targets_min": 358 }, { "epoch": 3.692185007974482, "grad_norm": 0.44106248237446816, "learning_rate": 2.1589003339434292e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1686490774154663, "step": 2315, "valid_targets_mean": 4874.4, "valid_targets_min": 216 }, { "epoch": 3.7001594896331738, "grad_norm": 0.44652285565230415, "learning_rate": 2.150970841257476e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.18092358112335205, "step": 2320, "valid_targets_mean": 4935.1, "valid_targets_min": 242 }, { "epoch": 3.708133971291866, "grad_norm": 0.41008613997039367, "learning_rate": 2.1430389611007393e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724787950515747, "step": 2325, "valid_targets_mean": 5347.4, "valid_targets_min": 306 }, { "epoch": 3.716108452950558, "grad_norm": 0.4552446615706991, "learning_rate": 2.135104818908913e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.17449814081192017, "step": 2330, "valid_targets_mean": 5358.0, "valid_targets_min": 258 }, { "epoch": 3.7240829346092506, "grad_norm": 0.5705362385621706, "learning_rate": 2.1271685401534617e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.17245930433273315, "step": 2335, "valid_targets_mean": 5281.9, "valid_targets_min": 252 }, { "epoch": 3.7320574162679425, "grad_norm": 0.45629997713629283, "learning_rate": 2.11923025033964e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.18641863763332367, "step": 2340, "valid_targets_mean": 4875.7, "valid_targets_min": 244 }, { "epoch": 3.740031897926635, "grad_norm": 0.5004011387408458, "learning_rate": 2.111290075004503e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.1716715544462204, "step": 2345, "valid_targets_mean": 3934.6, "valid_targets_min": 242 }, { "epoch": 3.748006379585327, "grad_norm": 0.46246492036373593, "learning_rate": 2.103348139714925e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724526733160019, "step": 2350, "valid_targets_mean": 4492.5, "valid_targets_min": 238 }, { "epoch": 3.7559808612440193, "grad_norm": 0.5448173548752107, "learning_rate": 2.0954045700656126e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.17832358181476593, "step": 2355, "valid_targets_mean": 3425.9, "valid_targets_min": 205 }, { "epoch": 3.7639553429027113, "grad_norm": 0.5015418002105231, "learning_rate": 2.0874594916771174e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.18966464698314667, "step": 2360, "valid_targets_mean": 4649.9, "valid_targets_min": 428 }, { "epoch": 3.7719298245614032, "grad_norm": 0.4569286157077601, "learning_rate": 2.079513030193852e-05, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.15085861086845398, "step": 2365, "valid_targets_mean": 4497.1, "valid_targets_min": 650 }, { "epoch": 3.7799043062200957, "grad_norm": 0.5131210924769427, "learning_rate": 2.071565311282099e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.16978487372398376, "step": 2370, "valid_targets_mean": 3804.6, "valid_targets_min": 255 }, { "epoch": 3.787878787878788, "grad_norm": 0.4053676310724288, "learning_rate": 2.063616460628029e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.1770038604736328, "step": 2375, "valid_targets_mean": 5768.6, "valid_targets_min": 227 }, { "epoch": 3.79585326953748, "grad_norm": 0.4533781362163844, "learning_rate": 2.0556666039357084e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.17858347296714783, "step": 2380, "valid_targets_mean": 5566.5, "valid_targets_min": 252 }, { "epoch": 3.803827751196172, "grad_norm": 0.4188217594597362, "learning_rate": 2.047715866925113e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.18884845077991486, "step": 2385, "valid_targets_mean": 5425.9, "valid_targets_min": 259 }, { "epoch": 3.8118022328548644, "grad_norm": 0.4764124493876062, "learning_rate": 2.0397643753301403e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.16345086693763733, "step": 2390, "valid_targets_mean": 5698.1, "valid_targets_min": 286 }, { "epoch": 3.819776714513557, "grad_norm": 0.48932350458239837, "learning_rate": 2.0318122548966225e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.17059862613677979, "step": 2395, "valid_targets_mean": 4492.2, "valid_targets_min": 427 }, { "epoch": 3.827751196172249, "grad_norm": 0.4210708424627556, "learning_rate": 2.0238596313803337e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.16127406060695648, "step": 2400, "valid_targets_mean": 6233.4, "valid_targets_min": 4329 }, { "epoch": 3.8357256778309408, "grad_norm": 0.46048380449758947, "learning_rate": 2.015906630545005e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.19462665915489197, "step": 2405, "valid_targets_mean": 4631.4, "valid_targets_min": 409 }, { "epoch": 3.843700159489633, "grad_norm": 0.42862173152229316, "learning_rate": 2.0079533781603352e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.18994180858135223, "step": 2410, "valid_targets_mean": 4918.5, "valid_targets_min": 332 }, { "epoch": 3.8516746411483256, "grad_norm": 0.5010059874905928, "learning_rate": 2e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.20106858015060425, "step": 2415, "valid_targets_mean": 4281.1, "valid_targets_min": 262 }, { "epoch": 3.8596491228070176, "grad_norm": 0.4072491507266973, "learning_rate": 1.9920466218396655e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.16354908049106598, "step": 2420, "valid_targets_mean": 4883.2, "valid_targets_min": 245 }, { "epoch": 3.8676236044657095, "grad_norm": 0.4810942686183941, "learning_rate": 1.9840933694549956e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.18778419494628906, "step": 2425, "valid_targets_mean": 4466.9, "valid_targets_min": 240 }, { "epoch": 3.875598086124402, "grad_norm": 0.4057684960139382, "learning_rate": 1.976140368619667e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.1536000519990921, "step": 2430, "valid_targets_mean": 5985.8, "valid_targets_min": 244 }, { "epoch": 3.8835725677830943, "grad_norm": 0.4211890086346668, "learning_rate": 1.9681877451033778e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.17464828491210938, "step": 2435, "valid_targets_mean": 5423.5, "valid_targets_min": 373 }, { "epoch": 3.8915470494417863, "grad_norm": 0.47758132116301366, "learning_rate": 1.9602356246698597e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.19579948484897614, "step": 2440, "valid_targets_mean": 4473.9, "valid_targets_min": 211 }, { "epoch": 3.8995215311004783, "grad_norm": 0.43785459648367925, "learning_rate": 1.9522841330748877e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.16913919150829315, "step": 2445, "valid_targets_mean": 5518.2, "valid_targets_min": 876 }, { "epoch": 3.9074960127591707, "grad_norm": 0.4718315228758523, "learning_rate": 1.944333396064292e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.16812896728515625, "step": 2450, "valid_targets_mean": 4544.7, "valid_targets_min": 228 }, { "epoch": 3.915470494417863, "grad_norm": 0.41246881276557107, "learning_rate": 1.936383539371971e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.186811625957489, "step": 2455, "valid_targets_mean": 5773.6, "valid_targets_min": 244 }, { "epoch": 3.923444976076555, "grad_norm": 0.4236112780842354, "learning_rate": 1.9284346887179016e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823834776878357, "step": 2460, "valid_targets_mean": 5392.7, "valid_targets_min": 269 }, { "epoch": 3.931419457735247, "grad_norm": 0.48575329642988746, "learning_rate": 1.9204869698061493e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.17913323640823364, "step": 2465, "valid_targets_mean": 4545.8, "valid_targets_min": 189 }, { "epoch": 3.9393939393939394, "grad_norm": 0.4391863078677367, "learning_rate": 1.9125405083228833e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.18172624707221985, "step": 2470, "valid_targets_mean": 5295.9, "valid_targets_min": 250 }, { "epoch": 3.9473684210526314, "grad_norm": 0.43686870532771416, "learning_rate": 1.9045954299343884e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.18156322836875916, "step": 2475, "valid_targets_mean": 5534.2, "valid_targets_min": 735 }, { "epoch": 3.955342902711324, "grad_norm": 0.4410672277323973, "learning_rate": 1.896651860285076e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.16273203492164612, "step": 2480, "valid_targets_mean": 5046.9, "valid_targets_min": 244 }, { "epoch": 3.963317384370016, "grad_norm": 0.4379301215701126, "learning_rate": 1.8887099249954976e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.18227660655975342, "step": 2485, "valid_targets_mean": 5287.8, "valid_targets_min": 1155 }, { "epoch": 3.971291866028708, "grad_norm": 0.41662085884964606, "learning_rate": 1.8807697496603604e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.1678864061832428, "step": 2490, "valid_targets_mean": 5324.2, "valid_targets_min": 445 }, { "epoch": 3.9792663476874, "grad_norm": 0.4373979648967585, "learning_rate": 1.8728314598465386e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.18611688911914825, "step": 2495, "valid_targets_mean": 5373.3, "valid_targets_min": 382 }, { "epoch": 3.9872408293460926, "grad_norm": 0.457053493882227, "learning_rate": 1.8648951810910878e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.1983267068862915, "step": 2500, "valid_targets_mean": 5981.6, "valid_targets_min": 342 }, { "epoch": 3.9952153110047846, "grad_norm": 0.43207203226320035, "learning_rate": 1.856961038899261e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1594964861869812, "step": 2505, "valid_targets_mean": 4767.2, "valid_targets_min": 248 }, { "epoch": 4.003189792663477, "grad_norm": 0.44162771304729975, "learning_rate": 1.849029158742525e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.17399078607559204, "step": 2510, "valid_targets_mean": 4869.1, "valid_targets_min": 259 }, { "epoch": 4.011164274322169, "grad_norm": 0.4100149325744668, "learning_rate": 1.8410996660565714e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.16074588894844055, "step": 2515, "valid_targets_mean": 5768.7, "valid_targets_min": 495 }, { "epoch": 4.019138755980861, "grad_norm": 0.4871133329160863, "learning_rate": 1.8331726862393385e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.16799892485141754, "step": 2520, "valid_targets_mean": 5172.4, "valid_targets_min": 980 }, { "epoch": 4.027113237639553, "grad_norm": 0.46342804287893813, "learning_rate": 1.8252483446490245e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1649300903081894, "step": 2525, "valid_targets_mean": 5258.1, "valid_targets_min": 226 }, { "epoch": 4.035087719298246, "grad_norm": 0.4888182281978054, "learning_rate": 1.8173267666021075e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.13286834955215454, "step": 2530, "valid_targets_mean": 3738.4, "valid_targets_min": 225 }, { "epoch": 4.043062200956938, "grad_norm": 0.439511550487397, "learning_rate": 1.8094080773713615e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16421306133270264, "step": 2535, "valid_targets_mean": 5328.5, "valid_targets_min": 248 }, { "epoch": 4.05103668261563, "grad_norm": 0.39916496188969774, "learning_rate": 1.8014924021838774e-05, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.19473597407341003, "step": 2540, "valid_targets_mean": 6501.2, "valid_targets_min": 798 }, { "epoch": 4.059011164274322, "grad_norm": 0.45532784154246636, "learning_rate": 1.7935798662190798e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.18312832713127136, "step": 2545, "valid_targets_mean": 5164.4, "valid_targets_min": 1592 }, { "epoch": 4.0669856459330145, "grad_norm": 0.39457706368906487, "learning_rate": 1.785670594606752e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.14157655835151672, "step": 2550, "valid_targets_mean": 5789.8, "valid_targets_min": 241 }, { "epoch": 4.074960127591707, "grad_norm": 0.44152278033105163, "learning_rate": 1.777764712425052e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.16815263032913208, "step": 2555, "valid_targets_mean": 5426.9, "valid_targets_min": 362 }, { "epoch": 4.082934609250398, "grad_norm": 0.4297478681585869, "learning_rate": 1.7698623446985378e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471405178308487, "step": 2560, "valid_targets_mean": 5570.6, "valid_targets_min": 221 }, { "epoch": 4.090909090909091, "grad_norm": 0.443891814693673, "learning_rate": 1.7619636163961907e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15766510367393494, "step": 2565, "valid_targets_mean": 5007.6, "valid_targets_min": 243 }, { "epoch": 4.098883572567783, "grad_norm": 0.6970765377465047, "learning_rate": 1.754068652429436e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.15241992473602295, "step": 2570, "valid_targets_mean": 4964.9, "valid_targets_min": 257 }, { "epoch": 4.106858054226476, "grad_norm": 0.5016042784027481, "learning_rate": 1.74617757765017e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.15563294291496277, "step": 2575, "valid_targets_mean": 4340.1, "valid_targets_min": 200 }, { "epoch": 4.114832535885167, "grad_norm": 0.4424438379039299, "learning_rate": 1.738290516848784e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.17813259363174438, "step": 2580, "valid_targets_mean": 5369.1, "valid_targets_min": 251 }, { "epoch": 4.12280701754386, "grad_norm": 0.45797415814975423, "learning_rate": 1.730407594752194e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.16528105735778809, "step": 2585, "valid_targets_mean": 5390.3, "valid_targets_min": 269 }, { "epoch": 4.130781499202552, "grad_norm": 0.5111816555204367, "learning_rate": 1.722528936021864e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.1601203978061676, "step": 2590, "valid_targets_mean": 3531.6, "valid_targets_min": 315 }, { "epoch": 4.138755980861244, "grad_norm": 0.3767954932539586, "learning_rate": 1.714654665251837e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1518028825521469, "step": 2595, "valid_targets_mean": 6542.2, "valid_targets_min": 1157 }, { "epoch": 4.146730462519936, "grad_norm": 0.46197127874950683, "learning_rate": 1.7067849069667644e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.1635223627090454, "step": 2600, "valid_targets_mean": 4890.6, "valid_targets_min": 538 }, { "epoch": 4.154704944178628, "grad_norm": 0.590965129504492, "learning_rate": 1.6989197856199377e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.14913973212242126, "step": 2605, "valid_targets_mean": 5326.4, "valid_targets_min": 255 }, { "epoch": 4.162679425837321, "grad_norm": 0.4398420111040478, "learning_rate": 1.6910594255913177e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.16554518043994904, "step": 2610, "valid_targets_mean": 5232.0, "valid_targets_min": 911 }, { "epoch": 4.170653907496013, "grad_norm": 1.2896108249705025, "learning_rate": 1.6832039511855702e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.1797063648700714, "step": 2615, "valid_targets_mean": 4964.2, "valid_targets_min": 252 }, { "epoch": 4.178628389154705, "grad_norm": 0.4916215767968524, "learning_rate": 1.6753534866300983e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.162457674741745, "step": 2620, "valid_targets_mean": 4723.4, "valid_targets_min": 525 }, { "epoch": 4.186602870813397, "grad_norm": 0.436093385151016, "learning_rate": 1.6675081560730804e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.1415684074163437, "step": 2625, "valid_targets_mean": 4707.8, "valid_targets_min": 245 }, { "epoch": 4.1945773524720895, "grad_norm": 0.3767766840818539, "learning_rate": 1.6596680835815024e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.15540149807929993, "step": 2630, "valid_targets_mean": 7057.1, "valid_targets_min": 4854 }, { "epoch": 4.202551834130782, "grad_norm": 0.5066458024848639, "learning_rate": 1.651833393139201e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.16125883162021637, "step": 2635, "valid_targets_mean": 3526.9, "valid_targets_min": 238 }, { "epoch": 4.2105263157894735, "grad_norm": 0.4523713268939122, "learning_rate": 1.6440042086449e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.16887378692626953, "step": 2640, "valid_targets_mean": 5442.1, "valid_targets_min": 1251 }, { "epoch": 4.218500797448166, "grad_norm": 0.4669348386422092, "learning_rate": 1.6361806539102508e-05, "loss": 0.1691, "loss_nan_ranks": 0, "loss_rank_avg": 0.16306337714195251, "step": 2645, "valid_targets_mean": 5191.7, "valid_targets_min": 232 }, { "epoch": 4.226475279106858, "grad_norm": 0.44072670778662126, "learning_rate": 1.628362852657876e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595107614994049, "step": 2650, "valid_targets_mean": 5289.1, "valid_targets_min": 377 }, { "epoch": 4.23444976076555, "grad_norm": 0.4181461806366608, "learning_rate": 1.620550928519411e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15849584341049194, "step": 2655, "valid_targets_mean": 4996.6, "valid_targets_min": 378 }, { "epoch": 4.242424242424242, "grad_norm": 0.43195277822271283, "learning_rate": 1.612745005033551e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.16953721642494202, "step": 2660, "valid_targets_mean": 5369.8, "valid_targets_min": 243 }, { "epoch": 4.250398724082935, "grad_norm": 0.41229933540536656, "learning_rate": 1.6049452056440948e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.17528899013996124, "step": 2665, "valid_targets_mean": 6492.4, "valid_targets_min": 3730 }, { "epoch": 4.258373205741627, "grad_norm": 0.4711001749394507, "learning_rate": 1.597151653697995e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.156410813331604, "step": 2670, "valid_targets_mean": 4710.2, "valid_targets_min": 329 }, { "epoch": 4.266347687400319, "grad_norm": 0.42542209328206093, "learning_rate": 1.5893644724434066e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.16571450233459473, "step": 2675, "valid_targets_mean": 5378.8, "valid_targets_min": 393 }, { "epoch": 4.274322169059011, "grad_norm": 0.6303378780815382, "learning_rate": 1.581583785027736e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.1706840693950653, "step": 2680, "valid_targets_mean": 4807.1, "valid_targets_min": 235 }, { "epoch": 4.282296650717703, "grad_norm": 0.48966028379629584, "learning_rate": 1.5738097144956976e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15253716707229614, "step": 2685, "valid_targets_mean": 4374.9, "valid_targets_min": 287 }, { "epoch": 4.290271132376396, "grad_norm": 0.41033469363863073, "learning_rate": 1.566042383787364e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.15829625725746155, "step": 2690, "valid_targets_mean": 6175.6, "valid_targets_min": 224 }, { "epoch": 4.298245614035087, "grad_norm": 0.40731073913252946, "learning_rate": 1.558281915736224e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.14746209979057312, "step": 2695, "valid_targets_mean": 5612.4, "valid_targets_min": 245 }, { "epoch": 4.30622009569378, "grad_norm": 0.5078322157963522, "learning_rate": 1.550528433067239e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16952064633369446, "step": 2700, "valid_targets_mean": 5778.9, "valid_targets_min": 878 }, { "epoch": 4.314194577352472, "grad_norm": 0.5507289227344653, "learning_rate": 1.5427820583949054e-05, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.15994137525558472, "step": 2705, "valid_targets_mean": 4218.4, "valid_targets_min": 239 }, { "epoch": 4.3221690590111645, "grad_norm": 0.408459346880975, "learning_rate": 1.5350429142213075e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.14765138924121857, "step": 2710, "valid_targets_mean": 5390.0, "valid_targets_min": 272 }, { "epoch": 4.330143540669856, "grad_norm": 0.4621251709763953, "learning_rate": 1.5273111229341907e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.16809380054473877, "step": 2715, "valid_targets_mean": 4960.4, "valid_targets_min": 251 }, { "epoch": 4.3381180223285485, "grad_norm": 0.4859821294927119, "learning_rate": 1.5195868068050185e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.15256614983081818, "step": 2720, "valid_targets_mean": 4789.8, "valid_targets_min": 265 }, { "epoch": 4.346092503987241, "grad_norm": 0.44208802195312985, "learning_rate": 1.5118700879870426e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.16697990894317627, "step": 2725, "valid_targets_mean": 5019.8, "valid_targets_min": 227 }, { "epoch": 4.354066985645933, "grad_norm": 0.39327145737658015, "learning_rate": 1.5041610885133681e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.17563647031784058, "step": 2730, "valid_targets_mean": 6262.4, "valid_targets_min": 4299 }, { "epoch": 4.362041467304625, "grad_norm": 0.5020697131026288, "learning_rate": 1.496459930295028e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.158511221408844, "step": 2735, "valid_targets_mean": 5749.7, "valid_targets_min": 347 }, { "epoch": 4.370015948963317, "grad_norm": 0.435040583369635, "learning_rate": 1.4887667351190508e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.15348437428474426, "step": 2740, "valid_targets_mean": 5452.8, "valid_targets_min": 866 }, { "epoch": 4.37799043062201, "grad_norm": 0.4713309684053475, "learning_rate": 1.4810816246465374e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.18029925227165222, "step": 2745, "valid_targets_mean": 4950.2, "valid_targets_min": 238 }, { "epoch": 4.385964912280702, "grad_norm": 0.4989171949325947, "learning_rate": 1.4734047204107358e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.162031888961792, "step": 2750, "valid_targets_mean": 5264.2, "valid_targets_min": 797 }, { "epoch": 4.393939393939394, "grad_norm": 0.4481729316372481, "learning_rate": 1.4657361438151192e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.17081616818904877, "step": 2755, "valid_targets_mean": 4965.4, "valid_targets_min": 281 }, { "epoch": 4.401913875598086, "grad_norm": 0.5035101448803713, "learning_rate": 1.458076016131468e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.17901387810707092, "step": 2760, "valid_targets_mean": 4425.4, "valid_targets_min": 230 }, { "epoch": 4.409888357256778, "grad_norm": 0.439004055065166, "learning_rate": 1.4504244584979494e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.1770099699497223, "step": 2765, "valid_targets_mean": 5970.6, "valid_targets_min": 280 }, { "epoch": 4.417862838915471, "grad_norm": 0.4559810410634476, "learning_rate": 1.442781591917203e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.16673271358013153, "step": 2770, "valid_targets_mean": 5037.8, "valid_targets_min": 342 }, { "epoch": 4.425837320574162, "grad_norm": 0.49141320176391684, "learning_rate": 1.4351475372544262e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.17553502321243286, "step": 2775, "valid_targets_mean": 5215.1, "valid_targets_min": 241 }, { "epoch": 4.433811802232855, "grad_norm": 0.4548580416328493, "learning_rate": 1.4275224152354658e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15424610674381256, "step": 2780, "valid_targets_mean": 5256.7, "valid_targets_min": 227 }, { "epoch": 4.441786283891547, "grad_norm": 0.43788067033156486, "learning_rate": 1.4199063464449047e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.14916040003299713, "step": 2785, "valid_targets_mean": 5186.2, "valid_targets_min": 530 }, { "epoch": 4.44976076555024, "grad_norm": 0.4517238770171476, "learning_rate": 1.4122994513241587e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.15957307815551758, "step": 2790, "valid_targets_mean": 4431.6, "valid_targets_min": 311 }, { "epoch": 4.457735247208931, "grad_norm": 0.4470813659837837, "learning_rate": 1.4047018501695677e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.16156211495399475, "step": 2795, "valid_targets_mean": 4721.2, "valid_targets_min": 361 }, { "epoch": 4.4657097288676235, "grad_norm": 0.48463023071484423, "learning_rate": 1.3971136631304978e-05, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.17857998609542847, "step": 2800, "valid_targets_mean": 4501.1, "valid_targets_min": 721 }, { "epoch": 4.473684210526316, "grad_norm": 0.463251002628163, "learning_rate": 1.3895350102074386e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.17204450070858002, "step": 2805, "valid_targets_mean": 5583.7, "valid_targets_min": 237 }, { "epoch": 4.481658692185008, "grad_norm": 0.43951674293696763, "learning_rate": 1.3819660112501054e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.15155509114265442, "step": 2810, "valid_targets_mean": 5825.9, "valid_targets_min": 897 }, { "epoch": 4.4896331738437, "grad_norm": 0.48668589039422894, "learning_rate": 1.3744067859555461e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.16631749272346497, "step": 2815, "valid_targets_mean": 4816.9, "valid_targets_min": 250 }, { "epoch": 4.497607655502392, "grad_norm": 0.4474999184326488, "learning_rate": 1.3668574538662451e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.17684899270534515, "step": 2820, "valid_targets_mean": 5176.1, "valid_targets_min": 243 }, { "epoch": 4.505582137161085, "grad_norm": 0.4462277446311322, "learning_rate": 1.3593181343682353e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.16628840565681458, "step": 2825, "valid_targets_mean": 5292.2, "valid_targets_min": 309 }, { "epoch": 4.513556618819777, "grad_norm": 0.5107987331641045, "learning_rate": 1.3517889466892085e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.15675923228263855, "step": 2830, "valid_targets_mean": 3909.9, "valid_targets_min": 296 }, { "epoch": 4.521531100478469, "grad_norm": 0.46641473919470094, "learning_rate": 1.3442700098966326e-05, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16455984115600586, "step": 2835, "valid_targets_mean": 4710.5, "valid_targets_min": 298 }, { "epoch": 4.529505582137161, "grad_norm": 0.5015636399760796, "learning_rate": 1.3367614428958646e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.17463116347789764, "step": 2840, "valid_targets_mean": 4366.3, "valid_targets_min": 265 }, { "epoch": 4.5374800637958534, "grad_norm": 0.5206414572728846, "learning_rate": 1.3292633644282735e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.18271681666374207, "step": 2845, "valid_targets_mean": 4655.6, "valid_targets_min": 237 }, { "epoch": 4.545454545454545, "grad_norm": 0.612470158692335, "learning_rate": 1.3217758930693608e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.15408973395824432, "step": 2850, "valid_targets_mean": 4344.2, "valid_targets_min": 234 }, { "epoch": 4.553429027113237, "grad_norm": 0.38141520226279213, "learning_rate": 1.314299147226887e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.14755874872207642, "step": 2855, "valid_targets_mean": 5986.4, "valid_targets_min": 880 }, { "epoch": 4.56140350877193, "grad_norm": 0.4310034608873921, "learning_rate": 1.3068332451389969e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514865756034851, "step": 2860, "valid_targets_mean": 6271.6, "valid_targets_min": 4306 }, { "epoch": 4.569377990430622, "grad_norm": 0.4356530709450213, "learning_rate": 1.2993783048723515e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.15877559781074524, "step": 2865, "valid_targets_mean": 5407.3, "valid_targets_min": 399 }, { "epoch": 4.577352472089315, "grad_norm": 0.564670837742309, "learning_rate": 1.2919344443202602e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.14960314333438873, "step": 2870, "valid_targets_mean": 3163.2, "valid_targets_min": 218 }, { "epoch": 4.585326953748006, "grad_norm": 0.4785084988426857, "learning_rate": 1.2845017812008158e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.1763634979724884, "step": 2875, "valid_targets_mean": 4772.2, "valid_targets_min": 222 }, { "epoch": 4.5933014354066986, "grad_norm": 0.42494589929233484, "learning_rate": 1.277080433055034e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.16085359454154968, "step": 2880, "valid_targets_mean": 5689.2, "valid_targets_min": 225 }, { "epoch": 4.601275917065391, "grad_norm": 0.47807251510580745, "learning_rate": 1.2696705172449944e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.15512213110923767, "step": 2885, "valid_targets_mean": 4743.9, "valid_targets_min": 185 }, { "epoch": 4.6092503987240825, "grad_norm": 0.45580307365244943, "learning_rate": 1.2622721509519846e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.17423364520072937, "step": 2890, "valid_targets_mean": 4932.5, "valid_targets_min": 373 }, { "epoch": 4.617224880382775, "grad_norm": 0.5794992528529187, "learning_rate": 1.2548854511746461e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.17313656210899353, "step": 2895, "valid_targets_mean": 4594.8, "valid_targets_min": 223 }, { "epoch": 4.625199362041467, "grad_norm": 0.4094555332819473, "learning_rate": 1.247510534727125e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.15635088086128235, "step": 2900, "valid_targets_mean": 5626.6, "valid_targets_min": 414 }, { "epoch": 4.63317384370016, "grad_norm": 0.4677979868665022, "learning_rate": 1.240147518237224e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597626507282257, "step": 2905, "valid_targets_mean": 4849.3, "valid_targets_min": 258 }, { "epoch": 4.641148325358852, "grad_norm": 0.4603270505711866, "learning_rate": 1.2327965181445593e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.16551506519317627, "step": 2910, "valid_targets_mean": 5237.4, "valid_targets_min": 2288 }, { "epoch": 4.649122807017544, "grad_norm": 0.4366408749058765, "learning_rate": 1.2254576506987182e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.1736927628517151, "step": 2915, "valid_targets_mean": 5546.3, "valid_targets_min": 350 }, { "epoch": 4.657097288676236, "grad_norm": 0.43355175444421734, "learning_rate": 1.21813103195742e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.15354032814502716, "step": 2920, "valid_targets_mean": 5324.1, "valid_targets_min": 218 }, { "epoch": 4.6650717703349285, "grad_norm": 0.5608093339511655, "learning_rate": 1.2108167777846815e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.16178153455257416, "step": 2925, "valid_targets_mean": 5233.4, "valid_targets_min": 242 }, { "epoch": 4.67304625199362, "grad_norm": 0.5169396036803482, "learning_rate": 1.203515003848987e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.18358519673347473, "step": 2930, "valid_targets_mean": 4139.6, "valid_targets_min": 333 }, { "epoch": 4.681020733652312, "grad_norm": 0.5322766631274986, "learning_rate": 1.1962258256214545e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.16810274124145508, "step": 2935, "valid_targets_mean": 3680.1, "valid_targets_min": 235 }, { "epoch": 4.688995215311005, "grad_norm": 0.4507589408310588, "learning_rate": 1.1889493583740124e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.14625227451324463, "step": 2940, "valid_targets_mean": 5085.9, "valid_targets_min": 234 }, { "epoch": 4.696969696969697, "grad_norm": 0.5558750405081903, "learning_rate": 1.1816857171775767e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1795760989189148, "step": 2945, "valid_targets_mean": 5080.6, "valid_targets_min": 226 }, { "epoch": 4.70494417862839, "grad_norm": 0.481514040881239, "learning_rate": 1.1744350169002308e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.16550910472869873, "step": 2950, "valid_targets_mean": 4276.0, "valid_targets_min": 220 }, { "epoch": 4.712918660287081, "grad_norm": 0.46285391513788915, "learning_rate": 1.1671973722054077e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.15627330541610718, "step": 2955, "valid_targets_mean": 5210.4, "valid_targets_min": 325 }, { "epoch": 4.720893141945774, "grad_norm": 0.4381563224190673, "learning_rate": 1.159972897550079e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.16192206740379333, "step": 2960, "valid_targets_mean": 5571.1, "valid_targets_min": 1626 }, { "epoch": 4.728867623604466, "grad_norm": 0.5236440592598125, "learning_rate": 1.1527617071829447e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626909375190735, "step": 2965, "valid_targets_mean": 5419.7, "valid_targets_min": 732 }, { "epoch": 4.7368421052631575, "grad_norm": 0.6260805242947385, "learning_rate": 1.145563915142622e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.17754967510700226, "step": 2970, "valid_targets_mean": 4668.6, "valid_targets_min": 214 }, { "epoch": 4.74481658692185, "grad_norm": 0.43717068230202355, "learning_rate": 1.1383796352558489e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.1576494425535202, "step": 2975, "valid_targets_mean": 5962.7, "valid_targets_min": 235 }, { "epoch": 4.752791068580542, "grad_norm": 0.5329045016777196, "learning_rate": 1.1312089811356803e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.1734808087348938, "step": 2980, "valid_targets_mean": 4494.7, "valid_targets_min": 327 }, { "epoch": 4.760765550239235, "grad_norm": 0.46495559769894873, "learning_rate": 1.1240520661796882e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.16236670315265656, "step": 2985, "valid_targets_mean": 4686.7, "valid_targets_min": 200 }, { "epoch": 4.768740031897926, "grad_norm": 0.43626568077375366, "learning_rate": 1.1169090035681772e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.1571044623851776, "step": 2990, "valid_targets_mean": 5496.3, "valid_targets_min": 190 }, { "epoch": 4.776714513556619, "grad_norm": 0.45169170298100625, "learning_rate": 1.109779906262383e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.15914367139339447, "step": 2995, "valid_targets_mean": 5026.9, "valid_targets_min": 238 }, { "epoch": 4.784688995215311, "grad_norm": 0.4655091549732474, "learning_rate": 1.102664887002698e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.16559766232967377, "step": 3000, "valid_targets_mean": 4727.7, "valid_targets_min": 817 }, { "epoch": 4.7926634768740035, "grad_norm": 0.5136371479792501, "learning_rate": 1.0955640583068802e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.1526031494140625, "step": 3005, "valid_targets_mean": 4957.2, "valid_targets_min": 224 }, { "epoch": 4.800637958532695, "grad_norm": 0.5016448829784496, "learning_rate": 1.0884775324682755e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.17114630341529846, "step": 3010, "valid_targets_mean": 4075.6, "valid_targets_min": 191 }, { "epoch": 4.8086124401913874, "grad_norm": 0.444367284493778, "learning_rate": 1.081405421554044e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16200141608715057, "step": 3015, "valid_targets_mean": 6258.1, "valid_targets_min": 388 }, { "epoch": 4.81658692185008, "grad_norm": 0.4237329819210327, "learning_rate": 1.074347837403387e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.15558627247810364, "step": 3020, "valid_targets_mean": 5657.1, "valid_targets_min": 349 }, { "epoch": 4.824561403508772, "grad_norm": 0.5176039560323095, "learning_rate": 1.067304891625776e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.16431066393852234, "step": 3025, "valid_targets_mean": 4240.2, "valid_targets_min": 296 }, { "epoch": 4.832535885167464, "grad_norm": 0.528814370807462, "learning_rate": 1.0602766955991913e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.1717158555984497, "step": 3030, "valid_targets_mean": 4902.6, "valid_targets_min": 492 }, { "epoch": 4.840510366826156, "grad_norm": 0.44331350492759686, "learning_rate": 1.053263360468358e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.16708722710609436, "step": 3035, "valid_targets_mean": 5435.2, "valid_targets_min": 246 }, { "epoch": 4.848484848484849, "grad_norm": 0.44468265380219274, "learning_rate": 1.0462649971429884e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.16008290648460388, "step": 3040, "valid_targets_mean": 5562.2, "valid_targets_min": 237 }, { "epoch": 4.856459330143541, "grad_norm": 0.465252421331791, "learning_rate": 1.0392817162960304e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.159569650888443, "step": 3045, "valid_targets_mean": 4934.4, "valid_targets_min": 779 }, { "epoch": 4.8644338118022326, "grad_norm": 0.5128838331578629, "learning_rate": 1.0323136283619167e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1651550829410553, "step": 3050, "valid_targets_mean": 4564.1, "valid_targets_min": 215 }, { "epoch": 4.872408293460925, "grad_norm": 0.45912144059548055, "learning_rate": 1.0253608435348136e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.16643419861793518, "step": 3055, "valid_targets_mean": 5427.7, "valid_targets_min": 229 }, { "epoch": 4.880382775119617, "grad_norm": 0.4460208854541763, "learning_rate": 1.0184234717668867e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.16689209640026093, "step": 3060, "valid_targets_mean": 4700.7, "valid_targets_min": 230 }, { "epoch": 4.88835725677831, "grad_norm": 0.4135934097283204, "learning_rate": 1.0115016227665544e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.13867491483688354, "step": 3065, "valid_targets_mean": 5309.3, "valid_targets_min": 577 }, { "epoch": 4.896331738437001, "grad_norm": 0.47533139658434936, "learning_rate": 1.0045954059967577e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.15308788418769836, "step": 3070, "valid_targets_mean": 4834.2, "valid_targets_min": 390 }, { "epoch": 4.904306220095694, "grad_norm": 0.5327287831119275, "learning_rate": 9.977049306732287e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.17162764072418213, "step": 3075, "valid_targets_mean": 4897.1, "valid_targets_min": 238 }, { "epoch": 4.912280701754386, "grad_norm": 0.4904017524563081, "learning_rate": 9.908303057627591e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14119388163089752, "step": 3080, "valid_targets_mean": 4725.4, "valid_targets_min": 228 }, { "epoch": 4.920255183413078, "grad_norm": 0.4970617612422358, "learning_rate": 9.83971639981484e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.15496879816055298, "step": 3085, "valid_targets_mean": 4607.4, "valid_targets_min": 408 }, { "epoch": 4.92822966507177, "grad_norm": 0.45864620988450583, "learning_rate": 9.771290417931559e-06, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.17323030531406403, "step": 3090, "valid_targets_mean": 5090.6, "valid_targets_min": 293 }, { "epoch": 4.9362041467304625, "grad_norm": 0.42808519157930736, "learning_rate": 9.703026194074342e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540815681219101, "step": 3095, "valid_targets_mean": 5067.4, "valid_targets_min": 327 }, { "epoch": 4.944178628389155, "grad_norm": 0.5865902968093246, "learning_rate": 9.634924807781729e-06, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1912127435207367, "step": 3100, "valid_targets_mean": 5640.5, "valid_targets_min": 246 }, { "epoch": 4.952153110047847, "grad_norm": 0.4717173764137801, "learning_rate": 9.566987336017102e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.16661816835403442, "step": 3105, "valid_targets_mean": 4765.6, "valid_targets_min": 311 }, { "epoch": 4.960127591706539, "grad_norm": 0.40260436168463637, "learning_rate": 9.499214853151699e-06, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.1473720371723175, "step": 3110, "valid_targets_mean": 5560.6, "valid_targets_min": 229 }, { "epoch": 4.968102073365231, "grad_norm": 0.6016222748580632, "learning_rate": 9.431608430947619e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.16205176711082458, "step": 3115, "valid_targets_mean": 4679.3, "valid_targets_min": 252 }, { "epoch": 4.976076555023924, "grad_norm": 0.5889165021406836, "learning_rate": 9.364169138540805e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.17166294157505035, "step": 3120, "valid_targets_mean": 5065.7, "valid_targets_min": 407 }, { "epoch": 4.984051036682615, "grad_norm": 0.4790845449767566, "learning_rate": 9.296898042424237e-06, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.18419404327869415, "step": 3125, "valid_targets_mean": 4631.6, "valid_targets_min": 286 }, { "epoch": 4.992025518341308, "grad_norm": 0.598447892968231, "learning_rate": 9.229796206431015e-06, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.18810789287090302, "step": 3130, "valid_targets_mean": 5094.1, "valid_targets_min": 294 }, { "epoch": 5.0, "grad_norm": 0.4721586914499431, "learning_rate": 9.162864691717513e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.15202680230140686, "step": 3135, "valid_targets_mean": 4077.1, "valid_targets_min": 246 }, { "epoch": 5.007974481658692, "grad_norm": 0.45686843030415786, "learning_rate": 9.096104556746654e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.14485131204128265, "step": 3140, "valid_targets_mean": 4520.2, "valid_targets_min": 212 }, { "epoch": 5.015948963317384, "grad_norm": 0.4413073850480446, "learning_rate": 9.029516857271115e-06, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.16614249348640442, "step": 3145, "valid_targets_mean": 5247.7, "valid_targets_min": 407 }, { "epoch": 5.023923444976076, "grad_norm": 0.45791139693185595, "learning_rate": 8.963102646316677e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.14995019137859344, "step": 3150, "valid_targets_mean": 5282.4, "valid_targets_min": 241 }, { "epoch": 5.031897926634769, "grad_norm": 0.5267991798971836, "learning_rate": 8.896862974165553e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.15393409132957458, "step": 3155, "valid_targets_mean": 3715.2, "valid_targets_min": 223 }, { "epoch": 5.039872408293461, "grad_norm": 0.4667594466034452, "learning_rate": 8.830798888339756e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.14532789587974548, "step": 3160, "valid_targets_mean": 4772.7, "valid_targets_min": 203 }, { "epoch": 5.047846889952153, "grad_norm": 0.443279890846053, "learning_rate": 8.764911433584581e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.14291726052761078, "step": 3165, "valid_targets_mean": 5765.4, "valid_targets_min": 538 }, { "epoch": 5.055821371610845, "grad_norm": 0.5471455934145786, "learning_rate": 8.699201651852056e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1686840057373047, "step": 3170, "valid_targets_mean": 4019.4, "valid_targets_min": 373 }, { "epoch": 5.0637958532695375, "grad_norm": 0.49683984011851123, "learning_rate": 8.633670582284446e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.15907122194766998, "step": 3175, "valid_targets_mean": 5820.6, "valid_targets_min": 540 }, { "epoch": 5.07177033492823, "grad_norm": 0.5606716282540908, "learning_rate": 8.56831926119787e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.14971384406089783, "step": 3180, "valid_targets_mean": 3764.8, "valid_targets_min": 225 }, { "epoch": 5.0797448165869215, "grad_norm": 0.43047185858023407, "learning_rate": 8.503148722065851e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.13558684289455414, "step": 3185, "valid_targets_mean": 5010.2, "valid_targets_min": 243 }, { "epoch": 5.087719298245614, "grad_norm": 0.46301730293349586, "learning_rate": 8.43815999550303e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.14114761352539062, "step": 3190, "valid_targets_mean": 4802.3, "valid_targets_min": 650 }, { "epoch": 5.095693779904306, "grad_norm": 0.46169394066738256, "learning_rate": 8.373354109248842e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.17059487104415894, "step": 3195, "valid_targets_mean": 5362.9, "valid_targets_min": 477 }, { "epoch": 5.103668261562999, "grad_norm": 0.4737706843985567, "learning_rate": 8.308732088151245e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.14929816126823425, "step": 3200, "valid_targets_mean": 5279.0, "valid_targets_min": 1123 }, { "epoch": 5.11164274322169, "grad_norm": 0.558320078734975, "learning_rate": 8.24429495415054e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.14897915720939636, "step": 3205, "valid_targets_mean": 3327.8, "valid_targets_min": 198 }, { "epoch": 5.119617224880383, "grad_norm": 0.4969563956951489, "learning_rate": 8.180043726263216e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.1674622893333435, "step": 3210, "valid_targets_mean": 4794.8, "valid_targets_min": 234 }, { "epoch": 5.127591706539075, "grad_norm": 0.4433365316202014, "learning_rate": 8.115979420565794e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.14808738231658936, "step": 3215, "valid_targets_mean": 5291.6, "valid_targets_min": 448 }, { "epoch": 5.1355661881977674, "grad_norm": 0.4863373730285094, "learning_rate": 8.052103050178806e-06, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.1640024185180664, "step": 3220, "valid_targets_mean": 5062.5, "valid_targets_min": 760 }, { "epoch": 5.143540669856459, "grad_norm": 0.4930454760697995, "learning_rate": 7.988415625250755e-06, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.14119328558444977, "step": 3225, "valid_targets_mean": 4849.4, "valid_targets_min": 258 }, { "epoch": 5.151515151515151, "grad_norm": 0.4113425375075243, "learning_rate": 7.924918152942117e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.13915401697158813, "step": 3230, "valid_targets_mean": 5780.1, "valid_targets_min": 1144 }, { "epoch": 5.159489633173844, "grad_norm": 0.4727008507251189, "learning_rate": 7.861611637409462e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.16318866610527039, "step": 3235, "valid_targets_mean": 4842.1, "valid_targets_min": 586 }, { "epoch": 5.167464114832536, "grad_norm": 0.4828095943833063, "learning_rate": 7.798497079789513e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16433711349964142, "step": 3240, "valid_targets_mean": 4624.4, "valid_targets_min": 274 }, { "epoch": 5.175438596491228, "grad_norm": 0.4744135193352567, "learning_rate": 7.735575478183381e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.1755599081516266, "step": 3245, "valid_targets_mean": 5212.1, "valid_targets_min": 333 }, { "epoch": 5.18341307814992, "grad_norm": 0.4581602183709319, "learning_rate": 7.672847827640735e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.14598888158798218, "step": 3250, "valid_targets_mean": 4947.1, "valid_targets_min": 367 }, { "epoch": 5.1913875598086126, "grad_norm": 0.44432426152642096, "learning_rate": 7.610315120144067e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.15802133083343506, "step": 3255, "valid_targets_mean": 5613.7, "valid_targets_min": 230 }, { "epoch": 5.199362041467305, "grad_norm": 0.45090931602424295, "learning_rate": 7.5479783445930414e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.14497801661491394, "step": 3260, "valid_targets_mean": 5019.5, "valid_targets_min": 241 }, { "epoch": 5.2073365231259965, "grad_norm": 0.48834864182029514, "learning_rate": 7.485838486788803e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.15974393486976624, "step": 3265, "valid_targets_mean": 6540.7, "valid_targets_min": 4632 }, { "epoch": 5.215311004784689, "grad_norm": 0.4491148244141114, "learning_rate": 7.4238965294184374e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.14351961016654968, "step": 3270, "valid_targets_mean": 5034.4, "valid_targets_min": 207 }, { "epoch": 5.223285486443381, "grad_norm": 0.4459921331500691, "learning_rate": 7.362153452039409e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.1467072069644928, "step": 3275, "valid_targets_mean": 5784.2, "valid_targets_min": 993 }, { "epoch": 5.231259968102074, "grad_norm": 0.48106320041218886, "learning_rate": 7.300610231064056e-06, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.14502954483032227, "step": 3280, "valid_targets_mean": 4507.9, "valid_targets_min": 236 }, { "epoch": 5.239234449760765, "grad_norm": 0.4864889224714647, "learning_rate": 7.239267839744166e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16197340190410614, "step": 3285, "valid_targets_mean": 4953.2, "valid_targets_min": 255 }, { "epoch": 5.247208931419458, "grad_norm": 0.4604998630393094, "learning_rate": 7.178127248155604e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.14153867959976196, "step": 3290, "valid_targets_mean": 4488.4, "valid_targets_min": 272 }, { "epoch": 5.25518341307815, "grad_norm": 0.49236439922059083, "learning_rate": 7.117189423182917e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.15775446593761444, "step": 3295, "valid_targets_mean": 5084.4, "valid_targets_min": 210 }, { "epoch": 5.2631578947368425, "grad_norm": 0.47838707598832375, "learning_rate": 7.056455328504104e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.15875396132469177, "step": 3300, "valid_targets_mean": 4948.1, "valid_targets_min": 215 }, { "epoch": 5.271132376395534, "grad_norm": 0.5433755427176816, "learning_rate": 6.995925924575342e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.13437744975090027, "step": 3305, "valid_targets_mean": 4722.6, "valid_targets_min": 222 }, { "epoch": 5.279106858054226, "grad_norm": 0.4815763895098848, "learning_rate": 6.935602168615792e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.14211152493953705, "step": 3310, "valid_targets_mean": 4732.8, "valid_targets_min": 221 }, { "epoch": 5.287081339712919, "grad_norm": 0.4447410196842261, "learning_rate": 6.875485014592493e-06, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.14757999777793884, "step": 3315, "valid_targets_mean": 5167.4, "valid_targets_min": 363 }, { "epoch": 5.295055821371611, "grad_norm": 0.4251332258800115, "learning_rate": 6.815575413205235e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.13727967441082, "step": 3320, "valid_targets_mean": 5821.2, "valid_targets_min": 240 }, { "epoch": 5.303030303030303, "grad_norm": 0.49143529385732765, "learning_rate": 6.755874311871562e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.14603282511234283, "step": 3325, "valid_targets_mean": 5343.0, "valid_targets_min": 235 }, { "epoch": 5.311004784688995, "grad_norm": 0.4426387776988706, "learning_rate": 6.696382654711777e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.15520070493221283, "step": 3330, "valid_targets_mean": 5272.8, "valid_targets_min": 235 }, { "epoch": 5.318979266347688, "grad_norm": 0.4049094841075801, "learning_rate": 6.637101382533986e-06, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.14739316701889038, "step": 3335, "valid_targets_mean": 6374.6, "valid_targets_min": 402 }, { "epoch": 5.32695374800638, "grad_norm": 0.4913045824856341, "learning_rate": 6.578031432819263e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1726195514202118, "step": 3340, "valid_targets_mean": 5006.8, "valid_targets_min": 314 }, { "epoch": 5.3349282296650715, "grad_norm": 0.4627985926205782, "learning_rate": 6.5191737397068015e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1454908698797226, "step": 3345, "valid_targets_mean": 5310.7, "valid_targets_min": 589 }, { "epoch": 5.342902711323764, "grad_norm": 0.5210475663646326, "learning_rate": 6.460529233979127e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15867014229297638, "step": 3350, "valid_targets_mean": 4499.4, "valid_targets_min": 248 }, { "epoch": 5.350877192982456, "grad_norm": 0.49981873498821056, "learning_rate": 6.402098843047417e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1456516683101654, "step": 3355, "valid_targets_mean": 5316.4, "valid_targets_min": 598 }, { "epoch": 5.358851674641148, "grad_norm": 0.5064676891648265, "learning_rate": 6.343883490936791e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.1448066532611847, "step": 3360, "valid_targets_mean": 4308.1, "valid_targets_min": 233 }, { "epoch": 5.36682615629984, "grad_norm": 0.47905838596998346, "learning_rate": 6.285884098271739e-06, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.15558141469955444, "step": 3365, "valid_targets_mean": 5043.6, "valid_targets_min": 243 }, { "epoch": 5.374800637958533, "grad_norm": 0.48629149557224766, "learning_rate": 6.228101582261532e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.16721400618553162, "step": 3370, "valid_targets_mean": 4973.9, "valid_targets_min": 497 }, { "epoch": 5.382775119617225, "grad_norm": 0.4850858183720529, "learning_rate": 6.170536856685716e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.15335974097251892, "step": 3375, "valid_targets_mean": 4478.9, "valid_targets_min": 223 }, { "epoch": 5.3907496012759175, "grad_norm": 0.4833072145728141, "learning_rate": 6.113190831879698e-06, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.16516146063804626, "step": 3380, "valid_targets_mean": 5205.5, "valid_targets_min": 235 }, { "epoch": 5.398724082934609, "grad_norm": 0.4835288113090004, "learning_rate": 6.056064414720317e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.16842329502105713, "step": 3385, "valid_targets_mean": 5243.1, "valid_targets_min": 411 }, { "epoch": 5.4066985645933014, "grad_norm": 0.43313320847470577, "learning_rate": 5.999158508611496e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504177451133728, "step": 3390, "valid_targets_mean": 5215.4, "valid_targets_min": 465 }, { "epoch": 5.414673046251994, "grad_norm": 0.49036685155823234, "learning_rate": 5.942474013469983e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.1608334183692932, "step": 3395, "valid_targets_mean": 4751.9, "valid_targets_min": 285 }, { "epoch": 5.422647527910685, "grad_norm": 0.574663879399246, "learning_rate": 5.886011825711117e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.15289413928985596, "step": 3400, "valid_targets_mean": 5535.6, "valid_targets_min": 242 }, { "epoch": 5.430622009569378, "grad_norm": 0.5322494164948655, "learning_rate": 5.829772838234615e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.15102876722812653, "step": 3405, "valid_targets_mean": 3683.2, "valid_targets_min": 240 }, { "epoch": 5.43859649122807, "grad_norm": 0.5187498623215531, "learning_rate": 5.773757940410503e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.14615221321582794, "step": 3410, "valid_targets_mean": 4623.8, "valid_targets_min": 346 }, { "epoch": 5.446570972886763, "grad_norm": 0.4685828114508998, "learning_rate": 5.7179680180650055e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.15752843022346497, "step": 3415, "valid_targets_mean": 5684.5, "valid_targets_min": 300 }, { "epoch": 5.454545454545454, "grad_norm": 0.522889077511281, "learning_rate": 5.6624039534665775e-06, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.1590261310338974, "step": 3420, "valid_targets_mean": 4173.8, "valid_targets_min": 233 }, { "epoch": 5.4625199362041466, "grad_norm": 0.4756762932324726, "learning_rate": 5.607066625311925e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.19886696338653564, "step": 3425, "valid_targets_mean": 5566.5, "valid_targets_min": 164 }, { "epoch": 5.470494417862839, "grad_norm": 0.47917438890986686, "learning_rate": 5.55195690871211e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.160795658826828, "step": 3430, "valid_targets_mean": 4546.6, "valid_targets_min": 446 }, { "epoch": 5.478468899521531, "grad_norm": 0.7787098363738806, "learning_rate": 5.497075675178727e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.1853606253862381, "step": 3435, "valid_targets_mean": 4119.0, "valid_targets_min": 224 }, { "epoch": 5.486443381180223, "grad_norm": 0.5471104540057793, "learning_rate": 5.442423792610118e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.13731586933135986, "step": 3440, "valid_targets_mean": 4580.0, "valid_targets_min": 238 }, { "epoch": 5.494417862838915, "grad_norm": 0.43633058177704404, "learning_rate": 5.388002125277627e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.1393011510372162, "step": 3445, "valid_targets_mean": 5709.1, "valid_targets_min": 2356 }, { "epoch": 5.502392344497608, "grad_norm": 0.500544121947255, "learning_rate": 5.333811533811945e-06, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.16812501847743988, "step": 3450, "valid_targets_mean": 4662.3, "valid_targets_min": 404 }, { "epoch": 5.5103668261563, "grad_norm": 0.4321968671668473, "learning_rate": 5.2798528751895265e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472059190273285, "step": 3455, "valid_targets_mean": 5412.5, "valid_targets_min": 260 }, { "epoch": 5.518341307814992, "grad_norm": 0.516188282731035, "learning_rate": 5.226127002718984e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455184817314148, "step": 3460, "valid_targets_mean": 4234.6, "valid_targets_min": 243 }, { "epoch": 5.526315789473684, "grad_norm": 0.4966018837171216, "learning_rate": 5.1726347660276424e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.1486985981464386, "step": 3465, "valid_targets_mean": 5566.6, "valid_targets_min": 226 }, { "epoch": 5.5342902711323765, "grad_norm": 0.4791331897643804, "learning_rate": 5.119377011048066e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.13465863466262817, "step": 3470, "valid_targets_mean": 3971.8, "valid_targets_min": 239 }, { "epoch": 5.542264752791069, "grad_norm": 0.6285282708036979, "learning_rate": 5.066354580004713e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15100893378257751, "step": 3475, "valid_targets_mean": 3005.4, "valid_targets_min": 269 }, { "epoch": 5.55023923444976, "grad_norm": 0.4915313605987961, "learning_rate": 5.013568311400599e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.14344826340675354, "step": 3480, "valid_targets_mean": 6651.2, "valid_targets_min": 236 }, { "epoch": 5.558213716108453, "grad_norm": 0.5181311764118561, "learning_rate": 4.96101904000402e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.16833406686782837, "step": 3485, "valid_targets_mean": 4451.7, "valid_targets_min": 298 }, { "epoch": 5.566188197767145, "grad_norm": 0.44911434199256317, "learning_rate": 4.908707596835396e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.16398075222969055, "step": 3490, "valid_targets_mean": 5795.6, "valid_targets_min": 243 }, { "epoch": 5.574162679425838, "grad_norm": 0.48887673542216, "learning_rate": 4.856634809154093e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.14630258083343506, "step": 3495, "valid_targets_mean": 4798.6, "valid_targets_min": 395 }, { "epoch": 5.582137161084529, "grad_norm": 0.4795845324226209, "learning_rate": 4.804801500445338e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.16289225220680237, "step": 3500, "valid_targets_mean": 4453.1, "valid_targets_min": 245 }, { "epoch": 5.590111642743222, "grad_norm": 0.49292253026437766, "learning_rate": 4.753208490407233e-06, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.18191534280776978, "step": 3505, "valid_targets_mean": 4498.8, "valid_targets_min": 489 }, { "epoch": 5.598086124401914, "grad_norm": 0.5089760135607062, "learning_rate": 4.701856594937744e-06, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.13293233513832092, "step": 3510, "valid_targets_mean": 3764.9, "valid_targets_min": 215 }, { "epoch": 5.606060606060606, "grad_norm": 0.4746190959310646, "learning_rate": 4.650746626121838e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.13995599746704102, "step": 3515, "valid_targets_mean": 4787.4, "valid_targets_min": 199 }, { "epoch": 5.614035087719298, "grad_norm": 0.5034639146801175, "learning_rate": 4.5998793922186315e-06, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.15416234731674194, "step": 3520, "valid_targets_mean": 4616.1, "valid_targets_min": 246 }, { "epoch": 5.62200956937799, "grad_norm": 0.46111743578791226, "learning_rate": 4.549255697648576e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.152305006980896, "step": 3525, "valid_targets_mean": 4995.6, "valid_targets_min": 227 }, { "epoch": 5.629984051036683, "grad_norm": 0.4608602450555988, "learning_rate": 4.498876342980796e-06, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.1579793095588684, "step": 3530, "valid_targets_mean": 5248.8, "valid_targets_min": 255 }, { "epoch": 5.637958532695375, "grad_norm": 0.4733308675485752, "learning_rate": 4.448742124920368e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.14798873662948608, "step": 3535, "valid_targets_mean": 5376.5, "valid_targets_min": 221 }, { "epoch": 5.645933014354067, "grad_norm": 0.6093609437426408, "learning_rate": 4.39885383629576e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16494160890579224, "step": 3540, "valid_targets_mean": 5107.6, "valid_targets_min": 242 }, { "epoch": 5.653907496012759, "grad_norm": 0.4704193599073439, "learning_rate": 4.349212266046285e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.16326230764389038, "step": 3545, "valid_targets_mean": 5324.4, "valid_targets_min": 269 }, { "epoch": 5.6618819776714515, "grad_norm": 0.4657747975162824, "learning_rate": 4.299818199209629e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.17422260344028473, "step": 3550, "valid_targets_mean": 4970.7, "valid_targets_min": 1396 }, { "epoch": 5.669856459330144, "grad_norm": 0.420515044849732, "learning_rate": 4.250672416909407e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514442265033722, "step": 3555, "valid_targets_mean": 5760.6, "valid_targets_min": 1570 }, { "epoch": 5.6778309409888355, "grad_norm": 0.41516338928503643, "learning_rate": 4.201775696342862e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16060051321983337, "step": 3560, "valid_targets_mean": 6413.8, "valid_targets_min": 3600 }, { "epoch": 5.685805422647528, "grad_norm": 0.46906623700170114, "learning_rate": 4.153128810768517e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.16279572248458862, "step": 3565, "valid_targets_mean": 4736.4, "valid_targets_min": 208 }, { "epoch": 5.69377990430622, "grad_norm": 0.5015754356988779, "learning_rate": 4.104732529493991e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.18926894664764404, "step": 3570, "valid_targets_mean": 4425.1, "valid_targets_min": 227 }, { "epoch": 5.701754385964913, "grad_norm": 0.45105806384824143, "learning_rate": 4.056587617863825e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.17029494047164917, "step": 3575, "valid_targets_mean": 5617.8, "valid_targets_min": 460 }, { "epoch": 5.709728867623604, "grad_norm": 0.49175639523779135, "learning_rate": 4.008694837247345e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.18568654358386993, "step": 3580, "valid_targets_mean": 6270.6, "valid_targets_min": 244 }, { "epoch": 5.717703349282297, "grad_norm": 0.6769881677170507, "learning_rate": 3.961054945026674e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1355312615633011, "step": 3585, "valid_targets_mean": 4165.9, "valid_targets_min": 218 }, { "epoch": 5.725677830940989, "grad_norm": 0.5133023315898203, "learning_rate": 3.913668694584705e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.15609794855117798, "step": 3590, "valid_targets_mean": 4151.4, "valid_targets_min": 220 }, { "epoch": 5.733652312599681, "grad_norm": 0.44064504684893196, "learning_rate": 3.866536835293227e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.14749088883399963, "step": 3595, "valid_targets_mean": 5171.5, "valid_targets_min": 281 }, { "epoch": 5.741626794258373, "grad_norm": 0.4520697005826577, "learning_rate": 3.819660112501053e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.14739054441452026, "step": 3600, "valid_targets_mean": 5231.6, "valid_targets_min": 227 }, { "epoch": 5.749601275917065, "grad_norm": 0.4991227138203837, "learning_rate": 3.773039267522227e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.16402383148670197, "step": 3605, "valid_targets_mean": 4534.4, "valid_targets_min": 625 }, { "epoch": 5.757575757575758, "grad_norm": 0.4986065297798539, "learning_rate": 3.72667503762433e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630692034959793, "step": 3610, "valid_targets_mean": 5159.6, "valid_targets_min": 389 }, { "epoch": 5.76555023923445, "grad_norm": 0.4049459898514612, "learning_rate": 3.680568156016786e-06, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.1414915919303894, "step": 3615, "valid_targets_mean": 6273.9, "valid_targets_min": 3956 }, { "epoch": 5.773524720893142, "grad_norm": 0.543662044908981, "learning_rate": 3.6347193518392776e-06, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1631641983985901, "step": 3620, "valid_targets_mean": 3520.4, "valid_targets_min": 242 }, { "epoch": 5.781499202551834, "grad_norm": 0.5132679429264033, "learning_rate": 3.58912935015024e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.17440487444400787, "step": 3625, "valid_targets_mean": 4255.1, "valid_targets_min": 328 }, { "epoch": 5.7894736842105265, "grad_norm": 0.5053310023786863, "learning_rate": 3.543798871915367e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.15172672271728516, "step": 3630, "valid_targets_mean": 4452.2, "valid_targets_min": 227 }, { "epoch": 5.797448165869218, "grad_norm": 0.4684784598941, "learning_rate": 3.498728633996209e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.14971506595611572, "step": 3635, "valid_targets_mean": 5225.2, "valid_targets_min": 230 }, { "epoch": 5.8054226475279105, "grad_norm": 0.46115162406236737, "learning_rate": 3.453919349138859e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.14659349620342255, "step": 3640, "valid_targets_mean": 5709.1, "valid_targets_min": 299 }, { "epoch": 5.813397129186603, "grad_norm": 0.46020022381518416, "learning_rate": 3.4093717259626514e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.13591623306274414, "step": 3645, "valid_targets_mean": 4973.1, "valid_targets_min": 765 }, { "epoch": 5.821371610845295, "grad_norm": 0.47367553344910285, "learning_rate": 3.365086468948988e-06, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.1700918823480606, "step": 3650, "valid_targets_mean": 5319.5, "valid_targets_min": 225 }, { "epoch": 5.829346092503988, "grad_norm": 0.6505180384813233, "learning_rate": 3.321064278430175e-06, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.1515679657459259, "step": 3655, "valid_targets_mean": 4172.9, "valid_targets_min": 212 }, { "epoch": 5.837320574162679, "grad_norm": 0.49312956238364775, "learning_rate": 3.277305850578345e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.14799179136753082, "step": 3660, "valid_targets_mean": 4885.3, "valid_targets_min": 227 }, { "epoch": 5.845295055821372, "grad_norm": 0.4184102214187514, "learning_rate": 3.2338118773944684e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1451129913330078, "step": 3665, "valid_targets_mean": 6137.9, "valid_targets_min": 2702 }, { "epoch": 5.853269537480064, "grad_norm": 0.4917317516199451, "learning_rate": 3.1905830466973975e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.15702003240585327, "step": 3670, "valid_targets_mean": 5106.1, "valid_targets_min": 264 }, { "epoch": 5.861244019138756, "grad_norm": 0.4628847616665014, "learning_rate": 3.14762004211298e-06, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.16175755858421326, "step": 3675, "valid_targets_mean": 5198.9, "valid_targets_min": 214 }, { "epoch": 5.869218500797448, "grad_norm": 0.47601217080416275, "learning_rate": 3.1049235430632696e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.15074549615383148, "step": 3680, "valid_targets_mean": 4520.1, "valid_targets_min": 233 }, { "epoch": 5.87719298245614, "grad_norm": 0.5834218075207638, "learning_rate": 3.062494224755759e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2231508493423462, "step": 3685, "valid_targets_mean": 4244.4, "valid_targets_min": 232 }, { "epoch": 5.885167464114833, "grad_norm": 0.4766868558186829, "learning_rate": 3.0203327581727195e-06, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1613055020570755, "step": 3690, "valid_targets_mean": 4811.6, "valid_targets_min": 255 }, { "epoch": 5.893141945773524, "grad_norm": 0.44876715014880975, "learning_rate": 2.9784398100605937e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.14462366700172424, "step": 3695, "valid_targets_mean": 5235.1, "valid_targets_min": 278 }, { "epoch": 5.901116427432217, "grad_norm": 0.4510142737031215, "learning_rate": 2.9368160429194127e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13386178016662598, "step": 3700, "valid_targets_mean": 5353.9, "valid_targets_min": 283 }, { "epoch": 5.909090909090909, "grad_norm": 0.4556921018996119, "learning_rate": 2.895462114992371e-06, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.17346566915512085, "step": 3705, "valid_targets_mean": 5930.0, "valid_targets_min": 252 }, { "epoch": 5.917065390749602, "grad_norm": 0.4682379596121741, "learning_rate": 2.8543786802553943e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504223793745041, "step": 3710, "valid_targets_mean": 4891.8, "valid_targets_min": 244 }, { "epoch": 5.925039872408293, "grad_norm": 0.5028889161289527, "learning_rate": 2.813566388406781e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.16947460174560547, "step": 3715, "valid_targets_mean": 5198.4, "valid_targets_min": 238 }, { "epoch": 5.9330143540669855, "grad_norm": 0.42820894853940544, "learning_rate": 2.773025884856957e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.14061594009399414, "step": 3720, "valid_targets_mean": 5816.4, "valid_targets_min": 469 }, { "epoch": 5.940988835725678, "grad_norm": 0.4664774104232858, "learning_rate": 2.7327578107182585e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.13510872423648834, "step": 3725, "valid_targets_mean": 5545.6, "valid_targets_min": 273 }, { "epoch": 5.94896331738437, "grad_norm": 0.5238401849218677, "learning_rate": 2.692762802794775e-06, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.16264596581459045, "step": 3730, "valid_targets_mean": 4376.4, "valid_targets_min": 230 }, { "epoch": 5.956937799043062, "grad_norm": 0.45087693055845296, "learning_rate": 2.6530414935723104e-06, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1532100886106491, "step": 3735, "valid_targets_mean": 4878.6, "valid_targets_min": 259 }, { "epoch": 5.964912280701754, "grad_norm": 0.4438179509578052, "learning_rate": 2.6135945112083506e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.14241643249988556, "step": 3740, "valid_targets_mean": 4956.2, "valid_targets_min": 379 }, { "epoch": 5.972886762360447, "grad_norm": 0.5549037871035863, "learning_rate": 2.574422479522156e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.1596030294895172, "step": 3745, "valid_targets_mean": 4997.6, "valid_targets_min": 549 }, { "epoch": 5.980861244019139, "grad_norm": 0.5895868584381605, "learning_rate": 2.535526017984884e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.16880738735198975, "step": 3750, "valid_targets_mean": 3346.3, "valid_targets_min": 199 }, { "epoch": 5.988835725677831, "grad_norm": 0.5130364660857234, "learning_rate": 2.4969057417097807e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.15060560405254364, "step": 3755, "valid_targets_mean": 3963.4, "valid_targets_min": 314 }, { "epoch": 5.996810207336523, "grad_norm": 0.4976543721703397, "learning_rate": 2.458562261442483e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.13388743996620178, "step": 3760, "valid_targets_mean": 5151.2, "valid_targets_min": 245 }, { "epoch": 6.0047846889952154, "grad_norm": 0.44928966826086414, "learning_rate": 2.4204961835513263e-06, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.16202214360237122, "step": 3765, "valid_targets_mean": 5942.7, "valid_targets_min": 388 }, { "epoch": 6.012759170653908, "grad_norm": 0.4062032075083199, "learning_rate": 2.3827081100177797e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397780179977417, "step": 3770, "valid_targets_mean": 6125.1, "valid_targets_min": 223 }, { "epoch": 6.020733652312599, "grad_norm": 0.44993434313584385, "learning_rate": 2.3451986384269266e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1594015508890152, "step": 3775, "valid_targets_mean": 5130.2, "valid_targets_min": 269 }, { "epoch": 6.028708133971292, "grad_norm": 0.4875301922172514, "learning_rate": 2.307968361957993e-06, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.14149093627929688, "step": 3780, "valid_targets_mean": 4876.2, "valid_targets_min": 404 }, { "epoch": 6.036682615629984, "grad_norm": 0.4629594770445272, "learning_rate": 2.2710178693749805e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.16642490029335022, "step": 3785, "valid_targets_mean": 4987.9, "valid_targets_min": 254 }, { "epoch": 6.044657097288677, "grad_norm": 0.5166944673117188, "learning_rate": 2.2343477450173665e-06, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.17281094193458557, "step": 3790, "valid_targets_mean": 4621.1, "valid_targets_min": 215 }, { "epoch": 6.052631578947368, "grad_norm": 0.47068452452288745, "learning_rate": 2.197958568790839e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15370580554008484, "step": 3795, "valid_targets_mean": 4905.4, "valid_targets_min": 912 }, { "epoch": 6.0606060606060606, "grad_norm": 0.4549056607289303, "learning_rate": 2.161850916158148e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.16554537415504456, "step": 3800, "valid_targets_mean": 5324.4, "valid_targets_min": 240 }, { "epoch": 6.068580542264753, "grad_norm": 0.4845167729156862, "learning_rate": 2.1260253581299996e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14590927958488464, "step": 3805, "valid_targets_mean": 4456.4, "valid_targets_min": 545 }, { "epoch": 6.076555023923445, "grad_norm": 0.4653335767771134, "learning_rate": 2.0904824612560046e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1586759090423584, "step": 3810, "valid_targets_mean": 4953.6, "valid_targets_min": 407 }, { "epoch": 6.084529505582137, "grad_norm": 0.48055135656708736, "learning_rate": 2.0552227876157536e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.13218027353286743, "step": 3815, "valid_targets_mean": 5003.9, "valid_targets_min": 205 }, { "epoch": 6.092503987240829, "grad_norm": 0.4867289410365764, "learning_rate": 2.020246894809912e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.14842218160629272, "step": 3820, "valid_targets_mean": 4870.1, "valid_targets_min": 223 }, { "epoch": 6.100478468899522, "grad_norm": 0.4788267536406092, "learning_rate": 1.9855553359513836e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.16526566445827484, "step": 3825, "valid_targets_mean": 4967.4, "valid_targets_min": 347 }, { "epoch": 6.108452950558214, "grad_norm": 0.44362145470110076, "learning_rate": 1.9511486596566054e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.13952435553073883, "step": 3830, "valid_targets_mean": 5323.2, "valid_targets_min": 732 }, { "epoch": 6.116427432216906, "grad_norm": 0.44421535025224507, "learning_rate": 1.917027410036825e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.15196619927883148, "step": 3835, "valid_targets_mean": 5453.3, "valid_targets_min": 680 }, { "epoch": 6.124401913875598, "grad_norm": 0.48619880208308525, "learning_rate": 1.8831921266895348e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.1549423336982727, "step": 3840, "valid_targets_mean": 4936.4, "valid_targets_min": 292 }, { "epoch": 6.1323763955342905, "grad_norm": 0.4933266469826171, "learning_rate": 1.8496433446899197e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.14725814759731293, "step": 3845, "valid_targets_mean": 4630.4, "valid_targets_min": 371 }, { "epoch": 6.140350877192983, "grad_norm": 0.4355406021657482, "learning_rate": 1.8163815945823881e-06, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.13551683723926544, "step": 3850, "valid_targets_mean": 6277.8, "valid_targets_min": 369 }, { "epoch": 6.148325358851674, "grad_norm": 0.44639648871243803, "learning_rate": 1.7834074023722082e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.13991107046604156, "step": 3855, "valid_targets_mean": 5152.2, "valid_targets_min": 231 }, { "epoch": 6.156299840510367, "grad_norm": 0.489541279190905, "learning_rate": 1.7507212895171632e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.15481799840927124, "step": 3860, "valid_targets_mean": 5027.0, "valid_targets_min": 318 }, { "epoch": 6.164274322169059, "grad_norm": 0.5049501309051616, "learning_rate": 1.7183237729193081e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.16344068944454193, "step": 3865, "valid_targets_mean": 4705.1, "valid_targets_min": 444 }, { "epoch": 6.172248803827751, "grad_norm": 0.5079803335616084, "learning_rate": 1.6862153649168211e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.15662287175655365, "step": 3870, "valid_targets_mean": 4186.4, "valid_targets_min": 241 }, { "epoch": 6.180223285486443, "grad_norm": 0.5116936150655245, "learning_rate": 1.6543965732758737e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334778070449829, "step": 3875, "valid_targets_mean": 4322.1, "valid_targets_min": 326 }, { "epoch": 6.188197767145136, "grad_norm": 0.45160368109673826, "learning_rate": 1.6228679011826032e-06, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.16378632187843323, "step": 3880, "valid_targets_mean": 5385.4, "valid_targets_min": 547 }, { "epoch": 6.196172248803828, "grad_norm": 0.4571770596267456, "learning_rate": 1.591629847235172e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14328834414482117, "step": 3885, "valid_targets_mean": 5291.6, "valid_targets_min": 598 }, { "epoch": 6.2041467304625195, "grad_norm": 0.4692079789797092, "learning_rate": 1.5606829054358686e-06, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.150887131690979, "step": 3890, "valid_targets_mean": 5435.4, "valid_targets_min": 1139 }, { "epoch": 6.212121212121212, "grad_norm": 0.426069274473679, "learning_rate": 1.5300275651832963e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.14551419019699097, "step": 3895, "valid_targets_mean": 6428.3, "valid_targets_min": 1623 }, { "epoch": 6.220095693779904, "grad_norm": 0.6045869058817608, "learning_rate": 1.499664311264648e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.14620190858840942, "step": 3900, "valid_targets_mean": 4127.7, "valid_targets_min": 252 }, { "epoch": 6.228070175438597, "grad_norm": 0.5782970704223566, "learning_rate": 1.4695936238480135e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.1496705263853073, "step": 3905, "valid_targets_mean": 3291.6, "valid_targets_min": 240 }, { "epoch": 6.236044657097288, "grad_norm": 0.47876040223726124, "learning_rate": 1.4398159784748144e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.15745174884796143, "step": 3910, "valid_targets_mean": 5079.1, "valid_targets_min": 266 }, { "epoch": 6.244019138755981, "grad_norm": 0.5126346829344415, "learning_rate": 1.4103318460522598e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.16566559672355652, "step": 3915, "valid_targets_mean": 4192.6, "valid_targets_min": 273 }, { "epoch": 6.251993620414673, "grad_norm": 0.5416124300618265, "learning_rate": 1.3811416928459177e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.15463967621326447, "step": 3920, "valid_targets_mean": 4478.5, "valid_targets_min": 272 }, { "epoch": 6.2599681020733655, "grad_norm": 0.4448108644678357, "learning_rate": 1.3522459804723353e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516856849193573, "step": 3925, "valid_targets_mean": 5685.1, "valid_targets_min": 711 }, { "epoch": 6.267942583732057, "grad_norm": 0.4289450178961959, "learning_rate": 1.3236451658917293e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.15075251460075378, "step": 3930, "valid_targets_mean": 5997.5, "valid_targets_min": 2915 }, { "epoch": 6.2759170653907494, "grad_norm": 0.46681109243000163, "learning_rate": 1.2953397014007728e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.14777758717536926, "step": 3935, "valid_targets_mean": 5023.1, "valid_targets_min": 390 }, { "epoch": 6.283891547049442, "grad_norm": 0.42835960080586744, "learning_rate": 1.2673300346254447e-06, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.13789385557174683, "step": 3940, "valid_targets_mean": 5225.6, "valid_targets_min": 289 }, { "epoch": 6.291866028708134, "grad_norm": 0.5196426280217668, "learning_rate": 1.239616608513925e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.15100279450416565, "step": 3945, "valid_targets_mean": 4081.2, "valid_targets_min": 286 }, { "epoch": 6.299840510366826, "grad_norm": 0.5022813022318281, "learning_rate": 1.2121998613296259e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.14675407111644745, "step": 3950, "valid_targets_mean": 5395.9, "valid_targets_min": 412 }, { "epoch": 6.307814992025518, "grad_norm": 0.44890211526343465, "learning_rate": 1.1850802266442396e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.1509132981300354, "step": 3955, "valid_targets_mean": 5812.4, "valid_targets_min": 2642 }, { "epoch": 6.315789473684211, "grad_norm": 0.5061776876413504, "learning_rate": 1.1582581333308784e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.14476345479488373, "step": 3960, "valid_targets_mean": 4706.8, "valid_targets_min": 408 }, { "epoch": 6.323763955342903, "grad_norm": 0.5217658882608658, "learning_rate": 1.1317340055573122e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14775893092155457, "step": 3965, "valid_targets_mean": 3739.5, "valid_targets_min": 199 }, { "epoch": 6.3317384370015946, "grad_norm": 0.5118859450723333, "learning_rate": 1.1055082627792357e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.16105467081069946, "step": 3970, "valid_targets_mean": 4756.9, "valid_targets_min": 293 }, { "epoch": 6.339712918660287, "grad_norm": 0.5054678322271705, "learning_rate": 1.0795813197336602e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.12841784954071045, "step": 3975, "valid_targets_mean": 4324.1, "valid_targets_min": 251 }, { "epoch": 6.347687400318979, "grad_norm": 0.5102069371772863, "learning_rate": 1.0539535864323391e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.164170041680336, "step": 3980, "valid_targets_mean": 4642.5, "valid_targets_min": 212 }, { "epoch": 6.355661881977672, "grad_norm": 0.47695267618075876, "learning_rate": 1.0286254681552777e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.15313708782196045, "step": 3985, "valid_targets_mean": 5626.9, "valid_targets_min": 273 }, { "epoch": 6.363636363636363, "grad_norm": 0.43091234410044393, "learning_rate": 1.0035973654443466e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.15081724524497986, "step": 3990, "valid_targets_mean": 5959.9, "valid_targets_min": 284 }, { "epoch": 6.371610845295056, "grad_norm": 0.5340840931679183, "learning_rate": 9.788696740969295e-07, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.14918410778045654, "step": 3995, "valid_targets_mean": 4531.4, "valid_targets_min": 1210 }, { "epoch": 6.379585326953748, "grad_norm": 0.4247409219481503, "learning_rate": 9.544427851596661e-07, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.14433777332305908, "step": 4000, "valid_targets_mean": 6152.6, "valid_targets_min": 241 }, { "epoch": 6.3875598086124405, "grad_norm": 0.4895024880775478, "learning_rate": 9.303170849222764e-07, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440003663301468, "step": 4005, "valid_targets_mean": 4668.4, "valid_targets_min": 300 }, { "epoch": 6.395534290271132, "grad_norm": 0.429988312127633, "learning_rate": 9.064929549114421e-07, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.1483185589313507, "step": 4010, "valid_targets_mean": 6485.9, "valid_targets_min": 3764 }, { "epoch": 6.4035087719298245, "grad_norm": 0.46137829910478273, "learning_rate": 8.829707718847835e-07, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15009953081607819, "step": 4015, "valid_targets_mean": 5219.5, "valid_targets_min": 341 }, { "epoch": 6.411483253588517, "grad_norm": 0.47612714642052334, "learning_rate": 8.597509078248923e-07, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.14877188205718994, "step": 4020, "valid_targets_mean": 5458.4, "valid_targets_min": 263 }, { "epoch": 6.419457735247209, "grad_norm": 0.4790590020325636, "learning_rate": 8.368337299334461e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.14202189445495605, "step": 4025, "valid_targets_mean": 4610.4, "valid_targets_min": 221 }, { "epoch": 6.427432216905901, "grad_norm": 0.43486828774128805, "learning_rate": 8.142196006254144e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.14796648919582367, "step": 4030, "valid_targets_mean": 5326.4, "valid_targets_min": 357 }, { "epoch": 6.435406698564593, "grad_norm": 0.4703735281341048, "learning_rate": 7.919088775233264e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.155422180891037, "step": 4035, "valid_targets_mean": 5504.8, "valid_targets_min": 220 }, { "epoch": 6.443381180223286, "grad_norm": 0.535947939565035, "learning_rate": 7.699019134515917e-07, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.15502360463142395, "step": 4040, "valid_targets_mean": 4319.9, "valid_targets_min": 285 }, { "epoch": 6.451355661881978, "grad_norm": 0.4818703555632311, "learning_rate": 7.48199056430956e-07, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630256175994873, "step": 4045, "valid_targets_mean": 5285.6, "valid_targets_min": 208 }, { "epoch": 6.45933014354067, "grad_norm": 0.5035873377823161, "learning_rate": 7.268006496729762e-07, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15067459642887115, "step": 4050, "valid_targets_mean": 5337.9, "valid_targets_min": 174 }, { "epoch": 6.467304625199362, "grad_norm": 0.502747428173728, "learning_rate": 7.057070315745851e-07, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.1535114347934723, "step": 4055, "valid_targets_mean": 4404.4, "valid_targets_min": 201 }, { "epoch": 6.475279106858054, "grad_norm": 0.4016268682691944, "learning_rate": 6.849185357127686e-07, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472223699092865, "step": 4060, "valid_targets_mean": 5625.4, "valid_targets_min": 252 }, { "epoch": 6.483253588516747, "grad_norm": 0.500867474532203, "learning_rate": 6.64435490839257e-07, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15104928612709045, "step": 4065, "valid_targets_mean": 5525.7, "valid_targets_min": 233 }, { "epoch": 6.491228070175438, "grad_norm": 0.4376815836110299, "learning_rate": 6.442582208753578e-07, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.15212634205818176, "step": 4070, "valid_targets_mean": 6167.4, "valid_targets_min": 372 }, { "epoch": 6.499202551834131, "grad_norm": 0.4925011711593379, "learning_rate": 6.243870449068068e-07, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.13938778638839722, "step": 4075, "valid_targets_mean": 4858.9, "valid_targets_min": 293 }, { "epoch": 6.507177033492823, "grad_norm": 0.5028373020409859, "learning_rate": 6.048222771787382e-07, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.14744833111763, "step": 4080, "valid_targets_mean": 4449.3, "valid_targets_min": 285 }, { "epoch": 6.515151515151516, "grad_norm": 0.4451538888037021, "learning_rate": 5.85564227090707e-07, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.15033164620399475, "step": 4085, "valid_targets_mean": 5139.9, "valid_targets_min": 227 }, { "epoch": 6.523125996810207, "grad_norm": 0.49448838566482495, "learning_rate": 5.666131991917989e-07, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.14017827808856964, "step": 4090, "valid_targets_mean": 5041.9, "valid_targets_min": 233 }, { "epoch": 6.5311004784688995, "grad_norm": 0.5416350180533349, "learning_rate": 5.479694931758194e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1785852611064911, "step": 4095, "valid_targets_mean": 5573.2, "valid_targets_min": 437 }, { "epoch": 6.539074960127592, "grad_norm": 0.5628948990040651, "learning_rate": 5.296334038765483e-07, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.1577194631099701, "step": 4100, "valid_targets_mean": 4427.6, "valid_targets_min": 477 }, { "epoch": 6.5470494417862835, "grad_norm": 0.48315562844847276, "learning_rate": 5.116052212630696e-07, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.14190314710140228, "step": 4105, "valid_targets_mean": 4638.1, "valid_targets_min": 238 }, { "epoch": 6.555023923444976, "grad_norm": 0.4649105580146512, "learning_rate": 4.938852304352026e-07, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.1748298704624176, "step": 4110, "valid_targets_mean": 6575.4, "valid_targets_min": 783 }, { "epoch": 6.562998405103668, "grad_norm": 0.4586563960264318, "learning_rate": 4.7647371161898547e-07, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.14360040426254272, "step": 4115, "valid_targets_mean": 5360.1, "valid_targets_min": 332 }, { "epoch": 6.570972886762361, "grad_norm": 0.45085707891473675, "learning_rate": 4.593709401622359e-07, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.1483638733625412, "step": 4120, "valid_targets_mean": 5548.3, "valid_targets_min": 283 }, { "epoch": 6.578947368421053, "grad_norm": 0.46458186030605464, "learning_rate": 4.425771865302153e-07, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930150866508484, "step": 4125, "valid_targets_mean": 5190.6, "valid_targets_min": 350 }, { "epoch": 6.586921850079745, "grad_norm": 0.43541944344062583, "learning_rate": 4.2609271630133174e-07, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1533948928117752, "step": 4130, "valid_targets_mean": 5871.0, "valid_targets_min": 231 }, { "epoch": 6.594896331738437, "grad_norm": 0.5031511197247889, "learning_rate": 4.099177901629525e-07, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.139293372631073, "step": 4135, "valid_targets_mean": 3976.4, "valid_targets_min": 185 }, { "epoch": 6.6028708133971294, "grad_norm": 0.5019363115194629, "learning_rate": 3.9405266390727836e-07, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.16090963780879974, "step": 4140, "valid_targets_mean": 5086.2, "valid_targets_min": 195 }, { "epoch": 6.610845295055821, "grad_norm": 0.4844497814826883, "learning_rate": 3.7849758842729344e-07, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.16627800464630127, "step": 4145, "valid_targets_mean": 5407.1, "valid_targets_min": 199 }, { "epoch": 6.618819776714513, "grad_norm": 0.4591731715598886, "learning_rate": 3.632528097128085e-07, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.14857414364814758, "step": 4150, "valid_targets_mean": 5256.8, "valid_targets_min": 229 }, { "epoch": 6.626794258373206, "grad_norm": 0.5202929604535261, "learning_rate": 3.48318568846564e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455889195203781, "step": 4155, "valid_targets_mean": 4872.8, "valid_targets_min": 247 }, { "epoch": 6.634768740031898, "grad_norm": 0.4705904446828977, "learning_rate": 3.336951020004087e-07, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.14285165071487427, "step": 4160, "valid_targets_mean": 5109.5, "valid_targets_min": 200 }, { "epoch": 6.64274322169059, "grad_norm": 0.45577635857265425, "learning_rate": 3.1938264043158694e-07, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.13021527230739594, "step": 4165, "valid_targets_mean": 4774.4, "valid_targets_min": 435 }, { "epoch": 6.650717703349282, "grad_norm": 0.4486128504903437, "learning_rate": 3.05381410479062e-07, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472494751214981, "step": 4170, "valid_targets_mean": 5558.4, "valid_targets_min": 536 }, { "epoch": 6.6586921850079746, "grad_norm": 0.4535891529882187, "learning_rate": 2.916916335599407e-07, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309969127178192, "step": 4175, "valid_targets_mean": 5063.6, "valid_targets_min": 443 }, { "epoch": 6.666666666666667, "grad_norm": 0.5137615372694194, "learning_rate": 2.783135261659831e-07, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.131601944565773, "step": 4180, "valid_targets_mean": 4253.1, "valid_targets_min": 180 }, { "epoch": 6.6746411483253585, "grad_norm": 0.4956512141213648, "learning_rate": 2.6524729986016293e-07, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345309317111969, "step": 4185, "valid_targets_mean": 4681.8, "valid_targets_min": 370 }, { "epoch": 6.682615629984051, "grad_norm": 0.4322804982850078, "learning_rate": 2.524931612733328e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334218680858612, "step": 4190, "valid_targets_mean": 5158.1, "valid_targets_min": 1221 }, { "epoch": 6.690590111642743, "grad_norm": 0.5524770921264247, "learning_rate": 2.400513121009529e-07, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.13881897926330566, "step": 4195, "valid_targets_mean": 5170.0, "valid_targets_min": 217 }, { "epoch": 6.698564593301436, "grad_norm": 0.4416808616196191, "learning_rate": 2.279219490998985e-07, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.14825358986854553, "step": 4200, "valid_targets_mean": 5345.4, "valid_targets_min": 192 }, { "epoch": 6.706539074960127, "grad_norm": 0.41557160123119896, "learning_rate": 2.161052640853578e-07, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.15103837847709656, "step": 4205, "valid_targets_mean": 6218.0, "valid_targets_min": 3267 }, { "epoch": 6.71451355661882, "grad_norm": 0.4665005539147527, "learning_rate": 2.0460144392778768e-07, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.14628729224205017, "step": 4210, "valid_targets_mean": 5114.4, "valid_targets_min": 184 }, { "epoch": 6.722488038277512, "grad_norm": 0.41678070100960785, "learning_rate": 1.9341067054996277e-07, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.13423167169094086, "step": 4215, "valid_targets_mean": 6462.1, "valid_targets_min": 707 }, { "epoch": 6.7304625199362045, "grad_norm": 0.5329553956676955, "learning_rate": 1.8253312092409992e-07, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.16593559086322784, "step": 4220, "valid_targets_mean": 4739.5, "valid_targets_min": 458 }, { "epoch": 6.738437001594896, "grad_norm": 0.4077664732039775, "learning_rate": 1.7196896706906273e-07, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.14922519028186798, "step": 4225, "valid_targets_mean": 6259.2, "valid_targets_min": 1201 }, { "epoch": 6.746411483253588, "grad_norm": 0.4572419979041358, "learning_rate": 1.6171837604762597e-07, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.14641094207763672, "step": 4230, "valid_targets_mean": 5254.2, "valid_targets_min": 598 }, { "epoch": 6.754385964912281, "grad_norm": 0.494702420453681, "learning_rate": 1.5178150996385755e-07, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475975215435028, "step": 4235, "valid_targets_mean": 4546.5, "valid_targets_min": 232 }, { "epoch": 6.762360446570973, "grad_norm": 0.4796385200530194, "learning_rate": 1.421585259605318e-07, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.1568702608346939, "step": 4240, "valid_targets_mean": 5172.8, "valid_targets_min": 260 }, { "epoch": 6.770334928229665, "grad_norm": 0.43075191213287334, "learning_rate": 1.3284957621666039e-07, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.14368301630020142, "step": 4245, "valid_targets_mean": 5836.8, "valid_targets_min": 1704 }, { "epoch": 6.778309409888357, "grad_norm": 0.4851600090501543, "learning_rate": 1.2385480794507853e-07, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.13613252341747284, "step": 4250, "valid_targets_mean": 5194.1, "valid_targets_min": 224 }, { "epoch": 6.78628389154705, "grad_norm": 0.49076420450563607, "learning_rate": 1.1517436339011589e-07, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1567186713218689, "step": 4255, "valid_targets_mean": 4560.8, "valid_targets_min": 306 }, { "epoch": 6.794258373205742, "grad_norm": 0.481268750942527, "learning_rate": 1.0680837982535607e-07, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.13878720998764038, "step": 4260, "valid_targets_mean": 5214.8, "valid_targets_min": 247 }, { "epoch": 6.8022328548644335, "grad_norm": 0.525692133957443, "learning_rate": 9.875698955145174e-08, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.12678062915802002, "step": 4265, "valid_targets_mean": 4339.8, "valid_targets_min": 242 }, { "epoch": 6.810207336523126, "grad_norm": 0.42621079495304015, "learning_rate": 9.102031989404403e-08, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1495763659477234, "step": 4270, "valid_targets_mean": 5675.7, "valid_targets_min": 642 }, { "epoch": 6.818181818181818, "grad_norm": 0.4580655646450462, "learning_rate": 8.359849320174196e-08, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.15296252071857452, "step": 4275, "valid_targets_mean": 5290.6, "valid_targets_min": 261 }, { "epoch": 6.826156299840511, "grad_norm": 0.424793015484167, "learning_rate": 7.649162684419731e-08, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.1285790205001831, "step": 4280, "valid_targets_mean": 5851.7, "valid_targets_min": 997 }, { "epoch": 6.834130781499202, "grad_norm": 0.6009179207598535, "learning_rate": 6.969983321023499e-08, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.15977022051811218, "step": 4285, "valid_targets_mean": 4550.5, "valid_targets_min": 446 }, { "epoch": 6.842105263157895, "grad_norm": 0.43101483729428003, "learning_rate": 6.322321970608337e-08, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.13828077912330627, "step": 4290, "valid_targets_mean": 6386.3, "valid_targets_min": 205 }, { "epoch": 6.850079744816587, "grad_norm": 0.4465415769876545, "learning_rate": 5.7061888753677796e-08, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383409947156906, "step": 4295, "valid_targets_mean": 5717.8, "valid_targets_min": 262 }, { "epoch": 6.858054226475279, "grad_norm": 0.5473085555335196, "learning_rate": 5.121593778903755e-08, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.14721372723579407, "step": 4300, "valid_targets_mean": 4142.8, "valid_targets_min": 239 }, { "epoch": 6.866028708133971, "grad_norm": 0.4853378564035753, "learning_rate": 4.5685459260722544e-08, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.15751667320728302, "step": 4305, "valid_targets_mean": 5418.1, "valid_targets_min": 238 }, { "epoch": 6.8740031897926634, "grad_norm": 0.4931042806071698, "learning_rate": 4.047054062837452e-08, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.14012879133224487, "step": 4310, "valid_targets_mean": 4697.9, "valid_targets_min": 230 }, { "epoch": 6.881977671451356, "grad_norm": 0.8971037686738282, "learning_rate": 3.55712643613404e-08, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.15433238446712494, "step": 4315, "valid_targets_mean": 4864.7, "valid_targets_min": 205 }, { "epoch": 6.889952153110048, "grad_norm": 0.4692472893763074, "learning_rate": 3.0987707937351066e-08, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1405605673789978, "step": 4320, "valid_targets_mean": 4847.9, "valid_targets_min": 302 }, { "epoch": 6.89792663476874, "grad_norm": 0.47088407985998104, "learning_rate": 2.6719943841311268e-08, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.14168399572372437, "step": 4325, "valid_targets_mean": 4563.3, "valid_targets_min": 186 }, { "epoch": 6.905901116427432, "grad_norm": 0.4156838063505349, "learning_rate": 2.2768039564151635e-08, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.1466359794139862, "step": 4330, "valid_targets_mean": 6131.1, "valid_targets_min": 222 }, { "epoch": 6.913875598086125, "grad_norm": 0.45459420575813153, "learning_rate": 1.913205760175174e-08, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472633183002472, "step": 4335, "valid_targets_mean": 5499.1, "valid_targets_min": 918 }, { "epoch": 6.921850079744816, "grad_norm": 0.5393281054744222, "learning_rate": 1.5812055453963136e-08, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455461084842682, "step": 4340, "valid_targets_mean": 4090.8, "valid_targets_min": 223 }, { "epoch": 6.9298245614035086, "grad_norm": 0.4636075944477561, "learning_rate": 1.280808562369229e-08, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.15545576810836792, "step": 4345, "valid_targets_mean": 5444.2, "valid_targets_min": 306 }, { "epoch": 6.937799043062201, "grad_norm": 0.4669452035057073, "learning_rate": 1.01201956160768e-08, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.16182288527488708, "step": 4350, "valid_targets_mean": 5502.8, "valid_targets_min": 237 }, { "epoch": 6.945773524720893, "grad_norm": 0.5151990228437675, "learning_rate": 7.74842793772601e-09, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.16319866478443146, "step": 4355, "valid_targets_mean": 4926.0, "valid_targets_min": 294 }, { "epoch": 6.953748006379586, "grad_norm": 0.4990613508241575, "learning_rate": 5.692820096054874e-09, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.18269044160842896, "step": 4360, "valid_targets_mean": 5456.6, "valid_targets_min": 353 }, { "epoch": 6.961722488038277, "grad_norm": 0.4688789910525006, "learning_rate": 3.9534045986888706e-09, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.1274082511663437, "step": 4365, "valid_targets_mean": 4650.2, "valid_targets_min": 253 }, { "epoch": 6.96969696969697, "grad_norm": 0.47324806337291064, "learning_rate": 2.530208952953306e-09, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.16023960709571838, "step": 4370, "valid_targets_mean": 5175.2, "valid_targets_min": 188 }, { "epoch": 6.977671451355662, "grad_norm": 0.5245943580661637, "learning_rate": 1.4232556654314445e-09, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.14867472648620605, "step": 4375, "valid_targets_mean": 4396.8, "valid_targets_min": 217 }, { "epoch": 6.985645933014354, "grad_norm": 0.49879412018200225, "learning_rate": 6.325622416136767e-10, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.16116350889205933, "step": 4380, "valid_targets_mean": 5194.9, "valid_targets_min": 606 }, { "epoch": 6.993620414673046, "grad_norm": 0.5977785482250375, "learning_rate": 1.581411856199644e-10, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.16265273094177246, "step": 4385, "valid_targets_mean": 4349.9, "valid_targets_min": 237 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1386960744857788, "step": 4389, "total_flos": 1630450968166400.0, "train_loss": 0.1932186623672386, "train_runtime": 23240.6244, "train_samples_per_second": 3.017, "train_steps_per_second": 0.189, "valid_targets_mean": 4301.4, "valid_targets_min": 221 } ], "logging_steps": 5, "max_steps": 4389, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1630450968166400.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }