{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4333, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008077544426494346, "grad_norm": 17.94031922937094, "learning_rate": 3.686635944700461e-07, "loss": 0.6301, "loss_nan_ranks": 0, "loss_rank_avg": 0.6101559400558472, "step": 5, "valid_targets_mean": 5131.6, "valid_targets_min": 2456 }, { "epoch": 0.01615508885298869, "grad_norm": 18.031251271375503, "learning_rate": 8.294930875576038e-07, "loss": 0.6434, "loss_nan_ranks": 0, "loss_rank_avg": 0.6626201868057251, "step": 10, "valid_targets_mean": 4924.7, "valid_targets_min": 2511 }, { "epoch": 0.024232633279483037, "grad_norm": 15.80671655943195, "learning_rate": 1.2903225806451614e-06, "loss": 0.5987, "loss_nan_ranks": 0, "loss_rank_avg": 0.6084240078926086, "step": 15, "valid_targets_mean": 5216.2, "valid_targets_min": 2840 }, { "epoch": 0.03231017770597738, "grad_norm": 12.200268087793992, "learning_rate": 1.751152073732719e-06, "loss": 0.5488, "loss_nan_ranks": 0, "loss_rank_avg": 0.5271545052528381, "step": 20, "valid_targets_mean": 5782.9, "valid_targets_min": 3261 }, { "epoch": 0.04038772213247173, "grad_norm": 7.84942309438541, "learning_rate": 2.211981566820277e-06, "loss": 0.5143, "loss_nan_ranks": 0, "loss_rank_avg": 0.48371779918670654, "step": 25, "valid_targets_mean": 5333.9, "valid_targets_min": 3236 }, { "epoch": 0.048465266558966075, "grad_norm": 4.200322718651227, "learning_rate": 2.6728110599078343e-06, "loss": 0.4757, "loss_nan_ranks": 0, "loss_rank_avg": 0.444708913564682, "step": 30, "valid_targets_mean": 5335.8, "valid_targets_min": 3982 }, { "epoch": 0.05654281098546042, "grad_norm": 2.5697926973071, "learning_rate": 3.1336405529953917e-06, "loss": 0.4407, "loss_nan_ranks": 0, "loss_rank_avg": 0.4613327383995056, "step": 35, "valid_targets_mean": 5051.0, "valid_targets_min": 3053 }, { "epoch": 0.06462035541195477, "grad_norm": 1.2615763319708777, "learning_rate": 3.5944700460829495e-06, "loss": 0.412, "loss_nan_ranks": 0, "loss_rank_avg": 0.38105225563049316, "step": 40, "valid_targets_mean": 6270.6, "valid_targets_min": 4347 }, { "epoch": 0.07269789983844911, "grad_norm": 1.2005219937697187, "learning_rate": 4.055299539170508e-06, "loss": 0.3991, "loss_nan_ranks": 0, "loss_rank_avg": 0.3904378414154053, "step": 45, "valid_targets_mean": 4399.7, "valid_targets_min": 773 }, { "epoch": 0.08077544426494346, "grad_norm": 0.8711539509364695, "learning_rate": 4.516129032258065e-06, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.3860582709312439, "step": 50, "valid_targets_mean": 5580.8, "valid_targets_min": 2625 }, { "epoch": 0.0888529886914378, "grad_norm": 0.7806846326439755, "learning_rate": 4.976958525345623e-06, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.3754419684410095, "step": 55, "valid_targets_mean": 5052.6, "valid_targets_min": 915 }, { "epoch": 0.09693053311793215, "grad_norm": 0.6803342618147262, "learning_rate": 5.43778801843318e-06, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.3440122604370117, "step": 60, "valid_targets_mean": 4892.2, "valid_targets_min": 1595 }, { "epoch": 0.1050080775444265, "grad_norm": 0.5873054899995456, "learning_rate": 5.8986175115207375e-06, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.3376592993736267, "step": 65, "valid_targets_mean": 5686.4, "valid_targets_min": 3311 }, { "epoch": 0.11308562197092084, "grad_norm": 0.5812104869467237, "learning_rate": 6.359447004608295e-06, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.32878339290618896, "step": 70, "valid_targets_mean": 5069.1, "valid_targets_min": 2942 }, { "epoch": 0.12116316639741519, "grad_norm": 0.6110766171265148, "learning_rate": 6.820276497695853e-06, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.32319021224975586, "step": 75, "valid_targets_mean": 5218.8, "valid_targets_min": 3039 }, { "epoch": 0.12924071082390953, "grad_norm": 0.5275806578865466, "learning_rate": 7.28110599078341e-06, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.2842397391796112, "step": 80, "valid_targets_mean": 5314.7, "valid_targets_min": 936 }, { "epoch": 0.13731825525040386, "grad_norm": 0.5043499827664671, "learning_rate": 7.741935483870968e-06, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.29710888862609863, "step": 85, "valid_targets_mean": 5840.7, "valid_targets_min": 3092 }, { "epoch": 0.14539579967689822, "grad_norm": 0.46665023880464535, "learning_rate": 8.202764976958527e-06, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.30811554193496704, "step": 90, "valid_targets_mean": 5763.2, "valid_targets_min": 2093 }, { "epoch": 0.15347334410339256, "grad_norm": 0.479007494945398, "learning_rate": 8.663594470046084e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.27862054109573364, "step": 95, "valid_targets_mean": 5151.4, "valid_targets_min": 3499 }, { "epoch": 0.16155088852988692, "grad_norm": 0.46977805962833913, "learning_rate": 9.124423963133642e-06, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.27801576256752014, "step": 100, "valid_targets_mean": 5621.1, "valid_targets_min": 2984 }, { "epoch": 0.16962843295638125, "grad_norm": 0.5413430637817005, "learning_rate": 9.5852534562212e-06, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.27780991792678833, "step": 105, "valid_targets_mean": 5530.5, "valid_targets_min": 3262 }, { "epoch": 0.1777059773828756, "grad_norm": 0.4854713237809568, "learning_rate": 1.0046082949308758e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.29190337657928467, "step": 110, "valid_targets_mean": 5010.4, "valid_targets_min": 2172 }, { "epoch": 0.18578352180936994, "grad_norm": 0.43214061276729393, "learning_rate": 1.0506912442396313e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.2443092167377472, "step": 115, "valid_targets_mean": 5622.8, "valid_targets_min": 2807 }, { "epoch": 0.1938610662358643, "grad_norm": 0.4667686489049157, "learning_rate": 1.096774193548387e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.29900214076042175, "step": 120, "valid_targets_mean": 5740.0, "valid_targets_min": 2342 }, { "epoch": 0.20193861066235863, "grad_norm": 0.47079196966589154, "learning_rate": 1.1428571428571429e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535105049610138, "step": 125, "valid_targets_mean": 5683.8, "valid_targets_min": 3121 }, { "epoch": 0.210016155088853, "grad_norm": 0.48737229402291704, "learning_rate": 1.1889400921658986e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.2664521038532257, "step": 130, "valid_targets_mean": 5758.3, "valid_targets_min": 3031 }, { "epoch": 0.21809369951534732, "grad_norm": 0.44438273857452876, "learning_rate": 1.2350230414746545e-05, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.24761803448200226, "step": 135, "valid_targets_mean": 5854.6, "valid_targets_min": 2705 }, { "epoch": 0.22617124394184168, "grad_norm": 0.484602203573656, "learning_rate": 1.2811059907834102e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.2663928270339966, "step": 140, "valid_targets_mean": 4858.4, "valid_targets_min": 3166 }, { "epoch": 0.23424878836833601, "grad_norm": 0.8373509253059376, "learning_rate": 1.327188940092166e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.23110944032669067, "step": 145, "valid_targets_mean": 5774.5, "valid_targets_min": 3857 }, { "epoch": 0.24232633279483037, "grad_norm": 0.4744523854954822, "learning_rate": 1.3732718894009217e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2517966628074646, "step": 150, "valid_targets_mean": 5936.8, "valid_targets_min": 3820 }, { "epoch": 0.25040387722132473, "grad_norm": 0.4436732050116699, "learning_rate": 1.4193548387096776e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502896189689636, "step": 155, "valid_targets_mean": 5545.9, "valid_targets_min": 3053 }, { "epoch": 0.25848142164781907, "grad_norm": 0.5326764127215488, "learning_rate": 1.4654377880184335e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557904124259949, "step": 160, "valid_targets_mean": 4778.4, "valid_targets_min": 2787 }, { "epoch": 0.2665589660743134, "grad_norm": 0.5742888836203236, "learning_rate": 1.511520737327189e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.2368374466896057, "step": 165, "valid_targets_mean": 4304.3, "valid_targets_min": 982 }, { "epoch": 0.27463651050080773, "grad_norm": 0.516540542996034, "learning_rate": 1.5576036866359447e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.23024621605873108, "step": 170, "valid_targets_mean": 5190.8, "valid_targets_min": 3596 }, { "epoch": 0.2827140549273021, "grad_norm": 0.49927626067384623, "learning_rate": 1.6036866359447006e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.26048240065574646, "step": 175, "valid_targets_mean": 5276.1, "valid_targets_min": 3502 }, { "epoch": 0.29079159935379645, "grad_norm": 0.5279070782491759, "learning_rate": 1.6497695852534564e-05, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.26732373237609863, "step": 180, "valid_targets_mean": 5403.4, "valid_targets_min": 3363 }, { "epoch": 0.2988691437802908, "grad_norm": 0.7686728653284448, "learning_rate": 1.695852534562212e-05, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.24225091934204102, "step": 185, "valid_targets_mean": 5036.5, "valid_targets_min": 3044 }, { "epoch": 0.3069466882067851, "grad_norm": 0.5401854168098045, "learning_rate": 1.741935483870968e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.23782731592655182, "step": 190, "valid_targets_mean": 4939.9, "valid_targets_min": 3655 }, { "epoch": 0.3150242326332795, "grad_norm": 0.4741183912318437, "learning_rate": 1.7880184331797237e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.23438788950443268, "step": 195, "valid_targets_mean": 5697.8, "valid_targets_min": 3818 }, { "epoch": 0.32310177705977383, "grad_norm": 0.5649501345080572, "learning_rate": 1.8341013824884796e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.2522869110107422, "step": 200, "valid_targets_mean": 5545.6, "valid_targets_min": 2987 }, { "epoch": 0.33117932148626816, "grad_norm": 0.5024588642048885, "learning_rate": 1.880184331797235e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.25441572070121765, "step": 205, "valid_targets_mean": 5945.6, "valid_targets_min": 3733 }, { "epoch": 0.3392568659127625, "grad_norm": 0.4723024425418466, "learning_rate": 1.926267281105991e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.22206412255764008, "step": 210, "valid_targets_mean": 5697.2, "valid_targets_min": 3558 }, { "epoch": 0.3473344103392569, "grad_norm": 0.6726911987350219, "learning_rate": 1.9723502304147465e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.28493285179138184, "step": 215, "valid_targets_mean": 5278.5, "valid_targets_min": 3333 }, { "epoch": 0.3554119547657512, "grad_norm": 0.4932617145639215, "learning_rate": 2.0184331797235024e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.24521911144256592, "step": 220, "valid_targets_mean": 5599.8, "valid_targets_min": 3656 }, { "epoch": 0.36348949919224555, "grad_norm": 0.7642926488649742, "learning_rate": 2.0645161290322582e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.23008081316947937, "step": 225, "valid_targets_mean": 4490.4, "valid_targets_min": 2678 }, { "epoch": 0.3715670436187399, "grad_norm": 0.4615383980334948, "learning_rate": 2.110599078341014e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.2407582700252533, "step": 230, "valid_targets_mean": 5580.6, "valid_targets_min": 1278 }, { "epoch": 0.37964458804523427, "grad_norm": 0.48203999030444306, "learning_rate": 2.1566820276497696e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535155117511749, "step": 235, "valid_targets_mean": 5543.1, "valid_targets_min": 3751 }, { "epoch": 0.3877221324717286, "grad_norm": 0.5148221390988014, "learning_rate": 2.2027649769585255e-05, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.2425214797258377, "step": 240, "valid_targets_mean": 5763.6, "valid_targets_min": 3036 }, { "epoch": 0.39579967689822293, "grad_norm": 0.46547764871482555, "learning_rate": 2.2488479262672814e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.25116443634033203, "step": 245, "valid_targets_mean": 5522.1, "valid_targets_min": 2416 }, { "epoch": 0.40387722132471726, "grad_norm": 0.5077942282172957, "learning_rate": 2.2949308755760372e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.22106090188026428, "step": 250, "valid_targets_mean": 4705.5, "valid_targets_min": 2789 }, { "epoch": 0.41195476575121165, "grad_norm": 0.4787719956412287, "learning_rate": 2.3410138248847928e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.2345045804977417, "step": 255, "valid_targets_mean": 5413.2, "valid_targets_min": 2585 }, { "epoch": 0.420032310177706, "grad_norm": 0.485030743771553, "learning_rate": 2.3870967741935486e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22481679916381836, "step": 260, "valid_targets_mean": 5144.9, "valid_targets_min": 2641 }, { "epoch": 0.4281098546042003, "grad_norm": 0.4205207190362599, "learning_rate": 2.4331797235023045e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.21444383263587952, "step": 265, "valid_targets_mean": 6273.4, "valid_targets_min": 2606 }, { "epoch": 0.43618739903069464, "grad_norm": 0.5211610541894309, "learning_rate": 2.4792626728110604e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537360191345215, "step": 270, "valid_targets_mean": 5275.8, "valid_targets_min": 2861 }, { "epoch": 0.44426494345718903, "grad_norm": 0.4770920801732771, "learning_rate": 2.525345622119816e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.23997442424297333, "step": 275, "valid_targets_mean": 5575.6, "valid_targets_min": 3039 }, { "epoch": 0.45234248788368336, "grad_norm": 0.4570395047899931, "learning_rate": 2.5714285714285718e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.23134195804595947, "step": 280, "valid_targets_mean": 6000.9, "valid_targets_min": 3196 }, { "epoch": 0.4604200323101777, "grad_norm": 0.5166087876373537, "learning_rate": 2.6175115207373277e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.2255057841539383, "step": 285, "valid_targets_mean": 4838.3, "valid_targets_min": 3099 }, { "epoch": 0.46849757673667203, "grad_norm": 0.49241744642017077, "learning_rate": 2.663594470046083e-05, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.23905658721923828, "step": 290, "valid_targets_mean": 5878.9, "valid_targets_min": 3158 }, { "epoch": 0.4765751211631664, "grad_norm": 0.5151431055676697, "learning_rate": 2.7096774193548387e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.2637583017349243, "step": 295, "valid_targets_mean": 5450.1, "valid_targets_min": 3154 }, { "epoch": 0.48465266558966075, "grad_norm": 0.5264942287162724, "learning_rate": 2.7557603686635946e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.24266698956489563, "step": 300, "valid_targets_mean": 5319.9, "valid_targets_min": 3183 }, { "epoch": 0.4927302100161551, "grad_norm": 0.5615744267117123, "learning_rate": 2.8018433179723505e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.23225907981395721, "step": 305, "valid_targets_mean": 5445.9, "valid_targets_min": 1904 }, { "epoch": 0.5008077544426495, "grad_norm": 0.4460039656784886, "learning_rate": 2.847926267281106e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.22618719935417175, "step": 310, "valid_targets_mean": 5620.4, "valid_targets_min": 2755 }, { "epoch": 0.5088852988691438, "grad_norm": 0.5221362994436883, "learning_rate": 2.894009216589862e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.23870401084423065, "step": 315, "valid_targets_mean": 5645.4, "valid_targets_min": 3330 }, { "epoch": 0.5169628432956381, "grad_norm": 0.49079495003474594, "learning_rate": 2.9400921658986177e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.22571909427642822, "step": 320, "valid_targets_mean": 5016.4, "valid_targets_min": 3153 }, { "epoch": 0.5250403877221325, "grad_norm": 0.6884266293843466, "learning_rate": 2.9861751152073736e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.2298227846622467, "step": 325, "valid_targets_mean": 5508.1, "valid_targets_min": 2791 }, { "epoch": 0.5331179321486268, "grad_norm": 0.4402543092747063, "learning_rate": 3.032258064516129e-05, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.21528840065002441, "step": 330, "valid_targets_mean": 6062.5, "valid_targets_min": 3032 }, { "epoch": 0.5411954765751211, "grad_norm": 0.4982840307868996, "learning_rate": 3.078341013824885e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.21430733799934387, "step": 335, "valid_targets_mean": 5194.5, "valid_targets_min": 3011 }, { "epoch": 0.5492730210016155, "grad_norm": 0.47525498968315927, "learning_rate": 3.124423963133641e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.23421087861061096, "step": 340, "valid_targets_mean": 5589.8, "valid_targets_min": 2991 }, { "epoch": 0.5573505654281099, "grad_norm": 0.48962076056010556, "learning_rate": 3.170506912442397e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.23705869913101196, "step": 345, "valid_targets_mean": 5420.9, "valid_targets_min": 3046 }, { "epoch": 0.5654281098546042, "grad_norm": 0.5248601937434871, "learning_rate": 3.2165898617511526e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.20738640427589417, "step": 350, "valid_targets_mean": 4991.7, "valid_targets_min": 3306 }, { "epoch": 0.5735056542810986, "grad_norm": 0.5529134517454101, "learning_rate": 3.2626728110599085e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2433146983385086, "step": 355, "valid_targets_mean": 5450.4, "valid_targets_min": 2867 }, { "epoch": 0.5815831987075929, "grad_norm": 0.5074738580262357, "learning_rate": 3.3087557603686637e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.21955862641334534, "step": 360, "valid_targets_mean": 5322.2, "valid_targets_min": 3236 }, { "epoch": 0.5896607431340872, "grad_norm": 0.5076742089256605, "learning_rate": 3.3548387096774195e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.2087869644165039, "step": 365, "valid_targets_mean": 5765.1, "valid_targets_min": 3093 }, { "epoch": 0.5977382875605816, "grad_norm": 0.5278251933504018, "learning_rate": 3.4009216589861754e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.2305276095867157, "step": 370, "valid_targets_mean": 4804.2, "valid_targets_min": 3003 }, { "epoch": 0.6058158319870759, "grad_norm": 0.4826719162983493, "learning_rate": 3.447004608294931e-05, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.23459242284297943, "step": 375, "valid_targets_mean": 5528.1, "valid_targets_min": 3357 }, { "epoch": 0.6138933764135702, "grad_norm": 0.6320625812833691, "learning_rate": 3.493087557603687e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.2187860608100891, "step": 380, "valid_targets_mean": 5503.6, "valid_targets_min": 3016 }, { "epoch": 0.6219709208400647, "grad_norm": 0.47007347965400653, "learning_rate": 3.539170506912443e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.20786529779434204, "step": 385, "valid_targets_mean": 5985.6, "valid_targets_min": 2796 }, { "epoch": 0.630048465266559, "grad_norm": 0.4630795250015434, "learning_rate": 3.585253456221198e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.19715559482574463, "step": 390, "valid_targets_mean": 4612.4, "valid_targets_min": 1713 }, { "epoch": 0.6381260096930533, "grad_norm": 0.5023966582999537, "learning_rate": 3.631336405529954e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.2126794159412384, "step": 395, "valid_targets_mean": 5234.2, "valid_targets_min": 3174 }, { "epoch": 0.6462035541195477, "grad_norm": 0.5251269446671685, "learning_rate": 3.67741935483871e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.20799562335014343, "step": 400, "valid_targets_mean": 5003.8, "valid_targets_min": 3258 }, { "epoch": 0.654281098546042, "grad_norm": 0.4819749890049641, "learning_rate": 3.723502304147466e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.21949312090873718, "step": 405, "valid_targets_mean": 5259.9, "valid_targets_min": 3497 }, { "epoch": 0.6623586429725363, "grad_norm": 0.5188610703053317, "learning_rate": 3.7695852534562217e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.22154083847999573, "step": 410, "valid_targets_mean": 5679.1, "valid_targets_min": 3014 }, { "epoch": 0.6704361873990307, "grad_norm": 0.5039417340983822, "learning_rate": 3.815668202764977e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.20660996437072754, "step": 415, "valid_targets_mean": 5197.8, "valid_targets_min": 1997 }, { "epoch": 0.678513731825525, "grad_norm": 0.7798249907735217, "learning_rate": 3.861751152073733e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.2136276513338089, "step": 420, "valid_targets_mean": 4663.6, "valid_targets_min": 2738 }, { "epoch": 0.6865912762520194, "grad_norm": 0.6066741003505866, "learning_rate": 3.9078341013824886e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.21756117045879364, "step": 425, "valid_targets_mean": 5574.6, "valid_targets_min": 3514 }, { "epoch": 0.6946688206785138, "grad_norm": 0.5223178069456903, "learning_rate": 3.9539170506912445e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.21287712454795837, "step": 430, "valid_targets_mean": 4827.9, "valid_targets_min": 2644 }, { "epoch": 0.7027463651050081, "grad_norm": 0.6672575878387428, "learning_rate": 4e-05, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.2201261818408966, "step": 435, "valid_targets_mean": 5125.8, "valid_targets_min": 3199 }, { "epoch": 0.7108239095315024, "grad_norm": 0.5201189718514464, "learning_rate": 3.999983769470204e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.19945184886455536, "step": 440, "valid_targets_mean": 4788.5, "valid_targets_min": 3072 }, { "epoch": 0.7189014539579968, "grad_norm": 0.5370932365597184, "learning_rate": 3.999935078144245e-05, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.2333751916885376, "step": 445, "valid_targets_mean": 5377.1, "valid_targets_min": 2867 }, { "epoch": 0.7269789983844911, "grad_norm": 0.47353136343989644, "learning_rate": 3.99985392681241e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.2093178629875183, "step": 450, "valid_targets_mean": 5342.3, "valid_targets_min": 3433 }, { "epoch": 0.7350565428109854, "grad_norm": 0.46778639574510306, "learning_rate": 3.999740316791827e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.19645030796527863, "step": 455, "valid_targets_mean": 5162.6, "valid_targets_min": 2735 }, { "epoch": 0.7431340872374798, "grad_norm": 0.5039905355084849, "learning_rate": 3.999594249926448e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.21575768291950226, "step": 460, "valid_targets_mean": 5144.1, "valid_targets_min": 2666 }, { "epoch": 0.7512116316639742, "grad_norm": 0.4533789907763941, "learning_rate": 3.999415728587014e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.2194235473871231, "step": 465, "valid_targets_mean": 5687.6, "valid_targets_min": 3098 }, { "epoch": 0.7592891760904685, "grad_norm": 0.510641703733595, "learning_rate": 3.999204755671023e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.23498345911502838, "step": 470, "valid_targets_mean": 5974.1, "valid_targets_min": 3649 }, { "epoch": 0.7673667205169629, "grad_norm": 0.4919939945918816, "learning_rate": 3.998961334602676e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.2350984811782837, "step": 475, "valid_targets_mean": 5363.2, "valid_targets_min": 3018 }, { "epoch": 0.7754442649434572, "grad_norm": 0.4966404337232152, "learning_rate": 3.998685469332826e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.22934846580028534, "step": 480, "valid_targets_mean": 5015.6, "valid_targets_min": 2629 }, { "epoch": 0.7835218093699515, "grad_norm": 0.4663688220948183, "learning_rate": 3.998377164338912e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.19937145709991455, "step": 485, "valid_targets_mean": 4668.9, "valid_targets_min": 2626 }, { "epoch": 0.7915993537964459, "grad_norm": 0.43392124152029365, "learning_rate": 3.9980364246248886e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.21592256426811218, "step": 490, "valid_targets_mean": 6146.0, "valid_targets_min": 3710 }, { "epoch": 0.7996768982229402, "grad_norm": 0.4987695829826951, "learning_rate": 3.997663255721141e-05, "loss": 0.2169, "loss_nan_ranks": 0, "loss_rank_avg": 0.20188398659229279, "step": 495, "valid_targets_mean": 5604.4, "valid_targets_min": 3111 }, { "epoch": 0.8077544426494345, "grad_norm": 0.42396799291927767, "learning_rate": 3.9972576636843976e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.19645419716835022, "step": 500, "valid_targets_mean": 5397.3, "valid_targets_min": 3259 }, { "epoch": 0.815831987075929, "grad_norm": 0.4615497571346846, "learning_rate": 3.9968196550976335e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.20108461380004883, "step": 505, "valid_targets_mean": 5036.8, "valid_targets_min": 3462 }, { "epoch": 0.8239095315024233, "grad_norm": 0.45009318204805604, "learning_rate": 3.99634923706996e-05, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.214469313621521, "step": 510, "valid_targets_mean": 5153.3, "valid_targets_min": 951 }, { "epoch": 0.8319870759289176, "grad_norm": 0.4672244800718876, "learning_rate": 3.99584641723651e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.22961321473121643, "step": 515, "valid_targets_mean": 5477.1, "valid_targets_min": 3372 }, { "epoch": 0.840064620355412, "grad_norm": 0.5295100729321306, "learning_rate": 3.995311203758315e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.19334357976913452, "step": 520, "valid_targets_mean": 5322.9, "valid_targets_min": 2539 }, { "epoch": 0.8481421647819063, "grad_norm": 0.44621467111732166, "learning_rate": 3.9947436053221765e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.1929529756307602, "step": 525, "valid_targets_mean": 5034.4, "valid_targets_min": 2613 }, { "epoch": 0.8562197092084006, "grad_norm": 0.45403900653095236, "learning_rate": 3.9941436311405146e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.19396071135997772, "step": 530, "valid_targets_mean": 5233.5, "valid_targets_min": 2868 }, { "epoch": 0.864297253634895, "grad_norm": 0.46795099266112605, "learning_rate": 3.9935112909512296e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.19735530018806458, "step": 535, "valid_targets_mean": 5340.6, "valid_targets_min": 2698 }, { "epoch": 0.8723747980613893, "grad_norm": 0.44225098932497453, "learning_rate": 3.992846595017538e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.19745707511901855, "step": 540, "valid_targets_mean": 5411.4, "valid_targets_min": 2974 }, { "epoch": 0.8804523424878837, "grad_norm": 0.4699030453155565, "learning_rate": 3.9921495541278055e-05, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.22131837904453278, "step": 545, "valid_targets_mean": 5369.1, "valid_targets_min": 3132 }, { "epoch": 0.8885298869143781, "grad_norm": 0.4484267118953338, "learning_rate": 3.991420179595377e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.19803202152252197, "step": 550, "valid_targets_mean": 5474.4, "valid_targets_min": 3240 }, { "epoch": 0.8966074313408724, "grad_norm": 0.4363172999484147, "learning_rate": 3.990658483258386e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.20177263021469116, "step": 555, "valid_targets_mean": 5468.0, "valid_targets_min": 3611 }, { "epoch": 0.9046849757673667, "grad_norm": 0.42726472894471124, "learning_rate": 3.989864477479568e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.19797097146511078, "step": 560, "valid_targets_mean": 5297.5, "valid_targets_min": 3148 }, { "epoch": 0.9127625201938611, "grad_norm": 0.8604100735139655, "learning_rate": 3.989038175146058e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.1961522400379181, "step": 565, "valid_targets_mean": 4621.4, "valid_targets_min": 2523 }, { "epoch": 0.9208400646203554, "grad_norm": 0.5029110628980737, "learning_rate": 3.98817958966918e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.20313574373722076, "step": 570, "valid_targets_mean": 5248.2, "valid_targets_min": 2731 }, { "epoch": 0.9289176090468497, "grad_norm": 0.4875542838449614, "learning_rate": 3.9872887349842314e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.2127552330493927, "step": 575, "valid_targets_mean": 5201.7, "valid_targets_min": 3392 }, { "epoch": 0.9369951534733441, "grad_norm": 0.43717989119834383, "learning_rate": 3.9863656255502564e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.21224826574325562, "step": 580, "valid_targets_mean": 5225.4, "valid_targets_min": 3381 }, { "epoch": 0.9450726978998385, "grad_norm": 0.4616037851520303, "learning_rate": 3.985410276349809e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.17695999145507812, "step": 585, "valid_targets_mean": 5687.9, "valid_targets_min": 2938 }, { "epoch": 0.9531502423263328, "grad_norm": 0.4463582506367317, "learning_rate": 3.984422702888714e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.1981690526008606, "step": 590, "valid_targets_mean": 6257.0, "valid_targets_min": 3446 }, { "epoch": 0.9612277867528272, "grad_norm": 0.480542991208568, "learning_rate": 3.983402921195811e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.1909128725528717, "step": 595, "valid_targets_mean": 5778.5, "valid_targets_min": 2941 }, { "epoch": 0.9693053311793215, "grad_norm": 0.3902770147091619, "learning_rate": 3.982350947822697e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.1805838793516159, "step": 600, "valid_targets_mean": 5756.9, "valid_targets_min": 3440 }, { "epoch": 0.9773828756058158, "grad_norm": 0.4131148462914201, "learning_rate": 3.981266799843458e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.18150508403778076, "step": 605, "valid_targets_mean": 5193.4, "valid_targets_min": 2566 }, { "epoch": 0.9854604200323102, "grad_norm": 0.4235370608617834, "learning_rate": 3.9801504948543896e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.19405357539653778, "step": 610, "valid_targets_mean": 5936.7, "valid_targets_min": 3174 }, { "epoch": 0.9935379644588045, "grad_norm": 0.4516255003041157, "learning_rate": 3.979002050973713e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.18916358053684235, "step": 615, "valid_targets_mean": 5747.1, "valid_targets_min": 2721 }, { "epoch": 1.001615508885299, "grad_norm": 0.461759410912527, "learning_rate": 3.9778214868412814e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.19580666720867157, "step": 620, "valid_targets_mean": 5032.6, "valid_targets_min": 2931 }, { "epoch": 1.0096930533117932, "grad_norm": 0.4503702954517947, "learning_rate": 3.9766088216182757e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.19610512256622314, "step": 625, "valid_targets_mean": 5503.9, "valid_targets_min": 3242 }, { "epoch": 1.0177705977382876, "grad_norm": 0.38535465367440225, "learning_rate": 3.975364074986895e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.1850084364414215, "step": 630, "valid_targets_mean": 5991.6, "valid_targets_min": 2942 }, { "epoch": 1.0258481421647818, "grad_norm": 0.49310881925785266, "learning_rate": 3.974087267150037e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.18842723965644836, "step": 635, "valid_targets_mean": 5075.8, "valid_targets_min": 3002 }, { "epoch": 1.0339256865912763, "grad_norm": 0.43908988379157626, "learning_rate": 3.972778418830969e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.19962944090366364, "step": 640, "valid_targets_mean": 5342.0, "valid_targets_min": 2747 }, { "epoch": 1.0420032310177707, "grad_norm": 0.4331538096922879, "learning_rate": 3.971437551272992e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.21022823452949524, "step": 645, "valid_targets_mean": 6027.9, "valid_targets_min": 3154 }, { "epoch": 1.050080775444265, "grad_norm": 0.5019102025271842, "learning_rate": 3.970064686239098e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.20737481117248535, "step": 650, "valid_targets_mean": 5382.2, "valid_targets_min": 2603 }, { "epoch": 1.0581583198707594, "grad_norm": 0.5083170777115193, "learning_rate": 3.968659846011614e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.20576795935630798, "step": 655, "valid_targets_mean": 5068.6, "valid_targets_min": 3324 }, { "epoch": 1.0662358642972536, "grad_norm": 0.5345249950524992, "learning_rate": 3.9672230533918394e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.20422016084194183, "step": 660, "valid_targets_mean": 4944.4, "valid_targets_min": 2800 }, { "epoch": 1.074313408723748, "grad_norm": 0.45969874071534583, "learning_rate": 3.965754331699681e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.21545246243476868, "step": 665, "valid_targets_mean": 5249.9, "valid_targets_min": 3535 }, { "epoch": 1.0823909531502423, "grad_norm": 0.448125663434801, "learning_rate": 3.96425370477327e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18208260834217072, "step": 670, "valid_targets_mean": 5157.9, "valid_targets_min": 3169 }, { "epoch": 1.0904684975767367, "grad_norm": 0.4135195037949607, "learning_rate": 3.962721196968575e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.1834549605846405, "step": 675, "valid_targets_mean": 5862.1, "valid_targets_min": 1603 }, { "epoch": 1.098546042003231, "grad_norm": 0.44798067711582557, "learning_rate": 3.961156833159012e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.19529622793197632, "step": 680, "valid_targets_mean": 5122.6, "valid_targets_min": 3054 }, { "epoch": 1.1066235864297254, "grad_norm": 0.42894997437857857, "learning_rate": 3.959560638735033e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.20408596098423004, "step": 685, "valid_targets_mean": 5497.6, "valid_targets_min": 1227 }, { "epoch": 1.1147011308562198, "grad_norm": 0.4528612328531972, "learning_rate": 3.9579326396037194e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.20387399196624756, "step": 690, "valid_targets_mean": 5263.1, "valid_targets_min": 3358 }, { "epoch": 1.122778675282714, "grad_norm": 0.5306644692965696, "learning_rate": 3.95627286218836e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.1954362839460373, "step": 695, "valid_targets_mean": 5552.9, "valid_targets_min": 3140 }, { "epoch": 1.1308562197092085, "grad_norm": 0.4038746508777421, "learning_rate": 3.9545813334280196e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.22040167450904846, "step": 700, "valid_targets_mean": 6317.6, "valid_targets_min": 3279 }, { "epoch": 1.1389337641357027, "grad_norm": 0.48511839796376943, "learning_rate": 3.952858080777109e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.18491333723068237, "step": 705, "valid_targets_mean": 4990.2, "valid_targets_min": 3120 }, { "epoch": 1.1470113085621971, "grad_norm": 0.4163906032254929, "learning_rate": 3.951103132204929e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.18463069200515747, "step": 710, "valid_targets_mean": 5359.3, "valid_targets_min": 3578 }, { "epoch": 1.1550888529886914, "grad_norm": 0.4707109747768151, "learning_rate": 3.9493165161952273e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2015255093574524, "step": 715, "valid_targets_mean": 5115.6, "valid_targets_min": 3198 }, { "epoch": 1.1631663974151858, "grad_norm": 0.4360586669061346, "learning_rate": 3.947498261745727e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.21659937500953674, "step": 720, "valid_targets_mean": 5570.9, "valid_targets_min": 3109 }, { "epoch": 1.1712439418416802, "grad_norm": 0.4909905395226162, "learning_rate": 3.9456483983676605e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.1849258691072464, "step": 725, "valid_targets_mean": 4441.8, "valid_targets_min": 2975 }, { "epoch": 1.1793214862681745, "grad_norm": 0.3961239491997915, "learning_rate": 3.943766956085291e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.18745461106300354, "step": 730, "valid_targets_mean": 5738.1, "valid_targets_min": 3693 }, { "epoch": 1.187399030694669, "grad_norm": 0.4504001793054616, "learning_rate": 3.941853965435425e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.20162153244018555, "step": 735, "valid_targets_mean": 5464.8, "valid_targets_min": 3482 }, { "epoch": 1.1954765751211631, "grad_norm": 0.4192116804539455, "learning_rate": 3.939909457466912e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.19164562225341797, "step": 740, "valid_targets_mean": 5500.5, "valid_targets_min": 3403 }, { "epoch": 1.2035541195476576, "grad_norm": 0.40950065823595944, "learning_rate": 3.937933463740147e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.19027677178382874, "step": 745, "valid_targets_mean": 5712.7, "valid_targets_min": 3948 }, { "epoch": 1.2116316639741518, "grad_norm": 0.49384646135843263, "learning_rate": 3.9359260163265565e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.20605245232582092, "step": 750, "valid_targets_mean": 5703.0, "valid_targets_min": 3153 }, { "epoch": 1.2197092084006462, "grad_norm": 0.43935835645833166, "learning_rate": 3.933887147808074e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.19032615423202515, "step": 755, "valid_targets_mean": 5017.1, "valid_targets_min": 3492 }, { "epoch": 1.2277867528271407, "grad_norm": 0.4246915116255467, "learning_rate": 3.9318168912766165e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.17201930284500122, "step": 760, "valid_targets_mean": 4913.5, "valid_targets_min": 2726 }, { "epoch": 1.235864297253635, "grad_norm": 0.4371494767513589, "learning_rate": 3.929715280333544e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1912434995174408, "step": 765, "valid_targets_mean": 5462.5, "valid_targets_min": 3552 }, { "epoch": 1.2439418416801293, "grad_norm": 0.4254249509205848, "learning_rate": 3.927582349089115e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.18086455762386322, "step": 770, "valid_targets_mean": 5954.0, "valid_targets_min": 2815 }, { "epoch": 1.2520193861066236, "grad_norm": 0.49992158133323245, "learning_rate": 3.9254181321619354e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.21536007523536682, "step": 775, "valid_targets_mean": 6339.7, "valid_targets_min": 2654 }, { "epoch": 1.260096930533118, "grad_norm": 0.4391153689958113, "learning_rate": 3.923222664678391e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.20235435664653778, "step": 780, "valid_targets_mean": 5025.3, "valid_targets_min": 3189 }, { "epoch": 1.2681744749596122, "grad_norm": 0.45436181679553417, "learning_rate": 3.9209959822720825e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.18655994534492493, "step": 785, "valid_targets_mean": 5029.0, "valid_targets_min": 3026 }, { "epoch": 1.2762520193861067, "grad_norm": 0.4123558934830543, "learning_rate": 3.918738121083244e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18062835931777954, "step": 790, "valid_targets_mean": 6172.1, "valid_targets_min": 4072 }, { "epoch": 1.284329563812601, "grad_norm": 0.4648329512789721, "learning_rate": 3.916449117758162e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.20275992155075073, "step": 795, "valid_targets_mean": 5446.8, "valid_targets_min": 2875 }, { "epoch": 1.2924071082390953, "grad_norm": 0.43193021218404604, "learning_rate": 3.9141290094485695e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.1833624541759491, "step": 800, "valid_targets_mean": 5321.3, "valid_targets_min": 2904 }, { "epoch": 1.3004846526655895, "grad_norm": 0.4754726363482082, "learning_rate": 3.911777833811056e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.19616547226905823, "step": 805, "valid_targets_mean": 5313.9, "valid_targets_min": 3515 }, { "epoch": 1.308562197092084, "grad_norm": 0.45079727006553794, "learning_rate": 3.909395629006446e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.19740955531597137, "step": 810, "valid_targets_mean": 6083.8, "valid_targets_min": 3641 }, { "epoch": 1.3166397415185784, "grad_norm": 0.6882667145706619, "learning_rate": 3.906982433699188e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.19484448432922363, "step": 815, "valid_targets_mean": 5730.5, "valid_targets_min": 3268 }, { "epoch": 1.3247172859450727, "grad_norm": 0.4089270681222454, "learning_rate": 3.9045382870567176e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.18390175700187683, "step": 820, "valid_targets_mean": 5482.7, "valid_targets_min": 1648 }, { "epoch": 1.332794830371567, "grad_norm": 0.45501691325829674, "learning_rate": 3.9020632287488306e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.18795420229434967, "step": 825, "valid_targets_mean": 5459.8, "valid_targets_min": 2946 }, { "epoch": 1.3408723747980613, "grad_norm": 0.4032112523950925, "learning_rate": 3.899557298947036e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.1787724494934082, "step": 830, "valid_targets_mean": 5734.0, "valid_targets_min": 3219 }, { "epoch": 1.3489499192245558, "grad_norm": 0.6157000030569536, "learning_rate": 3.897020538323901e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.18250499665737152, "step": 835, "valid_targets_mean": 4282.5, "valid_targets_min": 935 }, { "epoch": 1.35702746365105, "grad_norm": 0.4289416257934381, "learning_rate": 3.894452988052393e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.20244619250297546, "step": 840, "valid_targets_mean": 5285.2, "valid_targets_min": 3236 }, { "epoch": 1.3651050080775444, "grad_norm": 0.443933802902784, "learning_rate": 3.8918546898052163e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.1882239729166031, "step": 845, "valid_targets_mean": 5619.4, "valid_targets_min": 2782 }, { "epoch": 1.3731825525040389, "grad_norm": 0.42620992362285304, "learning_rate": 3.889225685754126e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.19183053076267242, "step": 850, "valid_targets_mean": 5213.1, "valid_targets_min": 3058 }, { "epoch": 1.381260096930533, "grad_norm": 0.4479107119801428, "learning_rate": 3.8865660185692506e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.19001539051532745, "step": 855, "valid_targets_mean": 4980.0, "valid_targets_min": 2417 }, { "epoch": 1.3893376413570275, "grad_norm": 0.4378497546979614, "learning_rate": 3.883875731418399e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.18882623314857483, "step": 860, "valid_targets_mean": 5717.3, "valid_targets_min": 3232 }, { "epoch": 1.3974151857835218, "grad_norm": 0.449776610356312, "learning_rate": 3.881154867966356e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.19307288527488708, "step": 865, "valid_targets_mean": 5585.6, "valid_targets_min": 3062 }, { "epoch": 1.4054927302100162, "grad_norm": 0.42148035811696744, "learning_rate": 3.878403472374176e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.18191015720367432, "step": 870, "valid_targets_mean": 5366.6, "valid_targets_min": 3470 }, { "epoch": 1.4135702746365104, "grad_norm": 0.4657919244437453, "learning_rate": 3.875621589298469e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.19623816013336182, "step": 875, "valid_targets_mean": 5090.8, "valid_targets_min": 256 }, { "epoch": 1.4216478190630049, "grad_norm": 0.5048847662100151, "learning_rate": 3.872809263890669e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.1963757425546646, "step": 880, "valid_targets_mean": 5389.4, "valid_targets_min": 3219 }, { "epoch": 1.4297253634894993, "grad_norm": 0.44706704838768546, "learning_rate": 3.8699665417963104e-05, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.1936870962381363, "step": 885, "valid_targets_mean": 5634.3, "valid_targets_min": 3611 }, { "epoch": 1.4378029079159935, "grad_norm": 0.45989658582019405, "learning_rate": 3.867093469154275e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.18847247958183289, "step": 890, "valid_targets_mean": 4658.3, "valid_targets_min": 2568 }, { "epoch": 1.445880452342488, "grad_norm": 0.44383505996365463, "learning_rate": 3.864190092596058e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.19026578962802887, "step": 895, "valid_targets_mean": 5617.9, "valid_targets_min": 2564 }, { "epoch": 1.4539579967689822, "grad_norm": 0.4194199111124668, "learning_rate": 3.861256459244996e-05, "loss": 0.1909, "loss_nan_ranks": 0, "loss_rank_avg": 0.17383940517902374, "step": 900, "valid_targets_mean": 5795.9, "valid_targets_min": 3262 }, { "epoch": 1.4620355411954766, "grad_norm": 0.4255109011676174, "learning_rate": 3.858292616715514e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.19212770462036133, "step": 905, "valid_targets_mean": 5731.1, "valid_targets_min": 2999 }, { "epoch": 1.4701130856219708, "grad_norm": 0.4319447738916833, "learning_rate": 3.855298613112346e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1939164698123932, "step": 910, "valid_targets_mean": 5160.8, "valid_targets_min": 3688 }, { "epoch": 1.4781906300484653, "grad_norm": 0.4272240749656332, "learning_rate": 3.852274497029757e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.19081246852874756, "step": 915, "valid_targets_mean": 5302.4, "valid_targets_min": 2299 }, { "epoch": 1.4862681744749597, "grad_norm": 0.46589612683429193, "learning_rate": 3.849220317550753e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.18594548106193542, "step": 920, "valid_targets_mean": 5551.4, "valid_targets_min": 3274 }, { "epoch": 1.494345718901454, "grad_norm": 0.4239255105833143, "learning_rate": 3.846136124246285e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.1909162998199463, "step": 925, "valid_targets_mean": 5199.1, "valid_targets_min": 3129 }, { "epoch": 1.5024232633279482, "grad_norm": 0.422429353264246, "learning_rate": 3.843021967174444e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.19193074107170105, "step": 930, "valid_targets_mean": 5211.6, "valid_targets_min": 2783 }, { "epoch": 1.5105008077544426, "grad_norm": 0.41284494740761696, "learning_rate": 3.8398778968796504e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.18506529927253723, "step": 935, "valid_targets_mean": 5035.5, "valid_targets_min": 2843 }, { "epoch": 1.518578352180937, "grad_norm": 0.46260388072253517, "learning_rate": 3.836703964391829e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.17804807424545288, "step": 940, "valid_targets_mean": 4760.1, "valid_targets_min": 2700 }, { "epoch": 1.5266558966074313, "grad_norm": 0.4539090096449715, "learning_rate": 3.833500221225587e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.196572944521904, "step": 945, "valid_targets_mean": 5048.2, "valid_targets_min": 2911 }, { "epoch": 1.5347334410339257, "grad_norm": 0.3711320418441143, "learning_rate": 3.830266719379372e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.16216923296451569, "step": 950, "valid_targets_mean": 5451.4, "valid_targets_min": 2728 }, { "epoch": 1.5428109854604202, "grad_norm": 0.4053523215280699, "learning_rate": 3.827003511334634e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.1896899789571762, "step": 955, "valid_targets_mean": 5590.5, "valid_targets_min": 3036 }, { "epoch": 1.5508885298869144, "grad_norm": 0.4143801981662257, "learning_rate": 3.8237106500549665e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.18760329484939575, "step": 960, "valid_targets_mean": 5340.1, "valid_targets_min": 3031 }, { "epoch": 1.5589660743134086, "grad_norm": 0.43435463117874407, "learning_rate": 3.8203881889852546e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.19068461656570435, "step": 965, "valid_targets_mean": 5864.2, "valid_targets_min": 2487 }, { "epoch": 1.567043618739903, "grad_norm": 0.398129305740008, "learning_rate": 3.8170361820508e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.18233898282051086, "step": 970, "valid_targets_mean": 5440.2, "valid_targets_min": 3231 }, { "epoch": 1.5751211631663975, "grad_norm": 0.3950559172966164, "learning_rate": 3.813654683656451e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.1903170347213745, "step": 975, "valid_targets_mean": 5554.0, "valid_targets_min": 3331 }, { "epoch": 1.5831987075928917, "grad_norm": 0.42327581866709485, "learning_rate": 3.810243748685719e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.1960287094116211, "step": 980, "valid_targets_mean": 5807.6, "valid_targets_min": 3432 }, { "epoch": 1.5912762520193862, "grad_norm": 0.426598665566564, "learning_rate": 3.806803432499885e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.17561861872673035, "step": 985, "valid_targets_mean": 5001.1, "valid_targets_min": 3431 }, { "epoch": 1.5993537964458806, "grad_norm": 0.40412602556538074, "learning_rate": 3.803333790937105e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.18966534733772278, "step": 990, "valid_targets_mean": 5509.1, "valid_targets_min": 2404 }, { "epoch": 1.6074313408723748, "grad_norm": 0.4340842659419959, "learning_rate": 3.7998348803114976e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.1840440034866333, "step": 995, "valid_targets_mean": 5310.2, "valid_targets_min": 2912 }, { "epoch": 1.615508885298869, "grad_norm": 0.4111931761292879, "learning_rate": 3.7963067574122366e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.1781894564628601, "step": 1000, "valid_targets_mean": 5349.6, "valid_targets_min": 2450 }, { "epoch": 1.6235864297253635, "grad_norm": 0.4087537870046933, "learning_rate": 3.7927494795026265e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.19502080976963043, "step": 1005, "valid_targets_mean": 5933.0, "valid_targets_min": 3385 }, { "epoch": 1.631663974151858, "grad_norm": 0.4394450939693841, "learning_rate": 3.789163104319172e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.17000094056129456, "step": 1010, "valid_targets_mean": 4293.8, "valid_targets_min": 3014 }, { "epoch": 1.6397415185783522, "grad_norm": 0.4179986706849446, "learning_rate": 3.785547690070642e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.20335310697555542, "step": 1015, "valid_targets_mean": 4971.2, "valid_targets_min": 1935 }, { "epoch": 1.6478190630048464, "grad_norm": 0.41354564827824025, "learning_rate": 3.7819032954371265e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.19064179062843323, "step": 1020, "valid_targets_mean": 4628.4, "valid_targets_min": 915 }, { "epoch": 1.655896607431341, "grad_norm": 0.4510503380733471, "learning_rate": 3.7782299795690794e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.17823462188243866, "step": 1025, "valid_targets_mean": 4513.6, "valid_targets_min": 3031 }, { "epoch": 1.6639741518578353, "grad_norm": 0.4359485981028798, "learning_rate": 3.774527802086364e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.174652099609375, "step": 1030, "valid_targets_mean": 5560.6, "valid_targets_min": 3401 }, { "epoch": 1.6720516962843295, "grad_norm": 0.40463728071035676, "learning_rate": 3.770796823077283e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.18872065842151642, "step": 1035, "valid_targets_mean": 5051.6, "valid_targets_min": 936 }, { "epoch": 1.680129240710824, "grad_norm": 0.4285363767291524, "learning_rate": 3.767037103097602e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.19253358244895935, "step": 1040, "valid_targets_mean": 4814.4, "valid_targets_min": 826 }, { "epoch": 1.6882067851373184, "grad_norm": 0.42583910093778676, "learning_rate": 3.7632487031695675e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.18691575527191162, "step": 1045, "valid_targets_mean": 4759.1, "valid_targets_min": 2459 }, { "epoch": 1.6962843295638126, "grad_norm": 0.43279804450379034, "learning_rate": 3.7594316847809186e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.20354296267032623, "step": 1050, "valid_targets_mean": 5009.4, "valid_targets_min": 1970 }, { "epoch": 1.7043618739903068, "grad_norm": 0.4184227732912941, "learning_rate": 3.755586109883885e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.1752951741218567, "step": 1055, "valid_targets_mean": 5004.6, "valid_targets_min": 2373 }, { "epoch": 1.7124394184168013, "grad_norm": 0.3799780135092674, "learning_rate": 3.751712040894184e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.19882872700691223, "step": 1060, "valid_targets_mean": 6411.0, "valid_targets_min": 4081 }, { "epoch": 1.7205169628432957, "grad_norm": 0.41181195585953756, "learning_rate": 3.7478095406900095e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.20096594095230103, "step": 1065, "valid_targets_mean": 5860.9, "valid_targets_min": 3251 }, { "epoch": 1.72859450726979, "grad_norm": 0.42902723973896295, "learning_rate": 3.743878672611007e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.18756358325481415, "step": 1070, "valid_targets_mean": 5537.8, "valid_targets_min": 3196 }, { "epoch": 1.7366720516962844, "grad_norm": 0.41118928927546355, "learning_rate": 3.7399195004572466e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.19546402990818024, "step": 1075, "valid_targets_mean": 5526.4, "valid_targets_min": 2809 }, { "epoch": 1.7447495961227788, "grad_norm": 0.4324303457609878, "learning_rate": 3.735932088488191e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.18632230162620544, "step": 1080, "valid_targets_mean": 5635.8, "valid_targets_min": 916 }, { "epoch": 1.752827140549273, "grad_norm": 0.4055121110771316, "learning_rate": 3.731916501421649e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.18193931877613068, "step": 1085, "valid_targets_mean": 5442.8, "valid_targets_min": 3361 }, { "epoch": 1.7609046849757672, "grad_norm": 0.527999221110702, "learning_rate": 3.727872804432726e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.20073384046554565, "step": 1090, "valid_targets_mean": 5310.4, "valid_targets_min": 3223 }, { "epoch": 1.7689822294022617, "grad_norm": 0.4274858774477681, "learning_rate": 3.7238010631527666e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.18347422778606415, "step": 1095, "valid_targets_mean": 5612.4, "valid_targets_min": 3423 }, { "epoch": 1.7770597738287561, "grad_norm": 0.42927802221254874, "learning_rate": 3.719701343668289e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.1750662922859192, "step": 1100, "valid_targets_mean": 4959.8, "valid_targets_min": 3136 }, { "epoch": 1.7851373182552503, "grad_norm": 0.3628087054837778, "learning_rate": 3.715573712519911e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.17887043952941895, "step": 1105, "valid_targets_mean": 5815.1, "valid_targets_min": 4014 }, { "epoch": 1.7932148626817448, "grad_norm": 0.4266388200490565, "learning_rate": 3.711418236701275e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.21544912457466125, "step": 1110, "valid_targets_mean": 5051.7, "valid_targets_min": 2386 }, { "epoch": 1.8012924071082392, "grad_norm": 0.4136868601031113, "learning_rate": 3.707234983657954e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.18486517667770386, "step": 1115, "valid_targets_mean": 5495.8, "valid_targets_min": 1305 }, { "epoch": 1.8093699515347335, "grad_norm": 0.402967118487239, "learning_rate": 3.703024021286362e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.20577257871627808, "step": 1120, "valid_targets_mean": 5403.4, "valid_targets_min": 2698 }, { "epoch": 1.8174474959612277, "grad_norm": 0.42496692219736487, "learning_rate": 3.698785417932649e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.17963314056396484, "step": 1125, "valid_targets_mean": 5468.1, "valid_targets_min": 2550 }, { "epoch": 1.8255250403877221, "grad_norm": 0.39479948585929464, "learning_rate": 3.694519242391592e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.18878337740898132, "step": 1130, "valid_targets_mean": 5651.1, "valid_targets_min": 4059 }, { "epoch": 1.8336025848142166, "grad_norm": 0.4389945003529063, "learning_rate": 3.6902255639054806e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.18954357504844666, "step": 1135, "valid_targets_mean": 5592.6, "valid_targets_min": 3598 }, { "epoch": 1.8416801292407108, "grad_norm": 0.41830928765826586, "learning_rate": 3.685904452162992e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.18112030625343323, "step": 1140, "valid_targets_mean": 4664.1, "valid_targets_min": 2236 }, { "epoch": 1.849757673667205, "grad_norm": 0.41070471823717275, "learning_rate": 3.681555977298059e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.2223418653011322, "step": 1145, "valid_targets_mean": 5106.7, "valid_targets_min": 2678 }, { "epoch": 1.8578352180936997, "grad_norm": 0.3916635528154224, "learning_rate": 3.677180209888733e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.17309582233428955, "step": 1150, "valid_targets_mean": 5281.2, "valid_targets_min": 2840 }, { "epoch": 1.865912762520194, "grad_norm": 0.4439330061230736, "learning_rate": 3.672777220956035e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.1888798475265503, "step": 1155, "valid_targets_mean": 4692.0, "valid_targets_min": 2598 }, { "epoch": 1.8739903069466881, "grad_norm": 0.4098709425390136, "learning_rate": 3.6683470819628104e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.2108800709247589, "step": 1160, "valid_targets_mean": 6092.9, "valid_targets_min": 3524 }, { "epoch": 1.8820678513731826, "grad_norm": 0.3506145878762836, "learning_rate": 3.663889864812562e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.15639182925224304, "step": 1165, "valid_targets_mean": 5912.6, "valid_targets_min": 3557 }, { "epoch": 1.890145395799677, "grad_norm": 0.4280367169398799, "learning_rate": 3.6594056418482844e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.1831849217414856, "step": 1170, "valid_targets_mean": 4734.1, "valid_targets_min": 2709 }, { "epoch": 1.8982229402261712, "grad_norm": 0.402531733486501, "learning_rate": 3.6548944858512926e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.19320084154605865, "step": 1175, "valid_targets_mean": 5464.7, "valid_targets_min": 3488 }, { "epoch": 1.9063004846526654, "grad_norm": 0.426933703454056, "learning_rate": 3.650356470040038e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.17539432644844055, "step": 1180, "valid_targets_mean": 4791.7, "valid_targets_min": 1595 }, { "epoch": 1.9143780290791599, "grad_norm": 0.39173229481194327, "learning_rate": 3.645791668068923e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.20481710135936737, "step": 1185, "valid_targets_mean": 5580.2, "valid_targets_min": 3431 }, { "epoch": 1.9224555735056543, "grad_norm": 0.3534776648862029, "learning_rate": 3.6412001540271e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.17972326278686523, "step": 1190, "valid_targets_mean": 6481.8, "valid_targets_min": 3058 }, { "epoch": 1.9305331179321485, "grad_norm": 0.44528228054460384, "learning_rate": 3.6365820024372754e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.1828109472990036, "step": 1195, "valid_targets_mean": 5294.1, "valid_targets_min": 2729 }, { "epoch": 1.938610662358643, "grad_norm": 0.6772035127037407, "learning_rate": 3.6319372882544966e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.1858840435743332, "step": 1200, "valid_targets_mean": 5217.1, "valid_targets_min": 1086 }, { "epoch": 1.9466882067851374, "grad_norm": 0.3861931899139504, "learning_rate": 3.627266086864935e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952175348997116, "step": 1205, "valid_targets_mean": 5899.5, "valid_targets_min": 3731 }, { "epoch": 1.9547657512116317, "grad_norm": 0.43872850575648026, "learning_rate": 3.622568474084664e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.16384650766849518, "step": 1210, "valid_targets_mean": 4261.4, "valid_targets_min": 1412 }, { "epoch": 1.9628432956381259, "grad_norm": 0.37399241885571466, "learning_rate": 3.6178445261584275e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.1738545447587967, "step": 1215, "valid_targets_mean": 5521.0, "valid_targets_min": 2739 }, { "epoch": 1.9709208400646203, "grad_norm": 0.41605738475702797, "learning_rate": 3.6130943197584036e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.18516364693641663, "step": 1220, "valid_targets_mean": 5404.1, "valid_targets_min": 3228 }, { "epoch": 1.9789983844911148, "grad_norm": 0.4085987552814228, "learning_rate": 3.608317931982958e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.19084042310714722, "step": 1225, "valid_targets_mean": 5928.6, "valid_targets_min": 3101 }, { "epoch": 1.987075928917609, "grad_norm": 0.36877496540693433, "learning_rate": 3.6035154403553965e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.174210324883461, "step": 1230, "valid_targets_mean": 5422.4, "valid_targets_min": 2923 }, { "epoch": 1.9951534733441034, "grad_norm": 0.426933061586902, "learning_rate": 3.5986869228227005e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.18611037731170654, "step": 1235, "valid_targets_mean": 4997.9, "valid_targets_min": 1502 }, { "epoch": 2.003231017770598, "grad_norm": 0.401606174889642, "learning_rate": 3.593832457754269e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1687077432870865, "step": 1240, "valid_targets_mean": 5052.2, "valid_targets_min": 3015 }, { "epoch": 2.011308562197092, "grad_norm": 0.40606330051530004, "learning_rate": 3.588952123940642e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.16908740997314453, "step": 1245, "valid_targets_mean": 5349.8, "valid_targets_min": 2523 }, { "epoch": 2.0193861066235863, "grad_norm": 0.4274105385686568, "learning_rate": 3.584046000592222e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.15948118269443512, "step": 1250, "valid_targets_mean": 5093.5, "valid_targets_min": 3262 }, { "epoch": 2.027463651050081, "grad_norm": 0.45256421704515376, "learning_rate": 3.5791141673379906e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.16202068328857422, "step": 1255, "valid_targets_mean": 5621.1, "valid_targets_min": 3673 }, { "epoch": 2.035541195476575, "grad_norm": 0.3862372173341649, "learning_rate": 3.574156704224215e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.14887890219688416, "step": 1260, "valid_targets_mean": 5471.6, "valid_targets_min": 3034 }, { "epoch": 2.0436187399030694, "grad_norm": 0.43883940614494954, "learning_rate": 3.569173691713147e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.17507337033748627, "step": 1265, "valid_targets_mean": 4869.2, "valid_targets_min": 3110 }, { "epoch": 2.0516962843295636, "grad_norm": 0.4077056739419978, "learning_rate": 3.5641652106817194e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628391593694687, "step": 1270, "valid_targets_mean": 4946.0, "valid_targets_min": 3397 }, { "epoch": 2.0597738287560583, "grad_norm": 0.3920400314649599, "learning_rate": 3.559131342420235e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.16144214570522308, "step": 1275, "valid_targets_mean": 5687.8, "valid_targets_min": 3219 }, { "epoch": 2.0678513731825525, "grad_norm": 0.4697014734112868, "learning_rate": 3.554072168631039e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.16841688752174377, "step": 1280, "valid_targets_mean": 5773.9, "valid_targets_min": 2827 }, { "epoch": 2.0759289176090467, "grad_norm": 0.41851856710048596, "learning_rate": 3.5489877714272064e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.17223848402500153, "step": 1285, "valid_targets_mean": 5887.8, "valid_targets_min": 3573 }, { "epoch": 2.0840064620355414, "grad_norm": 0.3877542211888081, "learning_rate": 3.543878233331194e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.16172486543655396, "step": 1290, "valid_targets_mean": 5461.9, "valid_targets_min": 3066 }, { "epoch": 2.0920840064620356, "grad_norm": 0.4405751263169863, "learning_rate": 3.538743637273515e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.156228169798851, "step": 1295, "valid_targets_mean": 5554.2, "valid_targets_min": 3937 }, { "epoch": 2.10016155088853, "grad_norm": 0.44672479309346075, "learning_rate": 3.5335840665913814e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.1716388314962387, "step": 1300, "valid_targets_mean": 4500.0, "valid_targets_min": 2274 }, { "epoch": 2.108239095315024, "grad_norm": 0.43396813723890304, "learning_rate": 3.5283996050273606e-05, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.17064327001571655, "step": 1305, "valid_targets_mean": 5100.9, "valid_targets_min": 2093 }, { "epoch": 2.1163166397415187, "grad_norm": 0.43545641516471767, "learning_rate": 3.523190336728009e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.16103370487689972, "step": 1310, "valid_targets_mean": 4831.9, "valid_targets_min": 3058 }, { "epoch": 2.124394184168013, "grad_norm": 0.4303303750630934, "learning_rate": 3.517956346242512e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.16605603694915771, "step": 1315, "valid_targets_mean": 4949.8, "valid_targets_min": 3379 }, { "epoch": 2.132471728594507, "grad_norm": 0.3785254380964551, "learning_rate": 3.512697718521308e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.157035693526268, "step": 1320, "valid_targets_mean": 5796.8, "valid_targets_min": 2571 }, { "epoch": 2.1405492730210014, "grad_norm": 0.4479990330504035, "learning_rate": 3.5074145389147095e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.18853747844696045, "step": 1325, "valid_targets_mean": 5415.8, "valid_targets_min": 2539 }, { "epoch": 2.148626817447496, "grad_norm": 0.4332672460538596, "learning_rate": 3.502106893171523e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.17232483625411987, "step": 1330, "valid_targets_mean": 5326.8, "valid_targets_min": 2771 }, { "epoch": 2.1567043618739903, "grad_norm": 0.4158673008862669, "learning_rate": 3.4967748674376494e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18939775228500366, "step": 1335, "valid_targets_mean": 5557.8, "valid_targets_min": 3100 }, { "epoch": 2.1647819063004845, "grad_norm": 0.42762701762425376, "learning_rate": 3.4914185482546915e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.16821393370628357, "step": 1340, "valid_targets_mean": 5204.9, "valid_targets_min": 2956 }, { "epoch": 2.172859450726979, "grad_norm": 0.39851109399748474, "learning_rate": 3.4860380225585475e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.17029531300067902, "step": 1345, "valid_targets_mean": 5027.6, "valid_targets_min": 2571 }, { "epoch": 2.1809369951534734, "grad_norm": 0.4168775245127039, "learning_rate": 3.480633377678e-05, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.15992960333824158, "step": 1350, "valid_targets_mean": 4966.4, "valid_targets_min": 720 }, { "epoch": 2.1890145395799676, "grad_norm": 0.475573654602836, "learning_rate": 3.475204701333298e-05, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710505187511444, "step": 1355, "valid_targets_mean": 4562.9, "valid_targets_min": 2976 }, { "epoch": 2.197092084006462, "grad_norm": 0.41742134982113543, "learning_rate": 3.469752081634736e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.17456302046775818, "step": 1360, "valid_targets_mean": 5109.5, "valid_targets_min": 2370 }, { "epoch": 2.2051696284329565, "grad_norm": 0.5028864896919181, "learning_rate": 3.464275607081219e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.15900300443172455, "step": 1365, "valid_targets_mean": 4860.5, "valid_targets_min": 1502 }, { "epoch": 2.2132471728594507, "grad_norm": 0.3673834965367812, "learning_rate": 3.458775366558832e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.17337435483932495, "step": 1370, "valid_targets_mean": 6093.9, "valid_targets_min": 3429 }, { "epoch": 2.221324717285945, "grad_norm": 0.41072037713762377, "learning_rate": 3.4532514493393914e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.17573903501033783, "step": 1375, "valid_targets_mean": 5765.9, "valid_targets_min": 2648 }, { "epoch": 2.2294022617124396, "grad_norm": 0.4284254331283453, "learning_rate": 3.4477039450790015e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.16634736955165863, "step": 1380, "valid_targets_mean": 5872.1, "valid_targets_min": 3221 }, { "epoch": 2.237479806138934, "grad_norm": 0.6490092475424905, "learning_rate": 3.4421329438165944e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.15642938017845154, "step": 1385, "valid_targets_mean": 4863.2, "valid_targets_min": 2800 }, { "epoch": 2.245557350565428, "grad_norm": 0.4532650779405078, "learning_rate": 3.436538535972473e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.16853484511375427, "step": 1390, "valid_targets_mean": 5580.8, "valid_targets_min": 2997 }, { "epoch": 2.2536348949919223, "grad_norm": 0.46862263231029005, "learning_rate": 3.430920812346838e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.18197011947631836, "step": 1395, "valid_targets_mean": 5054.0, "valid_targets_min": 1102 }, { "epoch": 2.261712439418417, "grad_norm": 0.3926929669058476, "learning_rate": 3.425279864118324e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.1653885543346405, "step": 1400, "valid_targets_mean": 5755.1, "valid_targets_min": 3486 }, { "epoch": 2.269789983844911, "grad_norm": 0.4473829670830625, "learning_rate": 3.419615782842507e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.17438775300979614, "step": 1405, "valid_targets_mean": 4425.4, "valid_targets_min": 2813 }, { "epoch": 2.2778675282714054, "grad_norm": 0.4497507198651243, "learning_rate": 3.413928660450427e-05, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.18055163323879242, "step": 1410, "valid_targets_mean": 4834.5, "valid_targets_min": 2564 }, { "epoch": 2.2859450726979, "grad_norm": 0.3833845124298959, "learning_rate": 3.408218589247094e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.14256328344345093, "step": 1415, "valid_targets_mean": 5140.1, "valid_targets_min": 3313 }, { "epoch": 2.2940226171243943, "grad_norm": 0.4145273879316233, "learning_rate": 3.402485661909988e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.18663017451763153, "step": 1420, "valid_targets_mean": 5167.8, "valid_targets_min": 3523 }, { "epoch": 2.3021001615508885, "grad_norm": 0.3623669701914888, "learning_rate": 3.396729971487557e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.1587752103805542, "step": 1425, "valid_targets_mean": 5643.6, "valid_targets_min": 3462 }, { "epoch": 2.3101777059773827, "grad_norm": 0.4066395797349654, "learning_rate": 3.3909516113977073e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.16322427988052368, "step": 1430, "valid_targets_mean": 5590.2, "valid_targets_min": 3377 }, { "epoch": 2.3182552504038774, "grad_norm": 0.42382751521347023, "learning_rate": 3.385150675426283e-05, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.16787301003932953, "step": 1435, "valid_targets_mean": 4900.2, "valid_targets_min": 2613 }, { "epoch": 2.3263327948303716, "grad_norm": 0.4268245994999202, "learning_rate": 3.37932725772555e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.1627117395401001, "step": 1440, "valid_targets_mean": 5724.6, "valid_targets_min": 3407 }, { "epoch": 2.334410339256866, "grad_norm": 0.43132043272994586, "learning_rate": 3.37348145281266e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.18179920315742493, "step": 1445, "valid_targets_mean": 5504.1, "valid_targets_min": 3547 }, { "epoch": 2.3424878836833605, "grad_norm": 0.40927578349516525, "learning_rate": 3.367613355568126e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.18249475955963135, "step": 1450, "valid_targets_mean": 5405.1, "valid_targets_min": 3096 }, { "epoch": 2.3505654281098547, "grad_norm": 0.37071367481289286, "learning_rate": 3.361723061234275e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.15142659842967987, "step": 1455, "valid_targets_mean": 5216.8, "valid_targets_min": 2946 }, { "epoch": 2.358642972536349, "grad_norm": 0.4273375833985219, "learning_rate": 3.355810665413704e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.16882875561714172, "step": 1460, "valid_targets_mean": 5893.2, "valid_targets_min": 4168 }, { "epoch": 2.366720516962843, "grad_norm": 0.43524365947164323, "learning_rate": 3.34987626406773e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.16199825704097748, "step": 1465, "valid_targets_mean": 5291.4, "valid_targets_min": 3203 }, { "epoch": 2.374798061389338, "grad_norm": 0.4326769770987258, "learning_rate": 3.343919953514831e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.1664809137582779, "step": 1470, "valid_targets_mean": 5582.1, "valid_targets_min": 2984 }, { "epoch": 2.382875605815832, "grad_norm": 0.4114451446619777, "learning_rate": 3.337941830429082e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.1652735322713852, "step": 1475, "valid_targets_mean": 5063.2, "valid_targets_min": 3032 }, { "epoch": 2.3909531502423262, "grad_norm": 0.3660040398033965, "learning_rate": 3.331941991838589e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.16325372457504272, "step": 1480, "valid_targets_mean": 5960.8, "valid_targets_min": 4023 }, { "epoch": 2.399030694668821, "grad_norm": 0.43398835076941117, "learning_rate": 3.32592053512391e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.16197870671749115, "step": 1485, "valid_targets_mean": 4514.6, "valid_targets_min": 665 }, { "epoch": 2.407108239095315, "grad_norm": 0.3909720869151018, "learning_rate": 3.319877558016478e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.16862240433692932, "step": 1490, "valid_targets_mean": 5479.7, "valid_targets_min": 2374 }, { "epoch": 2.4151857835218093, "grad_norm": 0.44100978004666036, "learning_rate": 3.3138131585970134e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.18514972925186157, "step": 1495, "valid_targets_mean": 5116.6, "valid_targets_min": 3257 }, { "epoch": 2.4232633279483036, "grad_norm": 0.3981887790759492, "learning_rate": 3.3077274352939315e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.15568625926971436, "step": 1500, "valid_targets_mean": 5510.9, "valid_targets_min": 3469 }, { "epoch": 2.4313408723747982, "grad_norm": 0.43017412638926306, "learning_rate": 3.301620486881746e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.17815840244293213, "step": 1505, "valid_targets_mean": 5197.9, "valid_targets_min": 2762 }, { "epoch": 2.4394184168012925, "grad_norm": 0.4401707898411131, "learning_rate": 3.2954924124794636e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.16379782557487488, "step": 1510, "valid_targets_mean": 4692.9, "valid_targets_min": 2956 }, { "epoch": 2.4474959612277867, "grad_norm": 0.3607160404524143, "learning_rate": 3.28934331154898e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.15107029676437378, "step": 1515, "valid_targets_mean": 5661.4, "valid_targets_min": 2921 }, { "epoch": 2.4555735056542813, "grad_norm": 0.35908930376071707, "learning_rate": 3.2831732838934615e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.14789265394210815, "step": 1520, "valid_targets_mean": 5564.4, "valid_targets_min": 2092 }, { "epoch": 2.4636510500807756, "grad_norm": 0.44315420095764363, "learning_rate": 3.276982429655724e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.15249694883823395, "step": 1525, "valid_targets_mean": 4679.8, "valid_targets_min": 256 }, { "epoch": 2.47172859450727, "grad_norm": 0.3807929761670207, "learning_rate": 3.270770849316612e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.1659863442182541, "step": 1530, "valid_targets_mean": 5424.8, "valid_targets_min": 3098 }, { "epoch": 2.479806138933764, "grad_norm": 0.4029349113660074, "learning_rate": 3.264538643693367e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.14238610863685608, "step": 1535, "valid_targets_mean": 5705.2, "valid_targets_min": 3058 }, { "epoch": 2.4878836833602587, "grad_norm": 0.392438283116615, "learning_rate": 3.258285913937988e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.15044398605823517, "step": 1540, "valid_targets_mean": 5630.6, "valid_targets_min": 3316 }, { "epoch": 2.495961227786753, "grad_norm": 0.42696864338998214, "learning_rate": 3.2520127615355885e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.17117537558078766, "step": 1545, "valid_targets_mean": 5718.1, "valid_targets_min": 3588 }, { "epoch": 2.504038772213247, "grad_norm": 0.4088967704654339, "learning_rate": 3.245719288302758e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.17196603119373322, "step": 1550, "valid_targets_mean": 5265.9, "valid_targets_min": 2815 }, { "epoch": 2.5121163166397418, "grad_norm": 0.3502253105336199, "learning_rate": 3.239405596385902e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.14983238279819489, "step": 1555, "valid_targets_mean": 6427.2, "valid_targets_min": 4682 }, { "epoch": 2.520193861066236, "grad_norm": 0.4183519330842782, "learning_rate": 3.233071788259582e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.14721640944480896, "step": 1560, "valid_targets_mean": 4815.1, "valid_targets_min": 3095 }, { "epoch": 2.52827140549273, "grad_norm": 0.4352795741458169, "learning_rate": 3.2267179667248636e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.15912222862243652, "step": 1565, "valid_targets_mean": 5072.4, "valid_targets_min": 3089 }, { "epoch": 2.5363489499192244, "grad_norm": 0.42056275261628046, "learning_rate": 3.220344234907634e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.16274453699588776, "step": 1570, "valid_targets_mean": 5461.2, "valid_targets_min": 3889 }, { "epoch": 2.5444264943457187, "grad_norm": 0.39668108670101565, "learning_rate": 3.2139506962569376e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.15409982204437256, "step": 1575, "valid_targets_mean": 5482.7, "valid_targets_min": 1894 }, { "epoch": 2.5525040387722133, "grad_norm": 0.39268047733866424, "learning_rate": 3.2075374545432945e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.15878914296627045, "step": 1580, "valid_targets_mean": 5595.6, "valid_targets_min": 2744 }, { "epoch": 2.5605815831987075, "grad_norm": 0.48291631001099655, "learning_rate": 3.201104613857015e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.18096968531608582, "step": 1585, "valid_targets_mean": 4983.4, "valid_targets_min": 1583 }, { "epoch": 2.568659127625202, "grad_norm": 0.4034564494750503, "learning_rate": 3.1946522786065125e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.14894041419029236, "step": 1590, "valid_targets_mean": 5471.7, "valid_targets_min": 2886 }, { "epoch": 2.5767366720516964, "grad_norm": 0.4119983923922993, "learning_rate": 3.188180553516606e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.16128647327423096, "step": 1595, "valid_targets_mean": 5662.8, "valid_targets_min": 2978 }, { "epoch": 2.5848142164781907, "grad_norm": 0.4123640591545943, "learning_rate": 3.181689543626822e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.18056736886501312, "step": 1600, "valid_targets_mean": 5447.2, "valid_targets_min": 3365 }, { "epoch": 2.592891760904685, "grad_norm": 0.3869046988263049, "learning_rate": 3.1751793542896895e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.16578814387321472, "step": 1605, "valid_targets_mean": 5747.5, "valid_targets_min": 1603 }, { "epoch": 2.600969305331179, "grad_norm": 0.4316608359130143, "learning_rate": 3.1686500911690315e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606169044971466, "step": 1610, "valid_targets_mean": 5133.5, "valid_targets_min": 906 }, { "epoch": 2.6090468497576738, "grad_norm": 0.40446250120673677, "learning_rate": 3.162101860238247e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.14105135202407837, "step": 1615, "valid_targets_mean": 5533.9, "valid_targets_min": 3032 }, { "epoch": 2.617124394184168, "grad_norm": 0.47625077340872074, "learning_rate": 3.155534767778594e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.18141523003578186, "step": 1620, "valid_targets_mean": 4673.2, "valid_targets_min": 2542 }, { "epoch": 2.625201938610662, "grad_norm": 0.4465275345328576, "learning_rate": 3.1489489203774627e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1559813916683197, "step": 1625, "valid_targets_mean": 5545.8, "valid_targets_min": 3295 }, { "epoch": 2.633279483037157, "grad_norm": 0.4192958307468656, "learning_rate": 3.1423444249266436e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.18528008460998535, "step": 1630, "valid_targets_mean": 5995.1, "valid_targets_min": 3733 }, { "epoch": 2.641357027463651, "grad_norm": 0.4049950210554484, "learning_rate": 3.1357213886205986e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.17278358340263367, "step": 1635, "valid_targets_mean": 5698.8, "valid_targets_min": 1120 }, { "epoch": 2.6494345718901453, "grad_norm": 0.40913206526342066, "learning_rate": 3.1290799189547155e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.15328720211982727, "step": 1640, "valid_targets_mean": 4910.6, "valid_targets_min": 860 }, { "epoch": 2.6575121163166395, "grad_norm": 0.4257325837836936, "learning_rate": 3.122420123723565e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.15455028414726257, "step": 1645, "valid_targets_mean": 5031.7, "valid_targets_min": 3529 }, { "epoch": 2.665589660743134, "grad_norm": 0.4521874347895494, "learning_rate": 3.115742111019152e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.14618174731731415, "step": 1650, "valid_targets_mean": 4829.0, "valid_targets_min": 2955 }, { "epoch": 2.6736672051696284, "grad_norm": 0.39499453267355306, "learning_rate": 3.1090459892291616e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.1510046422481537, "step": 1655, "valid_targets_mean": 5492.4, "valid_targets_min": 3011 }, { "epoch": 2.6817447495961226, "grad_norm": 0.42966057396892693, "learning_rate": 3.102331867035197e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.16350698471069336, "step": 1660, "valid_targets_mean": 5012.4, "valid_targets_min": 3294 }, { "epoch": 2.6898222940226173, "grad_norm": 0.4262326803802079, "learning_rate": 3.095599853411019e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16098210215568542, "step": 1665, "valid_targets_mean": 5450.9, "valid_targets_min": 3548 }, { "epoch": 2.6978998384491115, "grad_norm": 0.4546118001183254, "learning_rate": 3.088850057620777e-05, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.16224367916584015, "step": 1670, "valid_targets_mean": 5435.6, "valid_targets_min": 3398 }, { "epoch": 2.7059773828756057, "grad_norm": 0.40167696331255726, "learning_rate": 3.08208258921723e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.13801468908786774, "step": 1675, "valid_targets_mean": 5132.9, "valid_targets_min": 3184 }, { "epoch": 2.7140549273021, "grad_norm": 0.4210913248605828, "learning_rate": 3.075297558039976e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.14852957427501678, "step": 1680, "valid_targets_mean": 5154.9, "valid_targets_min": 2962 }, { "epoch": 2.7221324717285946, "grad_norm": 0.3743885008222628, "learning_rate": 3.068495074213667e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1448890119791031, "step": 1685, "valid_targets_mean": 5794.9, "valid_targets_min": 2758 }, { "epoch": 2.730210016155089, "grad_norm": 0.40410715658459306, "learning_rate": 3.0616752481462184e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.15657979249954224, "step": 1690, "valid_targets_mean": 5021.4, "valid_targets_min": 3366 }, { "epoch": 2.738287560581583, "grad_norm": 0.4714995506258271, "learning_rate": 3.054838190527021e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.16343599557876587, "step": 1695, "valid_targets_mean": 4527.0, "valid_targets_min": 2803 }, { "epoch": 2.7463651050080777, "grad_norm": 0.43772533089432647, "learning_rate": 3.0479840123251424e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.17091104388237, "step": 1700, "valid_targets_mean": 5508.5, "valid_targets_min": 3143 }, { "epoch": 2.754442649434572, "grad_norm": 0.45122256716443765, "learning_rate": 3.0411128247875248e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.17041394114494324, "step": 1705, "valid_targets_mean": 4875.2, "valid_targets_min": 2137 }, { "epoch": 2.762520193861066, "grad_norm": 0.38714450629462066, "learning_rate": 3.0342247394371836e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.152548149228096, "step": 1710, "valid_targets_mean": 5843.6, "valid_targets_min": 3284 }, { "epoch": 2.7705977382875604, "grad_norm": 0.5422209052327676, "learning_rate": 3.0273198680713937e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.16515977680683136, "step": 1715, "valid_targets_mean": 5581.4, "valid_targets_min": 2737 }, { "epoch": 2.778675282714055, "grad_norm": 0.41258879566049084, "learning_rate": 3.0203983227598733e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1601826399564743, "step": 1720, "valid_targets_mean": 5942.6, "valid_targets_min": 3936 }, { "epoch": 2.7867528271405493, "grad_norm": 0.4158870047598975, "learning_rate": 3.0134602158429723e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.15733978152275085, "step": 1725, "valid_targets_mean": 6098.9, "valid_targets_min": 3073 }, { "epoch": 2.7948303715670435, "grad_norm": 0.43216407751154545, "learning_rate": 3.00650565992984e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1826433390378952, "step": 1730, "valid_targets_mean": 5351.1, "valid_targets_min": 2817 }, { "epoch": 2.802907915993538, "grad_norm": 0.3883027870620293, "learning_rate": 2.999534767896604e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.14935646951198578, "step": 1735, "valid_targets_mean": 5830.9, "valid_targets_min": 4066 }, { "epoch": 2.8109854604200324, "grad_norm": 0.48044695829642137, "learning_rate": 2.992547652884536e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.16807019710540771, "step": 1740, "valid_targets_mean": 4481.2, "valid_targets_min": 2976 }, { "epoch": 2.8190630048465266, "grad_norm": 0.4140322247787378, "learning_rate": 2.985544428298213e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.1593261957168579, "step": 1745, "valid_targets_mean": 5142.8, "valid_targets_min": 1294 }, { "epoch": 2.827140549273021, "grad_norm": 0.42543096236919437, "learning_rate": 2.978525207803681e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564638316631317, "step": 1750, "valid_targets_mean": 4954.4, "valid_targets_min": 3126 }, { "epoch": 2.8352180936995155, "grad_norm": 0.4694157233084932, "learning_rate": 2.9714901053266075e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15422756969928741, "step": 1755, "valid_targets_mean": 4928.2, "valid_targets_min": 2928 }, { "epoch": 2.8432956381260097, "grad_norm": 0.4116696511240596, "learning_rate": 2.9644392350504322e-05, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15589065849781036, "step": 1760, "valid_targets_mean": 4785.0, "valid_targets_min": 3331 }, { "epoch": 2.851373182552504, "grad_norm": 0.41296699834187545, "learning_rate": 2.9573727114145162e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.18629789352416992, "step": 1765, "valid_targets_mean": 5090.4, "valid_targets_min": 3547 }, { "epoch": 2.8594507269789986, "grad_norm": 0.4347499443746334, "learning_rate": 2.9502906491122813e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.15154750645160675, "step": 1770, "valid_targets_mean": 5262.7, "valid_targets_min": 2874 }, { "epoch": 2.867528271405493, "grad_norm": 0.4141641791774333, "learning_rate": 2.9431931630893504e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.17479820549488068, "step": 1775, "valid_targets_mean": 5459.6, "valid_targets_min": 2579 }, { "epoch": 2.875605815831987, "grad_norm": 0.4638086659411083, "learning_rate": 2.9360803685416825e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.16348320245742798, "step": 1780, "valid_targets_mean": 5805.8, "valid_targets_min": 3612 }, { "epoch": 2.8836833602584813, "grad_norm": 0.4504562586687795, "learning_rate": 2.9289523809137016e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.1563473343849182, "step": 1785, "valid_targets_mean": 4970.2, "valid_targets_min": 3548 }, { "epoch": 2.891760904684976, "grad_norm": 0.38292898167329614, "learning_rate": 2.9218093158964227e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.15860334038734436, "step": 1790, "valid_targets_mean": 5831.6, "valid_targets_min": 3135 }, { "epoch": 2.89983844911147, "grad_norm": 0.3947814339597183, "learning_rate": 2.9146512894255755e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.16357748210430145, "step": 1795, "valid_targets_mean": 5600.8, "valid_targets_min": 2395 }, { "epoch": 2.9079159935379644, "grad_norm": 0.3773815244534708, "learning_rate": 2.907478417679722e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.15501318871974945, "step": 1800, "valid_targets_mean": 5604.1, "valid_targets_min": 3823 }, { "epoch": 2.915993537964459, "grad_norm": 0.49862612619338115, "learning_rate": 2.900290817078371e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.145344540476799, "step": 1805, "valid_targets_mean": 5771.7, "valid_targets_min": 2848 }, { "epoch": 2.9240710823909533, "grad_norm": 0.39778554749092054, "learning_rate": 2.893088604280088e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.157730370759964, "step": 1810, "valid_targets_mean": 5914.8, "valid_targets_min": 3646 }, { "epoch": 2.9321486268174475, "grad_norm": 0.3893095212067741, "learning_rate": 2.8858718961806028e-05, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.17110855877399445, "step": 1815, "valid_targets_mean": 6156.4, "valid_targets_min": 3925 }, { "epoch": 2.9402261712439417, "grad_norm": 0.442018274409042, "learning_rate": 2.87864080991091e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.15044714510440826, "step": 1820, "valid_targets_mean": 4851.6, "valid_targets_min": 2939 }, { "epoch": 2.948303715670436, "grad_norm": 0.4241200775734895, "learning_rate": 2.8713954628353727e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.15260717272758484, "step": 1825, "valid_targets_mean": 4876.9, "valid_targets_min": 2759 }, { "epoch": 2.9563812600969306, "grad_norm": 0.4261849048816585, "learning_rate": 2.8641359725498106e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.18526265025138855, "step": 1830, "valid_targets_mean": 5735.2, "valid_targets_min": 1069 }, { "epoch": 2.964458804523425, "grad_norm": 0.4134324557091191, "learning_rate": 2.856862456879599e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.15292227268218994, "step": 1835, "valid_targets_mean": 4747.1, "valid_targets_min": 3410 }, { "epoch": 2.9725363489499195, "grad_norm": 0.4210915654521287, "learning_rate": 2.8495750338777487e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.15871697664260864, "step": 1840, "valid_targets_mean": 5455.9, "valid_targets_min": 3518 }, { "epoch": 2.9806138933764137, "grad_norm": 0.4495497695447994, "learning_rate": 2.8422738218229974e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.16716666519641876, "step": 1845, "valid_targets_mean": 5352.4, "valid_targets_min": 3391 }, { "epoch": 2.988691437802908, "grad_norm": 1.5430872891092386, "learning_rate": 2.8349589392178843e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13364684581756592, "step": 1850, "valid_targets_mean": 5169.6, "valid_targets_min": 3248 }, { "epoch": 2.996768982229402, "grad_norm": 0.385078503937771, "learning_rate": 2.827630504786829e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.15355360507965088, "step": 1855, "valid_targets_mean": 5491.1, "valid_targets_min": 3017 }, { "epoch": 3.004846526655897, "grad_norm": 0.3790490762550386, "learning_rate": 2.8202886374742062e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.17056137323379517, "step": 1860, "valid_targets_mean": 5756.8, "valid_targets_min": 2958 }, { "epoch": 3.012924071082391, "grad_norm": 0.3968150107316026, "learning_rate": 2.812933456442411e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.15332677960395813, "step": 1865, "valid_targets_mean": 5816.9, "valid_targets_min": 2930 }, { "epoch": 3.0210016155088852, "grad_norm": 0.4168205957829322, "learning_rate": 2.8055650810699286e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.17240363359451294, "step": 1870, "valid_targets_mean": 5458.4, "valid_targets_min": 1314 }, { "epoch": 3.0290791599353795, "grad_norm": 0.41901551796139186, "learning_rate": 2.7981836309493945e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.13956554234027863, "step": 1875, "valid_targets_mean": 5344.1, "valid_targets_min": 3291 }, { "epoch": 3.037156704361874, "grad_norm": 0.43648629037836206, "learning_rate": 2.790789225885656e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1436006724834442, "step": 1880, "valid_targets_mean": 5276.2, "valid_targets_min": 256 }, { "epoch": 3.0452342487883683, "grad_norm": 0.38914872559345653, "learning_rate": 2.783381985893824e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.14736038446426392, "step": 1885, "valid_targets_mean": 5778.1, "valid_targets_min": 3255 }, { "epoch": 3.0533117932148626, "grad_norm": 0.371589235961242, "learning_rate": 2.775962031197328e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.1469155102968216, "step": 1890, "valid_targets_mean": 6252.9, "valid_targets_min": 3988 }, { "epoch": 3.0613893376413572, "grad_norm": 0.42447513418921207, "learning_rate": 2.768529482225964e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542665660381317, "step": 1895, "valid_targets_mean": 4997.4, "valid_targets_min": 3403 }, { "epoch": 3.0694668820678515, "grad_norm": 0.36654037754401236, "learning_rate": 2.761084459613939e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.14190000295639038, "step": 1900, "valid_targets_mean": 6075.4, "valid_targets_min": 3704 }, { "epoch": 3.0775444264943457, "grad_norm": 0.3991548440822749, "learning_rate": 2.7536270841979153e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.14582324028015137, "step": 1905, "valid_targets_mean": 5232.4, "valid_targets_min": 3181 }, { "epoch": 3.08562197092084, "grad_norm": 0.3896275257772552, "learning_rate": 2.7461574770150457e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319112479686737, "step": 1910, "valid_targets_mean": 5051.2, "valid_targets_min": 2904 }, { "epoch": 3.0936995153473346, "grad_norm": 0.40055785830035945, "learning_rate": 2.7386757593010127e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.14539475739002228, "step": 1915, "valid_targets_mean": 5449.8, "valid_targets_min": 2642 }, { "epoch": 3.101777059773829, "grad_norm": 0.41050944408580226, "learning_rate": 2.7311820524880584e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.15138906240463257, "step": 1920, "valid_targets_mean": 5428.7, "valid_targets_min": 3801 }, { "epoch": 3.109854604200323, "grad_norm": 0.414382801561421, "learning_rate": 2.7236764782030153e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.15684393048286438, "step": 1925, "valid_targets_mean": 5752.2, "valid_targets_min": 3445 }, { "epoch": 3.1179321486268172, "grad_norm": 0.4253007826394208, "learning_rate": 2.7161591582653293e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.15882694721221924, "step": 1930, "valid_targets_mean": 5576.8, "valid_targets_min": 999 }, { "epoch": 3.126009693053312, "grad_norm": 0.4116885191877429, "learning_rate": 2.708630214685086e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.1493636965751648, "step": 1935, "valid_targets_mean": 5349.6, "valid_targets_min": 2809 }, { "epoch": 3.134087237479806, "grad_norm": 0.3824930218093128, "learning_rate": 2.70108976966103e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.14908301830291748, "step": 1940, "valid_targets_mean": 5485.6, "valid_targets_min": 3274 }, { "epoch": 3.1421647819063003, "grad_norm": 0.43229853577719435, "learning_rate": 2.693537945578576e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.15119776129722595, "step": 1945, "valid_targets_mean": 5140.9, "valid_targets_min": 2373 }, { "epoch": 3.150242326332795, "grad_norm": 0.42884161042903884, "learning_rate": 2.6859748650078327e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.17630845308303833, "step": 1950, "valid_targets_mean": 5807.7, "valid_targets_min": 3410 }, { "epoch": 3.158319870759289, "grad_norm": 0.37371276792780805, "learning_rate": 2.678400650701602e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1380992978811264, "step": 1955, "valid_targets_mean": 5687.8, "valid_targets_min": 2911 }, { "epoch": 3.1663974151857834, "grad_norm": 0.4145495752229891, "learning_rate": 2.6708154255933973e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371968537569046, "step": 1960, "valid_targets_mean": 4979.2, "valid_targets_min": 2518 }, { "epoch": 3.1744749596122777, "grad_norm": 0.4406884355216408, "learning_rate": 2.6632193127954393e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1561473160982132, "step": 1965, "valid_targets_mean": 5259.7, "valid_targets_min": 1825 }, { "epoch": 3.1825525040387723, "grad_norm": 0.4179333160175781, "learning_rate": 2.6556124355966633e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15797705948352814, "step": 1970, "valid_targets_mean": 5317.8, "valid_targets_min": 982 }, { "epoch": 3.1906300484652665, "grad_norm": 0.4068834683524423, "learning_rate": 2.6479949174607166e-05, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1401294469833374, "step": 1975, "valid_targets_mean": 6256.9, "valid_targets_min": 2170 }, { "epoch": 3.1987075928917608, "grad_norm": 0.46135880028117426, "learning_rate": 2.640366882023955e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.1438083052635193, "step": 1980, "valid_targets_mean": 4902.4, "valid_targets_min": 2561 }, { "epoch": 3.2067851373182554, "grad_norm": 0.3772951249061422, "learning_rate": 2.6327284530934333e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.13431373238563538, "step": 1985, "valid_targets_mean": 5266.6, "valid_targets_min": 3377 }, { "epoch": 3.2148626817447497, "grad_norm": 0.4365284090149285, "learning_rate": 2.625079754644901e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.14966890215873718, "step": 1990, "valid_targets_mean": 5547.6, "valid_targets_min": 3367 }, { "epoch": 3.222940226171244, "grad_norm": 0.4344060467491617, "learning_rate": 2.6174209108207858e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.15894004702568054, "step": 1995, "valid_targets_mean": 5271.2, "valid_targets_min": 2963 }, { "epoch": 3.231017770597738, "grad_norm": 0.4290654640834972, "learning_rate": 2.609752045928181e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.15122604370117188, "step": 2000, "valid_targets_mean": 4874.1, "valid_targets_min": 1618 }, { "epoch": 3.2390953150242328, "grad_norm": 0.40755382282044406, "learning_rate": 2.6020732844368253e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.15718157589435577, "step": 2005, "valid_targets_mean": 5710.7, "valid_targets_min": 3247 }, { "epoch": 3.247172859450727, "grad_norm": 0.45017496542152, "learning_rate": 2.5943847509770878e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.1719478964805603, "step": 2010, "valid_targets_mean": 5359.8, "valid_targets_min": 2700 }, { "epoch": 3.255250403877221, "grad_norm": 0.4623455962159807, "learning_rate": 2.586686570337939e-05, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.15864837169647217, "step": 2015, "valid_targets_mean": 5411.4, "valid_targets_min": 2368 }, { "epoch": 3.263327948303716, "grad_norm": 0.3774210696224583, "learning_rate": 2.5789788674649287e-05, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15108612179756165, "step": 2020, "valid_targets_mean": 5870.5, "valid_targets_min": 3853 }, { "epoch": 3.27140549273021, "grad_norm": 0.3702630043239486, "learning_rate": 2.571261767458159e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.15424832701683044, "step": 2025, "valid_targets_mean": 6300.9, "valid_targets_min": 3895 }, { "epoch": 3.2794830371567043, "grad_norm": 0.42808499410597545, "learning_rate": 2.5635353955702517e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.15260916948318481, "step": 2030, "valid_targets_mean": 5049.5, "valid_targets_min": 3091 }, { "epoch": 3.2875605815831985, "grad_norm": 0.40554869240072816, "learning_rate": 2.5557998772043148e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14066237211227417, "step": 2035, "valid_targets_mean": 4771.4, "valid_targets_min": 773 }, { "epoch": 3.295638126009693, "grad_norm": 0.4033053077584176, "learning_rate": 2.54805533791191e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15944485366344452, "step": 2040, "valid_targets_mean": 5350.1, "valid_targets_min": 2479 }, { "epoch": 3.3037156704361874, "grad_norm": 0.4070671096794082, "learning_rate": 2.5403019033910137e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1527840942144394, "step": 2045, "valid_targets_mean": 5546.4, "valid_targets_min": 2999 }, { "epoch": 3.3117932148626816, "grad_norm": 0.40454651912809586, "learning_rate": 2.5325396994839748e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.14618010818958282, "step": 2050, "valid_targets_mean": 4913.0, "valid_targets_min": 2799 }, { "epoch": 3.3198707592891763, "grad_norm": 0.4048992795149119, "learning_rate": 2.5247688521754758e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.16438153386116028, "step": 2055, "valid_targets_mean": 5300.4, "valid_targets_min": 3030 }, { "epoch": 3.3279483037156705, "grad_norm": 0.43565390906405965, "learning_rate": 2.5169894875904853e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.14154842495918274, "step": 2060, "valid_targets_mean": 4655.8, "valid_targets_min": 3134 }, { "epoch": 3.3360258481421647, "grad_norm": 0.400196945243683, "learning_rate": 2.509201731992212e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15692731738090515, "step": 2065, "valid_targets_mean": 5103.1, "valid_targets_min": 3355 }, { "epoch": 3.344103392568659, "grad_norm": 0.3937349961185628, "learning_rate": 2.5014057117800556e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.14389444887638092, "step": 2070, "valid_targets_mean": 5687.6, "valid_targets_min": 2137 }, { "epoch": 3.3521809369951536, "grad_norm": 0.39353561868224096, "learning_rate": 2.4936015534875547e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426299661397934, "step": 2075, "valid_targets_mean": 4550.7, "valid_targets_min": 1747 }, { "epoch": 3.360258481421648, "grad_norm": 0.406929436006472, "learning_rate": 2.4857893837803313e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.15165364742279053, "step": 2080, "valid_targets_mean": 5169.2, "valid_targets_min": 3414 }, { "epoch": 3.368336025848142, "grad_norm": 0.6134118024117283, "learning_rate": 2.4779693294540407e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490992307662964, "step": 2085, "valid_targets_mean": 5403.9, "valid_targets_min": 3683 }, { "epoch": 3.3764135702746367, "grad_norm": 0.38653362977731454, "learning_rate": 2.470141517432306e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.13950718939304352, "step": 2090, "valid_targets_mean": 5945.8, "valid_targets_min": 3636 }, { "epoch": 3.384491114701131, "grad_norm": 0.4412013292005518, "learning_rate": 2.4623060747646643e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426210254430771, "step": 2095, "valid_targets_mean": 4918.0, "valid_targets_min": 2768 }, { "epoch": 3.392568659127625, "grad_norm": 0.4239121175423532, "learning_rate": 2.4544631286245007e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.16665086150169373, "step": 2100, "valid_targets_mean": 5425.8, "valid_targets_min": 2417 }, { "epoch": 3.4006462035541194, "grad_norm": 0.4186314057065351, "learning_rate": 2.4466128063069873e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.1559276580810547, "step": 2105, "valid_targets_mean": 5203.6, "valid_targets_min": 2440 }, { "epoch": 3.408723747980614, "grad_norm": 0.3986419672009297, "learning_rate": 2.4387552352270136e-05, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.13025811314582825, "step": 2110, "valid_targets_mean": 4968.6, "valid_targets_min": 2560 }, { "epoch": 3.4168012924071083, "grad_norm": 0.38677721019528954, "learning_rate": 2.430890542917121e-05, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.13195520639419556, "step": 2115, "valid_targets_mean": 6195.9, "valid_targets_min": 4188 }, { "epoch": 3.4248788368336025, "grad_norm": 0.37812614213504553, "learning_rate": 2.4230188570254328e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.14694543182849884, "step": 2120, "valid_targets_mean": 5629.4, "valid_targets_min": 2668 }, { "epoch": 3.432956381260097, "grad_norm": 0.3811752552651874, "learning_rate": 2.415140305313581e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.14528897404670715, "step": 2125, "valid_targets_mean": 6108.1, "valid_targets_min": 2661 }, { "epoch": 3.4410339256865914, "grad_norm": 0.44768742792803773, "learning_rate": 2.4072550156546343e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.17549705505371094, "step": 2130, "valid_targets_mean": 5012.2, "valid_targets_min": 1476 }, { "epoch": 3.4491114701130856, "grad_norm": 0.42807143683133275, "learning_rate": 2.399363116031022e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.15805082023143768, "step": 2135, "valid_targets_mean": 5021.9, "valid_targets_min": 3006 }, { "epoch": 3.45718901453958, "grad_norm": 0.38078146986186595, "learning_rate": 2.3914647345324543e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.14287428557872772, "step": 2140, "valid_targets_mean": 5498.7, "valid_targets_min": 3390 }, { "epoch": 3.4652665589660745, "grad_norm": 0.3851937956769129, "learning_rate": 2.3835599993538486e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.1542748063802719, "step": 2145, "valid_targets_mean": 6078.2, "valid_targets_min": 3209 }, { "epoch": 3.4733441033925687, "grad_norm": 0.43169567603841624, "learning_rate": 2.3756490387932458e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.15492887794971466, "step": 2150, "valid_targets_mean": 4833.4, "valid_targets_min": 3133 }, { "epoch": 3.481421647819063, "grad_norm": 0.3642965932222815, "learning_rate": 2.3677319812497252e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442583203315735, "step": 2155, "valid_targets_mean": 6142.7, "valid_targets_min": 2984 }, { "epoch": 3.489499192245557, "grad_norm": 0.366185985042951, "learning_rate": 2.359808955221326e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.15077048540115356, "step": 2160, "valid_targets_mean": 5692.4, "valid_targets_min": 4004 }, { "epoch": 3.497576736672052, "grad_norm": 0.399036857478809, "learning_rate": 2.351880089302958e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14326925575733185, "step": 2165, "valid_targets_mean": 5415.2, "valid_targets_min": 2826 }, { "epoch": 3.505654281098546, "grad_norm": 0.4264292290712075, "learning_rate": 2.3439455121843157e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.16648367047309875, "step": 2170, "valid_targets_mean": 5267.7, "valid_targets_min": 2725 }, { "epoch": 3.5137318255250403, "grad_norm": 0.3993313828190049, "learning_rate": 2.33600535264779e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.14025278389453888, "step": 2175, "valid_targets_mean": 5846.4, "valid_targets_min": 3385 }, { "epoch": 3.5218093699515345, "grad_norm": 0.42577091740104067, "learning_rate": 2.3280597395663764e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.16203680634498596, "step": 2180, "valid_targets_mean": 5129.8, "valid_targets_min": 2050 }, { "epoch": 3.529886914378029, "grad_norm": 0.3971417885413414, "learning_rate": 2.3201088019015843e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.1632687896490097, "step": 2185, "valid_targets_mean": 5620.4, "valid_targets_min": 3488 }, { "epoch": 3.5379644588045234, "grad_norm": 0.4336661416116471, "learning_rate": 2.3121526687013448e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.1689453125, "step": 2190, "valid_targets_mean": 4963.4, "valid_targets_min": 2764 }, { "epoch": 3.546042003231018, "grad_norm": 0.4304892599162082, "learning_rate": 2.3041914690979157e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.15438434481620789, "step": 2195, "valid_targets_mean": 5219.6, "valid_targets_min": 826 }, { "epoch": 3.5541195476575123, "grad_norm": 0.44762639861098785, "learning_rate": 2.2962253323057834e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.15575367212295532, "step": 2200, "valid_targets_mean": 5476.6, "valid_targets_min": 2659 }, { "epoch": 3.5621970920840065, "grad_norm": 0.4112970830970271, "learning_rate": 2.288254387619568e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.15437915921211243, "step": 2205, "valid_targets_mean": 4804.3, "valid_targets_min": 3202 }, { "epoch": 3.5702746365105007, "grad_norm": 0.4353593179660125, "learning_rate": 2.2802787644119265e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426883041858673, "step": 2210, "valid_targets_mean": 4871.5, "valid_targets_min": 2812 }, { "epoch": 3.578352180936995, "grad_norm": 0.38606076115639726, "learning_rate": 2.272298592131447e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.14033401012420654, "step": 2215, "valid_targets_mean": 5166.7, "valid_targets_min": 1471 }, { "epoch": 3.5864297253634896, "grad_norm": 0.37884641017389226, "learning_rate": 2.264314000300555e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.144095778465271, "step": 2220, "valid_targets_mean": 5684.6, "valid_targets_min": 3165 }, { "epoch": 3.594507269789984, "grad_norm": 0.48067246758501286, "learning_rate": 2.2563251185134054e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1463029831647873, "step": 2225, "valid_targets_mean": 5646.9, "valid_targets_min": 3291 }, { "epoch": 3.602584814216478, "grad_norm": 0.3994157579202727, "learning_rate": 2.248332076433782e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.13935203850269318, "step": 2230, "valid_targets_mean": 5540.3, "valid_targets_min": 2448 }, { "epoch": 3.6106623586429727, "grad_norm": 0.3991704899058015, "learning_rate": 2.2403350037929928e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.13998529314994812, "step": 2235, "valid_targets_mean": 5438.3, "valid_targets_min": 2712 }, { "epoch": 3.618739903069467, "grad_norm": 0.4060660237223782, "learning_rate": 2.2323340303877633e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.15896086394786835, "step": 2240, "valid_targets_mean": 5169.9, "valid_targets_min": 2435 }, { "epoch": 3.626817447495961, "grad_norm": 0.5493544951854048, "learning_rate": 2.224329286078131e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.15103283524513245, "step": 2245, "valid_targets_mean": 4844.8, "valid_targets_min": 2845 }, { "epoch": 3.6348949919224554, "grad_norm": 0.3800540098826123, "learning_rate": 2.2163209007853367e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.15237392485141754, "step": 2250, "valid_targets_mean": 6551.5, "valid_targets_min": 3834 }, { "epoch": 3.64297253634895, "grad_norm": 0.4234706738999503, "learning_rate": 2.2083090044897172e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.16106975078582764, "step": 2255, "valid_targets_mean": 5363.4, "valid_targets_min": 2606 }, { "epoch": 3.6510500807754442, "grad_norm": 0.3864243032489708, "learning_rate": 2.200293727228593e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.16979104280471802, "step": 2260, "valid_targets_mean": 6010.2, "valid_targets_min": 4332 }, { "epoch": 3.6591276252019385, "grad_norm": 0.4019173231742567, "learning_rate": 2.1922751990941614e-05, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15049397945404053, "step": 2265, "valid_targets_mean": 5629.3, "valid_targets_min": 3522 }, { "epoch": 3.667205169628433, "grad_norm": 0.42205042047957253, "learning_rate": 2.1842535502313816e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.15802344679832458, "step": 2270, "valid_targets_mean": 5414.5, "valid_targets_min": 2678 }, { "epoch": 3.6752827140549273, "grad_norm": 0.43674629248505054, "learning_rate": 2.1762289108358645e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704617440700531, "step": 2275, "valid_targets_mean": 5013.8, "valid_targets_min": 2887 }, { "epoch": 3.6833602584814216, "grad_norm": 0.3875197904903836, "learning_rate": 2.1682014111517588e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.14359474182128906, "step": 2280, "valid_targets_mean": 5659.9, "valid_targets_min": 3261 }, { "epoch": 3.691437802907916, "grad_norm": 0.38330175090036805, "learning_rate": 2.1601711814696387e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.15725120902061462, "step": 2285, "valid_targets_mean": 5879.8, "valid_targets_min": 2714 }, { "epoch": 3.6995153473344105, "grad_norm": 0.4367315902170705, "learning_rate": 2.1521383521243842e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.13833829760551453, "step": 2290, "valid_targets_mean": 4894.6, "valid_targets_min": 3211 }, { "epoch": 3.7075928917609047, "grad_norm": 0.4581004559395213, "learning_rate": 2.1441030534930728e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371515393257141, "step": 2295, "valid_targets_mean": 5755.8, "valid_targets_min": 3641 }, { "epoch": 3.715670436187399, "grad_norm": 0.40780633076924916, "learning_rate": 2.1360654159928577e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14940571784973145, "step": 2300, "valid_targets_mean": 5407.1, "valid_targets_min": 2902 }, { "epoch": 3.7237479806138936, "grad_norm": 0.4440265677355658, "learning_rate": 2.1280255700788542e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.15323799848556519, "step": 2305, "valid_targets_mean": 4922.2, "valid_targets_min": 2340 }, { "epoch": 3.731825525040388, "grad_norm": 0.41170826111410097, "learning_rate": 2.119983646242021e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13932514190673828, "step": 2310, "valid_targets_mean": 5513.8, "valid_targets_min": 3219 }, { "epoch": 3.739903069466882, "grad_norm": 0.42184075604681603, "learning_rate": 2.1119397750070428e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.14799876511096954, "step": 2315, "valid_targets_mean": 5156.5, "valid_targets_min": 3263 }, { "epoch": 3.7479806138933762, "grad_norm": 0.4407278270429571, "learning_rate": 2.10389408693021e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560024917125702, "step": 2320, "valid_targets_mean": 5386.8, "valid_targets_min": 2776 }, { "epoch": 3.756058158319871, "grad_norm": 0.41160777876348226, "learning_rate": 2.095846712597304e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.1562466025352478, "step": 2325, "valid_targets_mean": 5080.0, "valid_targets_min": 2467 }, { "epoch": 3.764135702746365, "grad_norm": 0.46822578896832445, "learning_rate": 2.0877977826214737e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.16950945556163788, "step": 2330, "valid_targets_mean": 5497.2, "valid_targets_min": 3151 }, { "epoch": 3.7722132471728593, "grad_norm": 0.3987880976941857, "learning_rate": 2.079747427641116e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.16459164023399353, "step": 2335, "valid_targets_mean": 5201.4, "valid_targets_min": 3350 }, { "epoch": 3.780290791599354, "grad_norm": 0.4061680905283449, "learning_rate": 2.071695778317758e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.14735883474349976, "step": 2340, "valid_targets_mean": 5035.7, "valid_targets_min": 2845 }, { "epoch": 3.788368336025848, "grad_norm": 0.39441369050080427, "learning_rate": 2.0636429653339335e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540263593196869, "step": 2345, "valid_targets_mean": 5057.6, "valid_targets_min": 2274 }, { "epoch": 3.7964458804523424, "grad_norm": 0.416889915883133, "learning_rate": 2.0555891193910646e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14710207283496857, "step": 2350, "valid_targets_mean": 4770.0, "valid_targets_min": 3236 }, { "epoch": 3.8045234248788367, "grad_norm": 0.40711401787943335, "learning_rate": 2.0475343712073363e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.15809385478496552, "step": 2355, "valid_targets_mean": 5591.0, "valid_targets_min": 2093 }, { "epoch": 3.8126009693053313, "grad_norm": 0.3903390563586942, "learning_rate": 2.0394788515155803e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.14185532927513123, "step": 2360, "valid_targets_mean": 5076.9, "valid_targets_min": 920 }, { "epoch": 3.8206785137318255, "grad_norm": 0.413416495294967, "learning_rate": 2.0314226910611478e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.14693567156791687, "step": 2365, "valid_targets_mean": 5353.4, "valid_targets_min": 3014 }, { "epoch": 3.8287560581583198, "grad_norm": 0.4039346596230813, "learning_rate": 2.023366020599792e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1467030942440033, "step": 2370, "valid_targets_mean": 5815.2, "valid_targets_min": 2985 }, { "epoch": 3.8368336025848144, "grad_norm": 0.41298565389518715, "learning_rate": 2.0153089708955432e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.1566350758075714, "step": 2375, "valid_targets_mean": 5346.1, "valid_targets_min": 2150 }, { "epoch": 3.8449111470113086, "grad_norm": 0.4089974403263933, "learning_rate": 2.0072516727185854e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.15077462792396545, "step": 2380, "valid_targets_mean": 4935.6, "valid_targets_min": 2943 }, { "epoch": 3.852988691437803, "grad_norm": 0.42079270976668665, "learning_rate": 1.999194256843138e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612389087677002, "step": 2385, "valid_targets_mean": 5302.7, "valid_targets_min": 3147 }, { "epoch": 3.861066235864297, "grad_norm": 0.38147493590776055, "learning_rate": 1.9911368540453285e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.1430862843990326, "step": 2390, "valid_targets_mean": 5481.4, "valid_targets_min": 3173 }, { "epoch": 3.8691437802907918, "grad_norm": 0.41106419802822197, "learning_rate": 1.9830795951010737e-05, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.15999916195869446, "step": 2395, "valid_targets_mean": 5510.4, "valid_targets_min": 3092 }, { "epoch": 3.877221324717286, "grad_norm": 0.4031529390937838, "learning_rate": 1.9750226107839546e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15642176568508148, "step": 2400, "valid_targets_mean": 5265.4, "valid_targets_min": 2776 }, { "epoch": 3.88529886914378, "grad_norm": 0.4187223419051394, "learning_rate": 1.966966031863096e-05, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.15662488341331482, "step": 2405, "valid_targets_mean": 5388.5, "valid_targets_min": 3219 }, { "epoch": 3.893376413570275, "grad_norm": 0.42727605871459245, "learning_rate": 1.958909989101041e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.14462366700172424, "step": 2410, "valid_targets_mean": 5035.6, "valid_targets_min": 3184 }, { "epoch": 3.901453957996769, "grad_norm": 0.42498564523285326, "learning_rate": 1.9508546132516316e-05, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.15392355620861053, "step": 2415, "valid_targets_mean": 5218.9, "valid_targets_min": 2957 }, { "epoch": 3.9095315024232633, "grad_norm": 0.3959878020726741, "learning_rate": 1.9428000350578874e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.14723697304725647, "step": 2420, "valid_targets_mean": 5313.4, "valid_targets_min": 3003 }, { "epoch": 3.9176090468497575, "grad_norm": 0.40065923174356644, "learning_rate": 1.9347463852498776e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575714349746704, "step": 2425, "valid_targets_mean": 5617.6, "valid_targets_min": 3985 }, { "epoch": 3.9256865912762517, "grad_norm": 0.44927439386069595, "learning_rate": 1.926693794542607e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1579849123954773, "step": 2430, "valid_targets_mean": 4860.3, "valid_targets_min": 2840 }, { "epoch": 3.9337641357027464, "grad_norm": 0.3777485375355132, "learning_rate": 1.9186423936338886e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13425903022289276, "step": 2435, "valid_targets_mean": 5260.8, "valid_targets_min": 1369 }, { "epoch": 3.9418416801292406, "grad_norm": 0.4350245152644942, "learning_rate": 1.9105923132022234e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.16233918070793152, "step": 2440, "valid_targets_mean": 4957.4, "valid_targets_min": 2768 }, { "epoch": 3.9499192245557353, "grad_norm": 0.4091057515846294, "learning_rate": 1.9025436839046834e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.15739592909812927, "step": 2445, "valid_targets_mean": 5077.9, "valid_targets_min": 2154 }, { "epoch": 3.9579967689822295, "grad_norm": 0.4097245633846646, "learning_rate": 1.894496636374786e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472896784543991, "step": 2450, "valid_targets_mean": 5508.9, "valid_targets_min": 1412 }, { "epoch": 3.9660743134087237, "grad_norm": 0.39627955516501584, "learning_rate": 1.8864513012203747e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.16468317806720734, "step": 2455, "valid_targets_mean": 6392.1, "valid_targets_min": 3349 }, { "epoch": 3.974151857835218, "grad_norm": 0.4209417514706817, "learning_rate": 1.8784078090215028e-05, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.13668987154960632, "step": 2460, "valid_targets_mean": 4554.8, "valid_targets_min": 3061 }, { "epoch": 3.982229402261712, "grad_norm": 0.40708659888796483, "learning_rate": 1.8703662903283092e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.14635734260082245, "step": 2465, "valid_targets_mean": 5307.4, "valid_targets_min": 2869 }, { "epoch": 3.990306946688207, "grad_norm": 0.4201079145553348, "learning_rate": 1.8623268756589033e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.1568068265914917, "step": 2470, "valid_targets_mean": 5867.6, "valid_targets_min": 2861 }, { "epoch": 3.998384491114701, "grad_norm": 0.5636352727995623, "learning_rate": 1.8542896954972443e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15685251355171204, "step": 2475, "valid_targets_mean": 4876.6, "valid_targets_min": 3117 }, { "epoch": 4.006462035541196, "grad_norm": 0.42565467595314055, "learning_rate": 1.846254880291024e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.12946423888206482, "step": 2480, "valid_targets_mean": 5089.5, "valid_targets_min": 3193 }, { "epoch": 4.01453957996769, "grad_norm": 0.44213909133955387, "learning_rate": 1.8382225604495505e-05, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.14307674765586853, "step": 2485, "valid_targets_mean": 5329.4, "valid_targets_min": 2999 }, { "epoch": 4.022617124394184, "grad_norm": 0.43432375435262827, "learning_rate": 1.830192866341629e-05, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.1415438950061798, "step": 2490, "valid_targets_mean": 5478.9, "valid_targets_min": 3263 }, { "epoch": 4.030694668820678, "grad_norm": 0.43445963751081745, "learning_rate": 1.822165928293451e-05, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.15091031789779663, "step": 2495, "valid_targets_mean": 5127.4, "valid_targets_min": 906 }, { "epoch": 4.038772213247173, "grad_norm": 0.4037874438131497, "learning_rate": 1.8141418765864726e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.14658978581428528, "step": 2500, "valid_targets_mean": 6061.2, "valid_targets_min": 2480 }, { "epoch": 4.046849757673667, "grad_norm": 0.42639107834727435, "learning_rate": 1.8061208414553033e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.13869735598564148, "step": 2505, "valid_targets_mean": 5297.2, "valid_targets_min": 3324 }, { "epoch": 4.054927302100162, "grad_norm": 0.4073550017785693, "learning_rate": 1.798102953085595e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.12786024808883667, "step": 2510, "valid_targets_mean": 5235.1, "valid_targets_min": 2653 }, { "epoch": 4.063004846526656, "grad_norm": 0.41328082544496686, "learning_rate": 1.7900883416119216e-05, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.12691153585910797, "step": 2515, "valid_targets_mean": 5156.7, "valid_targets_min": 1294 }, { "epoch": 4.07108239095315, "grad_norm": 0.4346008708708734, "learning_rate": 1.7820771371156737e-05, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.1545967161655426, "step": 2520, "valid_targets_mean": 5345.7, "valid_targets_min": 2941 }, { "epoch": 4.079159935379645, "grad_norm": 0.47779679748632076, "learning_rate": 1.7740694696229463e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.15502513945102692, "step": 2525, "valid_targets_mean": 4844.4, "valid_targets_min": 3134 }, { "epoch": 4.087237479806139, "grad_norm": 0.43057242625314834, "learning_rate": 1.766065469102423e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1366223692893982, "step": 2530, "valid_targets_mean": 4981.9, "valid_targets_min": 2603 }, { "epoch": 4.095315024232633, "grad_norm": 0.429086317612865, "learning_rate": 1.7580652654632745e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.1400957852602005, "step": 2535, "valid_targets_mean": 5427.9, "valid_targets_min": 3298 }, { "epoch": 4.103392568659127, "grad_norm": 0.465331706392212, "learning_rate": 1.7500689885530435e-05, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.13422629237174988, "step": 2540, "valid_targets_mean": 4903.6, "valid_targets_min": 256 }, { "epoch": 4.111470113085622, "grad_norm": 0.44363029506124135, "learning_rate": 1.7420767681555406e-05, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.16646191477775574, "step": 2545, "valid_targets_mean": 5154.2, "valid_targets_min": 922 }, { "epoch": 4.119547657512117, "grad_norm": 0.43473031219865776, "learning_rate": 1.734088733988738e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13686491549015045, "step": 2550, "valid_targets_mean": 5565.6, "valid_targets_min": 2904 }, { "epoch": 4.127625201938611, "grad_norm": 0.4531518269846548, "learning_rate": 1.7261050157026606e-05, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368991732597351, "step": 2555, "valid_targets_mean": 5132.1, "valid_targets_min": 3521 }, { "epoch": 4.135702746365105, "grad_norm": 0.4536959505796717, "learning_rate": 1.7181257428772876e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1559496521949768, "step": 2560, "valid_targets_mean": 5842.8, "valid_targets_min": 3620 }, { "epoch": 4.143780290791599, "grad_norm": 0.43018680374896995, "learning_rate": 1.7101510450204435e-05, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514936238527298, "step": 2565, "valid_targets_mean": 5458.9, "valid_targets_min": 2870 }, { "epoch": 4.1518578352180935, "grad_norm": 0.45789834628046766, "learning_rate": 1.7021810515656993e-05, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.14251697063446045, "step": 2570, "valid_targets_mean": 4443.4, "valid_targets_min": 2642 }, { "epoch": 4.159935379644588, "grad_norm": 0.4046050667132452, "learning_rate": 1.694215891870272e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378990113735199, "step": 2575, "valid_targets_mean": 5174.7, "valid_targets_min": 3246 }, { "epoch": 4.168012924071083, "grad_norm": 0.39401964693624647, "learning_rate": 1.686255695212923e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.14063289761543274, "step": 2580, "valid_targets_mean": 5825.9, "valid_targets_min": 2571 }, { "epoch": 4.176090468497577, "grad_norm": 0.4149990311373484, "learning_rate": 1.678300590791861e-05, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12822958827018738, "step": 2585, "valid_targets_mean": 5082.3, "valid_targets_min": 3157 }, { "epoch": 4.184168012924071, "grad_norm": 0.4724232157465758, "learning_rate": 1.6703507077226456e-05, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.14374995231628418, "step": 2590, "valid_targets_mean": 5187.9, "valid_targets_min": 2995 }, { "epoch": 4.1922455573505655, "grad_norm": 0.42323445983331587, "learning_rate": 1.6624061750360903e-05, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.13836079835891724, "step": 2595, "valid_targets_mean": 4957.8, "valid_targets_min": 2629 }, { "epoch": 4.20032310177706, "grad_norm": 0.4554566483557804, "learning_rate": 1.6544671216761713e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.14031758904457092, "step": 2600, "valid_targets_mean": 5175.9, "valid_targets_min": 2404 }, { "epoch": 4.208400646203554, "grad_norm": 0.4430945069630982, "learning_rate": 1.6465336764979292e-05, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.13017365336418152, "step": 2605, "valid_targets_mean": 4475.2, "valid_targets_min": 2718 }, { "epoch": 4.216478190630048, "grad_norm": 0.4501689534740505, "learning_rate": 1.638605968265382e-05, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.12520724534988403, "step": 2610, "valid_targets_mean": 5041.1, "valid_targets_min": 3294 }, { "epoch": 4.224555735056542, "grad_norm": 0.5609815427967917, "learning_rate": 1.630684125649436e-05, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.136855348944664, "step": 2615, "valid_targets_mean": 5298.2, "valid_targets_min": 3349 }, { "epoch": 4.2326332794830375, "grad_norm": 0.42487595678563556, "learning_rate": 1.6227682772257917e-05, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.14639994502067566, "step": 2620, "valid_targets_mean": 5180.0, "valid_targets_min": 1936 }, { "epoch": 4.240710823909532, "grad_norm": 0.49601400066615947, "learning_rate": 1.614858551472865e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1491582691669464, "step": 2625, "valid_targets_mean": 4556.6, "valid_targets_min": 587 }, { "epoch": 4.248788368336026, "grad_norm": 0.4777696243054849, "learning_rate": 1.606955076769694e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.14732205867767334, "step": 2630, "valid_targets_mean": 4729.9, "valid_targets_min": 3100 }, { "epoch": 4.25686591276252, "grad_norm": 0.3994414220127131, "learning_rate": 1.599057981393861e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13781988620758057, "step": 2635, "valid_targets_mean": 5807.2, "valid_targets_min": 3105 }, { "epoch": 4.264943457189014, "grad_norm": 0.42041612018001095, "learning_rate": 1.5911673935194076e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.13944032788276672, "step": 2640, "valid_targets_mean": 5278.3, "valid_targets_min": 3270 }, { "epoch": 4.273021001615509, "grad_norm": 0.45473382797456474, "learning_rate": 1.5832834412147555e-05, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.1407957673072815, "step": 2645, "valid_targets_mean": 5380.7, "valid_targets_min": 3752 }, { "epoch": 4.281098546042003, "grad_norm": 0.393765619903028, "learning_rate": 1.5754062524406268e-05, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.14375929534435272, "step": 2650, "valid_targets_mean": 5499.1, "valid_targets_min": 2657 }, { "epoch": 4.289176090468498, "grad_norm": 0.41567383960953874, "learning_rate": 1.56753595504797e-05, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.1321938931941986, "step": 2655, "valid_targets_mean": 5447.8, "valid_targets_min": 2886 }, { "epoch": 4.297253634894992, "grad_norm": 0.3821655224339751, "learning_rate": 1.55967267677588e-05, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.13490810990333557, "step": 2660, "valid_targets_mean": 5990.6, "valid_targets_min": 3450 }, { "epoch": 4.305331179321486, "grad_norm": 0.3877345295764598, "learning_rate": 1.55181654524953e-05, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12980371713638306, "step": 2665, "valid_targets_mean": 5655.2, "valid_targets_min": 3541 }, { "epoch": 4.313408723747981, "grad_norm": 0.3800794993104672, "learning_rate": 1.5439676879780967e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.14696776866912842, "step": 2670, "valid_targets_mean": 6074.6, "valid_targets_min": 2990 }, { "epoch": 4.321486268174475, "grad_norm": 0.43433424667276765, "learning_rate": 1.536126232352691e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.14254535734653473, "step": 2675, "valid_targets_mean": 5378.1, "valid_targets_min": 3445 }, { "epoch": 4.329563812600969, "grad_norm": 0.4918736832136846, "learning_rate": 1.5282923056442937e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.12696698307991028, "step": 2680, "valid_targets_mean": 5071.9, "valid_targets_min": 3521 }, { "epoch": 4.337641357027463, "grad_norm": 0.42555336980945496, "learning_rate": 1.5204660350016837e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.15498827397823334, "step": 2685, "valid_targets_mean": 5173.1, "valid_targets_min": 1768 }, { "epoch": 4.345718901453958, "grad_norm": 0.4748149092313879, "learning_rate": 1.5126475474493825e-05, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370469033718109, "step": 2690, "valid_targets_mean": 5121.7, "valid_targets_min": 2159 }, { "epoch": 4.353796445880453, "grad_norm": 0.3777654185593629, "learning_rate": 1.504836969885583e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358526647090912, "step": 2695, "valid_targets_mean": 6279.1, "valid_targets_min": 3547 }, { "epoch": 4.361873990306947, "grad_norm": 0.38522738434416426, "learning_rate": 1.4970344290800971e-05, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1352044939994812, "step": 2700, "valid_targets_mean": 5467.2, "valid_targets_min": 2092 }, { "epoch": 4.369951534733441, "grad_norm": 0.4645665341976508, "learning_rate": 1.4892400516722978e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.14225059747695923, "step": 2705, "valid_targets_mean": 5347.4, "valid_targets_min": 2911 }, { "epoch": 4.378029079159935, "grad_norm": 0.4848170535572879, "learning_rate": 1.4814539641690574e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.14791812002658844, "step": 2710, "valid_targets_mean": 4669.4, "valid_targets_min": 936 }, { "epoch": 4.386106623586429, "grad_norm": 0.4151190917642315, "learning_rate": 1.4736762929427029e-05, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.13626649975776672, "step": 2715, "valid_targets_mean": 4952.8, "valid_targets_min": 1603 }, { "epoch": 4.394184168012924, "grad_norm": 0.39763403121391977, "learning_rate": 1.4659071642289586e-05, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.13494357466697693, "step": 2720, "valid_targets_mean": 5396.2, "valid_targets_min": 3598 }, { "epoch": 4.402261712439419, "grad_norm": 0.4411026275876086, "learning_rate": 1.4581467041248987e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.14752957224845886, "step": 2725, "valid_targets_mean": 5540.3, "valid_targets_min": 3036 }, { "epoch": 4.410339256865913, "grad_norm": 0.40905042976740047, "learning_rate": 1.450395038586903e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.13268199563026428, "step": 2730, "valid_targets_mean": 5190.2, "valid_targets_min": 3000 }, { "epoch": 4.418416801292407, "grad_norm": 0.4297968504084322, "learning_rate": 1.4426522934286101e-05, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1449374258518219, "step": 2735, "valid_targets_mean": 4803.5, "valid_targets_min": 1305 }, { "epoch": 4.426494345718901, "grad_norm": 0.412783061241555, "learning_rate": 1.4349185943188748e-05, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1454753279685974, "step": 2740, "valid_targets_mean": 5826.1, "valid_targets_min": 3507 }, { "epoch": 4.434571890145396, "grad_norm": 0.41250103264883276, "learning_rate": 1.4271940667797324e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.13304153084754944, "step": 2745, "valid_targets_mean": 5462.4, "valid_targets_min": 2791 }, { "epoch": 4.44264943457189, "grad_norm": 0.4502312399331622, "learning_rate": 1.4194788361843563e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.13922573626041412, "step": 2750, "valid_targets_mean": 5384.1, "valid_targets_min": 3369 }, { "epoch": 4.450726978998384, "grad_norm": 0.41469346574409216, "learning_rate": 1.411773027755027e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.16563090682029724, "step": 2755, "valid_targets_mean": 5837.9, "valid_targets_min": 3309 }, { "epoch": 4.458804523424879, "grad_norm": 0.433737086009782, "learning_rate": 1.4040767665610981e-05, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.14223286509513855, "step": 2760, "valid_targets_mean": 5067.8, "valid_targets_min": 3270 }, { "epoch": 4.466882067851373, "grad_norm": 0.41723969171999564, "learning_rate": 1.396390177516965e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.1245618462562561, "step": 2765, "valid_targets_mean": 5411.2, "valid_targets_min": 2965 }, { "epoch": 4.474959612277868, "grad_norm": 0.4127449084932179, "learning_rate": 1.3887133853800418e-05, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349238157272339, "step": 2770, "valid_targets_mean": 5649.5, "valid_targets_min": 3148 }, { "epoch": 4.483037156704362, "grad_norm": 0.44963424947146446, "learning_rate": 1.3810465147487305e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.14304043352603912, "step": 2775, "valid_targets_mean": 5597.4, "valid_targets_min": 2511 }, { "epoch": 4.491114701130856, "grad_norm": 0.4019246775715318, "learning_rate": 1.373389690060405e-05, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.13364571332931519, "step": 2780, "valid_targets_mean": 5670.1, "valid_targets_min": 3242 }, { "epoch": 4.49919224555735, "grad_norm": 0.4594474877153609, "learning_rate": 1.3657430355893855e-05, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.12532834708690643, "step": 2785, "valid_targets_mean": 5329.9, "valid_targets_min": 2668 }, { "epoch": 4.5072697899838445, "grad_norm": 0.4134999029055612, "learning_rate": 1.3581066754449246e-05, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.13771578669548035, "step": 2790, "valid_targets_mean": 5896.8, "valid_targets_min": 2730 }, { "epoch": 4.51534733441034, "grad_norm": 0.41778304086801016, "learning_rate": 1.3504807335691948e-05, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.15168075263500214, "step": 2795, "valid_targets_mean": 5395.0, "valid_targets_min": 3492 }, { "epoch": 4.523424878836834, "grad_norm": 0.4403664374264896, "learning_rate": 1.3428653337352722e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1525859832763672, "step": 2800, "valid_targets_mean": 5305.6, "valid_targets_min": 3771 }, { "epoch": 4.531502423263328, "grad_norm": 0.4078756485043072, "learning_rate": 1.3352605995451295e-05, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.13579663634300232, "step": 2805, "valid_targets_mean": 5819.9, "valid_targets_min": 3028 }, { "epoch": 4.539579967689822, "grad_norm": 0.47241584949791804, "learning_rate": 1.3276666544276338e-05, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.12606637179851532, "step": 2810, "valid_targets_mean": 5300.6, "valid_targets_min": 3032 }, { "epoch": 4.5476575121163165, "grad_norm": 0.4472552136291, "learning_rate": 1.3200836216365357e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.16859114170074463, "step": 2815, "valid_targets_mean": 5528.4, "valid_targets_min": 3139 }, { "epoch": 4.555735056542811, "grad_norm": 0.4314047387299008, "learning_rate": 1.3125116242484761e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.14334100484848022, "step": 2820, "valid_targets_mean": 5568.1, "valid_targets_min": 1120 }, { "epoch": 4.563812600969305, "grad_norm": 0.4770918683992712, "learning_rate": 1.3049507851609837e-05, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330651342868805, "step": 2825, "valid_targets_mean": 4386.8, "valid_targets_min": 2747 }, { "epoch": 4.5718901453958, "grad_norm": 0.4870368298725214, "learning_rate": 1.2974012270904824e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.14877751469612122, "step": 2830, "valid_targets_mean": 4765.4, "valid_targets_min": 2739 }, { "epoch": 4.579967689822294, "grad_norm": 0.44178395738617654, "learning_rate": 1.2898630725703e-05, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.14977668225765228, "step": 2835, "valid_targets_mean": 5217.3, "valid_targets_min": 3492 }, { "epoch": 4.5880452342487885, "grad_norm": 0.39914740501270685, "learning_rate": 1.2823364439486775e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.14151275157928467, "step": 2840, "valid_targets_mean": 6049.9, "valid_targets_min": 2668 }, { "epoch": 4.596122778675283, "grad_norm": 0.43543696709388485, "learning_rate": 1.2748214633867852e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313113123178482, "step": 2845, "valid_targets_mean": 5043.1, "valid_targets_min": 665 }, { "epoch": 4.604200323101777, "grad_norm": 0.43160935343861717, "learning_rate": 1.2673182528567394e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.16229557991027832, "step": 2850, "valid_targets_mean": 5334.7, "valid_targets_min": 1412 }, { "epoch": 4.612277867528271, "grad_norm": 0.4112636471282577, "learning_rate": 1.2598269341396212e-05, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.14326302707195282, "step": 2855, "valid_targets_mean": 5666.9, "valid_targets_min": 2840 }, { "epoch": 4.620355411954765, "grad_norm": 0.4193132603434726, "learning_rate": 1.2523476288235035e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.11997410655021667, "step": 2860, "valid_targets_mean": 5055.6, "valid_targets_min": 2936 }, { "epoch": 4.6284329563812605, "grad_norm": 0.40727152336695605, "learning_rate": 1.2448804583014734e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.14037710428237915, "step": 2865, "valid_targets_mean": 5948.5, "valid_targets_min": 3460 }, { "epoch": 4.636510500807755, "grad_norm": 0.4576903143700993, "learning_rate": 1.237425543769664e-05, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.1467304229736328, "step": 2870, "valid_targets_mean": 4774.2, "valid_targets_min": 3035 }, { "epoch": 4.644588045234249, "grad_norm": 0.383155018230044, "learning_rate": 1.229983006225289e-05, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.12850114703178406, "step": 2875, "valid_targets_mean": 5473.4, "valid_targets_min": 2920 }, { "epoch": 4.652665589660743, "grad_norm": 0.42907692476292697, "learning_rate": 1.2225529664646743e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375298947095871, "step": 2880, "valid_targets_mean": 5756.6, "valid_targets_min": 3347 }, { "epoch": 4.660743134087237, "grad_norm": 0.45578066384811955, "learning_rate": 1.2151355450813032e-05, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.13910695910453796, "step": 2885, "valid_targets_mean": 5256.9, "valid_targets_min": 2607 }, { "epoch": 4.668820678513732, "grad_norm": 0.4392376613684911, "learning_rate": 1.207730862463854e-05, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.1305842101573944, "step": 2890, "valid_targets_mean": 5400.7, "valid_targets_min": 3440 }, { "epoch": 4.676898222940226, "grad_norm": 0.43322009220366464, "learning_rate": 1.2003390387942472e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.13938024640083313, "step": 2895, "valid_targets_mean": 5202.0, "valid_targets_min": 3009 }, { "epoch": 4.684975767366721, "grad_norm": 0.42387663404361464, "learning_rate": 1.192960194045699e-05, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.13488176465034485, "step": 2900, "valid_targets_mean": 5007.9, "valid_targets_min": 1583 }, { "epoch": 4.693053311793215, "grad_norm": 0.5059478326875065, "learning_rate": 1.1855944479807678e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.15618818998336792, "step": 2905, "valid_targets_mean": 4973.8, "valid_targets_min": 2736 }, { "epoch": 4.701130856219709, "grad_norm": 0.39919140562243194, "learning_rate": 1.1782419201494154e-05, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.12572744488716125, "step": 2910, "valid_targets_mean": 5450.1, "valid_targets_min": 3087 }, { "epoch": 4.709208400646204, "grad_norm": 0.4809512538206678, "learning_rate": 1.1709027298870632e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.1231696754693985, "step": 2915, "valid_targets_mean": 5773.8, "valid_targets_min": 2820 }, { "epoch": 4.717285945072698, "grad_norm": 0.41574868747529725, "learning_rate": 1.1635769963126573e-05, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308540552854538, "step": 2920, "valid_targets_mean": 5483.6, "valid_targets_min": 3132 }, { "epoch": 4.725363489499192, "grad_norm": 0.40307841075512413, "learning_rate": 1.1562648383267358e-05, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.13654011487960815, "step": 2925, "valid_targets_mean": 5368.4, "valid_targets_min": 3448 }, { "epoch": 4.733441033925686, "grad_norm": 0.536090353564831, "learning_rate": 1.1489663746094953e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1650780290365219, "step": 2930, "valid_targets_mean": 4809.2, "valid_targets_min": 2689 }, { "epoch": 4.741518578352181, "grad_norm": 0.4830950093812901, "learning_rate": 1.1416817236188695e-05, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.14563900232315063, "step": 2935, "valid_targets_mean": 5572.7, "valid_targets_min": 3211 }, { "epoch": 4.749596122778676, "grad_norm": 0.4126946285281672, "learning_rate": 1.1344110035886038e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.1415388286113739, "step": 2940, "valid_targets_mean": 5840.8, "valid_targets_min": 3161 }, { "epoch": 4.75767366720517, "grad_norm": 0.4183524471538227, "learning_rate": 1.1271543325263342e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.14083191752433777, "step": 2945, "valid_targets_mean": 5269.1, "valid_targets_min": 1018 }, { "epoch": 4.765751211631664, "grad_norm": 0.40863305060929256, "learning_rate": 1.1199118282116797e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.13962915539741516, "step": 2950, "valid_targets_mean": 5663.4, "valid_targets_min": 3494 }, { "epoch": 4.773828756058158, "grad_norm": 0.48244071805874694, "learning_rate": 1.1126836081943199e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.15097686648368835, "step": 2955, "valid_targets_mean": 4976.0, "valid_targets_min": 2044 }, { "epoch": 4.7819063004846525, "grad_norm": 0.4261822766446634, "learning_rate": 1.1054697897920963e-05, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349121630191803, "step": 2960, "valid_targets_mean": 4968.2, "valid_targets_min": 1307 }, { "epoch": 4.789983844911147, "grad_norm": 0.5078548452558224, "learning_rate": 1.098270490089104e-05, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.1354251205921173, "step": 2965, "valid_targets_mean": 5543.1, "valid_targets_min": 2942 }, { "epoch": 4.798061389337642, "grad_norm": 0.43986780155442085, "learning_rate": 1.0910858259337896e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.13416457176208496, "step": 2970, "valid_targets_mean": 4822.5, "valid_targets_min": 1904 }, { "epoch": 4.806138933764136, "grad_norm": 0.43214223060348766, "learning_rate": 1.0839159139370597e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.13904398679733276, "step": 2975, "valid_targets_mean": 5033.6, "valid_targets_min": 3069 }, { "epoch": 4.81421647819063, "grad_norm": 0.44873477765055975, "learning_rate": 1.0767608704703852e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.14608915150165558, "step": 2980, "valid_targets_mean": 4896.9, "valid_targets_min": 3119 }, { "epoch": 4.8222940226171245, "grad_norm": 0.42963463585563594, "learning_rate": 1.0696208116639108e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.13478168845176697, "step": 2985, "valid_targets_mean": 5041.9, "valid_targets_min": 2861 }, { "epoch": 4.830371567043619, "grad_norm": 0.4184747605118807, "learning_rate": 1.0624958534045748e-05, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.1315079629421234, "step": 2990, "valid_targets_mean": 4842.6, "valid_targets_min": 2395 }, { "epoch": 4.838449111470113, "grad_norm": 0.4507756298256187, "learning_rate": 1.055386111334225e-05, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1261076033115387, "step": 2995, "valid_targets_mean": 5323.1, "valid_targets_min": 2606 }, { "epoch": 4.846526655896607, "grad_norm": 0.4213500877752229, "learning_rate": 1.0482917008477406e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388499140739441, "step": 3000, "valid_targets_mean": 5244.6, "valid_targets_min": 2050 }, { "epoch": 4.854604200323102, "grad_norm": 0.4394120888553323, "learning_rate": 1.0412127370911627e-05, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.1536855250597, "step": 3005, "valid_targets_mean": 5368.1, "valid_targets_min": 2641 }, { "epoch": 4.8626817447495965, "grad_norm": 0.4350239563816111, "learning_rate": 1.034149334959824e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.13980424404144287, "step": 3010, "valid_targets_mean": 5067.7, "valid_targets_min": 3414 }, { "epoch": 4.870759289176091, "grad_norm": 0.4385149359865282, "learning_rate": 1.0271016090964836e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.1483292281627655, "step": 3015, "valid_targets_mean": 5908.5, "valid_targets_min": 3151 }, { "epoch": 4.878836833602585, "grad_norm": 0.4021151824125644, "learning_rate": 1.0200696738894651e-05, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273038387298584, "step": 3020, "valid_targets_mean": 5290.0, "valid_targets_min": 2564 }, { "epoch": 4.886914378029079, "grad_norm": 0.4468569200340916, "learning_rate": 1.0130536434708024e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.130598783493042, "step": 3025, "valid_targets_mean": 5362.9, "valid_targets_min": 4032 }, { "epoch": 4.894991922455573, "grad_norm": 0.4066728906290766, "learning_rate": 1.0060536317143877e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388537734746933, "step": 3030, "valid_targets_mean": 5224.4, "valid_targets_min": 826 }, { "epoch": 4.903069466882068, "grad_norm": 0.7116931473944323, "learning_rate": 9.990697522341179e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.13971570134162903, "step": 3035, "valid_targets_mean": 4791.1, "valid_targets_min": 2942 }, { "epoch": 4.911147011308563, "grad_norm": 0.4071326459613783, "learning_rate": 9.921021183820601e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1335953325033188, "step": 3040, "valid_targets_mean": 5521.1, "valid_targets_min": 3073 }, { "epoch": 4.919224555735057, "grad_norm": 0.42992397938879723, "learning_rate": 9.851508432466006e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.13599014282226562, "step": 3045, "valid_targets_mean": 4856.4, "valid_targets_min": 1595 }, { "epoch": 4.927302100161551, "grad_norm": 0.4990884521696119, "learning_rate": 9.782160396506187e-06, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.14541074633598328, "step": 3050, "valid_targets_mean": 4448.3, "valid_targets_min": 3020 }, { "epoch": 4.935379644588045, "grad_norm": 0.422162536375542, "learning_rate": 9.712978201496512e-06, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.13707958161830902, "step": 3055, "valid_targets_mean": 4581.8, "valid_targets_min": 2808 }, { "epoch": 4.94345718901454, "grad_norm": 0.40274962941480746, "learning_rate": 9.643962970300646e-06, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.13235828280448914, "step": 3060, "valid_targets_mean": 5385.7, "valid_targets_min": 2964 }, { "epoch": 4.951534733441034, "grad_norm": 0.41106224144589665, "learning_rate": 9.575115823072366e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.15319183468818665, "step": 3065, "valid_targets_mean": 5383.4, "valid_targets_min": 3733 }, { "epoch": 4.959612277867528, "grad_norm": 0.4368314776007296, "learning_rate": 9.506437877237346e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13027821481227875, "step": 3070, "valid_targets_mean": 5122.1, "valid_targets_min": 3149 }, { "epoch": 4.967689822294023, "grad_norm": 0.44034403884405504, "learning_rate": 9.437930247475023e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.129189133644104, "step": 3075, "valid_targets_mean": 4822.6, "valid_targets_min": 3038 }, { "epoch": 4.975767366720517, "grad_norm": 0.4280324030430042, "learning_rate": 9.36959404570053e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.13658729195594788, "step": 3080, "valid_targets_mean": 4948.9, "valid_targets_min": 1227 }, { "epoch": 4.983844911147012, "grad_norm": 0.4238657423203, "learning_rate": 9.30143038104663e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.12977300584316254, "step": 3085, "valid_targets_mean": 5721.9, "valid_targets_min": 3482 }, { "epoch": 4.991922455573506, "grad_norm": 0.48199672073194927, "learning_rate": 9.233440359845703e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.18151067197322845, "step": 3090, "valid_targets_mean": 5081.3, "valid_targets_min": 2827 }, { "epoch": 5.0, "grad_norm": 0.44906074019942926, "learning_rate": 9.165625085611818e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.14372006058692932, "step": 3095, "valid_targets_mean": 4968.9, "valid_targets_min": 3162 }, { "epoch": 5.008077544426494, "grad_norm": 0.43772755900870186, "learning_rate": 9.097985659022808e-06, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423802673816681, "step": 3100, "valid_targets_mean": 5149.9, "valid_targets_min": 2678 }, { "epoch": 5.016155088852988, "grad_norm": 0.43633990751021157, "learning_rate": 9.030523177902403e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.13901320099830627, "step": 3105, "valid_targets_mean": 5018.6, "valid_targets_min": 3138 }, { "epoch": 5.024232633279483, "grad_norm": 0.43155930945131143, "learning_rate": 8.963238737202405e-06, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.1326574683189392, "step": 3110, "valid_targets_mean": 5598.6, "valid_targets_min": 3441 }, { "epoch": 5.032310177705978, "grad_norm": 0.44926415068891506, "learning_rate": 8.896133428984935e-06, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.13450875878334045, "step": 3115, "valid_targets_mean": 5065.4, "valid_targets_min": 2402 }, { "epoch": 5.040387722132472, "grad_norm": 0.41465194337253264, "learning_rate": 8.829208342404709e-06, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.11707586795091629, "step": 3120, "valid_targets_mean": 5308.8, "valid_targets_min": 3109 }, { "epoch": 5.048465266558966, "grad_norm": 0.4216992603049396, "learning_rate": 8.762464563691315e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.11611682176589966, "step": 3125, "valid_targets_mean": 5293.1, "valid_targets_min": 2159 }, { "epoch": 5.05654281098546, "grad_norm": 0.44501179934754415, "learning_rate": 8.695903176131671e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.11896132677793503, "step": 3130, "valid_targets_mean": 5573.8, "valid_targets_min": 2874 }, { "epoch": 5.064620355411955, "grad_norm": 0.3946578295576979, "learning_rate": 8.62952526005234e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.131038099527359, "step": 3135, "valid_targets_mean": 6400.7, "valid_targets_min": 3402 }, { "epoch": 5.072697899838449, "grad_norm": 0.45436587295250586, "learning_rate": 8.563331892802076e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.117171511054039, "step": 3140, "valid_targets_mean": 4811.6, "valid_targets_min": 2952 }, { "epoch": 5.080775444264943, "grad_norm": 0.40209870031547296, "learning_rate": 8.497324148734301e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.1264287829399109, "step": 3145, "valid_targets_mean": 5566.0, "valid_targets_min": 2714 }, { "epoch": 5.088852988691438, "grad_norm": 0.45442895826783986, "learning_rate": 8.431503099189663e-06, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307426542043686, "step": 3150, "valid_targets_mean": 4966.5, "valid_targets_min": 2668 }, { "epoch": 5.096930533117932, "grad_norm": 0.43759406598068035, "learning_rate": 8.36586981247867e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.12658154964447021, "step": 3155, "valid_targets_mean": 5125.0, "valid_targets_min": 3152 }, { "epoch": 5.105008077544427, "grad_norm": 0.4329307110240369, "learning_rate": 8.300425353864347e-06, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.12121981382369995, "step": 3160, "valid_targets_mean": 5237.1, "valid_targets_min": 3475 }, { "epoch": 5.113085621970921, "grad_norm": 0.40729526908685826, "learning_rate": 8.235170785544915e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.12251444905996323, "step": 3165, "valid_targets_mean": 5824.7, "valid_targets_min": 3889 }, { "epoch": 5.121163166397415, "grad_norm": 0.4037150575762845, "learning_rate": 8.170107166636598e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.14814183115959167, "step": 3170, "valid_targets_mean": 6272.6, "valid_targets_min": 3781 }, { "epoch": 5.129240710823909, "grad_norm": 0.4471386441574684, "learning_rate": 8.105235553156407e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.13282373547554016, "step": 3175, "valid_targets_mean": 4648.6, "valid_targets_min": 2869 }, { "epoch": 5.1373182552504035, "grad_norm": 0.4227276424268678, "learning_rate": 8.040556998004983e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12098711729049683, "step": 3180, "valid_targets_mean": 5430.0, "valid_targets_min": 3431 }, { "epoch": 5.145395799676899, "grad_norm": 0.4509975577793107, "learning_rate": 7.97607255094955e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.13260114192962646, "step": 3185, "valid_targets_mean": 5342.8, "valid_targets_min": 2395 }, { "epoch": 5.153473344103393, "grad_norm": 0.4477220807877767, "learning_rate": 7.91178325860685e-06, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.12227153778076172, "step": 3190, "valid_targets_mean": 5051.9, "valid_targets_min": 2560 }, { "epoch": 5.161550888529887, "grad_norm": 0.4264237924218974, "learning_rate": 7.847690164426158e-06, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.12720181047916412, "step": 3195, "valid_targets_mean": 5173.0, "valid_targets_min": 2556 }, { "epoch": 5.169628432956381, "grad_norm": 0.49404814187524054, "learning_rate": 7.783794308672343e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.13522876799106598, "step": 3200, "valid_targets_mean": 4619.8, "valid_targets_min": 935 }, { "epoch": 5.1777059773828755, "grad_norm": 0.4602724062856385, "learning_rate": 7.720096728408997e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.12243683636188507, "step": 3205, "valid_targets_mean": 4999.7, "valid_targets_min": 1595 }, { "epoch": 5.18578352180937, "grad_norm": 0.4411519856570941, "learning_rate": 7.656598457481605e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.1451737880706787, "step": 3210, "valid_targets_mean": 5547.5, "valid_targets_min": 1618 }, { "epoch": 5.193861066235864, "grad_norm": 0.4378288689722619, "learning_rate": 7.593300526500729e-06, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.1233760267496109, "step": 3215, "valid_targets_mean": 5512.4, "valid_targets_min": 3502 }, { "epoch": 5.201938610662358, "grad_norm": 0.47342394353383355, "learning_rate": 7.530203962825331e-06, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.12568993866443634, "step": 3220, "valid_targets_mean": 4450.1, "valid_targets_min": 3026 }, { "epoch": 5.210016155088853, "grad_norm": 0.4796869582707379, "learning_rate": 7.467309790546069e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.12920737266540527, "step": 3225, "valid_targets_mean": 5082.8, "valid_targets_min": 3288 }, { "epoch": 5.2180936995153475, "grad_norm": 0.4160624936206936, "learning_rate": 7.40461903046868e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330195665359497, "step": 3230, "valid_targets_mean": 5481.2, "valid_targets_min": 2841 }, { "epoch": 5.226171243941842, "grad_norm": 0.4510127933852413, "learning_rate": 7.34213270009742e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.1508096605539322, "step": 3235, "valid_targets_mean": 5563.2, "valid_targets_min": 3330 }, { "epoch": 5.234248788368336, "grad_norm": 0.4432108039540858, "learning_rate": 7.2798518136185195e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.14449772238731384, "step": 3240, "valid_targets_mean": 5562.4, "valid_targets_min": 3147 }, { "epoch": 5.24232633279483, "grad_norm": 0.4836206888531536, "learning_rate": 7.2177773818837744e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.14104701578617096, "step": 3245, "valid_targets_mean": 4805.9, "valid_targets_min": 2348 }, { "epoch": 5.250403877221324, "grad_norm": 0.4230418368080128, "learning_rate": 7.1559104123941e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1265610009431839, "step": 3250, "valid_targets_mean": 5207.2, "valid_targets_min": 3414 }, { "epoch": 5.258481421647819, "grad_norm": 0.44816877933584826, "learning_rate": 7.094251909283181e-06, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.11602858453989029, "step": 3255, "valid_targets_mean": 4590.4, "valid_targets_min": 2297 }, { "epoch": 5.266558966074314, "grad_norm": 0.43966715189943295, "learning_rate": 7.0328028733011875e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.12680992484092712, "step": 3260, "valid_targets_mean": 5906.9, "valid_targets_min": 2735 }, { "epoch": 5.274636510500808, "grad_norm": 0.4378291301058054, "learning_rate": 6.971564301798543e-06, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.12160511314868927, "step": 3265, "valid_targets_mean": 5089.8, "valid_targets_min": 2870 }, { "epoch": 5.282714054927302, "grad_norm": 0.4000060678767217, "learning_rate": 6.91053718870969e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12655307352542877, "step": 3270, "valid_targets_mean": 5991.4, "valid_targets_min": 2731 }, { "epoch": 5.290791599353796, "grad_norm": 0.4099273992124578, "learning_rate": 6.8497225245370144e-06, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262008100748062, "step": 3275, "valid_targets_mean": 5426.8, "valid_targets_min": 2333 }, { "epoch": 5.298869143780291, "grad_norm": 0.4364288531777203, "learning_rate": 6.78912129633474e-06, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.1258752942085266, "step": 3280, "valid_targets_mean": 5990.5, "valid_targets_min": 2789 }, { "epoch": 5.306946688206785, "grad_norm": 0.4393195781993097, "learning_rate": 6.728734487692894e-06, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283208578824997, "step": 3285, "valid_targets_mean": 4943.7, "valid_targets_min": 2061 }, { "epoch": 5.315024232633279, "grad_norm": 0.4903622209303023, "learning_rate": 6.668563078721382e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.11967407166957855, "step": 3290, "valid_targets_mean": 4793.8, "valid_targets_min": 3392 }, { "epoch": 5.323101777059774, "grad_norm": 0.45020393410672527, "learning_rate": 6.608608046034046e-06, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.13561296463012695, "step": 3295, "valid_targets_mean": 5099.8, "valid_targets_min": 2654 }, { "epoch": 5.331179321486268, "grad_norm": 0.45266802210645696, "learning_rate": 6.54887036273284e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.11593136191368103, "step": 3300, "valid_targets_mean": 4864.9, "valid_targets_min": 3313 }, { "epoch": 5.339256865912763, "grad_norm": 0.4377571625246567, "learning_rate": 6.489350998392001e-06, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.12568038702011108, "step": 3305, "valid_targets_mean": 5153.2, "valid_targets_min": 2897 }, { "epoch": 5.347334410339257, "grad_norm": 0.43303242638782025, "learning_rate": 6.430050919042347e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.13954932987689972, "step": 3310, "valid_targets_mean": 6399.5, "valid_targets_min": 4216 }, { "epoch": 5.355411954765751, "grad_norm": 0.44970687075331883, "learning_rate": 6.370971087155591e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.13170082867145538, "step": 3315, "valid_targets_mean": 5281.7, "valid_targets_min": 3191 }, { "epoch": 5.363489499192245, "grad_norm": 0.4332525900942074, "learning_rate": 6.312112461628697e-06, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.12100870907306671, "step": 3320, "valid_targets_mean": 5090.7, "valid_targets_min": 2566 }, { "epoch": 5.3715670436187395, "grad_norm": 0.4382168631917469, "learning_rate": 6.253475997768348e-06, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.13327665627002716, "step": 3325, "valid_targets_mean": 5236.8, "valid_targets_min": 2975 }, { "epoch": 5.379644588045235, "grad_norm": 0.42660852601181254, "learning_rate": 6.195062647275408e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12060268223285675, "step": 3330, "valid_targets_mean": 5242.0, "valid_targets_min": 2180 }, { "epoch": 5.387722132471729, "grad_norm": 0.4373544379702163, "learning_rate": 6.136873358229507e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.11785711348056793, "step": 3335, "valid_targets_mean": 5259.1, "valid_targets_min": 2708 }, { "epoch": 5.395799676898223, "grad_norm": 0.41586955748569704, "learning_rate": 6.078909075073642e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338985115289688, "step": 3340, "valid_targets_mean": 6643.9, "valid_targets_min": 3093 }, { "epoch": 5.403877221324717, "grad_norm": 0.4180961613164803, "learning_rate": 6.021170738598827e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12959451973438263, "step": 3345, "valid_targets_mean": 5452.9, "valid_targets_min": 2867 }, { "epoch": 5.4119547657512115, "grad_norm": 0.44161500993929853, "learning_rate": 5.9636592859288536e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.14301708340644836, "step": 3350, "valid_targets_mean": 5461.9, "valid_targets_min": 3516 }, { "epoch": 5.420032310177706, "grad_norm": 0.4327699310648836, "learning_rate": 5.906375650505078e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12899701297283173, "step": 3355, "valid_targets_mean": 5683.8, "valid_targets_min": 3401 }, { "epoch": 5.4281098546042, "grad_norm": 0.4773817043534635, "learning_rate": 5.84932076207124e-06, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.14128807187080383, "step": 3360, "valid_targets_mean": 5567.1, "valid_targets_min": 3045 }, { "epoch": 5.436187399030695, "grad_norm": 0.4658579711976311, "learning_rate": 5.792495546658412e-06, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277376413345337, "step": 3365, "valid_targets_mean": 5739.8, "valid_targets_min": 3299 }, { "epoch": 5.444264943457189, "grad_norm": 0.4584917541629052, "learning_rate": 5.7359009265699504e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.14182579517364502, "step": 3370, "valid_targets_mean": 4920.7, "valid_targets_min": 2618 }, { "epoch": 5.4523424878836835, "grad_norm": 0.4310834601799318, "learning_rate": 5.679537820366512e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.12319634854793549, "step": 3375, "valid_targets_mean": 5160.1, "valid_targets_min": 2577 }, { "epoch": 5.460420032310178, "grad_norm": 0.45882510774341584, "learning_rate": 5.623407142851176e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.13417544960975647, "step": 3380, "valid_targets_mean": 4943.8, "valid_targets_min": 2983 }, { "epoch": 5.468497576736672, "grad_norm": 0.4706822122675181, "learning_rate": 5.567509805054578e-06, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.13072508573532104, "step": 3385, "valid_targets_mean": 5548.0, "valid_targets_min": 2401 }, { "epoch": 5.476575121163166, "grad_norm": 0.4430008079811621, "learning_rate": 5.5118467142201305e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1270829737186432, "step": 3390, "valid_targets_mean": 4675.6, "valid_targets_min": 2274 }, { "epoch": 5.48465266558966, "grad_norm": 0.4055283775412177, "learning_rate": 5.456418773789274e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.12905651330947876, "step": 3395, "valid_targets_mean": 6398.8, "valid_targets_min": 3517 }, { "epoch": 5.4927302100161555, "grad_norm": 0.4292954787037575, "learning_rate": 5.401226883386856e-06, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.13923311233520508, "step": 3400, "valid_targets_mean": 5949.5, "valid_targets_min": 2955 }, { "epoch": 5.50080775444265, "grad_norm": 0.4320861331630341, "learning_rate": 5.346271938806495e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.1434241682291031, "step": 3405, "valid_targets_mean": 5600.8, "valid_targets_min": 3004 }, { "epoch": 5.508885298869144, "grad_norm": 0.426440128757936, "learning_rate": 5.291554831996062e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.13731537759304047, "step": 3410, "valid_targets_mean": 5350.3, "valid_targets_min": 2603 }, { "epoch": 5.516962843295638, "grad_norm": 0.4300163801774742, "learning_rate": 5.237076451043188e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.130250483751297, "step": 3415, "valid_targets_mean": 5307.6, "valid_targets_min": 2725 }, { "epoch": 5.525040387722132, "grad_norm": 0.451123503977269, "learning_rate": 5.1828376801608525e-06, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.11685208231210709, "step": 3420, "valid_targets_mean": 4572.0, "valid_targets_min": 494 }, { "epoch": 5.533117932148627, "grad_norm": 0.41538448653314575, "learning_rate": 5.128839399673045e-06, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.13642895221710205, "step": 3425, "valid_targets_mean": 5603.0, "valid_targets_min": 3452 }, { "epoch": 5.541195476575121, "grad_norm": 0.4329784732882114, "learning_rate": 5.075082486000474e-06, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.13025406002998352, "step": 3430, "valid_targets_mean": 5057.3, "valid_targets_min": 1270 }, { "epoch": 5.549273021001616, "grad_norm": 0.44960446892514844, "learning_rate": 5.021567811646313e-06, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.1450745165348053, "step": 3435, "valid_targets_mean": 5347.9, "valid_targets_min": 3246 }, { "epoch": 5.55735056542811, "grad_norm": 0.41581636303296576, "learning_rate": 4.968296245182089e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.11230681836605072, "step": 3440, "valid_targets_mean": 5219.1, "valid_targets_min": 3596 }, { "epoch": 5.565428109854604, "grad_norm": 0.46622193654098787, "learning_rate": 4.915268651233553e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.1380825638771057, "step": 3445, "valid_targets_mean": 4438.7, "valid_targets_min": 2707 }, { "epoch": 5.573505654281099, "grad_norm": 0.44530442740815335, "learning_rate": 4.862485890466635e-06, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.13368725776672363, "step": 3450, "valid_targets_mean": 5893.5, "valid_targets_min": 3301 }, { "epoch": 5.581583198707593, "grad_norm": 0.43374674664178625, "learning_rate": 4.8099488195735155e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.12141568958759308, "step": 3455, "valid_targets_mean": 6286.9, "valid_targets_min": 3189 }, { "epoch": 5.589660743134087, "grad_norm": 0.43085346625468096, "learning_rate": 4.757658291258693e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.12574200332164764, "step": 3460, "valid_targets_mean": 5033.8, "valid_targets_min": 3589 }, { "epoch": 5.597738287560581, "grad_norm": 0.4267327262798803, "learning_rate": 4.705615154225134e-06, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.11858279258012772, "step": 3465, "valid_targets_mean": 5222.2, "valid_targets_min": 1583 }, { "epoch": 5.605815831987076, "grad_norm": 0.41479559745363154, "learning_rate": 4.6538202531605304e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.12612152099609375, "step": 3470, "valid_targets_mean": 5382.6, "valid_targets_min": 3126 }, { "epoch": 5.613893376413571, "grad_norm": 0.44362522228036605, "learning_rate": 4.602274428723568e-06, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.13906408846378326, "step": 3475, "valid_targets_mean": 5549.4, "valid_targets_min": 2956 }, { "epoch": 5.621970920840065, "grad_norm": 0.48940058866056046, "learning_rate": 4.550978517530287e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.15402500331401825, "step": 3480, "valid_targets_mean": 4956.8, "valid_targets_min": 3389 }, { "epoch": 5.630048465266559, "grad_norm": 0.4380326810478009, "learning_rate": 4.499933352140504e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398143470287323, "step": 3485, "valid_targets_mean": 5444.6, "valid_targets_min": 3100 }, { "epoch": 5.638126009693053, "grad_norm": 0.42605344964709, "learning_rate": 4.44913976104429e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.12708860635757446, "step": 3490, "valid_targets_mean": 5242.1, "valid_targets_min": 3196 }, { "epoch": 5.646203554119547, "grad_norm": 0.48778301584741457, "learning_rate": 4.398598568648542e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.1347925364971161, "step": 3495, "valid_targets_mean": 4615.4, "valid_targets_min": 3110 }, { "epoch": 5.654281098546042, "grad_norm": 0.39618198656394327, "learning_rate": 4.348310595263597e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.13055220246315002, "step": 3500, "valid_targets_mean": 6067.0, "valid_targets_min": 3733 }, { "epoch": 5.662358642972537, "grad_norm": 0.44742584197434127, "learning_rate": 4.29827665708989e-06, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.12233701348304749, "step": 3505, "valid_targets_mean": 4934.1, "valid_targets_min": 2995 }, { "epoch": 5.670436187399031, "grad_norm": 0.4462032079816014, "learning_rate": 4.248497566204755e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12860026955604553, "step": 3510, "valid_targets_mean": 5250.4, "valid_targets_min": 3606 }, { "epoch": 5.678513731825525, "grad_norm": 0.43055984492150595, "learning_rate": 4.198974130549209e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282704770565033, "step": 3515, "valid_targets_mean": 5206.6, "valid_targets_min": 2518 }, { "epoch": 5.686591276252019, "grad_norm": 0.4087171428147634, "learning_rate": 4.149707153914855e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.12912295758724213, "step": 3520, "valid_targets_mean": 5396.3, "valid_targets_min": 2628 }, { "epoch": 5.694668820678514, "grad_norm": 0.46483924914673547, "learning_rate": 4.100697435930812e-06, "loss": 0.1356, "loss_nan_ranks": 0, "loss_rank_avg": 0.14172643423080444, "step": 3525, "valid_targets_mean": 5788.2, "valid_targets_min": 3464 }, { "epoch": 5.702746365105008, "grad_norm": 0.4632668885464545, "learning_rate": 4.0519457720507785e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13240531086921692, "step": 3530, "valid_targets_mean": 5077.1, "valid_targets_min": 1471 }, { "epoch": 5.710823909531502, "grad_norm": 0.4334095684159384, "learning_rate": 4.003452953540088e-06, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.131183922290802, "step": 3535, "valid_targets_mean": 5292.6, "valid_targets_min": 3034 }, { "epoch": 5.718901453957997, "grad_norm": 0.3888369802534452, "learning_rate": 3.95521976746287e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.13127687573432922, "step": 3540, "valid_targets_mean": 6261.8, "valid_targets_min": 2698 }, { "epoch": 5.726978998384491, "grad_norm": 0.42989158386615484, "learning_rate": 3.907246996669289e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.1272650510072708, "step": 3545, "valid_targets_mean": 5860.9, "valid_targets_min": 3736 }, { "epoch": 5.735056542810986, "grad_norm": 0.41599823091501176, "learning_rate": 3.8595354197828405e-06, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12474222481250763, "step": 3550, "valid_targets_mean": 5342.7, "valid_targets_min": 3059 }, { "epoch": 5.74313408723748, "grad_norm": 0.4043405806565461, "learning_rate": 3.8120858111876824e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.11929463595151901, "step": 3555, "valid_targets_mean": 5652.8, "valid_targets_min": 3672 }, { "epoch": 5.751211631663974, "grad_norm": 0.46661331335623885, "learning_rate": 3.7648989410161064e-06, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.13622185587882996, "step": 3560, "valid_targets_mean": 4769.8, "valid_targets_min": 2370 }, { "epoch": 5.759289176090468, "grad_norm": 0.4184938336356662, "learning_rate": 3.7179755751360193e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.1348327100276947, "step": 3565, "valid_targets_mean": 5862.5, "valid_targets_min": 2050 }, { "epoch": 5.7673667205169625, "grad_norm": 0.4209144525581572, "learning_rate": 3.6713164751384933e-06, "loss": 0.1267, "loss_nan_ranks": 0, "loss_rank_avg": 0.12385410070419312, "step": 3570, "valid_targets_mean": 5000.0, "valid_targets_min": 875 }, { "epoch": 5.775444264943458, "grad_norm": 0.47636037540360815, "learning_rate": 3.624922398325461e-06, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.1303969919681549, "step": 3575, "valid_targets_mean": 4286.1, "valid_targets_min": 860 }, { "epoch": 5.783521809369952, "grad_norm": 0.4155562167139012, "learning_rate": 3.578794097697358e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.13030406832695007, "step": 3580, "valid_targets_mean": 5310.9, "valid_targets_min": 3587 }, { "epoch": 5.791599353796446, "grad_norm": 0.5016412125220293, "learning_rate": 3.5329323219409404e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.13560795783996582, "step": 3585, "valid_targets_mean": 5757.9, "valid_targets_min": 3802 }, { "epoch": 5.79967689822294, "grad_norm": 0.4287142497742641, "learning_rate": 3.4873378154171355e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.12317405641078949, "step": 3590, "valid_targets_mean": 5041.9, "valid_targets_min": 3316 }, { "epoch": 5.8077544426494345, "grad_norm": 0.415107501998662, "learning_rate": 3.44201131814893e-06, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.11532598733901978, "step": 3595, "valid_targets_mean": 5660.2, "valid_targets_min": 2571 }, { "epoch": 5.815831987075929, "grad_norm": 0.4576138982293604, "learning_rate": 3.396953565809393e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.12490224838256836, "step": 3600, "valid_targets_mean": 4615.6, "valid_targets_min": 3102 }, { "epoch": 5.823909531502423, "grad_norm": 0.44157735215572447, "learning_rate": 3.3521652897097145e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.14809024333953857, "step": 3605, "valid_targets_mean": 5332.1, "valid_targets_min": 1294 }, { "epoch": 5.831987075928918, "grad_norm": 0.44788378747331953, "learning_rate": 3.3076472167873506e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.14152215421199799, "step": 3610, "valid_targets_mean": 5306.1, "valid_targets_min": 3152 }, { "epoch": 5.840064620355412, "grad_norm": 0.41062346511478454, "learning_rate": 3.2634000695942005e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.11961716413497925, "step": 3615, "valid_targets_mean": 5562.0, "valid_targets_min": 2508 }, { "epoch": 5.8481421647819065, "grad_norm": 0.45060523033481636, "learning_rate": 3.2194245662849076e-06, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.13177934288978577, "step": 3620, "valid_targets_mean": 5529.1, "valid_targets_min": 3357 }, { "epoch": 5.856219709208401, "grad_norm": 0.46069722388709394, "learning_rate": 3.175721420605198e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.12503468990325928, "step": 3625, "valid_targets_mean": 4698.9, "valid_targets_min": 3025 }, { "epoch": 5.864297253634895, "grad_norm": 0.42719671755097033, "learning_rate": 3.132291341880269e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.12041535973548889, "step": 3630, "valid_targets_mean": 5449.2, "valid_targets_min": 3499 }, { "epoch": 5.872374798061389, "grad_norm": 0.45809759944896844, "learning_rate": 3.08913503500331e-06, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.12977182865142822, "step": 3635, "valid_targets_mean": 4846.6, "valid_targets_min": 1747 }, { "epoch": 5.880452342487883, "grad_norm": 0.4004710139327011, "learning_rate": 3.0462532004240497e-06, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.11773309111595154, "step": 3640, "valid_targets_mean": 5603.2, "valid_targets_min": 1502 }, { "epoch": 5.8885298869143785, "grad_norm": 0.42901347254613426, "learning_rate": 3.0036465341373764e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.15141505002975464, "step": 3645, "valid_targets_mean": 5615.2, "valid_targets_min": 1618 }, { "epoch": 5.896607431340873, "grad_norm": 0.4360637592715409, "learning_rate": 2.9613157276720604e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.12636485695838928, "step": 3650, "valid_targets_mean": 5416.1, "valid_targets_min": 3584 }, { "epoch": 5.904684975767367, "grad_norm": 0.40220716793314576, "learning_rate": 2.9192614680795196e-06, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.12780413031578064, "step": 3655, "valid_targets_mean": 5938.9, "valid_targets_min": 3451 }, { "epoch": 5.912762520193861, "grad_norm": 0.4325378825436018, "learning_rate": 2.8774844379226554e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.13803870975971222, "step": 3660, "valid_targets_mean": 5305.1, "valid_targets_min": 2629 }, { "epoch": 5.920840064620355, "grad_norm": 0.4414669381253834, "learning_rate": 2.8359853152648175e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497833371162415, "step": 3665, "valid_targets_mean": 5239.0, "valid_targets_min": 2990 }, { "epoch": 5.92891760904685, "grad_norm": 0.4393760609199369, "learning_rate": 2.7947647736587425e-06, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.13562984764575958, "step": 3670, "valid_targets_mean": 5573.1, "valid_targets_min": 3174 }, { "epoch": 5.936995153473344, "grad_norm": 0.42547485094726206, "learning_rate": 2.753823482135658e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.13088464736938477, "step": 3675, "valid_targets_mean": 5294.8, "valid_targets_min": 2571 }, { "epoch": 5.945072697899839, "grad_norm": 0.41839366327792726, "learning_rate": 2.713162105194427e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1284753829240799, "step": 3680, "valid_targets_mean": 6062.1, "valid_targets_min": 3553 }, { "epoch": 5.953150242326333, "grad_norm": 0.44798323279186714, "learning_rate": 2.672781302790726e-06, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.14375978708267212, "step": 3685, "valid_targets_mean": 5534.2, "valid_targets_min": 3805 }, { "epoch": 5.961227786752827, "grad_norm": 0.44867958556757354, "learning_rate": 2.6326817303263764e-06, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.1329280585050583, "step": 3690, "valid_targets_mean": 5351.2, "valid_targets_min": 2891 }, { "epoch": 5.969305331179322, "grad_norm": 0.437445716769064, "learning_rate": 2.592864038638685e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.1237957552075386, "step": 3695, "valid_targets_mean": 5218.3, "valid_targets_min": 3165 }, { "epoch": 5.977382875605816, "grad_norm": 0.4171417743389424, "learning_rate": 2.5533288739898865e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.16024985909461975, "step": 3700, "valid_targets_mean": 5685.4, "valid_targets_min": 1278 }, { "epoch": 5.98546042003231, "grad_norm": 0.42356417930931556, "learning_rate": 2.5140768780566436e-06, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332971751689911, "step": 3705, "valid_targets_mean": 6115.1, "valid_targets_min": 4652 }, { "epoch": 5.993537964458804, "grad_norm": 0.4187791264085228, "learning_rate": 2.475108687919645e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.12996046245098114, "step": 3710, "valid_targets_mean": 5287.6, "valid_targets_min": 2671 }, { "epoch": 6.0016155088852985, "grad_norm": 0.38042177308670916, "learning_rate": 2.43642493605327e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.13582850992679596, "step": 3715, "valid_targets_mean": 6274.0, "valid_targets_min": 3274 }, { "epoch": 6.009693053311794, "grad_norm": 0.3996995746582545, "learning_rate": 2.398026250315295e-06, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.12647423148155212, "step": 3720, "valid_targets_mean": 5534.5, "valid_targets_min": 494 }, { "epoch": 6.017770597738288, "grad_norm": 0.40840529795994723, "learning_rate": 2.3599132539367386e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.12015852332115173, "step": 3725, "valid_targets_mean": 5502.9, "valid_targets_min": 2993 }, { "epoch": 6.025848142164782, "grad_norm": 0.45063017808794575, "learning_rate": 2.3220865655117274e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.12192650139331818, "step": 3730, "valid_targets_mean": 4680.8, "valid_targets_min": 3100 }, { "epoch": 6.033925686591276, "grad_norm": 0.43630585939735095, "learning_rate": 2.284546798987448e-06, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.12560415267944336, "step": 3735, "valid_targets_mean": 5294.4, "valid_targets_min": 2865 }, { "epoch": 6.0420032310177705, "grad_norm": 0.505722121935076, "learning_rate": 2.2472945636542033e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.13361534476280212, "step": 3740, "valid_targets_mean": 5304.9, "valid_targets_min": 920 }, { "epoch": 6.050080775444265, "grad_norm": 0.42675333406544164, "learning_rate": 2.2103304641355128e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.12612757086753845, "step": 3745, "valid_targets_mean": 5455.9, "valid_targets_min": 3102 }, { "epoch": 6.058158319870759, "grad_norm": 0.4264645769477084, "learning_rate": 2.17365510037828e-06, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.12067071348428726, "step": 3750, "valid_targets_mean": 5514.5, "valid_targets_min": 3111 }, { "epoch": 6.066235864297254, "grad_norm": 0.3923668630594968, "learning_rate": 2.1372690676431106e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.12325260043144226, "step": 3755, "valid_targets_mean": 6121.4, "valid_targets_min": 4815 }, { "epoch": 6.074313408723748, "grad_norm": 0.4314493239984855, "learning_rate": 2.101172956494577e-06, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.1209428682923317, "step": 3760, "valid_targets_mean": 5166.6, "valid_targets_min": 2498 }, { "epoch": 6.0823909531502425, "grad_norm": 0.4682899642080794, "learning_rate": 2.065367352791694e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530829668045044, "step": 3765, "valid_targets_mean": 5197.5, "valid_targets_min": 2402 }, { "epoch": 6.090468497576737, "grad_norm": 0.4411425846116113, "learning_rate": 2.0298528376783787e-06, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.11478254199028015, "step": 3770, "valid_targets_mean": 5477.7, "valid_targets_min": 3269 }, { "epoch": 6.098546042003231, "grad_norm": 0.41948667962899977, "learning_rate": 1.9946299875740236e-06, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.13149794936180115, "step": 3775, "valid_targets_mean": 5922.2, "valid_targets_min": 2735 }, { "epoch": 6.106623586429725, "grad_norm": 0.3997061769361075, "learning_rate": 1.959699374164148e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.12436765432357788, "step": 3780, "valid_targets_mean": 6095.8, "valid_targets_min": 3791 }, { "epoch": 6.114701130856219, "grad_norm": 0.40787813247608634, "learning_rate": 1.9250615643911195e-06, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.12347099184989929, "step": 3785, "valid_targets_mean": 5512.1, "valid_targets_min": 2373 }, { "epoch": 6.1227786752827145, "grad_norm": 0.4394743128766455, "learning_rate": 1.8907171204449316e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11828821897506714, "step": 3790, "valid_targets_mean": 5453.8, "valid_targets_min": 3864 }, { "epoch": 6.130856219709209, "grad_norm": 0.4012592442183262, "learning_rate": 1.8566665997541111e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390397846698761, "step": 3795, "valid_targets_mean": 5487.6, "valid_targets_min": 2737 }, { "epoch": 6.138933764135703, "grad_norm": 0.462240025647866, "learning_rate": 1.8229105549766469e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.14077478647232056, "step": 3800, "valid_targets_mean": 5228.1, "valid_targets_min": 2965 }, { "epoch": 6.147011308562197, "grad_norm": 0.4367640979741714, "learning_rate": 1.7894495339910345e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.11776141822338104, "step": 3805, "valid_targets_mean": 5597.7, "valid_targets_min": 1618 }, { "epoch": 6.155088852988691, "grad_norm": 0.40903146232389964, "learning_rate": 1.7562840798873648e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.11086548119783401, "step": 3810, "valid_targets_mean": 5194.6, "valid_targets_min": 3095 }, { "epoch": 6.163166397415186, "grad_norm": 0.6394406603603819, "learning_rate": 1.7234147309585304e-06, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.13591381907463074, "step": 3815, "valid_targets_mean": 5851.1, "valid_targets_min": 3703 }, { "epoch": 6.17124394184168, "grad_norm": 0.45620403937167114, "learning_rate": 1.6908420206914854e-06, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.12876799702644348, "step": 3820, "valid_targets_mean": 5486.4, "valid_targets_min": 2299 }, { "epoch": 6.179321486268175, "grad_norm": 0.4606826442584153, "learning_rate": 1.6585664777585654e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.13059750199317932, "step": 3825, "valid_targets_mean": 4831.5, "valid_targets_min": 2564 }, { "epoch": 6.187399030694669, "grad_norm": 0.4775624709862394, "learning_rate": 1.6265886260089337e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.11253519356250763, "step": 3830, "valid_targets_mean": 5556.9, "valid_targets_min": 3334 }, { "epoch": 6.195476575121163, "grad_norm": 0.5357108543862896, "learning_rate": 1.5949089844600729e-06, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.11639741063117981, "step": 3835, "valid_targets_mean": 4648.2, "valid_targets_min": 2791 }, { "epoch": 6.203554119547658, "grad_norm": 1.215560948141749, "learning_rate": 1.563528067289335e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.1310233175754547, "step": 3840, "valid_targets_mean": 5432.3, "valid_targets_min": 2975 }, { "epoch": 6.211631663974152, "grad_norm": 0.43295667523345815, "learning_rate": 1.5324463838256476e-06, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.12923157215118408, "step": 3845, "valid_targets_mean": 5914.4, "valid_targets_min": 875 }, { "epoch": 6.219709208400646, "grad_norm": 0.4313108587022746, "learning_rate": 1.5016644385411928e-06, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.13349610567092896, "step": 3850, "valid_targets_mean": 5821.2, "valid_targets_min": 3989 }, { "epoch": 6.22778675282714, "grad_norm": 0.48650958615453055, "learning_rate": 1.4711827310432437e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.15580685436725616, "step": 3855, "valid_targets_mean": 5863.0, "valid_targets_min": 3242 }, { "epoch": 6.2358642972536344, "grad_norm": 0.40857640102352444, "learning_rate": 1.441001756066076e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.12889908254146576, "step": 3860, "valid_targets_mean": 5974.9, "valid_targets_min": 2904 }, { "epoch": 6.24394184168013, "grad_norm": 0.4541360947416613, "learning_rate": 1.4111220034628925e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.12288201600313187, "step": 3865, "valid_targets_mean": 5001.9, "valid_targets_min": 2061 }, { "epoch": 6.252019386106624, "grad_norm": 0.4507694019187057, "learning_rate": 1.3815439581979106e-06, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.12719199061393738, "step": 3870, "valid_targets_mean": 4805.4, "valid_targets_min": 635 }, { "epoch": 6.260096930533118, "grad_norm": 0.43314759395541486, "learning_rate": 1.352268100338483e-06, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.12478262186050415, "step": 3875, "valid_targets_mean": 5551.4, "valid_targets_min": 3299 }, { "epoch": 6.268174474959612, "grad_norm": 0.4434291666714666, "learning_rate": 1.3232949050472809e-06, "loss": 0.1225, "loss_nan_ranks": 0, "loss_rank_avg": 0.11485721915960312, "step": 3880, "valid_targets_mean": 5089.8, "valid_targets_min": 3032 }, { "epoch": 6.276252019386106, "grad_norm": 0.4269358778893437, "learning_rate": 1.2946248425746189e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.12474660575389862, "step": 3885, "valid_targets_mean": 5354.8, "valid_targets_min": 3237 }, { "epoch": 6.284329563812601, "grad_norm": 0.4944266854838816, "learning_rate": 1.266258378250802e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.1357978880405426, "step": 3890, "valid_targets_mean": 4909.8, "valid_targets_min": 2240 }, { "epoch": 6.292407108239095, "grad_norm": 0.4811185167949499, "learning_rate": 1.2381959724785752e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.12598447501659393, "step": 3895, "valid_targets_mean": 4965.4, "valid_targets_min": 1612 }, { "epoch": 6.30048465266559, "grad_norm": 0.45350839806662147, "learning_rate": 1.2104380807256488e-06, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.12420719116926193, "step": 3900, "valid_targets_mean": 5155.8, "valid_targets_min": 2456 }, { "epoch": 6.308562197092084, "grad_norm": 0.4407541653779522, "learning_rate": 1.182985153517311e-06, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.12510338425636292, "step": 3905, "valid_targets_mean": 5554.1, "valid_targets_min": 1894 }, { "epoch": 6.316639741518578, "grad_norm": 0.43753400948465604, "learning_rate": 1.1558376364291202e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.13448363542556763, "step": 3910, "valid_targets_mean": 5597.8, "valid_targets_min": 3414 }, { "epoch": 6.324717285945073, "grad_norm": 0.4867143708533207, "learning_rate": 1.128995970079656e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12516459822654724, "step": 3915, "valid_targets_mean": 4465.9, "valid_targets_min": 2876 }, { "epoch": 6.332794830371567, "grad_norm": 0.4556391374587531, "learning_rate": 1.1024605901233843e-06, "loss": 0.1267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345321536064148, "step": 3920, "valid_targets_mean": 5282.8, "valid_targets_min": 3026 }, { "epoch": 6.340872374798061, "grad_norm": 0.4901112286992194, "learning_rate": 1.0762319272435851e-06, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.12185169011354446, "step": 3925, "valid_targets_mean": 5655.7, "valid_targets_min": 3168 }, { "epoch": 6.348949919224555, "grad_norm": 0.4458223827027878, "learning_rate": 1.0503104071453429e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.1298675388097763, "step": 3930, "valid_targets_mean": 5410.5, "valid_targets_min": 3389 }, { "epoch": 6.35702746365105, "grad_norm": 0.4251996105028484, "learning_rate": 1.0246964505486768e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.13420116901397705, "step": 3935, "valid_targets_mean": 5914.3, "valid_targets_min": 2609 }, { "epoch": 6.365105008077545, "grad_norm": 0.46439313311522407, "learning_rate": 9.993904731816606e-07, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.1249784454703331, "step": 3940, "valid_targets_mean": 5972.4, "valid_targets_min": 2670 }, { "epoch": 6.373182552504039, "grad_norm": 0.4739447815808242, "learning_rate": 9.743928857737138e-07, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.13924196362495422, "step": 3945, "valid_targets_mean": 4824.4, "valid_targets_min": 2712 }, { "epoch": 6.381260096930533, "grad_norm": 0.48654467584611094, "learning_rate": 9.497040940489332e-07, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.12547633051872253, "step": 3950, "valid_targets_mean": 4858.6, "valid_targets_min": 2845 }, { "epoch": 6.389337641357027, "grad_norm": 0.4356735072665942, "learning_rate": 9.253244987194798e-07, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.12728527188301086, "step": 3955, "valid_targets_mean": 5167.6, "valid_targets_min": 2985 }, { "epoch": 6.3974151857835215, "grad_norm": 0.4506609202751045, "learning_rate": 9.012544954791048e-07, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.13564032316207886, "step": 3960, "valid_targets_mean": 6034.4, "valid_targets_min": 3891 }, { "epoch": 6.405492730210016, "grad_norm": 0.4608952018911762, "learning_rate": 8.774944749967162e-07, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12978151440620422, "step": 3965, "valid_targets_mean": 5206.6, "valid_targets_min": 2467 }, { "epoch": 6.413570274636511, "grad_norm": 0.46107689800024954, "learning_rate": 8.540448229100295e-07, "loss": 0.1206, "loss_nan_ranks": 0, "loss_rank_avg": 0.13031840324401855, "step": 3970, "valid_targets_mean": 5134.1, "valid_targets_min": 1820 }, { "epoch": 6.421647819063005, "grad_norm": 0.4118015091462396, "learning_rate": 8.309059198193225e-07, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.13095030188560486, "step": 3975, "valid_targets_mean": 6233.5, "valid_targets_min": 2561 }, { "epoch": 6.429725363489499, "grad_norm": 0.4682974706826252, "learning_rate": 8.080781412812544e-07, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.13665667176246643, "step": 3980, "valid_targets_mean": 5492.9, "valid_targets_min": 3368 }, { "epoch": 6.4378029079159935, "grad_norm": 0.5043978939772313, "learning_rate": 7.85561857802759e-07, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.14872294664382935, "step": 3985, "valid_targets_mean": 5439.5, "valid_targets_min": 3211 }, { "epoch": 6.445880452342488, "grad_norm": 0.4736575403831154, "learning_rate": 7.633574348350525e-07, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309095025062561, "step": 3990, "valid_targets_mean": 5669.1, "valid_targets_min": 3871 }, { "epoch": 6.453957996768982, "grad_norm": 0.44250125729727774, "learning_rate": 7.414652327676797e-07, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.11579351127147675, "step": 3995, "valid_targets_mean": 5095.6, "valid_targets_min": 3083 }, { "epoch": 6.462035541195476, "grad_norm": 0.46412183365878834, "learning_rate": 7.198856069226834e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247982382774353, "step": 4000, "valid_targets_mean": 5121.2, "valid_targets_min": 3202 }, { "epoch": 6.470113085621971, "grad_norm": 0.42099510160073933, "learning_rate": 6.986189075488159e-07, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.123319610953331, "step": 4005, "valid_targets_mean": 5561.8, "valid_targets_min": 3313 }, { "epoch": 6.4781906300484655, "grad_norm": 0.5096369000331581, "learning_rate": 6.77665479815881e-07, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309448778629303, "step": 4010, "valid_targets_mean": 5498.9, "valid_targets_min": 2886 }, { "epoch": 6.48626817447496, "grad_norm": 0.4469201811102124, "learning_rate": 6.570256638091122e-07, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.11223016679286957, "step": 4015, "valid_targets_mean": 4988.0, "valid_targets_min": 3026 }, { "epoch": 6.494345718901454, "grad_norm": 0.4204535857468685, "learning_rate": 6.366997945236519e-07, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368045210838318, "step": 4020, "valid_targets_mean": 5391.7, "valid_targets_min": 2986 }, { "epoch": 6.502423263327948, "grad_norm": 0.43551176249044327, "learning_rate": 6.166882018591369e-07, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.1250474750995636, "step": 4025, "valid_targets_mean": 5422.8, "valid_targets_min": 2538 }, { "epoch": 6.510500807754442, "grad_norm": 0.4399271110250978, "learning_rate": 5.969912106143105e-07, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.13834628462791443, "step": 4030, "valid_targets_mean": 5169.5, "valid_targets_min": 2401 }, { "epoch": 6.518578352180937, "grad_norm": 0.43382150239329875, "learning_rate": 5.776091404817762e-07, "loss": 0.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.12629744410514832, "step": 4035, "valid_targets_mean": 5217.6, "valid_targets_min": 3262 }, { "epoch": 6.526655896607432, "grad_norm": 0.43276969760803347, "learning_rate": 5.585423060428064e-07, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.1219807118177414, "step": 4040, "valid_targets_mean": 5053.8, "valid_targets_min": 2763 }, { "epoch": 6.534733441033926, "grad_norm": 0.4228424315263158, "learning_rate": 5.397910167622212e-07, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.1212330013513565, "step": 4045, "valid_targets_mean": 5681.0, "valid_targets_min": 3393 }, { "epoch": 6.54281098546042, "grad_norm": 0.43356050429031545, "learning_rate": 5.2135557698338e-07, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.11314418911933899, "step": 4050, "valid_targets_mean": 5226.2, "valid_targets_min": 862 }, { "epoch": 6.550888529886914, "grad_norm": 0.4410363384518348, "learning_rate": 5.032362859232409e-07, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.11539218574762344, "step": 4055, "valid_targets_mean": 5639.7, "valid_targets_min": 2686 }, { "epoch": 6.558966074313409, "grad_norm": 0.39036790685484907, "learning_rate": 4.854334376674908e-07, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.11777080595493317, "step": 4060, "valid_targets_mean": 6159.1, "valid_targets_min": 1583 }, { "epoch": 6.567043618739903, "grad_norm": 0.3970441420439976, "learning_rate": 4.679473211657959e-07, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.11998297274112701, "step": 4065, "valid_targets_mean": 6206.8, "valid_targets_min": 3559 }, { "epoch": 6.575121163166397, "grad_norm": 0.4361589600653003, "learning_rate": 4.507782202270883e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.12242761254310608, "step": 4070, "valid_targets_mean": 5184.5, "valid_targets_min": 2942 }, { "epoch": 6.583198707592892, "grad_norm": 0.41712998221462744, "learning_rate": 4.33926413514969e-07, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.12609797716140747, "step": 4075, "valid_targets_mean": 5275.7, "valid_targets_min": 3429 }, { "epoch": 6.591276252019386, "grad_norm": 0.42389981043438, "learning_rate": 4.1739217454319413e-07, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1254565268754959, "step": 4080, "valid_targets_mean": 5863.4, "valid_targets_min": 3192 }, { "epoch": 6.599353796445881, "grad_norm": 0.4415821899768825, "learning_rate": 4.0117577167121835e-07, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.11877983808517456, "step": 4085, "valid_targets_mean": 5662.8, "valid_targets_min": 3604 }, { "epoch": 6.607431340872375, "grad_norm": 0.4035743849460305, "learning_rate": 3.852774680998561e-07, "loss": 0.1267, "loss_nan_ranks": 0, "loss_rank_avg": 0.11850054562091827, "step": 4090, "valid_targets_mean": 5700.8, "valid_targets_min": 2739 }, { "epoch": 6.615508885298869, "grad_norm": 0.46246205856773076, "learning_rate": 3.6969752186699184e-07, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.13161437213420868, "step": 4095, "valid_targets_mean": 5081.2, "valid_targets_min": 3038 }, { "epoch": 6.623586429725363, "grad_norm": 0.4273771914997136, "learning_rate": 3.544361858434098e-07, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.12390320748090744, "step": 4100, "valid_targets_mean": 5140.4, "valid_targets_min": 1120 }, { "epoch": 6.6316639741518575, "grad_norm": 0.5070081607251208, "learning_rate": 3.3949370772868194e-07, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.14423541724681854, "step": 4105, "valid_targets_mean": 5319.9, "valid_targets_min": 2947 }, { "epoch": 6.639741518578353, "grad_norm": 0.4555409998613445, "learning_rate": 3.2487033004713564e-07, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.13123884797096252, "step": 4110, "valid_targets_mean": 5210.4, "valid_targets_min": 3311 }, { "epoch": 6.647819063004847, "grad_norm": 0.42299953702729287, "learning_rate": 3.105662901439499e-07, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.1164276972413063, "step": 4115, "valid_targets_mean": 5548.9, "valid_targets_min": 3105 }, { "epoch": 6.655896607431341, "grad_norm": 0.5750357035278376, "learning_rate": 2.9658182018126316e-07, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.12372918426990509, "step": 4120, "valid_targets_mean": 4148.2, "valid_targets_min": 936 }, { "epoch": 6.663974151857835, "grad_norm": 0.39431612594628507, "learning_rate": 2.829171471344294e-07, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.11072470247745514, "step": 4125, "valid_targets_mean": 5713.8, "valid_targets_min": 3219 }, { "epoch": 6.6720516962843295, "grad_norm": 0.41958708922647425, "learning_rate": 2.695724927883392e-07, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.12350701540708542, "step": 4130, "valid_targets_mean": 5393.2, "valid_targets_min": 2541 }, { "epoch": 6.680129240710824, "grad_norm": 0.43875701635891834, "learning_rate": 2.5654807373379777e-07, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1251029372215271, "step": 4135, "valid_targets_mean": 5595.2, "valid_targets_min": 2490 }, { "epoch": 6.688206785137318, "grad_norm": 0.4338446938410848, "learning_rate": 2.438441013640258e-07, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.12370643019676208, "step": 4140, "valid_targets_mean": 5581.8, "valid_targets_min": 3348 }, { "epoch": 6.696284329563813, "grad_norm": 0.46482721561432655, "learning_rate": 2.314607818712311e-07, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.13866999745368958, "step": 4145, "valid_targets_mean": 5038.1, "valid_targets_min": 3053 }, { "epoch": 6.704361873990307, "grad_norm": 0.43402661773234946, "learning_rate": 2.1939831624324226e-07, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.12082387506961823, "step": 4150, "valid_targets_mean": 5538.1, "valid_targets_min": 3741 }, { "epoch": 6.7124394184168015, "grad_norm": 0.45577974257774717, "learning_rate": 2.0765690026027353e-07, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.11891952157020569, "step": 4155, "valid_targets_mean": 4971.3, "valid_targets_min": 1305 }, { "epoch": 6.720516962843296, "grad_norm": 0.4053312005766982, "learning_rate": 1.9623672449172292e-07, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.11686712503433228, "step": 4160, "valid_targets_mean": 5524.4, "valid_targets_min": 3847 }, { "epoch": 6.72859450726979, "grad_norm": 0.4495177975522038, "learning_rate": 1.8513797429309477e-07, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.13314317166805267, "step": 4165, "valid_targets_mean": 5426.2, "valid_targets_min": 3193 }, { "epoch": 6.736672051696284, "grad_norm": 0.4933174749913547, "learning_rate": 1.743608298029842e-07, "loss": 0.1267, "loss_nan_ranks": 0, "loss_rank_avg": 0.13363343477249146, "step": 4170, "valid_targets_mean": 4938.6, "valid_targets_min": 3063 }, { "epoch": 6.744749596122778, "grad_norm": 0.4442812474453568, "learning_rate": 1.6390546594015512e-07, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.11812600493431091, "step": 4175, "valid_targets_mean": 5135.5, "valid_targets_min": 3018 }, { "epoch": 6.7528271405492735, "grad_norm": 0.4094154273593245, "learning_rate": 1.5377205240070692e-07, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.12172652781009674, "step": 4180, "valid_targets_mean": 6441.6, "valid_targets_min": 2946 }, { "epoch": 6.760904684975768, "grad_norm": 0.4033924852108923, "learning_rate": 1.4396075365530337e-07, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.11645178496837616, "step": 4185, "valid_targets_mean": 5842.5, "valid_targets_min": 3388 }, { "epoch": 6.768982229402262, "grad_norm": 0.45671966707657646, "learning_rate": 1.3447172894652582e-07, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.13203783333301544, "step": 4190, "valid_targets_mean": 5126.8, "valid_targets_min": 2642 }, { "epoch": 6.777059773828756, "grad_norm": 0.4395252653404362, "learning_rate": 1.2530513228627305e-07, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12178006768226624, "step": 4195, "valid_targets_mean": 5482.8, "valid_targets_min": 3456 }, { "epoch": 6.78513731825525, "grad_norm": 0.4085031802856091, "learning_rate": 1.1646111245326108e-07, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.11593121290206909, "step": 4200, "valid_targets_mean": 5370.7, "valid_targets_min": 3289 }, { "epoch": 6.793214862681745, "grad_norm": 0.4155977707068557, "learning_rate": 1.0793981299062061e-07, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.11050020158290863, "step": 4205, "valid_targets_mean": 6034.5, "valid_targets_min": 2639 }, { "epoch": 6.801292407108239, "grad_norm": 0.49421045013893233, "learning_rate": 9.97413722035545e-08, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.12287741899490356, "step": 4210, "valid_targets_mean": 4324.1, "valid_targets_min": 3034 }, { "epoch": 6.809369951534734, "grad_norm": 0.4509493958502341, "learning_rate": 9.186592315710175e-08, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.12337324023246765, "step": 4215, "valid_targets_mean": 5274.3, "valid_targets_min": 3306 }, { "epoch": 6.817447495961228, "grad_norm": 0.4824539638852361, "learning_rate": 8.431359367397251e-08, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.13827504217624664, "step": 4220, "valid_targets_mean": 5677.6, "valid_targets_min": 3337 }, { "epoch": 6.825525040387722, "grad_norm": 0.4641231639078321, "learning_rate": 7.708450633247655e-08, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.13125362992286682, "step": 4225, "valid_targets_mean": 4806.1, "valid_targets_min": 915 }, { "epoch": 6.833602584814217, "grad_norm": 0.43578209394600614, "learning_rate": 7.017877846452692e-08, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.13602393865585327, "step": 4230, "valid_targets_mean": 5431.9, "valid_targets_min": 3350 }, { "epoch": 6.841680129240711, "grad_norm": 0.4337462209646266, "learning_rate": 6.359652215375045e-08, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.1291150450706482, "step": 4235, "valid_targets_mean": 5241.9, "valid_targets_min": 3324 }, { "epoch": 6.849757673667205, "grad_norm": 0.44529633508876937, "learning_rate": 5.733784423365141e-08, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13770753145217896, "step": 4240, "valid_targets_mean": 5720.6, "valid_targets_min": 2434 }, { "epoch": 6.857835218093699, "grad_norm": 0.4833382892737251, "learning_rate": 5.140284628589065e-08, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1306309700012207, "step": 4245, "valid_targets_mean": 5192.2, "valid_targets_min": 3305 }, { "epoch": 6.865912762520194, "grad_norm": 0.4569082875177306, "learning_rate": 4.5791624638626966e-08, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.13639846444129944, "step": 4250, "valid_targets_mean": 5091.7, "valid_targets_min": 3352 }, { "epoch": 6.8739903069466886, "grad_norm": 0.44052978535555415, "learning_rate": 4.050427036496274e-08, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.12174591422080994, "step": 4255, "valid_targets_mean": 5032.0, "valid_targets_min": 3405 }, { "epoch": 6.882067851373183, "grad_norm": 0.4322882078765028, "learning_rate": 3.554086928145628e-08, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12149839103221893, "step": 4260, "valid_targets_mean": 5363.5, "valid_targets_min": 3387 }, { "epoch": 6.890145395799677, "grad_norm": 0.4059631546711396, "learning_rate": 3.090150194674069e-08, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.1226094663143158, "step": 4265, "valid_targets_mean": 5866.4, "valid_targets_min": 3317 }, { "epoch": 6.898222940226171, "grad_norm": 0.42761180544079447, "learning_rate": 2.658624366020046e-08, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262435019016266, "step": 4270, "valid_targets_mean": 5290.6, "valid_targets_min": 2684 }, { "epoch": 6.906300484652665, "grad_norm": 0.4514593673968472, "learning_rate": 2.2595164460768037e-08, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.12937885522842407, "step": 4275, "valid_targets_mean": 4918.3, "valid_targets_min": 2783 }, { "epoch": 6.91437802907916, "grad_norm": 0.4155716287333983, "learning_rate": 1.892832912577136e-08, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.1169050857424736, "step": 4280, "valid_targets_mean": 5553.2, "valid_targets_min": 2556 }, { "epoch": 6.922455573505655, "grad_norm": 0.468710773720154, "learning_rate": 1.55857971698925e-08, "loss": 0.1267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1221599131822586, "step": 4285, "valid_targets_mean": 5412.1, "valid_targets_min": 906 }, { "epoch": 6.930533117932149, "grad_norm": 0.45936368044765435, "learning_rate": 1.2567622844192885e-08, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.14119364321231842, "step": 4290, "valid_targets_mean": 5258.7, "valid_targets_min": 3509 }, { "epoch": 6.938610662358643, "grad_norm": 0.4446837612589739, "learning_rate": 9.87385513524286e-09, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.1250559538602829, "step": 4295, "valid_targets_mean": 5432.3, "valid_targets_min": 1471 }, { "epoch": 6.946688206785137, "grad_norm": 0.4374289120449582, "learning_rate": 7.504537764320142e-09, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.11904168874025345, "step": 4300, "valid_targets_mean": 5316.8, "valid_targets_min": 2943 }, { "epoch": 6.954765751211632, "grad_norm": 0.4125254709747706, "learning_rate": 5.4597091866992465e-09, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.10562781989574432, "step": 4305, "valid_targets_mean": 5005.0, "valid_targets_min": 2977 }, { "epoch": 6.962843295638126, "grad_norm": 0.4364936215987924, "learning_rate": 3.7394025910320045e-09, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.14175035059452057, "step": 4310, "valid_targets_mean": 5272.9, "valid_targets_min": 3332 }, { "epoch": 6.97092084006462, "grad_norm": 0.43734639977822165, "learning_rate": 2.3436458988057574e-09, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.12999486923217773, "step": 4315, "valid_targets_mean": 5339.0, "valid_targets_min": 3848 }, { "epoch": 6.978998384491114, "grad_norm": 0.4629362816601932, "learning_rate": 1.272461763890398e-09, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.13342653214931488, "step": 4320, "valid_targets_mean": 5303.4, "valid_targets_min": 1747 }, { "epoch": 6.987075928917609, "grad_norm": 0.41405175355515794, "learning_rate": 5.258675721742101e-10, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.11401565372943878, "step": 4325, "valid_targets_mean": 5648.8, "valid_targets_min": 2634 }, { "epoch": 6.995153473344104, "grad_norm": 0.4428591581295041, "learning_rate": 1.038754412752141e-10, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.13264863193035126, "step": 4330, "valid_targets_mean": 5337.8, "valid_targets_min": 2983 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.13213281333446503, "step": 4333, "total_flos": 1596873627009024.0, "train_loss": 0.09127889497572297, "train_runtime": 13176.1283, "train_samples_per_second": 5.26, "train_steps_per_second": 0.329, "valid_targets_mean": 5086.1, "valid_targets_min": 2015 } ], "logging_steps": 5, "max_steps": 4333, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1596873627009024.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }