{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4571, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007656967840735069, "grad_norm": 13.997882752776386, "learning_rate": 3.4934497816593887e-07, "loss": 0.6676, "loss_nan_ranks": 0, "loss_rank_avg": 0.6494572758674622, "step": 5, "valid_targets_mean": 5030.6, "valid_targets_min": 868 }, { "epoch": 0.015313935681470138, "grad_norm": 16.042150352702777, "learning_rate": 7.860262008733626e-07, "loss": 0.6736, "loss_nan_ranks": 0, "loss_rank_avg": 0.6432679295539856, "step": 10, "valid_targets_mean": 5537.1, "valid_targets_min": 972 }, { "epoch": 0.022970903522205207, "grad_norm": 13.768207464178623, "learning_rate": 1.222707423580786e-06, "loss": 0.657, "loss_nan_ranks": 0, "loss_rank_avg": 0.5933096408843994, "step": 15, "valid_targets_mean": 5550.1, "valid_targets_min": 622 }, { "epoch": 0.030627871362940276, "grad_norm": 11.169416861656957, "learning_rate": 1.6593886462882098e-06, "loss": 0.6091, "loss_nan_ranks": 0, "loss_rank_avg": 0.5853960514068604, "step": 20, "valid_targets_mean": 4935.4, "valid_targets_min": 885 }, { "epoch": 0.03828483920367534, "grad_norm": 7.70196829557587, "learning_rate": 2.096069868995633e-06, "loss": 0.5846, "loss_nan_ranks": 0, "loss_rank_avg": 0.5225365161895752, "step": 25, "valid_targets_mean": 4887.4, "valid_targets_min": 281 }, { "epoch": 0.045941807044410414, "grad_norm": 4.492171953461492, "learning_rate": 2.5327510917030567e-06, "loss": 0.5128, "loss_nan_ranks": 0, "loss_rank_avg": 0.5070335268974304, "step": 30, "valid_targets_mean": 5811.4, "valid_targets_min": 885 }, { "epoch": 0.05359877488514548, "grad_norm": 2.953910981015742, "learning_rate": 2.9694323144104806e-06, "loss": 0.4624, "loss_nan_ranks": 0, "loss_rank_avg": 0.46929267048835754, "step": 35, "valid_targets_mean": 4496.3, "valid_targets_min": 578 }, { "epoch": 0.06125574272588055, "grad_norm": 1.7185069687468981, "learning_rate": 3.406113537117904e-06, "loss": 0.4371, "loss_nan_ranks": 0, "loss_rank_avg": 0.45726278424263, "step": 40, "valid_targets_mean": 4568.8, "valid_targets_min": 588 }, { "epoch": 0.06891271056661562, "grad_norm": 1.2031548219005852, "learning_rate": 3.842794759825328e-06, "loss": 0.4393, "loss_nan_ranks": 0, "loss_rank_avg": 0.40769797563552856, "step": 45, "valid_targets_mean": 5177.7, "valid_targets_min": 660 }, { "epoch": 0.07656967840735068, "grad_norm": 1.0641842496634077, "learning_rate": 4.279475982532751e-06, "loss": 0.4176, "loss_nan_ranks": 0, "loss_rank_avg": 0.4184693992137909, "step": 50, "valid_targets_mean": 4836.5, "valid_targets_min": 461 }, { "epoch": 0.08422664624808576, "grad_norm": 0.828475734146539, "learning_rate": 4.716157205240175e-06, "loss": 0.3962, "loss_nan_ranks": 0, "loss_rank_avg": 0.39677250385284424, "step": 55, "valid_targets_mean": 5396.1, "valid_targets_min": 1014 }, { "epoch": 0.09188361408882083, "grad_norm": 0.7394723747598436, "learning_rate": 5.152838427947598e-06, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.4369763731956482, "step": 60, "valid_targets_mean": 5712.2, "valid_targets_min": 701 }, { "epoch": 0.0995405819295559, "grad_norm": 0.7090139134911532, "learning_rate": 5.589519650655022e-06, "loss": 0.3872, "loss_nan_ranks": 0, "loss_rank_avg": 0.3982025682926178, "step": 65, "valid_targets_mean": 5389.4, "valid_targets_min": 2834 }, { "epoch": 0.10719754977029096, "grad_norm": 0.593009086861499, "learning_rate": 6.0262008733624455e-06, "loss": 0.3983, "loss_nan_ranks": 0, "loss_rank_avg": 0.3946113586425781, "step": 70, "valid_targets_mean": 5376.4, "valid_targets_min": 2715 }, { "epoch": 0.11485451761102604, "grad_norm": 0.636095693800591, "learning_rate": 6.462882096069869e-06, "loss": 0.3619, "loss_nan_ranks": 0, "loss_rank_avg": 0.32831794023513794, "step": 75, "valid_targets_mean": 5254.6, "valid_targets_min": 966 }, { "epoch": 0.1225114854517611, "grad_norm": 0.6038700595775229, "learning_rate": 6.8995633187772934e-06, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.3565768003463745, "step": 80, "valid_targets_mean": 4155.2, "valid_targets_min": 629 }, { "epoch": 0.13016845329249618, "grad_norm": 0.9336428663228459, "learning_rate": 7.336244541484717e-06, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.34234848618507385, "step": 85, "valid_targets_mean": 4569.0, "valid_targets_min": 750 }, { "epoch": 0.13782542113323124, "grad_norm": 0.4930514762752864, "learning_rate": 7.77292576419214e-06, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.29909199476242065, "step": 90, "valid_targets_mean": 5865.1, "valid_targets_min": 731 }, { "epoch": 0.14548238897396631, "grad_norm": 0.5516406220071951, "learning_rate": 8.209606986899564e-06, "loss": 0.3488, "loss_nan_ranks": 0, "loss_rank_avg": 0.35991543531417847, "step": 95, "valid_targets_mean": 4539.4, "valid_targets_min": 718 }, { "epoch": 0.15313935681470137, "grad_norm": 0.512386584582494, "learning_rate": 8.646288209606988e-06, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.31739532947540283, "step": 100, "valid_targets_mean": 5295.0, "valid_targets_min": 358 }, { "epoch": 0.16079632465543645, "grad_norm": 0.5553107691519705, "learning_rate": 9.082969432314411e-06, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.34066033363342285, "step": 105, "valid_targets_mean": 4267.7, "valid_targets_min": 671 }, { "epoch": 0.16845329249617153, "grad_norm": 0.5564940658094145, "learning_rate": 9.519650655021835e-06, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.3298887014389038, "step": 110, "valid_targets_mean": 4755.4, "valid_targets_min": 862 }, { "epoch": 0.17611026033690658, "grad_norm": 0.5091671224165091, "learning_rate": 9.956331877729258e-06, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.32190486788749695, "step": 115, "valid_targets_mean": 4750.4, "valid_targets_min": 971 }, { "epoch": 0.18376722817764166, "grad_norm": 0.4905326318477757, "learning_rate": 1.0393013100436682e-05, "loss": 0.3471, "loss_nan_ranks": 0, "loss_rank_avg": 0.3529035151004791, "step": 120, "valid_targets_mean": 5538.1, "valid_targets_min": 935 }, { "epoch": 0.19142419601837674, "grad_norm": 0.5048261747177855, "learning_rate": 1.0829694323144107e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.30244866013526917, "step": 125, "valid_targets_mean": 4734.5, "valid_targets_min": 638 }, { "epoch": 0.1990811638591118, "grad_norm": 0.5361239607380978, "learning_rate": 1.1266375545851529e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.308383584022522, "step": 130, "valid_targets_mean": 4705.6, "valid_targets_min": 873 }, { "epoch": 0.20673813169984687, "grad_norm": 0.46801822029453244, "learning_rate": 1.1703056768558954e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.29804354906082153, "step": 135, "valid_targets_mean": 5411.8, "valid_targets_min": 2391 }, { "epoch": 0.21439509954058192, "grad_norm": 0.47487492624683453, "learning_rate": 1.2139737991266376e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.26761284470558167, "step": 140, "valid_targets_mean": 4593.1, "valid_targets_min": 564 }, { "epoch": 0.222052067381317, "grad_norm": 0.4825202183874898, "learning_rate": 1.2576419213973801e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.27101266384124756, "step": 145, "valid_targets_mean": 4800.3, "valid_targets_min": 720 }, { "epoch": 0.22970903522205208, "grad_norm": 0.5108014073726733, "learning_rate": 1.3013100436681223e-05, "loss": 0.3192, "loss_nan_ranks": 0, "loss_rank_avg": 0.32333505153656006, "step": 150, "valid_targets_mean": 4791.2, "valid_targets_min": 832 }, { "epoch": 0.23736600306278713, "grad_norm": 0.516438690481993, "learning_rate": 1.3449781659388648e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.3009350001811981, "step": 155, "valid_targets_mean": 5810.0, "valid_targets_min": 412 }, { "epoch": 0.2450229709035222, "grad_norm": 0.5405272774787385, "learning_rate": 1.388646288209607e-05, "loss": 0.2992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2833111882209778, "step": 160, "valid_targets_mean": 4378.3, "valid_targets_min": 700 }, { "epoch": 0.25267993874425726, "grad_norm": 0.48541608893286375, "learning_rate": 1.4323144104803495e-05, "loss": 0.3087, "loss_nan_ranks": 0, "loss_rank_avg": 0.2991043031215668, "step": 165, "valid_targets_mean": 5449.2, "valid_targets_min": 854 }, { "epoch": 0.26033690658499237, "grad_norm": 0.4369414808456571, "learning_rate": 1.4759825327510919e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.29198282957077026, "step": 170, "valid_targets_mean": 5611.1, "valid_targets_min": 470 }, { "epoch": 0.2679938744257274, "grad_norm": 0.4650699347244396, "learning_rate": 1.5196506550218343e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.2635342478752136, "step": 175, "valid_targets_mean": 5909.5, "valid_targets_min": 904 }, { "epoch": 0.27565084226646247, "grad_norm": 0.38904002970727797, "learning_rate": 1.5633187772925766e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.23884126543998718, "step": 180, "valid_targets_mean": 6394.3, "valid_targets_min": 2659 }, { "epoch": 0.2833078101071976, "grad_norm": 0.4430505165500373, "learning_rate": 1.6069868995633188e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.2831938862800598, "step": 185, "valid_targets_mean": 6014.1, "valid_targets_min": 2080 }, { "epoch": 0.29096477794793263, "grad_norm": 0.5388790759052032, "learning_rate": 1.6506550218340613e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.2641902565956116, "step": 190, "valid_targets_mean": 5561.6, "valid_targets_min": 2686 }, { "epoch": 0.2986217457886677, "grad_norm": 0.42663945124008945, "learning_rate": 1.6943231441048035e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2681276798248291, "step": 195, "valid_targets_mean": 5588.3, "valid_targets_min": 814 }, { "epoch": 0.30627871362940273, "grad_norm": 0.4943538108066963, "learning_rate": 1.737991266375546e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.2886020839214325, "step": 200, "valid_targets_mean": 4703.8, "valid_targets_min": 837 }, { "epoch": 0.31393568147013784, "grad_norm": 0.5295715062499827, "learning_rate": 1.7816593886462882e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.28761541843414307, "step": 205, "valid_targets_mean": 4730.3, "valid_targets_min": 648 }, { "epoch": 0.3215926493108729, "grad_norm": 0.5017011172561703, "learning_rate": 1.8253275109170307e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.292784184217453, "step": 210, "valid_targets_mean": 5370.1, "valid_targets_min": 1679 }, { "epoch": 0.32924961715160794, "grad_norm": 0.5384473207239906, "learning_rate": 1.868995633187773e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.2923944890499115, "step": 215, "valid_targets_mean": 4821.5, "valid_targets_min": 561 }, { "epoch": 0.33690658499234305, "grad_norm": 0.54252385993879, "learning_rate": 1.9126637554585155e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.25203627347946167, "step": 220, "valid_targets_mean": 4703.9, "valid_targets_min": 862 }, { "epoch": 0.3445635528330781, "grad_norm": 0.4590346647689083, "learning_rate": 1.9563318777292576e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.26956477761268616, "step": 225, "valid_targets_mean": 5403.2, "valid_targets_min": 292 }, { "epoch": 0.35222052067381315, "grad_norm": 0.591472293986723, "learning_rate": 2e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.2686610817909241, "step": 230, "valid_targets_mean": 5279.8, "valid_targets_min": 312 }, { "epoch": 0.35987748851454826, "grad_norm": 0.5351371337014471, "learning_rate": 2.0436681222707423e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.302329421043396, "step": 235, "valid_targets_mean": 4985.8, "valid_targets_min": 585 }, { "epoch": 0.3675344563552833, "grad_norm": 0.50551102825952, "learning_rate": 2.0873362445414852e-05, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.26980355381965637, "step": 240, "valid_targets_mean": 4849.7, "valid_targets_min": 512 }, { "epoch": 0.37519142419601836, "grad_norm": 0.5476580929537973, "learning_rate": 2.1310043668122274e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.30016613006591797, "step": 245, "valid_targets_mean": 4602.2, "valid_targets_min": 611 }, { "epoch": 0.38284839203675347, "grad_norm": 0.538603533015244, "learning_rate": 2.1746724890829696e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.2950373888015747, "step": 250, "valid_targets_mean": 4244.2, "valid_targets_min": 614 }, { "epoch": 0.3905053598774885, "grad_norm": 0.5405956170504431, "learning_rate": 2.2183406113537118e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.28181028366088867, "step": 255, "valid_targets_mean": 4765.5, "valid_targets_min": 625 }, { "epoch": 0.3981623277182236, "grad_norm": 0.4349349330799182, "learning_rate": 2.2620087336244546e-05, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.23736879229545593, "step": 260, "valid_targets_mean": 5519.2, "valid_targets_min": 829 }, { "epoch": 0.4058192955589586, "grad_norm": 0.479699481190532, "learning_rate": 2.3056768558951968e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.250985324382782, "step": 265, "valid_targets_mean": 4890.2, "valid_targets_min": 267 }, { "epoch": 0.41347626339969373, "grad_norm": 0.48110082764216044, "learning_rate": 2.349344978165939e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.2574954926967621, "step": 270, "valid_targets_mean": 5548.7, "valid_targets_min": 1079 }, { "epoch": 0.4211332312404288, "grad_norm": 0.5259890409455534, "learning_rate": 2.3930131004366812e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.2683018445968628, "step": 275, "valid_targets_mean": 5199.2, "valid_targets_min": 764 }, { "epoch": 0.42879019908116384, "grad_norm": 0.4872321788705009, "learning_rate": 2.436681222707424e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631978988647461, "step": 280, "valid_targets_mean": 5506.2, "valid_targets_min": 2013 }, { "epoch": 0.43644716692189894, "grad_norm": 0.49171872502106884, "learning_rate": 2.4803493449781662e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2735797166824341, "step": 285, "valid_targets_mean": 5573.5, "valid_targets_min": 701 }, { "epoch": 0.444104134762634, "grad_norm": 0.5457671973926761, "learning_rate": 2.5240174672489084e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.272636353969574, "step": 290, "valid_targets_mean": 4353.8, "valid_targets_min": 851 }, { "epoch": 0.45176110260336905, "grad_norm": 0.6850256638019349, "learning_rate": 2.567685589519651e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.25342246890068054, "step": 295, "valid_targets_mean": 5045.3, "valid_targets_min": 585 }, { "epoch": 0.45941807044410415, "grad_norm": 0.5394245332540767, "learning_rate": 2.6113537117903935e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.2724701166152954, "step": 300, "valid_targets_mean": 4828.3, "valid_targets_min": 875 }, { "epoch": 0.4670750382848392, "grad_norm": 0.5175333803982558, "learning_rate": 2.6550218340611357e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.2658703625202179, "step": 305, "valid_targets_mean": 5024.8, "valid_targets_min": 301 }, { "epoch": 0.47473200612557426, "grad_norm": 0.4885980644156084, "learning_rate": 2.698689956331878e-05, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.27572572231292725, "step": 310, "valid_targets_mean": 4917.0, "valid_targets_min": 993 }, { "epoch": 0.48238897396630936, "grad_norm": 0.9846395603780147, "learning_rate": 2.7423580786026204e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.2755519151687622, "step": 315, "valid_targets_mean": 4701.9, "valid_targets_min": 802 }, { "epoch": 0.4900459418070444, "grad_norm": 0.5476680571665029, "learning_rate": 2.786026200873363e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.31073257327079773, "step": 320, "valid_targets_mean": 5116.8, "valid_targets_min": 806 }, { "epoch": 0.49770290964777947, "grad_norm": 0.48787777876251054, "learning_rate": 2.829694323144105e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.24321046471595764, "step": 325, "valid_targets_mean": 4564.9, "valid_targets_min": 591 }, { "epoch": 0.5053598774885145, "grad_norm": 0.581959700960055, "learning_rate": 2.8733624454148473e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.2841954827308655, "step": 330, "valid_targets_mean": 5433.1, "valid_targets_min": 538 }, { "epoch": 0.5130168453292496, "grad_norm": 0.5197427771747507, "learning_rate": 2.9170305676855898e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.24852226674556732, "step": 335, "valid_targets_mean": 5383.6, "valid_targets_min": 2532 }, { "epoch": 0.5206738131699847, "grad_norm": 0.5832961166696086, "learning_rate": 2.960698689956332e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.283719003200531, "step": 340, "valid_targets_mean": 4863.8, "valid_targets_min": 809 }, { "epoch": 0.5283307810107197, "grad_norm": 0.5190165410837098, "learning_rate": 3.0043668122270745e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.2984423041343689, "step": 345, "valid_targets_mean": 5248.1, "valid_targets_min": 472 }, { "epoch": 0.5359877488514548, "grad_norm": 0.5424715125473839, "learning_rate": 3.0480349344978167e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.27597424387931824, "step": 350, "valid_targets_mean": 4519.0, "valid_targets_min": 645 }, { "epoch": 0.5436447166921899, "grad_norm": 0.5792391186945091, "learning_rate": 3.091703056768559e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.26070481538772583, "step": 355, "valid_targets_mean": 4367.1, "valid_targets_min": 625 }, { "epoch": 0.5513016845329249, "grad_norm": 0.61377111290995, "learning_rate": 3.1353711790393014e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.30032479763031006, "step": 360, "valid_targets_mean": 4076.1, "valid_targets_min": 655 }, { "epoch": 0.55895865237366, "grad_norm": 0.4499780741388462, "learning_rate": 3.1790393013100436e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.26613035798072815, "step": 365, "valid_targets_mean": 5930.6, "valid_targets_min": 2546 }, { "epoch": 0.5666156202143952, "grad_norm": 0.6040296111678708, "learning_rate": 3.2227074235807864e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.26369449496269226, "step": 370, "valid_targets_mean": 4356.6, "valid_targets_min": 767 }, { "epoch": 0.5742725880551302, "grad_norm": 0.5341830406768366, "learning_rate": 3.2663755458515286e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.30968743562698364, "step": 375, "valid_targets_mean": 5326.2, "valid_targets_min": 924 }, { "epoch": 0.5819295558958653, "grad_norm": 0.6231930070736144, "learning_rate": 3.310043668122271e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.29652100801467896, "step": 380, "valid_targets_mean": 4574.1, "valid_targets_min": 313 }, { "epoch": 0.5895865237366003, "grad_norm": 0.575410318717094, "learning_rate": 3.353711790393013e-05, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.2684730589389801, "step": 385, "valid_targets_mean": 4358.5, "valid_targets_min": 308 }, { "epoch": 0.5972434915773354, "grad_norm": 0.4673654478032364, "learning_rate": 3.397379912663756e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228243201971054, "step": 390, "valid_targets_mean": 5666.8, "valid_targets_min": 625 }, { "epoch": 0.6049004594180705, "grad_norm": 0.48675286049843114, "learning_rate": 3.441048034934498e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.23089733719825745, "step": 395, "valid_targets_mean": 5237.9, "valid_targets_min": 379 }, { "epoch": 0.6125574272588055, "grad_norm": 0.560591662575993, "learning_rate": 3.48471615720524e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.2665928602218628, "step": 400, "valid_targets_mean": 4672.1, "valid_targets_min": 645 }, { "epoch": 0.6202143950995406, "grad_norm": 0.42731570802442403, "learning_rate": 3.5283842794759824e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.22624076902866364, "step": 405, "valid_targets_mean": 5482.8, "valid_targets_min": 592 }, { "epoch": 0.6278713629402757, "grad_norm": 0.5347556972076133, "learning_rate": 3.572052401746725e-05, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.23603232204914093, "step": 410, "valid_targets_mean": 5739.4, "valid_targets_min": 743 }, { "epoch": 0.6355283307810107, "grad_norm": 0.5325226811766738, "learning_rate": 3.6157205240174675e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2480698823928833, "step": 415, "valid_targets_mean": 4790.4, "valid_targets_min": 1224 }, { "epoch": 0.6431852986217458, "grad_norm": 0.48048305351290477, "learning_rate": 3.6593886462882097e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.24673986434936523, "step": 420, "valid_targets_mean": 5280.0, "valid_targets_min": 949 }, { "epoch": 0.6508422664624809, "grad_norm": 0.5456250025761155, "learning_rate": 3.7030567685589525e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.2480792999267578, "step": 425, "valid_targets_mean": 5479.8, "valid_targets_min": 1915 }, { "epoch": 0.6584992343032159, "grad_norm": 0.564296936232767, "learning_rate": 3.746724890829695e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615630030632019, "step": 430, "valid_targets_mean": 5361.0, "valid_targets_min": 877 }, { "epoch": 0.666156202143951, "grad_norm": 0.48996027764636907, "learning_rate": 3.790393013100437e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.24756395816802979, "step": 435, "valid_targets_mean": 4916.1, "valid_targets_min": 326 }, { "epoch": 0.6738131699846861, "grad_norm": 0.44623955424804534, "learning_rate": 3.834061135371179e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.23491841554641724, "step": 440, "valid_targets_mean": 5672.4, "valid_targets_min": 429 }, { "epoch": 0.6814701378254211, "grad_norm": 0.45284851458486386, "learning_rate": 3.877729257641922e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.2342417687177658, "step": 445, "valid_targets_mean": 5099.3, "valid_targets_min": 687 }, { "epoch": 0.6891271056661562, "grad_norm": 0.5324943693738649, "learning_rate": 3.921397379912664e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.27402836084365845, "step": 450, "valid_targets_mean": 4484.3, "valid_targets_min": 580 }, { "epoch": 0.6967840735068913, "grad_norm": 0.4646196239617948, "learning_rate": 3.965065502183406e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.24006010591983795, "step": 455, "valid_targets_mean": 4958.8, "valid_targets_min": 911 }, { "epoch": 0.7044410413476263, "grad_norm": 0.4405348727571011, "learning_rate": 3.9999994165786676e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.22806835174560547, "step": 460, "valid_targets_mean": 5592.2, "valid_targets_min": 2673 }, { "epoch": 0.7120980091883614, "grad_norm": 0.5562861867740798, "learning_rate": 3.9999789968677496e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.2417786568403244, "step": 465, "valid_targets_mean": 4365.9, "valid_targets_min": 566 }, { "epoch": 0.7197549770290965, "grad_norm": 0.5080252815095521, "learning_rate": 3.999929406430558e-05, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.2633582651615143, "step": 470, "valid_targets_mean": 4811.5, "valid_targets_min": 530 }, { "epoch": 0.7274119448698315, "grad_norm": 0.5272035775867764, "learning_rate": 3.999850645990394e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.24008730053901672, "step": 475, "valid_targets_mean": 4771.0, "valid_targets_min": 686 }, { "epoch": 0.7350689127105666, "grad_norm": 0.4754003904766261, "learning_rate": 3.999742716696021e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.23725548386573792, "step": 480, "valid_targets_mean": 5124.4, "valid_targets_min": 464 }, { "epoch": 0.7427258805513017, "grad_norm": 0.6101466292156634, "learning_rate": 3.999605620121641e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.24445194005966187, "step": 485, "valid_targets_mean": 5324.8, "valid_targets_min": 660 }, { "epoch": 0.7503828483920367, "grad_norm": 0.4637006971657633, "learning_rate": 3.9994393582668806e-05, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.2397041618824005, "step": 490, "valid_targets_mean": 5648.9, "valid_targets_min": 777 }, { "epoch": 0.7580398162327718, "grad_norm": 0.5016071627691048, "learning_rate": 3.999243933556753e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539515197277069, "step": 495, "valid_targets_mean": 4441.4, "valid_targets_min": 321 }, { "epoch": 0.7656967840735069, "grad_norm": 0.4754215254300854, "learning_rate": 3.9990193488416304e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.2377694994211197, "step": 500, "valid_targets_mean": 5602.7, "valid_targets_min": 674 }, { "epoch": 0.7733537519142419, "grad_norm": 0.4442741247780648, "learning_rate": 3.9987656073971946e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.2323368787765503, "step": 505, "valid_targets_mean": 5325.0, "valid_targets_min": 841 }, { "epoch": 0.781010719754977, "grad_norm": 0.499596334503463, "learning_rate": 3.998482712924397e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.2620323896408081, "step": 510, "valid_targets_mean": 4717.8, "valid_targets_min": 740 }, { "epoch": 0.7886676875957122, "grad_norm": 0.4715666857814281, "learning_rate": 3.9981706695493996e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.27169761061668396, "step": 515, "valid_targets_mean": 5186.8, "valid_targets_min": 2363 }, { "epoch": 0.7963246554364471, "grad_norm": 0.5743001328378289, "learning_rate": 3.997829481823515e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.27855122089385986, "step": 520, "valid_targets_mean": 4762.1, "valid_targets_min": 593 }, { "epoch": 0.8039816232771823, "grad_norm": 0.47759303305733847, "learning_rate": 3.997459154723144e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.2423936426639557, "step": 525, "valid_targets_mean": 5297.0, "valid_targets_min": 854 }, { "epoch": 0.8116385911179173, "grad_norm": 0.46683109553118957, "learning_rate": 3.9970596936496976e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2846606373786926, "step": 530, "valid_targets_mean": 6037.3, "valid_targets_min": 691 }, { "epoch": 0.8192955589586524, "grad_norm": 0.4707779779562285, "learning_rate": 3.996631104429521e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.22087471187114716, "step": 535, "valid_targets_mean": 5019.9, "valid_targets_min": 876 }, { "epoch": 0.8269525267993875, "grad_norm": 0.5479924065007178, "learning_rate": 3.9961733933138106e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.23031362891197205, "step": 540, "valid_targets_mean": 4613.0, "valid_targets_min": 2571 }, { "epoch": 0.8346094946401225, "grad_norm": 0.5706626665016054, "learning_rate": 3.9956865669785185e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.2653731405735016, "step": 545, "valid_targets_mean": 4250.2, "valid_targets_min": 499 }, { "epoch": 0.8422664624808576, "grad_norm": 0.45823962344649066, "learning_rate": 3.9951706325242595e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.214570090174675, "step": 550, "valid_targets_mean": 5601.8, "valid_targets_min": 1935 }, { "epoch": 0.8499234303215927, "grad_norm": 0.4798067262429478, "learning_rate": 3.9946255974762023e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.22499428689479828, "step": 555, "valid_targets_mean": 4887.4, "valid_targets_min": 559 }, { "epoch": 0.8575803981623277, "grad_norm": 0.5354869537077036, "learning_rate": 3.9940514697839654e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.2552046775817871, "step": 560, "valid_targets_mean": 4646.8, "valid_targets_min": 584 }, { "epoch": 0.8652373660030628, "grad_norm": 0.404422046345916, "learning_rate": 3.993448257821498e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2055911421775818, "step": 565, "valid_targets_mean": 5405.6, "valid_targets_min": 2000 }, { "epoch": 0.8728943338437979, "grad_norm": 0.9512439674975726, "learning_rate": 3.992815970386956e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.22652213275432587, "step": 570, "valid_targets_mean": 5747.8, "valid_targets_min": 731 }, { "epoch": 0.8805513016845329, "grad_norm": 0.49581746326271475, "learning_rate": 3.99215461670258e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.25263649225234985, "step": 575, "valid_targets_mean": 4818.8, "valid_targets_min": 636 }, { "epoch": 0.888208269525268, "grad_norm": 0.5193294216924808, "learning_rate": 3.9914642064145555e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.24224933981895447, "step": 580, "valid_targets_mean": 4697.4, "valid_targets_min": 768 }, { "epoch": 0.8958652373660031, "grad_norm": 0.5081023804449541, "learning_rate": 3.990744749592871e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.25167709589004517, "step": 585, "valid_targets_mean": 5235.0, "valid_targets_min": 447 }, { "epoch": 0.9035222052067381, "grad_norm": 0.43150283564796665, "learning_rate": 3.989996256731178e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.24848490953445435, "step": 590, "valid_targets_mean": 5873.1, "valid_targets_min": 631 }, { "epoch": 0.9111791730474732, "grad_norm": 0.490082147198131, "learning_rate": 3.9892187387466286e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544364631175995, "step": 595, "valid_targets_mean": 5240.1, "valid_targets_min": 776 }, { "epoch": 0.9188361408882083, "grad_norm": 0.47301661085243424, "learning_rate": 3.9884122069797256e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.23627778887748718, "step": 600, "valid_targets_mean": 4547.9, "valid_targets_min": 1232 }, { "epoch": 0.9264931087289433, "grad_norm": 0.6020593350379793, "learning_rate": 3.9875766731941514e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.25998401641845703, "step": 605, "valid_targets_mean": 5206.4, "valid_targets_min": 1670 }, { "epoch": 0.9341500765696784, "grad_norm": 0.4343199562247558, "learning_rate": 3.986712149576597e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.21079614758491516, "step": 610, "valid_targets_mean": 5721.4, "valid_targets_min": 661 }, { "epoch": 0.9418070444104135, "grad_norm": 0.4959240813023885, "learning_rate": 3.985818648736588e-05, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.2344963252544403, "step": 615, "valid_targets_mean": 5268.9, "valid_targets_min": 645 }, { "epoch": 0.9494640122511485, "grad_norm": 0.44727712842280476, "learning_rate": 3.984896183706291e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.21470850706100464, "step": 620, "valid_targets_mean": 4735.4, "valid_targets_min": 727 }, { "epoch": 0.9571209800918836, "grad_norm": 0.4770114196646438, "learning_rate": 3.983944767940339e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.251364529132843, "step": 625, "valid_targets_mean": 5323.6, "valid_targets_min": 1961 }, { "epoch": 0.9647779479326187, "grad_norm": 0.5049867980521303, "learning_rate": 3.98296441531562e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.2861921489238739, "step": 630, "valid_targets_mean": 4449.9, "valid_targets_min": 357 }, { "epoch": 0.9724349157733537, "grad_norm": 0.4585093358813056, "learning_rate": 3.9819551401310834e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.2122216820716858, "step": 635, "valid_targets_mean": 5522.1, "valid_targets_min": 886 }, { "epoch": 0.9800918836140888, "grad_norm": 0.5195599231781355, "learning_rate": 3.980916957107529e-05, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.2382555454969406, "step": 640, "valid_targets_mean": 4636.5, "valid_targets_min": 365 }, { "epoch": 0.9877488514548239, "grad_norm": 0.5243648163119432, "learning_rate": 3.979849881387393e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2904030680656433, "step": 645, "valid_targets_mean": 4576.8, "valid_targets_min": 664 }, { "epoch": 0.9954058192955589, "grad_norm": 0.5320338443965096, "learning_rate": 3.9787539285345245e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.2518049478530884, "step": 650, "valid_targets_mean": 3986.9, "valid_targets_min": 582 }, { "epoch": 1.003062787136294, "grad_norm": 0.4543275980951745, "learning_rate": 3.977629114533963e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.21149328351020813, "step": 655, "valid_targets_mean": 4705.1, "valid_targets_min": 596 }, { "epoch": 1.010719754977029, "grad_norm": 0.4610185176199923, "learning_rate": 3.9764754557917e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.2165687382221222, "step": 660, "valid_targets_mean": 4701.8, "valid_targets_min": 757 }, { "epoch": 1.0183767228177643, "grad_norm": 0.3938486079154482, "learning_rate": 3.975292969134445e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.19741511344909668, "step": 665, "valid_targets_mean": 5695.2, "valid_targets_min": 763 }, { "epoch": 1.0260336906584993, "grad_norm": 0.4323156308860325, "learning_rate": 3.974081671809376e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.22385263442993164, "step": 670, "valid_targets_mean": 5580.4, "valid_targets_min": 3056 }, { "epoch": 1.0336906584992342, "grad_norm": 0.47472316536136555, "learning_rate": 3.97284158148389e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535420060157776, "step": 675, "valid_targets_mean": 5442.3, "valid_targets_min": 382 }, { "epoch": 1.0413476263399695, "grad_norm": 0.462265375894869, "learning_rate": 3.971572716245344e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.21901056170463562, "step": 680, "valid_targets_mean": 5023.1, "valid_targets_min": 741 }, { "epoch": 1.0490045941807045, "grad_norm": 0.48248662335215253, "learning_rate": 3.970275094600794e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.24081990122795105, "step": 685, "valid_targets_mean": 4785.9, "valid_targets_min": 665 }, { "epoch": 1.0566615620214395, "grad_norm": 0.4832238002221963, "learning_rate": 3.968948735476721e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2480914294719696, "step": 690, "valid_targets_mean": 4995.2, "valid_targets_min": 307 }, { "epoch": 1.0643185298621747, "grad_norm": 0.49185121927326225, "learning_rate": 3.9675936582187574e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.22463348507881165, "step": 695, "valid_targets_mean": 4966.1, "valid_targets_min": 571 }, { "epoch": 1.0719754977029097, "grad_norm": 0.4852510851215775, "learning_rate": 3.966209882591404e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.23765654861927032, "step": 700, "valid_targets_mean": 4573.9, "valid_targets_min": 1632 }, { "epoch": 1.0796324655436447, "grad_norm": 0.7554692659763621, "learning_rate": 3.9647974287777444e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.21256719529628754, "step": 705, "valid_targets_mean": 5479.7, "valid_targets_min": 1174 }, { "epoch": 1.0872894333843799, "grad_norm": 0.5138481666787079, "learning_rate": 3.9633563173791454e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.24174924194812775, "step": 710, "valid_targets_mean": 4438.2, "valid_targets_min": 709 }, { "epoch": 1.0949464012251149, "grad_norm": 0.5480222726912267, "learning_rate": 3.961886569414962e-05, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.23572365939617157, "step": 715, "valid_targets_mean": 4192.2, "valid_targets_min": 393 }, { "epoch": 1.1026033690658499, "grad_norm": 0.4970895044179645, "learning_rate": 3.9603882063222254e-05, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.2110937386751175, "step": 720, "valid_targets_mean": 4099.9, "valid_targets_min": 610 }, { "epoch": 1.110260336906585, "grad_norm": 0.3803758195568299, "learning_rate": 3.958861249955336e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.19598951935768127, "step": 725, "valid_targets_mean": 5967.6, "valid_targets_min": 319 }, { "epoch": 1.11791730474732, "grad_norm": 0.44999478220240136, "learning_rate": 3.957305722585742e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.24348898231983185, "step": 730, "valid_targets_mean": 5976.7, "valid_targets_min": 3547 }, { "epoch": 1.125574272588055, "grad_norm": 0.6543210798518898, "learning_rate": 3.955721646901611e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2491251528263092, "step": 735, "valid_targets_mean": 4430.6, "valid_targets_min": 655 }, { "epoch": 1.13323124042879, "grad_norm": 0.5116096170224053, "learning_rate": 3.954109046007506e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.24491837620735168, "step": 740, "valid_targets_mean": 5439.1, "valid_targets_min": 3023 }, { "epoch": 1.1408882082695253, "grad_norm": 0.4657142210971288, "learning_rate": 3.9524679434240426e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.2513515055179596, "step": 745, "valid_targets_mean": 5713.0, "valid_targets_min": 953 }, { "epoch": 1.1485451761102603, "grad_norm": 0.47461273340221555, "learning_rate": 3.95079836308755e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.22947482764720917, "step": 750, "valid_targets_mean": 4901.0, "valid_targets_min": 637 }, { "epoch": 1.1562021439509955, "grad_norm": 0.5357763463044893, "learning_rate": 3.94910032934972e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.31903350353240967, "step": 755, "valid_targets_mean": 4305.5, "valid_targets_min": 601 }, { "epoch": 1.1638591117917305, "grad_norm": 0.44975376536296746, "learning_rate": 3.947373866977251e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.2732940912246704, "step": 760, "valid_targets_mean": 5532.4, "valid_targets_min": 864 }, { "epoch": 1.1715160796324655, "grad_norm": 0.5172389291640855, "learning_rate": 3.945619001151487e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2661622166633606, "step": 765, "valid_targets_mean": 4083.5, "valid_targets_min": 316 }, { "epoch": 1.1791730474732005, "grad_norm": 0.5218749820672336, "learning_rate": 3.9438357574680536e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2443704754114151, "step": 770, "valid_targets_mean": 4730.9, "valid_targets_min": 324 }, { "epoch": 1.1868300153139357, "grad_norm": 0.5132882152134416, "learning_rate": 3.9420241619364794e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.23841838538646698, "step": 775, "valid_targets_mean": 4711.1, "valid_targets_min": 761 }, { "epoch": 1.1944869831546707, "grad_norm": 0.4750023702302424, "learning_rate": 3.940184240979822e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.20796674489974976, "step": 780, "valid_targets_mean": 4511.1, "valid_targets_min": 635 }, { "epoch": 1.202143950995406, "grad_norm": 0.4336368898063612, "learning_rate": 3.9383160214342775e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.22842389345169067, "step": 785, "valid_targets_mean": 5245.5, "valid_targets_min": 1511 }, { "epoch": 1.209800918836141, "grad_norm": 0.461955332746975, "learning_rate": 3.9364195305487926e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.19852107763290405, "step": 790, "valid_targets_mean": 4429.8, "valid_targets_min": 274 }, { "epoch": 1.217457886676876, "grad_norm": 0.44263849837581704, "learning_rate": 3.934494795984666e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.2133197784423828, "step": 795, "valid_targets_mean": 6112.6, "valid_targets_min": 2092 }, { "epoch": 1.225114854517611, "grad_norm": 0.46310194439122904, "learning_rate": 3.932541845815145e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.2494787722826004, "step": 800, "valid_targets_mean": 5680.5, "valid_targets_min": 797 }, { "epoch": 1.2327718223583461, "grad_norm": 0.534237892887851, "learning_rate": 3.930560708525018e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2164071798324585, "step": 805, "valid_targets_mean": 4722.7, "valid_targets_min": 844 }, { "epoch": 1.2404287901990811, "grad_norm": 0.5447789231267499, "learning_rate": 3.9285514130101916e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.2128959447145462, "step": 810, "valid_targets_mean": 5702.2, "valid_targets_min": 2581 }, { "epoch": 1.2480857580398161, "grad_norm": 0.4541670432548241, "learning_rate": 3.926513988577282e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.24208541214466095, "step": 815, "valid_targets_mean": 5627.6, "valid_targets_min": 756 }, { "epoch": 1.2557427258805514, "grad_norm": 0.5066058652602967, "learning_rate": 3.924448464943174e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.20324429869651794, "step": 820, "valid_targets_mean": 5178.3, "valid_targets_min": 590 }, { "epoch": 1.2633996937212864, "grad_norm": 0.4824685977219757, "learning_rate": 3.922354872234596e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.21685411036014557, "step": 825, "valid_targets_mean": 5625.1, "valid_targets_min": 2583 }, { "epoch": 1.2710566615620214, "grad_norm": 0.5000431811675772, "learning_rate": 3.9202332409876814e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.22782090306282043, "step": 830, "valid_targets_mean": 4467.5, "valid_targets_min": 357 }, { "epoch": 1.2787136294027566, "grad_norm": 0.46323331152102815, "learning_rate": 3.918083602147515e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2275102138519287, "step": 835, "valid_targets_mean": 5634.8, "valid_targets_min": 867 }, { "epoch": 1.2863705972434916, "grad_norm": 0.4773797488887894, "learning_rate": 3.91590598706769e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.24412119388580322, "step": 840, "valid_targets_mean": 4812.3, "valid_targets_min": 622 }, { "epoch": 1.2940275650842268, "grad_norm": 0.5076582879336042, "learning_rate": 3.913700427509847e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.2958303689956665, "step": 845, "valid_targets_mean": 5836.1, "valid_targets_min": 727 }, { "epoch": 1.3016845329249618, "grad_norm": 0.5949340076342235, "learning_rate": 3.911466955643209e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.23251014947891235, "step": 850, "valid_targets_mean": 5130.4, "valid_targets_min": 230 }, { "epoch": 1.3093415007656968, "grad_norm": 0.4670023051943422, "learning_rate": 3.909205604044119e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.2273961305618286, "step": 855, "valid_targets_mean": 5627.8, "valid_targets_min": 649 }, { "epoch": 1.3169984686064318, "grad_norm": 0.4559961360039699, "learning_rate": 3.9069164056955556e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.20973217487335205, "step": 860, "valid_targets_mean": 5071.0, "valid_targets_min": 453 }, { "epoch": 1.324655436447167, "grad_norm": 1.055965972410453, "learning_rate": 3.90459939398666e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2360004484653473, "step": 865, "valid_targets_mean": 4669.8, "valid_targets_min": 709 }, { "epoch": 1.332312404287902, "grad_norm": 0.4403899930388177, "learning_rate": 3.902254602712242e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.21914419531822205, "step": 870, "valid_targets_mean": 5948.8, "valid_targets_min": 755 }, { "epoch": 1.339969372128637, "grad_norm": 0.49919259365975516, "learning_rate": 3.899882066072296e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2369828075170517, "step": 875, "valid_targets_mean": 4776.4, "valid_targets_min": 294 }, { "epoch": 1.3476263399693722, "grad_norm": 0.465536683491622, "learning_rate": 3.897481818671493e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.21700987219810486, "step": 880, "valid_targets_mean": 5091.3, "valid_targets_min": 536 }, { "epoch": 1.3552833078101072, "grad_norm": 0.38610096562448637, "learning_rate": 3.895053895518679e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.20991790294647217, "step": 885, "valid_targets_mean": 6598.3, "valid_targets_min": 3662 }, { "epoch": 1.3629402756508422, "grad_norm": 0.3931810607665223, "learning_rate": 3.892598332026368e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.20161226391792297, "step": 890, "valid_targets_mean": 5230.8, "valid_targets_min": 874 }, { "epoch": 1.3705972434915774, "grad_norm": 0.46758214305344503, "learning_rate": 3.8901151640102214e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.2412872463464737, "step": 895, "valid_targets_mean": 5018.2, "valid_targets_min": 597 }, { "epoch": 1.3782542113323124, "grad_norm": 0.47535688154677647, "learning_rate": 3.8876044276885264e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.20891433954238892, "step": 900, "valid_targets_mean": 4952.4, "valid_targets_min": 426 }, { "epoch": 1.3859111791730474, "grad_norm": 0.3800112743149217, "learning_rate": 3.885066159681668e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.20787039399147034, "step": 905, "valid_targets_mean": 5950.2, "valid_targets_min": 872 }, { "epoch": 1.3935681470137826, "grad_norm": 0.5717375079447776, "learning_rate": 3.882500397011597e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.2375756800174713, "step": 910, "valid_targets_mean": 4286.0, "valid_targets_min": 648 }, { "epoch": 1.4012251148545176, "grad_norm": 0.4423799703448592, "learning_rate": 3.8799071771012865e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.2233145534992218, "step": 915, "valid_targets_mean": 5010.4, "valid_targets_min": 826 }, { "epoch": 1.4088820826952526, "grad_norm": 0.7674568548996449, "learning_rate": 3.877286537774187e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.25533410906791687, "step": 920, "valid_targets_mean": 5108.3, "valid_targets_min": 758 }, { "epoch": 1.4165390505359878, "grad_norm": 0.4672643825009114, "learning_rate": 3.874638517253676e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.24158219993114471, "step": 925, "valid_targets_mean": 4805.2, "valid_targets_min": 2561 }, { "epoch": 1.4241960183767228, "grad_norm": 0.4803000711402261, "learning_rate": 3.871963154162501e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.2522413730621338, "step": 930, "valid_targets_mean": 4650.3, "valid_targets_min": 895 }, { "epoch": 1.4318529862174578, "grad_norm": 0.4622132223927811, "learning_rate": 3.869260487522213e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.2327278107404709, "step": 935, "valid_targets_mean": 4991.4, "valid_targets_min": 754 }, { "epoch": 1.439509954058193, "grad_norm": 0.4466120611595715, "learning_rate": 3.866530556752601e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.2425045520067215, "step": 940, "valid_targets_mean": 4719.2, "valid_targets_min": 734 }, { "epoch": 1.447166921898928, "grad_norm": 0.4573816713524243, "learning_rate": 3.8637734016711144e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.2244962453842163, "step": 945, "valid_targets_mean": 4643.3, "valid_targets_min": 702 }, { "epoch": 1.454823889739663, "grad_norm": 0.458299903716274, "learning_rate": 3.860989062492284e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.2286277562379837, "step": 950, "valid_targets_mean": 4489.7, "valid_targets_min": 692 }, { "epoch": 1.462480857580398, "grad_norm": 0.5032857134165045, "learning_rate": 3.858177579827133e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.26451292634010315, "step": 955, "valid_targets_mean": 6107.7, "valid_targets_min": 926 }, { "epoch": 1.4701378254211332, "grad_norm": 0.4842909516880842, "learning_rate": 3.8553389946825896e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.24591636657714844, "step": 960, "valid_targets_mean": 4898.8, "valid_targets_min": 911 }, { "epoch": 1.4777947932618682, "grad_norm": 0.4073502413011468, "learning_rate": 3.8524733484608824e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.20459729433059692, "step": 965, "valid_targets_mean": 6015.3, "valid_targets_min": 1521 }, { "epoch": 1.4854517611026035, "grad_norm": 0.40576274013727376, "learning_rate": 3.8495806829589416e-05, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.21941059827804565, "step": 970, "valid_targets_mean": 5581.0, "valid_targets_min": 2235 }, { "epoch": 1.4931087289433385, "grad_norm": 0.6974578241353532, "learning_rate": 3.8466610403677874e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.19623053073883057, "step": 975, "valid_targets_mean": 5069.4, "valid_targets_min": 313 }, { "epoch": 1.5007656967840735, "grad_norm": 0.45967960346904296, "learning_rate": 3.8437144632719136e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.2094549983739853, "step": 980, "valid_targets_mean": 4371.3, "valid_targets_min": 732 }, { "epoch": 1.5084226646248085, "grad_norm": 0.42898168106530515, "learning_rate": 3.840740994648669e-05, "loss": 0.2163, "loss_nan_ranks": 0, "loss_rank_avg": 0.20533907413482666, "step": 985, "valid_targets_mean": 4905.2, "valid_targets_min": 1112 }, { "epoch": 1.5160796324655437, "grad_norm": 0.5771406355795161, "learning_rate": 3.837740677867628e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.26875361800193787, "step": 990, "valid_targets_mean": 4721.5, "valid_targets_min": 845 }, { "epoch": 1.5237366003062787, "grad_norm": 0.4902824785618498, "learning_rate": 3.8347135566899616e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2583337128162384, "step": 995, "valid_targets_mean": 4502.8, "valid_targets_min": 618 }, { "epoch": 1.5313935681470139, "grad_norm": 0.44320917141796234, "learning_rate": 3.831659675267793e-05, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.20274272561073303, "step": 1000, "valid_targets_mean": 4891.5, "valid_targets_min": 686 }, { "epoch": 1.5390505359877489, "grad_norm": 0.44737506920889025, "learning_rate": 3.828579078143561e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.24201388657093048, "step": 1005, "valid_targets_mean": 5657.9, "valid_targets_min": 3308 }, { "epoch": 1.5467075038284839, "grad_norm": 0.4987453352941786, "learning_rate": 3.825471810249365e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.23472508788108826, "step": 1010, "valid_targets_mean": 5547.6, "valid_targets_min": 1485 }, { "epoch": 1.5543644716692189, "grad_norm": 0.48227849169472226, "learning_rate": 3.822337916906311e-05, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2520979642868042, "step": 1015, "valid_targets_mean": 4113.2, "valid_targets_min": 629 }, { "epoch": 1.562021439509954, "grad_norm": 0.40392077613965266, "learning_rate": 3.8191774438238514e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.21043488383293152, "step": 1020, "valid_targets_mean": 5685.4, "valid_targets_min": 1845 }, { "epoch": 1.569678407350689, "grad_norm": 0.4284123643349941, "learning_rate": 3.815990437099118e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.21044665575027466, "step": 1025, "valid_targets_mean": 5459.0, "valid_targets_min": 720 }, { "epoch": 1.5773353751914243, "grad_norm": 0.4674790436901617, "learning_rate": 3.81277694321625e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.23535355925559998, "step": 1030, "valid_targets_mean": 4770.8, "valid_targets_min": 714 }, { "epoch": 1.5849923430321593, "grad_norm": 0.3788371319532689, "learning_rate": 3.809537009045714e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.20070108771324158, "step": 1035, "valid_targets_mean": 5832.2, "valid_targets_min": 318 }, { "epoch": 1.5926493108728943, "grad_norm": 0.5196182043035402, "learning_rate": 3.8062706818436234e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.26477953791618347, "step": 1040, "valid_targets_mean": 3962.2, "valid_targets_min": 410 }, { "epoch": 1.6003062787136293, "grad_norm": 0.48358135151926473, "learning_rate": 3.802978009251046e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.25546973943710327, "step": 1045, "valid_targets_mean": 4565.6, "valid_targets_min": 940 }, { "epoch": 1.6079632465543645, "grad_norm": 0.4289401594279837, "learning_rate": 3.799659039293312e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.2194889783859253, "step": 1050, "valid_targets_mean": 5301.4, "valid_targets_min": 582 }, { "epoch": 1.6156202143950995, "grad_norm": 0.451232811004955, "learning_rate": 3.796313820379313e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.2255152463912964, "step": 1055, "valid_targets_mean": 5610.7, "valid_targets_min": 596 }, { "epoch": 1.6232771822358347, "grad_norm": 0.4193660210903287, "learning_rate": 3.792942401300792e-05, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.20200134813785553, "step": 1060, "valid_targets_mean": 5545.6, "valid_targets_min": 528 }, { "epoch": 1.6309341500765697, "grad_norm": 0.4869469520460917, "learning_rate": 3.789544831231639e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.2149246633052826, "step": 1065, "valid_targets_mean": 3840.6, "valid_targets_min": 294 }, { "epoch": 1.6385911179173047, "grad_norm": 0.8289501528499609, "learning_rate": 3.7861211597271655e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.23823891580104828, "step": 1070, "valid_targets_mean": 5751.8, "valid_targets_min": 3017 }, { "epoch": 1.6462480857580397, "grad_norm": 0.3834423104766572, "learning_rate": 3.782671436723389e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.19142815470695496, "step": 1075, "valid_targets_mean": 6619.1, "valid_targets_min": 3373 }, { "epoch": 1.653905053598775, "grad_norm": 0.48705512770145654, "learning_rate": 3.779195712536301e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.23004969954490662, "step": 1080, "valid_targets_mean": 4073.9, "valid_targets_min": 294 }, { "epoch": 1.66156202143951, "grad_norm": 0.4542717256577794, "learning_rate": 3.775694037861134e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.2153184711933136, "step": 1085, "valid_targets_mean": 5164.8, "valid_targets_min": 661 }, { "epoch": 1.6692189892802451, "grad_norm": 0.45851010452010027, "learning_rate": 3.772166463771619e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2138391137123108, "step": 1090, "valid_targets_mean": 5276.1, "valid_targets_min": 1501 }, { "epoch": 1.6768759571209801, "grad_norm": 0.5506935584762426, "learning_rate": 3.768613041719247e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.22046592831611633, "step": 1095, "valid_targets_mean": 4694.3, "valid_targets_min": 899 }, { "epoch": 1.6845329249617151, "grad_norm": 0.46507047548755864, "learning_rate": 3.765033823532514e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.22383110225200653, "step": 1100, "valid_targets_mean": 4433.4, "valid_targets_min": 788 }, { "epoch": 1.6921898928024501, "grad_norm": 0.5379797863275028, "learning_rate": 3.7614288614161625e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.27269816398620605, "step": 1105, "valid_targets_mean": 3752.3, "valid_targets_min": 530 }, { "epoch": 1.6998468606431854, "grad_norm": 0.43058162892643365, "learning_rate": 3.7577982079504284e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.2153037041425705, "step": 1110, "valid_targets_mean": 5146.8, "valid_targets_min": 706 }, { "epoch": 1.7075038284839203, "grad_norm": 0.44249590505034403, "learning_rate": 3.754141916090266e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.20741818845272064, "step": 1115, "valid_targets_mean": 5802.1, "valid_targets_min": 679 }, { "epoch": 1.7151607963246556, "grad_norm": 0.458772872006437, "learning_rate": 3.750460039164581e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.24594131112098694, "step": 1120, "valid_targets_mean": 4699.8, "valid_targets_min": 184 }, { "epoch": 1.7228177641653906, "grad_norm": 0.7672926531697714, "learning_rate": 3.746752630875448e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.24634478986263275, "step": 1125, "valid_targets_mean": 3561.6, "valid_targets_min": 663 }, { "epoch": 1.7304747320061256, "grad_norm": 0.43972274729807126, "learning_rate": 3.743019745297332e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.22277215123176575, "step": 1130, "valid_targets_mean": 5361.2, "valid_targets_min": 1695 }, { "epoch": 1.7381316998468606, "grad_norm": 0.4516327506576068, "learning_rate": 3.739261436876296e-05, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.23480652272701263, "step": 1135, "valid_targets_mean": 4729.9, "valid_targets_min": 635 }, { "epoch": 1.7457886676875956, "grad_norm": 0.4949615258488163, "learning_rate": 3.73547776042921e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.2477773129940033, "step": 1140, "valid_targets_mean": 4868.1, "valid_targets_min": 380 }, { "epoch": 1.7534456355283308, "grad_norm": 0.4717486814671122, "learning_rate": 3.731668771142946e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.20434430241584778, "step": 1145, "valid_targets_mean": 4753.1, "valid_targets_min": 661 }, { "epoch": 1.761102603369066, "grad_norm": 0.43298582473400343, "learning_rate": 3.727834524573582e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.23231241106987, "step": 1150, "valid_targets_mean": 5028.3, "valid_targets_min": 680 }, { "epoch": 1.768759571209801, "grad_norm": 0.4520348267564731, "learning_rate": 3.7239750766455826e-05, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.22502996027469635, "step": 1155, "valid_targets_mean": 4861.9, "valid_targets_min": 571 }, { "epoch": 1.776416539050536, "grad_norm": 0.5150942320605032, "learning_rate": 3.720090483650988e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.2381991147994995, "step": 1160, "valid_targets_mean": 4304.5, "valid_targets_min": 880 }, { "epoch": 1.784073506891271, "grad_norm": 0.5161348929268305, "learning_rate": 3.7161808022485935e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.21709483861923218, "step": 1165, "valid_targets_mean": 4438.7, "valid_targets_min": 601 }, { "epoch": 1.791730474732006, "grad_norm": 0.49665971280240234, "learning_rate": 3.7122460894631204e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.24442270398139954, "step": 1170, "valid_targets_mean": 4556.2, "valid_targets_min": 594 }, { "epoch": 1.7993874425727412, "grad_norm": 0.8745968372963754, "learning_rate": 3.708286402684387e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.23762422800064087, "step": 1175, "valid_targets_mean": 4245.6, "valid_targets_min": 739 }, { "epoch": 1.8070444104134764, "grad_norm": 0.41278379589280434, "learning_rate": 3.704301799666469e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.20009422302246094, "step": 1180, "valid_targets_mean": 5268.8, "valid_targets_min": 876 }, { "epoch": 1.8147013782542114, "grad_norm": 0.48742732045154236, "learning_rate": 3.700292338526858e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.24549022316932678, "step": 1185, "valid_targets_mean": 4213.9, "valid_targets_min": 544 }, { "epoch": 1.8223583460949464, "grad_norm": 0.4712771047324667, "learning_rate": 3.696258077745616e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.24899449944496155, "step": 1190, "valid_targets_mean": 4609.4, "valid_targets_min": 566 }, { "epoch": 1.8300153139356814, "grad_norm": 0.44975298875115, "learning_rate": 3.6921990761645185e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.21963663399219513, "step": 1195, "valid_targets_mean": 4574.2, "valid_targets_min": 534 }, { "epoch": 1.8376722817764164, "grad_norm": 0.3951327552159224, "learning_rate": 3.6881153929861995e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228214144706726, "step": 1200, "valid_targets_mean": 6362.1, "valid_targets_min": 762 }, { "epoch": 1.8453292496171516, "grad_norm": 0.42372166371340003, "learning_rate": 3.684007087773287e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.21967345476150513, "step": 1205, "valid_targets_mean": 5326.0, "valid_targets_min": 998 }, { "epoch": 1.8529862174578868, "grad_norm": 0.5177828906855314, "learning_rate": 3.679874220447533e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.23139753937721252, "step": 1210, "valid_targets_mean": 3876.4, "valid_targets_min": 661 }, { "epoch": 1.8606431852986218, "grad_norm": 0.4257753688447525, "learning_rate": 3.675716851288942e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.21256472170352936, "step": 1215, "valid_targets_mean": 5345.1, "valid_targets_min": 743 }, { "epoch": 1.8683001531393568, "grad_norm": 0.41030398631754234, "learning_rate": 3.671535040934889e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.21335265040397644, "step": 1220, "valid_targets_mean": 4680.1, "valid_targets_min": 664 }, { "epoch": 1.8759571209800918, "grad_norm": 0.430169115187478, "learning_rate": 3.667328850379238e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.20409463346004486, "step": 1225, "valid_targets_mean": 5608.6, "valid_targets_min": 2533 }, { "epoch": 1.8836140888208268, "grad_norm": 0.42025014500169766, "learning_rate": 3.6630983409714494e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.21930241584777832, "step": 1230, "valid_targets_mean": 5487.7, "valid_targets_min": 1754 }, { "epoch": 1.891271056661562, "grad_norm": 0.5021327369610216, "learning_rate": 3.6588435744156865e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.19022399187088013, "step": 1235, "valid_targets_mean": 5496.7, "valid_targets_min": 938 }, { "epoch": 1.8989280245022973, "grad_norm": 0.540321749042443, "learning_rate": 3.654564612769917e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716904878616333, "step": 1240, "valid_targets_mean": 3926.7, "valid_targets_min": 693 }, { "epoch": 1.9065849923430322, "grad_norm": 0.4729363531042848, "learning_rate": 3.650261518445006e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.21322724223136902, "step": 1245, "valid_targets_mean": 5020.2, "valid_targets_min": 654 }, { "epoch": 1.9142419601837672, "grad_norm": 0.4446714421133037, "learning_rate": 3.6459343542038056e-05, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.20671671628952026, "step": 1250, "valid_targets_mean": 5615.5, "valid_targets_min": 2404 }, { "epoch": 1.9218989280245022, "grad_norm": 0.3944661996414203, "learning_rate": 3.64158318316024e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.21900799870491028, "step": 1255, "valid_targets_mean": 6057.3, "valid_targets_min": 3739 }, { "epoch": 1.9295558958652372, "grad_norm": 0.4723508700169769, "learning_rate": 3.6372080687783864e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.22037751972675323, "step": 1260, "valid_targets_mean": 4365.8, "valid_targets_min": 478 }, { "epoch": 1.9372128637059725, "grad_norm": 0.45131110819991693, "learning_rate": 3.632809074871546e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.20661242306232452, "step": 1265, "valid_targets_mean": 4677.1, "valid_targets_min": 494 }, { "epoch": 1.9448698315467075, "grad_norm": 0.5463896519037112, "learning_rate": 3.628386265601317e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.21639251708984375, "step": 1270, "valid_targets_mean": 5609.1, "valid_targets_min": 292 }, { "epoch": 1.9525267993874427, "grad_norm": 0.47101652563636187, "learning_rate": 3.623939705476655e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.2689882516860962, "step": 1275, "valid_targets_mean": 4807.4, "valid_targets_min": 941 }, { "epoch": 1.9601837672281777, "grad_norm": 0.5829538504135483, "learning_rate": 3.619469459352937e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.19414472579956055, "step": 1280, "valid_targets_mean": 5776.8, "valid_targets_min": 1769 }, { "epoch": 1.9678407350689127, "grad_norm": 0.47130592895075707, "learning_rate": 3.614975592431009e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.2240133434534073, "step": 1285, "valid_targets_mean": 4178.6, "valid_targets_min": 393 }, { "epoch": 1.9754977029096477, "grad_norm": 0.41933414032795246, "learning_rate": 3.6104581702562406e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.2266603261232376, "step": 1290, "valid_targets_mean": 5151.5, "valid_targets_min": 643 }, { "epoch": 1.9831546707503829, "grad_norm": 0.4099884275428022, "learning_rate": 3.605917258717567e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.2012246549129486, "step": 1295, "valid_targets_mean": 5393.4, "valid_targets_min": 2048 }, { "epoch": 1.9908116385911179, "grad_norm": 0.3989801489279899, "learning_rate": 3.6013529240465284e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.19280970096588135, "step": 1300, "valid_targets_mean": 5744.2, "valid_targets_min": 904 }, { "epoch": 1.998468606431853, "grad_norm": 0.402617048006408, "learning_rate": 3.596765232816301e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.2282564640045166, "step": 1305, "valid_targets_mean": 5270.4, "valid_targets_min": 962 }, { "epoch": 2.006125574272588, "grad_norm": 0.4373173508442768, "learning_rate": 3.5921542519407305e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.20129822194576263, "step": 1310, "valid_targets_mean": 5563.7, "valid_targets_min": 1904 }, { "epoch": 2.013782542113323, "grad_norm": 0.40992921140400285, "learning_rate": 3.587520048673354e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.1945541501045227, "step": 1315, "valid_targets_mean": 5979.3, "valid_targets_min": 3547 }, { "epoch": 2.021439509954058, "grad_norm": 0.4970730710034263, "learning_rate": 3.582862690606419e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.19818368554115295, "step": 1320, "valid_targets_mean": 4507.1, "valid_targets_min": 723 }, { "epoch": 2.029096477794793, "grad_norm": 0.475172498602143, "learning_rate": 3.578182245669896e-05, "loss": 0.2034, "loss_nan_ranks": 0, "loss_rank_avg": 0.19407986104488373, "step": 1325, "valid_targets_mean": 4450.6, "valid_targets_min": 584 }, { "epoch": 2.0367534456355285, "grad_norm": 0.47059170257977145, "learning_rate": 3.573478782130494e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.2392202615737915, "step": 1330, "valid_targets_mean": 4831.3, "valid_targets_min": 1514 }, { "epoch": 2.0444104134762635, "grad_norm": 0.528011468967076, "learning_rate": 3.5687523685906535e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.22966377437114716, "step": 1335, "valid_targets_mean": 3790.3, "valid_targets_min": 753 }, { "epoch": 2.0520673813169985, "grad_norm": 0.5074078705476603, "learning_rate": 3.564003073987559e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.24435581266880035, "step": 1340, "valid_targets_mean": 4693.4, "valid_targets_min": 721 }, { "epoch": 2.0597243491577335, "grad_norm": 0.3844129003728788, "learning_rate": 3.559230967592123e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.17261341214179993, "step": 1345, "valid_targets_mean": 5297.9, "valid_targets_min": 321 }, { "epoch": 2.0673813169984685, "grad_norm": 0.4224982802578748, "learning_rate": 3.554436119007982e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.2082083821296692, "step": 1350, "valid_targets_mean": 4975.2, "valid_targets_min": 621 }, { "epoch": 2.0750382848392035, "grad_norm": 0.437850384380176, "learning_rate": 3.5496185981704775e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.20134752988815308, "step": 1355, "valid_targets_mean": 5147.9, "valid_targets_min": 390 }, { "epoch": 2.082695252679939, "grad_norm": 0.4207133103422171, "learning_rate": 3.544778475345639e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.2060418426990509, "step": 1360, "valid_targets_mean": 5071.6, "valid_targets_min": 752 }, { "epoch": 2.090352220520674, "grad_norm": 1.3112730233999392, "learning_rate": 3.539915821129156e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.2119438499212265, "step": 1365, "valid_targets_mean": 5674.6, "valid_targets_min": 797 }, { "epoch": 2.098009188361409, "grad_norm": 0.5554558757769965, "learning_rate": 3.535030706445352e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.21164335310459137, "step": 1370, "valid_targets_mean": 4558.6, "valid_targets_min": 301 }, { "epoch": 2.105666156202144, "grad_norm": 0.4420544764278569, "learning_rate": 3.530123202546146e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.2061401605606079, "step": 1375, "valid_targets_mean": 5457.4, "valid_targets_min": 661 }, { "epoch": 2.113323124042879, "grad_norm": 0.46858657202849646, "learning_rate": 3.525193381010015e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.17351192235946655, "step": 1380, "valid_targets_mean": 4331.8, "valid_targets_min": 747 }, { "epoch": 2.120980091883614, "grad_norm": 0.4114806177904376, "learning_rate": 3.520241313740954e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.18135160207748413, "step": 1385, "valid_targets_mean": 5179.8, "valid_targets_min": 788 }, { "epoch": 2.1286370597243494, "grad_norm": 0.4150389909635014, "learning_rate": 3.51526707296742e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.21126386523246765, "step": 1390, "valid_targets_mean": 5510.6, "valid_targets_min": 2213 }, { "epoch": 2.1362940275650844, "grad_norm": 0.4189310905969695, "learning_rate": 3.510270731241282e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.2002798169851303, "step": 1395, "valid_targets_mean": 6350.9, "valid_targets_min": 873 }, { "epoch": 2.1439509954058193, "grad_norm": 0.41400366324510934, "learning_rate": 3.505252361436765e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952013075351715, "step": 1400, "valid_targets_mean": 5682.1, "valid_targets_min": 905 }, { "epoch": 2.1516079632465543, "grad_norm": 0.49444430141106194, "learning_rate": 3.500212036749382e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.22853989899158478, "step": 1405, "valid_targets_mean": 4394.3, "valid_targets_min": 693 }, { "epoch": 2.1592649310872893, "grad_norm": 0.4644344666905227, "learning_rate": 3.495149830694872e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.1914132535457611, "step": 1410, "valid_targets_mean": 5267.1, "valid_targets_min": 583 }, { "epoch": 2.1669218989280243, "grad_norm": 0.45615206271339814, "learning_rate": 3.490065817108124e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.20476290583610535, "step": 1415, "valid_targets_mean": 4469.4, "valid_targets_min": 614 }, { "epoch": 2.1745788667687598, "grad_norm": 0.47393370598028417, "learning_rate": 3.484960070142102e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.22236575186252594, "step": 1420, "valid_targets_mean": 4936.5, "valid_targets_min": 268 }, { "epoch": 2.1822358346094948, "grad_norm": 0.4253170924277631, "learning_rate": 3.4798326642667587e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.18139034509658813, "step": 1425, "valid_targets_mean": 4734.9, "valid_targets_min": 794 }, { "epoch": 2.1898928024502298, "grad_norm": 0.49911646366760776, "learning_rate": 3.474683674267959e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.20690619945526123, "step": 1430, "valid_targets_mean": 5103.0, "valid_targets_min": 889 }, { "epoch": 2.1975497702909648, "grad_norm": 0.49119882276790566, "learning_rate": 3.469513175246379e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.1835339367389679, "step": 1435, "valid_targets_mean": 4820.6, "valid_targets_min": 301 }, { "epoch": 2.2052067381316998, "grad_norm": 0.5154475611308721, "learning_rate": 3.464321242616418e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.19209043681621552, "step": 1440, "valid_targets_mean": 4761.6, "valid_targets_min": 357 }, { "epoch": 2.2128637059724348, "grad_norm": 0.45164627691834747, "learning_rate": 3.459107952105091e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.1891171634197235, "step": 1445, "valid_targets_mean": 5681.1, "valid_targets_min": 251 }, { "epoch": 2.22052067381317, "grad_norm": 0.5335767275763915, "learning_rate": 3.4538733797509355e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.2298070639371872, "step": 1450, "valid_targets_mean": 4577.5, "valid_targets_min": 884 }, { "epoch": 2.228177641653905, "grad_norm": 0.4679949420186815, "learning_rate": 3.44861760190289e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.19955570995807648, "step": 1455, "valid_targets_mean": 4832.8, "valid_targets_min": 240 }, { "epoch": 2.23583460949464, "grad_norm": 0.42095307623333295, "learning_rate": 3.443340695219188e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.1974397748708725, "step": 1460, "valid_targets_mean": 5598.1, "valid_targets_min": 877 }, { "epoch": 2.243491577335375, "grad_norm": 0.4745463301945368, "learning_rate": 3.4380427366662376e-05, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813713014125824, "step": 1465, "valid_targets_mean": 5202.5, "valid_targets_min": 727 }, { "epoch": 2.25114854517611, "grad_norm": 0.39487703795653906, "learning_rate": 3.432723803517501e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.1820264607667923, "step": 1470, "valid_targets_mean": 6077.2, "valid_targets_min": 3521 }, { "epoch": 2.258805513016845, "grad_norm": 0.5769539475945872, "learning_rate": 3.427383973352363e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.2072950303554535, "step": 1475, "valid_targets_mean": 3227.7, "valid_targets_min": 559 }, { "epoch": 2.26646248085758, "grad_norm": 0.4288473452558018, "learning_rate": 3.422023324055005e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.17287051677703857, "step": 1480, "valid_targets_mean": 5125.8, "valid_targets_min": 2542 }, { "epoch": 2.2741194486983156, "grad_norm": 0.4123498873195868, "learning_rate": 3.4166419338132636e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.2294299602508545, "step": 1485, "valid_targets_mean": 5843.1, "valid_targets_min": 719 }, { "epoch": 2.2817764165390506, "grad_norm": 0.4730663649794135, "learning_rate": 3.411239881117494e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.22474753856658936, "step": 1490, "valid_targets_mean": 4959.0, "valid_targets_min": 1705 }, { "epoch": 2.2894333843797856, "grad_norm": 0.3875549685911907, "learning_rate": 3.4058172447594255e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.1825382262468338, "step": 1495, "valid_targets_mean": 6264.6, "valid_targets_min": 580 }, { "epoch": 2.2970903522205206, "grad_norm": 0.4656618705136615, "learning_rate": 3.400374103831007e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.21203726530075073, "step": 1500, "valid_targets_mean": 4578.1, "valid_targets_min": 871 }, { "epoch": 2.3047473200612556, "grad_norm": 0.5002570246078484, "learning_rate": 3.394910537723259e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.21089878678321838, "step": 1505, "valid_targets_mean": 4343.4, "valid_targets_min": 962 }, { "epoch": 2.312404287901991, "grad_norm": 0.452438730699335, "learning_rate": 3.3894266261251163e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.18554329872131348, "step": 1510, "valid_targets_mean": 4893.6, "valid_targets_min": 872 }, { "epoch": 2.320061255742726, "grad_norm": 0.45774747263893145, "learning_rate": 3.3839224490222594e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.18411816656589508, "step": 1515, "valid_targets_mean": 4389.2, "valid_targets_min": 292 }, { "epoch": 2.327718223583461, "grad_norm": 0.4396767692269071, "learning_rate": 3.378398086695954e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.19679993391036987, "step": 1520, "valid_targets_mean": 4803.2, "valid_targets_min": 1214 }, { "epoch": 2.335375191424196, "grad_norm": 0.49013046313660535, "learning_rate": 3.372853619721876e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.20178654789924622, "step": 1525, "valid_targets_mean": 4873.6, "valid_targets_min": 591 }, { "epoch": 2.343032159264931, "grad_norm": 0.3922824720718304, "learning_rate": 3.367289128968939e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.16767504811286926, "step": 1530, "valid_targets_mean": 6036.3, "valid_targets_min": 1865 }, { "epoch": 2.350689127105666, "grad_norm": 0.5498579719590082, "learning_rate": 3.361704695598115e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.22038382291793823, "step": 1535, "valid_targets_mean": 5159.2, "valid_targets_min": 968 }, { "epoch": 2.358346094946401, "grad_norm": 0.4055300698729176, "learning_rate": 3.3561004010612466e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.19593411684036255, "step": 1540, "valid_targets_mean": 5894.4, "valid_targets_min": 303 }, { "epoch": 2.3660030627871365, "grad_norm": 0.3932581284453595, "learning_rate": 3.3504763270998634e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.20369234681129456, "step": 1545, "valid_targets_mean": 6333.2, "valid_targets_min": 2885 }, { "epoch": 2.3736600306278715, "grad_norm": 0.47076653510770716, "learning_rate": 3.344832555743988e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.21554359793663025, "step": 1550, "valid_targets_mean": 4756.6, "valid_targets_min": 315 }, { "epoch": 2.3813169984686064, "grad_norm": 0.48873017026939236, "learning_rate": 3.33916916931094e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.22236159443855286, "step": 1555, "valid_targets_mean": 4995.3, "valid_targets_min": 587 }, { "epoch": 2.3889739663093414, "grad_norm": 0.4125303912579736, "learning_rate": 3.3334862504041336e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.20083507895469666, "step": 1560, "valid_targets_mean": 5715.2, "valid_targets_min": 313 }, { "epoch": 2.3966309341500764, "grad_norm": 0.3853433874516468, "learning_rate": 3.327783881911876e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.17324942350387573, "step": 1565, "valid_targets_mean": 6147.9, "valid_targets_min": 4254 }, { "epoch": 2.404287901990812, "grad_norm": 0.4211655279711124, "learning_rate": 3.322062147006156e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.18347764015197754, "step": 1570, "valid_targets_mean": 5185.8, "valid_targets_min": 281 }, { "epoch": 2.411944869831547, "grad_norm": 0.648964580388655, "learning_rate": 3.3163211291414304e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.19629991054534912, "step": 1575, "valid_targets_mean": 4286.4, "valid_targets_min": 858 }, { "epoch": 2.419601837672282, "grad_norm": 0.4962453331492355, "learning_rate": 3.310560912053409e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.2081303745508194, "step": 1580, "valid_targets_mean": 4552.9, "valid_targets_min": 825 }, { "epoch": 2.427258805513017, "grad_norm": 0.4555354604900568, "learning_rate": 3.304781579757833e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.17186057567596436, "step": 1585, "valid_targets_mean": 5026.6, "valid_targets_min": 308 }, { "epoch": 2.434915773353752, "grad_norm": 0.4285448366359402, "learning_rate": 3.298983216549248e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.2216184288263321, "step": 1590, "valid_targets_mean": 5668.2, "valid_targets_min": 912 }, { "epoch": 2.442572741194487, "grad_norm": 0.5893928303619657, "learning_rate": 3.2931659069997735e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.21629182994365692, "step": 1595, "valid_targets_mean": 3893.3, "valid_targets_min": 304 }, { "epoch": 2.450229709035222, "grad_norm": 0.48884082069491913, "learning_rate": 3.287329735957874e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.2368190437555313, "step": 1600, "valid_targets_mean": 4901.4, "valid_targets_min": 1007 }, { "epoch": 2.4578866768759573, "grad_norm": 0.52785052949108, "learning_rate": 3.281474788547118e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.22330242395401, "step": 1605, "valid_targets_mean": 4853.1, "valid_targets_min": 648 }, { "epoch": 2.4655436447166923, "grad_norm": 0.3987288953747758, "learning_rate": 3.275601150164935e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.2003602832555771, "step": 1610, "valid_targets_mean": 5620.3, "valid_targets_min": 2039 }, { "epoch": 2.4732006125574273, "grad_norm": 0.47491465305943875, "learning_rate": 3.269708906481374e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.1774139255285263, "step": 1615, "valid_targets_mean": 4716.2, "valid_targets_min": 713 }, { "epoch": 2.4808575803981623, "grad_norm": 0.44594046656836617, "learning_rate": 3.263798143437851e-05, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.20561468601226807, "step": 1620, "valid_targets_mean": 5183.3, "valid_targets_min": 794 }, { "epoch": 2.4885145482388973, "grad_norm": 0.42727062717581415, "learning_rate": 3.2578689472458976e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.18722905218601227, "step": 1625, "valid_targets_mean": 5382.0, "valid_targets_min": 553 }, { "epoch": 2.4961715160796323, "grad_norm": 0.5834450873795829, "learning_rate": 3.251921404385901e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2354370504617691, "step": 1630, "valid_targets_mean": 4581.8, "valid_targets_min": 678 }, { "epoch": 2.5038284839203673, "grad_norm": 0.5345211557255457, "learning_rate": 3.245955601605845e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.2337321937084198, "step": 1635, "valid_targets_mean": 4913.5, "valid_targets_min": 728 }, { "epoch": 2.5114854517611027, "grad_norm": 0.37333243741751854, "learning_rate": 3.239971625920043e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.19104315340518951, "step": 1640, "valid_targets_mean": 5793.1, "valid_targets_min": 2257 }, { "epoch": 2.5191424196018377, "grad_norm": 0.5550955042373348, "learning_rate": 3.23396956460787e-05, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.21975022554397583, "step": 1645, "valid_targets_mean": 3863.6, "valid_targets_min": 293 }, { "epoch": 2.5267993874425727, "grad_norm": 0.4228650870100245, "learning_rate": 3.2279495052124884e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.1825849711894989, "step": 1650, "valid_targets_mean": 5644.5, "valid_targets_min": 2558 }, { "epoch": 2.5344563552833077, "grad_norm": 0.46523951256002843, "learning_rate": 3.2219115355395745e-05, "loss": 0.2126, "loss_nan_ranks": 0, "loss_rank_avg": 0.20776934921741486, "step": 1655, "valid_targets_mean": 4995.9, "valid_targets_min": 573 }, { "epoch": 2.5421133231240427, "grad_norm": 0.4225684699080134, "learning_rate": 3.2158557436560317e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.19467893242835999, "step": 1660, "valid_targets_mean": 4794.1, "valid_targets_min": 671 }, { "epoch": 2.549770290964778, "grad_norm": 0.4533547241905163, "learning_rate": 3.2097822178887114e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.20666176080703735, "step": 1665, "valid_targets_mean": 5426.8, "valid_targets_min": 3917 }, { "epoch": 2.557427258805513, "grad_norm": 0.7691377736423072, "learning_rate": 3.203691046823124e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768425941467285, "step": 1670, "valid_targets_mean": 4918.1, "valid_targets_min": 660 }, { "epoch": 2.565084226646248, "grad_norm": 0.4647968234361939, "learning_rate": 3.197582319302143e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.2030567228794098, "step": 1675, "valid_targets_mean": 4793.9, "valid_targets_min": 898 }, { "epoch": 2.572741194486983, "grad_norm": 0.47503096589440647, "learning_rate": 3.191456124424715e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.20649227499961853, "step": 1680, "valid_targets_mean": 4376.4, "valid_targets_min": 627 }, { "epoch": 2.580398162327718, "grad_norm": 0.38967161506770254, "learning_rate": 3.185312551544553e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.16294370591640472, "step": 1685, "valid_targets_mean": 5400.3, "valid_targets_min": 306 }, { "epoch": 2.5880551301684536, "grad_norm": 0.4137207933362876, "learning_rate": 3.179151690268842e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.20800091326236725, "step": 1690, "valid_targets_mean": 5615.9, "valid_targets_min": 1817 }, { "epoch": 2.595712098009188, "grad_norm": 0.43845263427784364, "learning_rate": 3.1729736304569216e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.1801062524318695, "step": 1695, "valid_targets_mean": 5320.6, "valid_targets_min": 494 }, { "epoch": 2.6033690658499236, "grad_norm": 0.4583531820739542, "learning_rate": 3.1667784622189866e-05, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.2043706327676773, "step": 1700, "valid_targets_mean": 4630.8, "valid_targets_min": 625 }, { "epoch": 2.6110260336906586, "grad_norm": 0.5834610593137702, "learning_rate": 3.160566275914763e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.1968202143907547, "step": 1705, "valid_targets_mean": 4307.7, "valid_targets_min": 328 }, { "epoch": 2.6186830015313936, "grad_norm": 0.5472036514053488, "learning_rate": 3.154337162152196e-05, "loss": 0.2111, "loss_nan_ranks": 0, "loss_rank_avg": 0.23707276582717896, "step": 1710, "valid_targets_mean": 3378.8, "valid_targets_min": 593 }, { "epoch": 2.6263399693721285, "grad_norm": 0.44150272015060515, "learning_rate": 3.148091211786126e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.21165896952152252, "step": 1715, "valid_targets_mean": 5223.7, "valid_targets_min": 365 }, { "epoch": 2.6339969372128635, "grad_norm": 0.5441798770208954, "learning_rate": 3.141828515916963e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.19593748450279236, "step": 1720, "valid_targets_mean": 5229.9, "valid_targets_min": 928 }, { "epoch": 2.641653905053599, "grad_norm": 0.49587618350763246, "learning_rate": 3.135549165889361e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.22288836538791656, "step": 1725, "valid_targets_mean": 4101.1, "valid_targets_min": 274 }, { "epoch": 2.649310872894334, "grad_norm": 0.4169833894502891, "learning_rate": 3.1292532532908814e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.19745498895645142, "step": 1730, "valid_targets_mean": 5347.1, "valid_targets_min": 288 }, { "epoch": 2.656967840735069, "grad_norm": 0.4322133840167338, "learning_rate": 3.12294086995066e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.17262643575668335, "step": 1735, "valid_targets_mean": 4846.4, "valid_targets_min": 2380 }, { "epoch": 2.664624808575804, "grad_norm": 0.5366545162742864, "learning_rate": 3.116612107938068e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.22421014308929443, "step": 1740, "valid_targets_mean": 4210.1, "valid_targets_min": 594 }, { "epoch": 2.672281776416539, "grad_norm": 0.45585126107024354, "learning_rate": 3.1102670595613654e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.19032257795333862, "step": 1745, "valid_targets_mean": 4588.5, "valid_targets_min": 713 }, { "epoch": 2.679938744257274, "grad_norm": 0.5669095838367388, "learning_rate": 3.10390581736636e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.20808973908424377, "step": 1750, "valid_targets_mean": 4542.7, "valid_targets_min": 637 }, { "epoch": 2.687595712098009, "grad_norm": 0.42969387483485466, "learning_rate": 3.0975284741350535e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.184463769197464, "step": 1755, "valid_targets_mean": 5571.9, "valid_targets_min": 899 }, { "epoch": 2.6952526799387444, "grad_norm": 0.4688512511006581, "learning_rate": 3.091135122884289e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.21699786186218262, "step": 1760, "valid_targets_mean": 5923.4, "valid_targets_min": 851 }, { "epoch": 2.7029096477794794, "grad_norm": 0.48031854884765524, "learning_rate": 3.084725856864395e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.21168527007102966, "step": 1765, "valid_targets_mean": 5652.4, "valid_targets_min": 996 }, { "epoch": 2.7105666156202144, "grad_norm": 0.3909694462296888, "learning_rate": 3.078300769557827e-05, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.16804447770118713, "step": 1770, "valid_targets_mean": 5812.6, "valid_targets_min": 669 }, { "epoch": 2.7182235834609494, "grad_norm": 0.44319625905779303, "learning_rate": 3.0718599546778e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.21331599354743958, "step": 1775, "valid_targets_mean": 4729.1, "valid_targets_min": 706 }, { "epoch": 2.7258805513016844, "grad_norm": 0.4495408359076918, "learning_rate": 3.065403506166925e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.20311203598976135, "step": 1780, "valid_targets_mean": 5382.8, "valid_targets_min": 2506 }, { "epoch": 2.73353751914242, "grad_norm": 0.46444461555955624, "learning_rate": 3.058931518195834e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.21994590759277344, "step": 1785, "valid_targets_mean": 4179.7, "valid_targets_min": 685 }, { "epoch": 2.741194486983155, "grad_norm": 0.591047392543951, "learning_rate": 3.052444085161818e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.20447468757629395, "step": 1790, "valid_targets_mean": 5012.3, "valid_targets_min": 685 }, { "epoch": 2.74885145482389, "grad_norm": 0.46171591187608774, "learning_rate": 3.0459413016874334e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.22244763374328613, "step": 1795, "valid_targets_mean": 4043.6, "valid_targets_min": 747 }, { "epoch": 2.756508422664625, "grad_norm": 0.4755204959145075, "learning_rate": 3.039423262619137e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.23722028732299805, "step": 1800, "valid_targets_mean": 4548.3, "valid_targets_min": 1499 }, { "epoch": 2.76416539050536, "grad_norm": 0.43118554325602115, "learning_rate": 3.0328900630258924e-05, "loss": 0.2163, "loss_nan_ranks": 0, "loss_rank_avg": 0.20272132754325867, "step": 1805, "valid_targets_mean": 5041.2, "valid_targets_min": 940 }, { "epoch": 2.771822358346095, "grad_norm": 0.40532349261110173, "learning_rate": 3.02634179819779e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.18425460159778595, "step": 1810, "valid_targets_mean": 5047.2, "valid_targets_min": 635 }, { "epoch": 2.77947932618683, "grad_norm": 0.40870340425176643, "learning_rate": 3.0197785636446516e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.19097676873207092, "step": 1815, "valid_targets_mean": 5106.1, "valid_targets_min": 360 }, { "epoch": 2.7871362940275652, "grad_norm": 0.4466837704739254, "learning_rate": 3.0132004550946438e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.24000149965286255, "step": 1820, "valid_targets_mean": 5685.8, "valid_targets_min": 603 }, { "epoch": 2.7947932618683002, "grad_norm": 0.4157130523321726, "learning_rate": 3.006607568492875e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.20618754625320435, "step": 1825, "valid_targets_mean": 5365.9, "valid_targets_min": 344 }, { "epoch": 2.8024502297090352, "grad_norm": 0.45846280599364925, "learning_rate": 3.0000000000000004e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.20795312523841858, "step": 1830, "valid_targets_mean": 5361.0, "valid_targets_min": 975 }, { "epoch": 2.8101071975497702, "grad_norm": 0.42423011488107815, "learning_rate": 2.9933778459908178e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.2021748125553131, "step": 1835, "valid_targets_mean": 5163.9, "valid_targets_min": 846 }, { "epoch": 2.8177641653905052, "grad_norm": 0.5922093821939035, "learning_rate": 2.986741203052863e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.2244371771812439, "step": 1840, "valid_targets_mean": 5787.4, "valid_targets_min": 732 }, { "epoch": 2.8254211332312407, "grad_norm": 0.41160121668642163, "learning_rate": 2.9800901679849993e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.20778921246528625, "step": 1845, "valid_targets_mean": 5501.7, "valid_targets_min": 663 }, { "epoch": 2.8330781010719757, "grad_norm": 0.4427215800064586, "learning_rate": 2.9734248377960072e-05, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.19352000951766968, "step": 1850, "valid_targets_mean": 5902.9, "valid_targets_min": 478 }, { "epoch": 2.8407350689127107, "grad_norm": 0.4807115826614534, "learning_rate": 2.9667453097031695e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.24455857276916504, "step": 1855, "valid_targets_mean": 4574.5, "valid_targets_min": 774 }, { "epoch": 2.8483920367534457, "grad_norm": 0.5374002834819784, "learning_rate": 2.9600516811308516e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.22875338792800903, "step": 1860, "valid_targets_mean": 4644.6, "valid_targets_min": 659 }, { "epoch": 2.8560490045941807, "grad_norm": 0.5090559947438412, "learning_rate": 2.953344049709082e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.19830799102783203, "step": 1865, "valid_targets_mean": 4229.7, "valid_targets_min": 827 }, { "epoch": 2.8637059724349156, "grad_norm": 0.45737005237173484, "learning_rate": 2.9466225132721285e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.20132991671562195, "step": 1870, "valid_targets_mean": 4853.1, "valid_targets_min": 792 }, { "epoch": 2.8713629402756506, "grad_norm": 0.40896772467478815, "learning_rate": 2.9398871698570706e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.20456016063690186, "step": 1875, "valid_targets_mean": 5263.5, "valid_targets_min": 364 }, { "epoch": 2.879019908116386, "grad_norm": 0.46658454506306835, "learning_rate": 2.9331381177023685e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.20330816507339478, "step": 1880, "valid_targets_mean": 4714.1, "valid_targets_min": 1107 }, { "epoch": 2.886676875957121, "grad_norm": 0.45821454150634894, "learning_rate": 2.9263754552464338e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.19405120611190796, "step": 1885, "valid_targets_mean": 4531.8, "valid_targets_min": 353 }, { "epoch": 2.894333843797856, "grad_norm": 0.5547254247208179, "learning_rate": 2.9195992811261897e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.23308220505714417, "step": 1890, "valid_targets_mean": 3445.6, "valid_targets_min": 270 }, { "epoch": 2.901990811638591, "grad_norm": 0.45421334304878075, "learning_rate": 2.912809694175634e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.2073233723640442, "step": 1895, "valid_targets_mean": 4847.8, "valid_targets_min": 610 }, { "epoch": 2.909647779479326, "grad_norm": 0.528454036702243, "learning_rate": 2.906006793424398e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.21321921050548553, "step": 1900, "valid_targets_mean": 3648.8, "valid_targets_min": 680 }, { "epoch": 2.9173047473200615, "grad_norm": 0.41825864046575006, "learning_rate": 2.8991906780963014e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.19795027375221252, "step": 1905, "valid_targets_mean": 5839.6, "valid_targets_min": 2864 }, { "epoch": 2.924961715160796, "grad_norm": 0.41700524250275683, "learning_rate": 2.8923614476079053e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.20309601724147797, "step": 1910, "valid_targets_mean": 5556.4, "valid_targets_min": 1212 }, { "epoch": 2.9326186830015315, "grad_norm": 0.41390443168776353, "learning_rate": 2.885519201567063e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.19842462241649628, "step": 1915, "valid_targets_mean": 5288.7, "valid_targets_min": 966 }, { "epoch": 2.9402756508422665, "grad_norm": 0.44113143651113673, "learning_rate": 2.878664039771466e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.1972970962524414, "step": 1920, "valid_targets_mean": 4468.6, "valid_targets_min": 724 }, { "epoch": 2.9479326186830015, "grad_norm": 0.42348693430683976, "learning_rate": 2.8717960622071875e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.2290765643119812, "step": 1925, "valid_targets_mean": 5191.4, "valid_targets_min": 1011 }, { "epoch": 2.9555895865237365, "grad_norm": 0.40281713608998554, "learning_rate": 2.8649153690472258e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.18338808417320251, "step": 1930, "valid_targets_mean": 5284.5, "valid_targets_min": 734 }, { "epoch": 2.9632465543644715, "grad_norm": 0.4313394629221367, "learning_rate": 2.858022060650045e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.20001380145549774, "step": 1935, "valid_targets_mean": 4850.2, "valid_targets_min": 294 }, { "epoch": 2.970903522205207, "grad_norm": 0.4330030636250435, "learning_rate": 2.851116237558106e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.19025284051895142, "step": 1940, "valid_targets_mean": 4625.9, "valid_targets_min": 313 }, { "epoch": 2.978560490045942, "grad_norm": 0.4537727728009908, "learning_rate": 2.8441980004964035e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.22758567333221436, "step": 1945, "valid_targets_mean": 5108.7, "valid_targets_min": 908 }, { "epoch": 2.986217457886677, "grad_norm": 0.5070336992907599, "learning_rate": 2.8372674503709988e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.22816471755504608, "step": 1950, "valid_targets_mean": 4112.2, "valid_targets_min": 731 }, { "epoch": 2.993874425727412, "grad_norm": 0.5222307071784804, "learning_rate": 2.8303246882675422e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.230756014585495, "step": 1955, "valid_targets_mean": 4718.6, "valid_targets_min": 822 }, { "epoch": 3.001531393568147, "grad_norm": 0.44388401663627725, "learning_rate": 2.8233698154498042e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.21255435049533844, "step": 1960, "valid_targets_mean": 5199.9, "valid_targets_min": 538 }, { "epoch": 3.009188361408882, "grad_norm": 0.49805799320752814, "learning_rate": 2.8164029333581964e-05, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.17959743738174438, "step": 1965, "valid_targets_mean": 4954.9, "valid_targets_min": 685 }, { "epoch": 3.0168453292496173, "grad_norm": 0.451755079299758, "learning_rate": 2.809424143608289e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.1869395226240158, "step": 1970, "valid_targets_mean": 5274.4, "valid_targets_min": 538 }, { "epoch": 3.0245022970903523, "grad_norm": 0.4237197860277832, "learning_rate": 2.802433547989336e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.1696140170097351, "step": 1975, "valid_targets_mean": 5256.1, "valid_targets_min": 869 }, { "epoch": 3.0321592649310873, "grad_norm": 0.48674324881062975, "learning_rate": 2.7954312484627824e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.1883959323167801, "step": 1980, "valid_targets_mean": 5084.5, "valid_targets_min": 702 }, { "epoch": 3.0398162327718223, "grad_norm": 0.49321268064240037, "learning_rate": 2.788417347160783e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.20648150146007538, "step": 1985, "valid_targets_mean": 4628.4, "valid_targets_min": 682 }, { "epoch": 3.0474732006125573, "grad_norm": 0.541476424950113, "learning_rate": 2.7813919463847094e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.19818390905857086, "step": 1990, "valid_targets_mean": 4582.2, "valid_targets_min": 680 }, { "epoch": 3.0551301684532923, "grad_norm": 0.4501064317153738, "learning_rate": 2.7743551486036588e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.18310943245887756, "step": 1995, "valid_targets_mean": 5253.2, "valid_targets_min": 846 }, { "epoch": 3.0627871362940278, "grad_norm": 0.47833852227635554, "learning_rate": 2.7673070564529606e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1747608482837677, "step": 2000, "valid_targets_mean": 5987.4, "valid_targets_min": 661 }, { "epoch": 3.0704441041347628, "grad_norm": 0.44582266307962753, "learning_rate": 2.7602477727326764e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.20294205844402313, "step": 2005, "valid_targets_mean": 5650.4, "valid_targets_min": 345 }, { "epoch": 3.0781010719754978, "grad_norm": 0.4439541326450507, "learning_rate": 2.7531774004061057e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.18605002760887146, "step": 2010, "valid_targets_mean": 5244.9, "valid_targets_min": 736 }, { "epoch": 3.0857580398162328, "grad_norm": 0.8975814777494563, "learning_rate": 2.746096042598279e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.1635829508304596, "step": 2015, "valid_targets_mean": 4843.5, "valid_targets_min": 776 }, { "epoch": 3.0934150076569678, "grad_norm": 0.4399161374325912, "learning_rate": 2.739003802594456e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.19688273966312408, "step": 2020, "valid_targets_mean": 5672.7, "valid_targets_min": 580 }, { "epoch": 3.1010719754977027, "grad_norm": 0.4325179298872115, "learning_rate": 2.7319007838386177e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.1865837574005127, "step": 2025, "valid_targets_mean": 5061.4, "valid_targets_min": 1569 }, { "epoch": 3.108728943338438, "grad_norm": 0.5041193832066779, "learning_rate": 2.724787089931962e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.17695216834545135, "step": 2030, "valid_targets_mean": 4700.2, "valid_targets_min": 635 }, { "epoch": 3.116385911179173, "grad_norm": 0.6636882689104748, "learning_rate": 2.7176628246313864e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.17805099487304688, "step": 2035, "valid_targets_mean": 5752.7, "valid_targets_min": 274 }, { "epoch": 3.124042879019908, "grad_norm": 0.4991191331475684, "learning_rate": 2.7105280918479775e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.18973186612129211, "step": 2040, "valid_targets_mean": 5067.0, "valid_targets_min": 706 }, { "epoch": 3.131699846860643, "grad_norm": 0.4629329569115915, "learning_rate": 2.7033829956454992e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.22558261454105377, "step": 2045, "valid_targets_mean": 4791.7, "valid_targets_min": 880 }, { "epoch": 3.139356814701378, "grad_norm": 0.4955623156729709, "learning_rate": 2.696227640238867e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18404105305671692, "step": 2050, "valid_targets_mean": 4818.3, "valid_targets_min": 294 }, { "epoch": 3.147013782542113, "grad_norm": 0.40572235426798386, "learning_rate": 2.6890621299926337e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.16386070847511292, "step": 2055, "valid_targets_mean": 5887.9, "valid_targets_min": 854 }, { "epoch": 3.1546707503828486, "grad_norm": 0.4822367465005572, "learning_rate": 2.681886569419467e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.1752379685640335, "step": 2060, "valid_targets_mean": 4959.8, "valid_targets_min": 559 }, { "epoch": 3.1623277182235836, "grad_norm": 0.42573426451272567, "learning_rate": 2.674701063178621e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.1862529069185257, "step": 2065, "valid_targets_mean": 5424.7, "valid_targets_min": 924 }, { "epoch": 3.1699846860643186, "grad_norm": 0.555365775012984, "learning_rate": 2.6675057160744157e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2169274091720581, "step": 2070, "valid_targets_mean": 4135.9, "valid_targets_min": 665 }, { "epoch": 3.1776416539050536, "grad_norm": 0.49960455879913235, "learning_rate": 2.660300633054703e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.19349941611289978, "step": 2075, "valid_targets_mean": 4799.2, "valid_targets_min": 692 }, { "epoch": 3.1852986217457886, "grad_norm": 0.4401708479718189, "learning_rate": 2.653085919209339e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.19372834265232086, "step": 2080, "valid_targets_mean": 5538.8, "valid_targets_min": 2930 }, { "epoch": 3.1929555895865236, "grad_norm": 0.40630670332354507, "learning_rate": 2.64586167976865e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.18609587848186493, "step": 2085, "valid_targets_mean": 5602.0, "valid_targets_min": 1947 }, { "epoch": 3.2006125574272586, "grad_norm": 0.4486946026376343, "learning_rate": 2.6386280201018978e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.19235703349113464, "step": 2090, "valid_targets_mean": 5800.1, "valid_targets_min": 834 }, { "epoch": 3.208269525267994, "grad_norm": 0.43778644558935853, "learning_rate": 2.6313850457157446e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.18642935156822205, "step": 2095, "valid_targets_mean": 5270.8, "valid_targets_min": 2460 }, { "epoch": 3.215926493108729, "grad_norm": 0.4771876713178929, "learning_rate": 2.6241328622527097e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.20062386989593506, "step": 2100, "valid_targets_mean": 5161.2, "valid_targets_min": 2477 }, { "epoch": 3.223583460949464, "grad_norm": 0.46215779428957415, "learning_rate": 2.6168715754896346e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.19280359148979187, "step": 2105, "valid_targets_mean": 5252.8, "valid_targets_min": 965 }, { "epoch": 3.231240428790199, "grad_norm": 0.445313686278001, "learning_rate": 2.6096012913361355e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.17572081089019775, "step": 2110, "valid_targets_mean": 5731.9, "valid_targets_min": 1637 }, { "epoch": 3.238897396630934, "grad_norm": 0.5062526832195221, "learning_rate": 2.60232211583306e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.18368211388587952, "step": 2115, "valid_targets_mean": 4119.7, "valid_targets_min": 889 }, { "epoch": 3.2465543644716695, "grad_norm": 0.5086260485057701, "learning_rate": 2.5950341551509417e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.16073405742645264, "step": 2120, "valid_targets_mean": 5029.1, "valid_targets_min": 801 }, { "epoch": 3.2542113323124044, "grad_norm": 0.4553370142955746, "learning_rate": 2.58773751558845e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.1590225100517273, "step": 2125, "valid_targets_mean": 5276.3, "valid_targets_min": 645 }, { "epoch": 3.2618683001531394, "grad_norm": 0.5007894833828535, "learning_rate": 2.5804323035708398e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.17388451099395752, "step": 2130, "valid_targets_mean": 4547.9, "valid_targets_min": 294 }, { "epoch": 3.2695252679938744, "grad_norm": 0.4373602866755202, "learning_rate": 2.5731186256484e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.18840092420578003, "step": 2135, "valid_targets_mean": 4721.8, "valid_targets_min": 546 }, { "epoch": 3.2771822358346094, "grad_norm": 0.6742452779283673, "learning_rate": 2.5657965884949e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.2183414101600647, "step": 2140, "valid_targets_mean": 4429.9, "valid_targets_min": 860 }, { "epoch": 3.2848392036753444, "grad_norm": 0.45898450490614895, "learning_rate": 2.5584662989060317e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.17275741696357727, "step": 2145, "valid_targets_mean": 5442.9, "valid_targets_min": 743 }, { "epoch": 3.2924961715160794, "grad_norm": 0.44882146875151396, "learning_rate": 2.5511278637978532e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.15515941381454468, "step": 2150, "valid_targets_mean": 5243.6, "valid_targets_min": 682 }, { "epoch": 3.300153139356815, "grad_norm": 0.4467734518319107, "learning_rate": 2.5437813902052292e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.18329621851444244, "step": 2155, "valid_targets_mean": 5117.8, "valid_targets_min": 616 }, { "epoch": 3.30781010719755, "grad_norm": 0.4152520371866648, "learning_rate": 2.536426985280271e-05, "loss": 0.2025, "loss_nan_ranks": 0, "loss_rank_avg": 0.1850317418575287, "step": 2160, "valid_targets_mean": 5134.1, "valid_targets_min": 662 }, { "epoch": 3.315467075038285, "grad_norm": 0.44998774771356215, "learning_rate": 2.5290647562907705e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.21751946210861206, "step": 2165, "valid_targets_mean": 5467.7, "valid_targets_min": 2622 }, { "epoch": 3.32312404287902, "grad_norm": 0.4019431753462474, "learning_rate": 2.5216948106186395e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.1585729718208313, "step": 2170, "valid_targets_mean": 5651.1, "valid_targets_min": 789 }, { "epoch": 3.330781010719755, "grad_norm": 0.5618290697674159, "learning_rate": 2.5143172557583412e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.21604791283607483, "step": 2175, "valid_targets_mean": 3703.8, "valid_targets_min": 748 }, { "epoch": 3.3384379785604903, "grad_norm": 0.43902097786183897, "learning_rate": 2.506932199315321e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.19183912873268127, "step": 2180, "valid_targets_mean": 4844.0, "valid_targets_min": 744 }, { "epoch": 3.3460949464012253, "grad_norm": 0.45644637337033184, "learning_rate": 2.499539749004441e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.20222628116607666, "step": 2185, "valid_targets_mean": 5212.4, "valid_targets_min": 773 }, { "epoch": 3.3537519142419603, "grad_norm": 0.4393001352247523, "learning_rate": 2.4921400126484057e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.20443087816238403, "step": 2190, "valid_targets_mean": 5666.1, "valid_targets_min": 1784 }, { "epoch": 3.3614088820826953, "grad_norm": 0.5628152912241892, "learning_rate": 2.4847330981761893e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.18845781683921814, "step": 2195, "valid_targets_mean": 3962.0, "valid_targets_min": 610 }, { "epoch": 3.3690658499234303, "grad_norm": 0.4499446422169732, "learning_rate": 2.4773191136214655e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.1923513114452362, "step": 2200, "valid_targets_mean": 4977.8, "valid_targets_min": 830 }, { "epoch": 3.3767228177641653, "grad_norm": 0.4645104369113949, "learning_rate": 2.4698981671210253e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823941171169281, "step": 2205, "valid_targets_mean": 4065.4, "valid_targets_min": 358 }, { "epoch": 3.3843797856049003, "grad_norm": 0.46636495279671436, "learning_rate": 2.462470366913206e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.18425936996936798, "step": 2210, "valid_targets_mean": 4618.2, "valid_targets_min": 601 }, { "epoch": 3.3920367534456357, "grad_norm": 0.5055126421992738, "learning_rate": 2.4550358213363083e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.19574221968650818, "step": 2215, "valid_targets_mean": 3900.2, "valid_targets_min": 591 }, { "epoch": 3.3996937212863707, "grad_norm": 0.5503070083738346, "learning_rate": 2.4475946388270172e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.17538341879844666, "step": 2220, "valid_targets_mean": 3802.2, "valid_targets_min": 255 }, { "epoch": 3.4073506891271057, "grad_norm": 0.47088674144945025, "learning_rate": 2.440146927918823e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.2073318362236023, "step": 2225, "valid_targets_mean": 4473.6, "valid_targets_min": 421 }, { "epoch": 3.4150076569678407, "grad_norm": 0.4740661356667313, "learning_rate": 2.4326927972404333e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.20011824369430542, "step": 2230, "valid_targets_mean": 4605.9, "valid_targets_min": 626 }, { "epoch": 3.4226646248085757, "grad_norm": 0.4165429827415794, "learning_rate": 2.4252323555141935e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.17027318477630615, "step": 2235, "valid_targets_mean": 5750.4, "valid_targets_min": 2722 }, { "epoch": 3.4303215926493107, "grad_norm": 0.4794637308355578, "learning_rate": 2.417765711554498e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.16433902084827423, "step": 2240, "valid_targets_mean": 4362.0, "valid_targets_min": 621 }, { "epoch": 3.437978560490046, "grad_norm": 0.5136159685801481, "learning_rate": 2.410292974266203e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.20960760116577148, "step": 2245, "valid_targets_mean": 3976.4, "valid_targets_min": 758 }, { "epoch": 3.445635528330781, "grad_norm": 0.5270719518942621, "learning_rate": 2.402814252643042e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.20371288061141968, "step": 2250, "valid_targets_mean": 4996.0, "valid_targets_min": 1014 }, { "epoch": 3.453292496171516, "grad_norm": 0.48963006601475756, "learning_rate": 2.3953296557660288e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.18395353853702545, "step": 2255, "valid_targets_mean": 5188.1, "valid_targets_min": 827 }, { "epoch": 3.460949464012251, "grad_norm": 0.4145211188615159, "learning_rate": 2.387839292801875e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.1779845654964447, "step": 2260, "valid_targets_mean": 5619.1, "valid_targets_min": 663 }, { "epoch": 3.468606431852986, "grad_norm": 0.4701954182659396, "learning_rate": 2.3803432730013913e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.18874239921569824, "step": 2265, "valid_targets_mean": 4970.4, "valid_targets_min": 854 }, { "epoch": 3.476263399693721, "grad_norm": 0.5084547938774928, "learning_rate": 2.372841705697897e-05, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.19924131035804749, "step": 2270, "valid_targets_mean": 4273.2, "valid_targets_min": 525 }, { "epoch": 3.4839203675344566, "grad_norm": 0.42346772066137994, "learning_rate": 2.365334700305624e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.18509188294410706, "step": 2275, "valid_targets_mean": 5318.5, "valid_targets_min": 593 }, { "epoch": 3.4915773353751915, "grad_norm": 0.43876011826770084, "learning_rate": 2.3578223663181214e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.19643978774547577, "step": 2280, "valid_targets_mean": 4982.8, "valid_targets_min": 744 }, { "epoch": 3.4992343032159265, "grad_norm": 0.4259076717957742, "learning_rate": 2.35030481330666e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.17723461985588074, "step": 2285, "valid_targets_mean": 5322.2, "valid_targets_min": 1669 }, { "epoch": 3.5068912710566615, "grad_norm": 0.40790611814620886, "learning_rate": 2.3427821509186308e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.16672778129577637, "step": 2290, "valid_targets_mean": 5282.6, "valid_targets_min": 1002 }, { "epoch": 3.5145482388973965, "grad_norm": 0.43724973404898343, "learning_rate": 2.3352544888759495e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.17628073692321777, "step": 2295, "valid_targets_mean": 5093.2, "valid_targets_min": 732 }, { "epoch": 3.522205206738132, "grad_norm": 0.4419945752454893, "learning_rate": 2.3277219369734537e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17800669372081757, "step": 2300, "valid_targets_mean": 5829.1, "valid_targets_min": 464 }, { "epoch": 3.5298621745788665, "grad_norm": 0.40029502890365776, "learning_rate": 2.320184605077302e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.1498422920703888, "step": 2305, "valid_targets_mean": 6132.4, "valid_targets_min": 3259 }, { "epoch": 3.537519142419602, "grad_norm": 0.4317895472992919, "learning_rate": 2.3126426031233714e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.20129495859146118, "step": 2310, "valid_targets_mean": 5208.1, "valid_targets_min": 901 }, { "epoch": 3.545176110260337, "grad_norm": 0.40601945027019737, "learning_rate": 2.3050960411156546e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.18385669589042664, "step": 2315, "valid_targets_mean": 6188.5, "valid_targets_min": 3363 }, { "epoch": 3.552833078101072, "grad_norm": 0.4955956305407851, "learning_rate": 2.2975450291246536e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.16455523669719696, "step": 2320, "valid_targets_mean": 5401.9, "valid_targets_min": 434 }, { "epoch": 3.560490045941807, "grad_norm": 0.4775531036710853, "learning_rate": 2.289989677285779e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.20387563109397888, "step": 2325, "valid_targets_mean": 5242.1, "valid_targets_min": 680 }, { "epoch": 3.568147013782542, "grad_norm": 0.42783431960706375, "learning_rate": 2.282430095797737e-05, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.17975592613220215, "step": 2330, "valid_targets_mean": 5704.2, "valid_targets_min": 792 }, { "epoch": 3.5758039816232774, "grad_norm": 0.4653094697113535, "learning_rate": 2.274866394920927e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.19249895215034485, "step": 2335, "valid_targets_mean": 5539.1, "valid_targets_min": 916 }, { "epoch": 3.5834609494640124, "grad_norm": 0.42954428223445007, "learning_rate": 2.2672986849758316e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.17228573560714722, "step": 2340, "valid_targets_mean": 5570.5, "valid_targets_min": 2379 }, { "epoch": 3.5911179173047474, "grad_norm": 0.8433824524079548, "learning_rate": 2.259727076341407e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.15344902873039246, "step": 2345, "valid_targets_mean": 5395.2, "valid_targets_min": 1700 }, { "epoch": 3.5987748851454824, "grad_norm": 0.43204330288459675, "learning_rate": 2.252151679453475e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.1977773904800415, "step": 2350, "valid_targets_mean": 4850.1, "valid_targets_min": 794 }, { "epoch": 3.6064318529862174, "grad_norm": 0.3957799588447967, "learning_rate": 2.2445726048031104e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.18701013922691345, "step": 2355, "valid_targets_mean": 6515.1, "valid_targets_min": 1939 }, { "epoch": 3.6140888208269524, "grad_norm": 0.46060379254586875, "learning_rate": 2.23698996293503e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.19811898469924927, "step": 2360, "valid_targets_mean": 5086.2, "valid_targets_min": 1335 }, { "epoch": 3.6217457886676874, "grad_norm": 0.4761035270932635, "learning_rate": 2.2294038644459805e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.18033194541931152, "step": 2365, "valid_targets_mean": 4584.5, "valid_targets_min": 607 }, { "epoch": 3.629402756508423, "grad_norm": 0.4869396442286812, "learning_rate": 2.221814419983125e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.20814746618270874, "step": 2370, "valid_targets_mean": 5545.9, "valid_targets_min": 2727 }, { "epoch": 3.637059724349158, "grad_norm": 0.46298467756924694, "learning_rate": 2.2142217402424296e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.176169753074646, "step": 2375, "valid_targets_mean": 4827.2, "valid_targets_min": 581 }, { "epoch": 3.644716692189893, "grad_norm": 0.4195617237812523, "learning_rate": 2.2066259359670485e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.17234407365322113, "step": 2380, "valid_targets_mean": 5661.3, "valid_targets_min": 814 }, { "epoch": 3.652373660030628, "grad_norm": 0.43491867592878586, "learning_rate": 2.1990271179457082e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.17926275730133057, "step": 2385, "valid_targets_mean": 5154.2, "valid_targets_min": 1010 }, { "epoch": 3.660030627871363, "grad_norm": 0.5808883209817489, "learning_rate": 2.1914253970110937e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.22726327180862427, "step": 2390, "valid_targets_mean": 3341.1, "valid_targets_min": 582 }, { "epoch": 3.6676875957120982, "grad_norm": 0.39616224115059184, "learning_rate": 2.1838208840382294e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.17501763999462128, "step": 2395, "valid_targets_mean": 5985.6, "valid_targets_min": 1035 }, { "epoch": 3.6753445635528332, "grad_norm": 0.5537720074927155, "learning_rate": 2.176213689942863e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.2179131954908371, "step": 2400, "valid_targets_mean": 3625.4, "valid_targets_min": 364 }, { "epoch": 3.6830015313935682, "grad_norm": 0.43256442597937816, "learning_rate": 2.168603925679849e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.14384448528289795, "step": 2405, "valid_targets_mean": 4353.9, "valid_targets_min": 335 }, { "epoch": 3.6906584992343032, "grad_norm": 0.4852843793132942, "learning_rate": 2.160991702241527e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.20300811529159546, "step": 2410, "valid_targets_mean": 4493.1, "valid_targets_min": 591 }, { "epoch": 3.698315467075038, "grad_norm": 0.4046986527750801, "learning_rate": 2.1533771306561066e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.17245183885097504, "step": 2415, "valid_targets_mean": 6083.0, "valid_targets_min": 837 }, { "epoch": 3.705972434915773, "grad_norm": 0.4681618550416894, "learning_rate": 2.1457603219860457e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.20374765992164612, "step": 2420, "valid_targets_mean": 4759.5, "valid_targets_min": 492 }, { "epoch": 3.713629402756508, "grad_norm": 0.35609101937418786, "learning_rate": 2.1381413873264315e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.16857865452766418, "step": 2425, "valid_targets_mean": 6080.7, "valid_targets_min": 3141 }, { "epoch": 3.7212863705972437, "grad_norm": 0.39199321408980886, "learning_rate": 2.1305204378033598e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.17050239443778992, "step": 2430, "valid_targets_mean": 6238.8, "valid_targets_min": 2991 }, { "epoch": 3.7289433384379786, "grad_norm": 0.5289287346109518, "learning_rate": 2.1228975845723137e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.18746045231819153, "step": 2435, "valid_targets_mean": 3991.0, "valid_targets_min": 251 }, { "epoch": 3.7366003062787136, "grad_norm": 0.4065373365511912, "learning_rate": 2.115272938816544e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.14783808588981628, "step": 2440, "valid_targets_mean": 4898.0, "valid_targets_min": 661 }, { "epoch": 3.7442572741194486, "grad_norm": 0.465243722366574, "learning_rate": 2.107646611745445e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2061719298362732, "step": 2445, "valid_targets_mean": 5343.1, "valid_targets_min": 720 }, { "epoch": 3.7519142419601836, "grad_norm": 0.5540659684720433, "learning_rate": 2.1000187145929347e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.20314675569534302, "step": 2450, "valid_targets_mean": 3803.7, "valid_targets_min": 490 }, { "epoch": 3.759571209800919, "grad_norm": 0.5243985701272287, "learning_rate": 2.092389358615832e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2511424124240875, "step": 2455, "valid_targets_mean": 4707.7, "valid_targets_min": 611 }, { "epoch": 3.7672281776416536, "grad_norm": 0.42664805575678655, "learning_rate": 2.0847586550922326e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.2017786204814911, "step": 2460, "valid_targets_mean": 5301.8, "valid_targets_min": 918 }, { "epoch": 3.774885145482389, "grad_norm": 0.4453346796586349, "learning_rate": 2.0771267153198873e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.17807403206825256, "step": 2465, "valid_targets_mean": 5417.9, "valid_targets_min": 928 }, { "epoch": 3.782542113323124, "grad_norm": 0.4219997971711044, "learning_rate": 2.069493650614578e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.1867009550333023, "step": 2470, "valid_targets_mean": 5047.1, "valid_targets_min": 616 }, { "epoch": 3.790199081163859, "grad_norm": 0.3945998573310309, "learning_rate": 2.0618595723084938e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.16966620087623596, "step": 2475, "valid_targets_mean": 5595.2, "valid_targets_min": 727 }, { "epoch": 3.797856049004594, "grad_norm": 0.3896927875127744, "learning_rate": 2.054224591748609e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.17560520768165588, "step": 2480, "valid_targets_mean": 5799.6, "valid_targets_min": 1214 }, { "epoch": 3.805513016845329, "grad_norm": 0.4767292234124444, "learning_rate": 2.046588820295057e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.2139269858598709, "step": 2485, "valid_targets_mean": 5065.8, "valid_targets_min": 499 }, { "epoch": 3.8131699846860645, "grad_norm": 0.48305615805465524, "learning_rate": 2.038952369319507e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.1714230179786682, "step": 2490, "valid_targets_mean": 5173.9, "valid_targets_min": 1005 }, { "epoch": 3.8208269525267995, "grad_norm": 0.4591287515515576, "learning_rate": 2.031315350203539e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.20354583859443665, "step": 2495, "valid_targets_mean": 5899.7, "valid_targets_min": 1542 }, { "epoch": 3.8284839203675345, "grad_norm": 0.405791559738873, "learning_rate": 2.02367787433702e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725158542394638, "step": 2500, "valid_targets_mean": 5390.0, "valid_targets_min": 639 }, { "epoch": 3.8361408882082695, "grad_norm": 0.4497822748514485, "learning_rate": 2.0160400531164787e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.15819357335567474, "step": 2505, "valid_targets_mean": 5183.4, "valid_targets_min": 813 }, { "epoch": 3.8437978560490045, "grad_norm": 0.38677614976809455, "learning_rate": 2.008401997943481e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.19747616350650787, "step": 2510, "valid_targets_mean": 6532.3, "valid_targets_min": 875 }, { "epoch": 3.85145482388974, "grad_norm": 0.4278038294940775, "learning_rate": 2.0007638202230053e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.1896567940711975, "step": 2515, "valid_targets_mean": 5536.9, "valid_targets_min": 838 }, { "epoch": 3.8591117917304745, "grad_norm": 0.5403737252126551, "learning_rate": 1.9931256313618173e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.19202588498592377, "step": 2520, "valid_targets_mean": 4081.1, "valid_targets_min": 352 }, { "epoch": 3.86676875957121, "grad_norm": 0.44283695481669993, "learning_rate": 1.9854875427668453e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.1849876344203949, "step": 2525, "valid_targets_mean": 5332.9, "valid_targets_min": 1213 }, { "epoch": 3.874425727411945, "grad_norm": 0.45612268357938296, "learning_rate": 1.9778496658435552e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.2018076777458191, "step": 2530, "valid_targets_mean": 4947.2, "valid_targets_min": 713 }, { "epoch": 3.88208269525268, "grad_norm": 0.4511802661455763, "learning_rate": 1.970212111994325e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.1800006926059723, "step": 2535, "valid_targets_mean": 5933.2, "valid_targets_min": 1511 }, { "epoch": 3.889739663093415, "grad_norm": 0.4550636487612721, "learning_rate": 1.9625749926168205e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.19659721851348877, "step": 2540, "valid_targets_mean": 5744.1, "valid_targets_min": 2064 }, { "epoch": 3.89739663093415, "grad_norm": 0.45143924481673986, "learning_rate": 1.954938419102372e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.17691466212272644, "step": 2545, "valid_targets_mean": 4654.2, "valid_targets_min": 892 }, { "epoch": 3.9050535987748853, "grad_norm": 0.4108146672941242, "learning_rate": 1.9473025028343464e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.1811871975660324, "step": 2550, "valid_targets_mean": 5904.1, "valid_targets_min": 2536 }, { "epoch": 3.9127105666156203, "grad_norm": 0.39297017745981955, "learning_rate": 1.9396673551865245e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.16155928373336792, "step": 2555, "valid_targets_mean": 5933.3, "valid_targets_min": 1125 }, { "epoch": 3.9203675344563553, "grad_norm": 0.4647337901010682, "learning_rate": 1.932033087521478e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.20087887346744537, "step": 2560, "valid_targets_mean": 5496.6, "valid_targets_min": 672 }, { "epoch": 3.9280245022970903, "grad_norm": 0.51196014419268, "learning_rate": 1.9243998111889422e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18994739651679993, "step": 2565, "valid_targets_mean": 4321.1, "valid_targets_min": 768 }, { "epoch": 3.9356814701378253, "grad_norm": 0.486482225957426, "learning_rate": 1.916767637524193e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.20536579191684723, "step": 2570, "valid_targets_mean": 4581.4, "valid_targets_min": 574 }, { "epoch": 3.9433384379785608, "grad_norm": 0.5397289328340875, "learning_rate": 1.9091366778464236e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987244337797165, "step": 2575, "valid_targets_mean": 4776.2, "valid_targets_min": 822 }, { "epoch": 3.9509954058192953, "grad_norm": 0.39898386260649726, "learning_rate": 1.9015070434571214e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.15328550338745117, "step": 2580, "valid_targets_mean": 5600.8, "valid_targets_min": 247 }, { "epoch": 3.9586523736600308, "grad_norm": 0.4317711975925466, "learning_rate": 1.8938788456384435e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.19141104817390442, "step": 2585, "valid_targets_mean": 5771.4, "valid_targets_min": 266 }, { "epoch": 3.9663093415007658, "grad_norm": 0.471345314428317, "learning_rate": 1.886252195651593e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.18774153292179108, "step": 2590, "valid_targets_mean": 5299.0, "valid_targets_min": 654 }, { "epoch": 3.9739663093415007, "grad_norm": 0.48013416700446687, "learning_rate": 1.8786272047351974e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.20652708411216736, "step": 2595, "valid_targets_mean": 5300.6, "valid_targets_min": 1524 }, { "epoch": 3.9816232771822357, "grad_norm": 0.4624682372289305, "learning_rate": 1.8710039841036868e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.17302487790584564, "step": 2600, "valid_targets_mean": 4120.8, "valid_targets_min": 390 }, { "epoch": 3.9892802450229707, "grad_norm": 0.4168745532084026, "learning_rate": 1.8633826449456694e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.17362730205059052, "step": 2605, "valid_targets_mean": 5236.6, "valid_targets_min": 625 }, { "epoch": 3.996937212863706, "grad_norm": 0.4932527691180615, "learning_rate": 1.8557632984223124e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.1852743923664093, "step": 2610, "valid_targets_mean": 5870.2, "valid_targets_min": 3261 }, { "epoch": 4.004594180704441, "grad_norm": 0.4117858119372678, "learning_rate": 1.848146055665718e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.16399316489696503, "step": 2615, "valid_targets_mean": 5134.5, "valid_targets_min": 742 }, { "epoch": 4.012251148545176, "grad_norm": 0.4808770384706559, "learning_rate": 1.840531027777306e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.1545652449131012, "step": 2620, "valid_targets_mean": 5073.8, "valid_targets_min": 291 }, { "epoch": 4.019908116385912, "grad_norm": 0.4716619083630413, "learning_rate": 1.832918325826188e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.1703418791294098, "step": 2625, "valid_targets_mean": 4764.6, "valid_targets_min": 274 }, { "epoch": 4.027565084226646, "grad_norm": 0.4838374411041368, "learning_rate": 1.825308060847554e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.17043305933475494, "step": 2630, "valid_targets_mean": 4994.8, "valid_targets_min": 626 }, { "epoch": 4.035222052067382, "grad_norm": 0.4840997051081212, "learning_rate": 1.8177003438410468e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.16094501316547394, "step": 2635, "valid_targets_mean": 5405.5, "valid_targets_min": 429 }, { "epoch": 4.042879019908116, "grad_norm": 0.4485354827030893, "learning_rate": 1.8100952857691478e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.16980960965156555, "step": 2640, "valid_targets_mean": 5238.2, "valid_targets_min": 2252 }, { "epoch": 4.050535987748852, "grad_norm": 0.5691308127289896, "learning_rate": 1.802492997555554e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.18940171599388123, "step": 2645, "valid_targets_mean": 3804.6, "valid_targets_min": 529 }, { "epoch": 4.058192955589586, "grad_norm": 0.5431514385919676, "learning_rate": 1.7948935900835666e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.17891111969947815, "step": 2650, "valid_targets_mean": 4574.4, "valid_targets_min": 727 }, { "epoch": 4.065849923430322, "grad_norm": 0.5041080458794216, "learning_rate": 1.7872971741944657e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.20006835460662842, "step": 2655, "valid_targets_mean": 4423.0, "valid_targets_min": 587 }, { "epoch": 4.073506891271057, "grad_norm": 0.48183764813968805, "learning_rate": 1.779703860685899e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.16695404052734375, "step": 2660, "valid_targets_mean": 4707.2, "valid_targets_min": 593 }, { "epoch": 4.081163859111792, "grad_norm": 0.44635472401034965, "learning_rate": 1.772113760310265e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.16373205184936523, "step": 2665, "valid_targets_mean": 5316.4, "valid_targets_min": 2045 }, { "epoch": 4.088820826952527, "grad_norm": 0.5341676996658703, "learning_rate": 1.7645269837730964e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.18219105899333954, "step": 2670, "valid_targets_mean": 4616.1, "valid_targets_min": 801 }, { "epoch": 4.096477794793262, "grad_norm": 0.5082489734934296, "learning_rate": 1.7569436417314454e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.15915320813655853, "step": 2675, "valid_targets_mean": 5307.9, "valid_targets_min": 1855 }, { "epoch": 4.104134762633997, "grad_norm": 0.48315077118735306, "learning_rate": 1.7493638447922724e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.17643246054649353, "step": 2680, "valid_targets_mean": 4735.8, "valid_targets_min": 603 }, { "epoch": 4.111791730474732, "grad_norm": 0.4158258538790409, "learning_rate": 1.741787703510828e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.14290867745876312, "step": 2685, "valid_targets_mean": 5752.9, "valid_targets_min": 801 }, { "epoch": 4.119448698315467, "grad_norm": 0.4464039644440533, "learning_rate": 1.7342153283890454e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.16524581611156464, "step": 2690, "valid_targets_mean": 4866.8, "valid_targets_min": 273 }, { "epoch": 4.1271056661562024, "grad_norm": 0.4276684308904948, "learning_rate": 1.7266468298739248e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.17335769534111023, "step": 2695, "valid_targets_mean": 5832.6, "valid_targets_min": 972 }, { "epoch": 4.134762633996937, "grad_norm": 0.4728772362847781, "learning_rate": 1.719082318355924e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612071692943573, "step": 2700, "valid_targets_mean": 5342.1, "valid_targets_min": 2692 }, { "epoch": 4.142419601837672, "grad_norm": 0.4765083268369304, "learning_rate": 1.7115219041673513e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.16713187098503113, "step": 2705, "valid_targets_mean": 4761.3, "valid_targets_min": 669 }, { "epoch": 4.150076569678407, "grad_norm": 0.4842020502823108, "learning_rate": 1.703965697580749e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.1749369502067566, "step": 2710, "valid_targets_mean": 4355.8, "valid_targets_min": 638 }, { "epoch": 4.157733537519142, "grad_norm": 0.49332601951947624, "learning_rate": 1.6964138088072927e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.20040933787822723, "step": 2715, "valid_targets_mean": 4893.5, "valid_targets_min": 767 }, { "epoch": 4.165390505359878, "grad_norm": 0.4114065993741536, "learning_rate": 1.6888663479951787e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.15738333761692047, "step": 2720, "valid_targets_mean": 5901.4, "valid_targets_min": 615 }, { "epoch": 4.173047473200612, "grad_norm": 0.49020449855560566, "learning_rate": 1.6813234252280198e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.17966817319393158, "step": 2725, "valid_targets_mean": 4505.4, "valid_targets_min": 393 }, { "epoch": 4.180704441041348, "grad_norm": 0.467609857800558, "learning_rate": 1.673785150523239e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.1697966456413269, "step": 2730, "valid_targets_mean": 4822.9, "valid_targets_min": 624 }, { "epoch": 4.188361408882082, "grad_norm": 0.405164834964215, "learning_rate": 1.6662516338304653e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.15354806184768677, "step": 2735, "valid_targets_mean": 5354.1, "valid_targets_min": 649 }, { "epoch": 4.196018376722818, "grad_norm": 0.4338536588919433, "learning_rate": 1.658722985029928e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.17717352509498596, "step": 2740, "valid_targets_mean": 5779.4, "valid_targets_min": 2130 }, { "epoch": 4.203675344563552, "grad_norm": 0.5850087613394777, "learning_rate": 1.6511993139308593e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.15216293931007385, "step": 2745, "valid_targets_mean": 4756.1, "valid_targets_min": 737 }, { "epoch": 4.211332312404288, "grad_norm": 0.4176714174791368, "learning_rate": 1.6436807302698853e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.15484420955181122, "step": 2750, "valid_targets_mean": 5400.6, "valid_targets_min": 692 }, { "epoch": 4.218989280245023, "grad_norm": 0.5045586445327894, "learning_rate": 1.6361673437094306e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.18908411264419556, "step": 2755, "valid_targets_mean": 4536.8, "valid_targets_min": 559 }, { "epoch": 4.226646248085758, "grad_norm": 0.47376908314362176, "learning_rate": 1.6286592638361176e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.16104529798030853, "step": 2760, "valid_targets_mean": 5460.4, "valid_targets_min": 912 }, { "epoch": 4.234303215926493, "grad_norm": 0.4804874523270708, "learning_rate": 1.6211566001591673e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.16267931461334229, "step": 2765, "valid_targets_mean": 4827.1, "valid_targets_min": 720 }, { "epoch": 4.241960183767228, "grad_norm": 0.5114521946324453, "learning_rate": 1.6136594621088038e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.19819220900535583, "step": 2770, "valid_targets_mean": 4684.1, "valid_targets_min": 567 }, { "epoch": 4.249617151607963, "grad_norm": 0.5128617395395278, "learning_rate": 1.606167959034656e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1607045829296112, "step": 2775, "valid_targets_mean": 4665.6, "valid_targets_min": 625 }, { "epoch": 4.257274119448699, "grad_norm": 0.5017550199119629, "learning_rate": 1.5986822002041645e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.167169451713562, "step": 2780, "valid_targets_mean": 4271.9, "valid_targets_min": 792 }, { "epoch": 4.264931087289433, "grad_norm": 0.44395083608432084, "learning_rate": 1.5912022948009862e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.15831434726715088, "step": 2785, "valid_targets_mean": 5820.2, "valid_targets_min": 2996 }, { "epoch": 4.272588055130169, "grad_norm": 0.4722239671745089, "learning_rate": 1.5837283519234038e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1687237173318863, "step": 2790, "valid_targets_mean": 5822.8, "valid_targets_min": 842 }, { "epoch": 4.280245022970903, "grad_norm": 0.45638928620066843, "learning_rate": 1.5762604805827323e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702617108821869, "step": 2795, "valid_targets_mean": 5522.4, "valid_targets_min": 625 }, { "epoch": 4.287901990811639, "grad_norm": 0.4756632270967452, "learning_rate": 1.5687987897017324e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.21105210483074188, "step": 2800, "valid_targets_mean": 5453.9, "valid_targets_min": 553 }, { "epoch": 4.295558958652373, "grad_norm": 0.4018470816825365, "learning_rate": 1.561343388113017e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.1360223889350891, "step": 2805, "valid_targets_mean": 6373.5, "valid_targets_min": 2733 }, { "epoch": 4.303215926493109, "grad_norm": 0.4931211767025457, "learning_rate": 1.5538943845574674e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.15920180082321167, "step": 2810, "valid_targets_mean": 6204.0, "valid_targets_min": 2948 }, { "epoch": 4.310872894333844, "grad_norm": 0.5467551374335786, "learning_rate": 1.5464518876826474e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.2006562054157257, "step": 2815, "valid_targets_mean": 4931.8, "valid_targets_min": 2745 }, { "epoch": 4.318529862174579, "grad_norm": 0.42757772305840064, "learning_rate": 1.5390160060412153e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.15964971482753754, "step": 2820, "valid_targets_mean": 6229.6, "valid_targets_min": 667 }, { "epoch": 4.326186830015314, "grad_norm": 0.4781249802666833, "learning_rate": 1.531586848089345e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1797013282775879, "step": 2825, "valid_targets_mean": 5788.6, "valid_targets_min": 2048 }, { "epoch": 4.333843797856049, "grad_norm": 0.4881439374190577, "learning_rate": 1.5241645221851405e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18294446170330048, "step": 2830, "valid_targets_mean": 5210.4, "valid_targets_min": 672 }, { "epoch": 4.341500765696784, "grad_norm": 0.40894754528830446, "learning_rate": 1.5167491365870573e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.14472708106040955, "step": 2835, "valid_targets_mean": 5870.3, "valid_targets_min": 3287 }, { "epoch": 4.3491577335375196, "grad_norm": 0.49768141849572484, "learning_rate": 1.5093407994523234e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.178148090839386, "step": 2840, "valid_targets_mean": 5438.2, "valid_targets_min": 1641 }, { "epoch": 4.356814701378254, "grad_norm": 0.428585898075749, "learning_rate": 1.501939618835361e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.15074047446250916, "step": 2845, "valid_targets_mean": 4899.4, "valid_targets_min": 557 }, { "epoch": 4.3644716692189895, "grad_norm": 0.5203366302958021, "learning_rate": 1.4945457026862102e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.18068398535251617, "step": 2850, "valid_targets_mean": 5078.4, "valid_targets_min": 591 }, { "epoch": 4.372128637059724, "grad_norm": 0.42841342187225284, "learning_rate": 1.4871591588489558e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.15299955010414124, "step": 2855, "valid_targets_mean": 5253.9, "valid_targets_min": 393 }, { "epoch": 4.3797856049004595, "grad_norm": 0.4510836298560107, "learning_rate": 1.4797800950601527e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.195342555642128, "step": 2860, "valid_targets_mean": 6093.7, "valid_targets_min": 611 }, { "epoch": 4.387442572741194, "grad_norm": 0.5035923423896532, "learning_rate": 1.4724086189472573e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.18418394029140472, "step": 2865, "valid_targets_mean": 5024.9, "valid_targets_min": 824 }, { "epoch": 4.3950995405819295, "grad_norm": 0.511919119688101, "learning_rate": 1.4650448380270542e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.18659475445747375, "step": 2870, "valid_targets_mean": 4247.2, "valid_targets_min": 654 }, { "epoch": 4.402756508422665, "grad_norm": 0.49765259928346983, "learning_rate": 1.4576888597040897e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.1821971833705902, "step": 2875, "valid_targets_mean": 4381.1, "valid_targets_min": 379 }, { "epoch": 4.4104134762633995, "grad_norm": 0.4844340089149697, "learning_rate": 1.450340791269106e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.16185416281223297, "step": 2880, "valid_targets_mean": 4287.1, "valid_targets_min": 258 }, { "epoch": 4.418070444104135, "grad_norm": 0.4422597910254744, "learning_rate": 1.4430007398974751e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.15629816055297852, "step": 2885, "valid_targets_mean": 5202.2, "valid_targets_min": 571 }, { "epoch": 4.4257274119448695, "grad_norm": 0.448577660568666, "learning_rate": 1.4356688126476352e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.15885485708713531, "step": 2890, "valid_targets_mean": 4905.8, "valid_targets_min": 255 }, { "epoch": 4.433384379785605, "grad_norm": 0.5127193213614976, "learning_rate": 1.428345116459532e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.1999489665031433, "step": 2895, "valid_targets_mean": 5543.8, "valid_targets_min": 942 }, { "epoch": 4.44104134762634, "grad_norm": 0.3696874292839933, "learning_rate": 1.421029758153055e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.13624325394630432, "step": 2900, "valid_targets_mean": 6215.7, "valid_targets_min": 2870 }, { "epoch": 4.448698315467075, "grad_norm": 0.47165957515150697, "learning_rate": 1.413722844426482e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.17101368308067322, "step": 2905, "valid_targets_mean": 5829.2, "valid_targets_min": 3825 }, { "epoch": 4.45635528330781, "grad_norm": 0.529309619643836, "learning_rate": 1.4064244818549227e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.20200702548027039, "step": 2910, "valid_targets_mean": 5083.9, "valid_targets_min": 1085 }, { "epoch": 4.464012251148545, "grad_norm": 0.4583986271288342, "learning_rate": 1.3991347768887629e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.15790319442749023, "step": 2915, "valid_targets_mean": 5490.7, "valid_targets_min": 2776 }, { "epoch": 4.47166921898928, "grad_norm": 0.4672454081699034, "learning_rate": 1.3918538358521136e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702156662940979, "step": 2920, "valid_targets_mean": 6327.2, "valid_targets_min": 3255 }, { "epoch": 4.479326186830015, "grad_norm": 0.5413334749004304, "learning_rate": 1.384581764941259e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.18624061346054077, "step": 2925, "valid_targets_mean": 3659.4, "valid_targets_min": 276 }, { "epoch": 4.48698315467075, "grad_norm": 0.4203208806439039, "learning_rate": 1.3773186702231076e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.18235370516777039, "step": 2930, "valid_targets_mean": 6541.8, "valid_targets_min": 2382 }, { "epoch": 4.494640122511486, "grad_norm": 0.49042923690230983, "learning_rate": 1.3700646576336469e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.16061678528785706, "step": 2935, "valid_targets_mean": 4792.9, "valid_targets_min": 733 }, { "epoch": 4.50229709035222, "grad_norm": 0.4834191846877714, "learning_rate": 1.362819832976395e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.187465101480484, "step": 2940, "valid_targets_mean": 4979.9, "valid_targets_min": 553 }, { "epoch": 4.509954058192956, "grad_norm": 0.5358280569932836, "learning_rate": 1.3555843019208604e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.16426986455917358, "step": 2945, "valid_targets_mean": 5311.7, "valid_targets_min": 745 }, { "epoch": 4.51761102603369, "grad_norm": 0.5228285623940019, "learning_rate": 1.3483581700009988e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.2028902769088745, "step": 2950, "valid_targets_mean": 4474.3, "valid_targets_min": 600 }, { "epoch": 4.525267993874426, "grad_norm": 0.4362550606192867, "learning_rate": 1.3411415426136754e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.18145951628684998, "step": 2955, "valid_targets_mean": 5741.4, "valid_targets_min": 3720 }, { "epoch": 4.53292496171516, "grad_norm": 0.5334592365964695, "learning_rate": 1.333934525017127e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.19370566308498383, "step": 2960, "valid_targets_mean": 4627.0, "valid_targets_min": 687 }, { "epoch": 4.540581929555896, "grad_norm": 0.5166440369660882, "learning_rate": 1.3267372223294258e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.1994536966085434, "step": 2965, "valid_targets_mean": 4718.9, "valid_targets_min": 600 }, { "epoch": 4.548238897396631, "grad_norm": 0.5598640848233768, "learning_rate": 1.319549739526948e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.22695991396903992, "step": 2970, "valid_targets_mean": 4743.5, "valid_targets_min": 439 }, { "epoch": 4.555895865237366, "grad_norm": 0.4771347776369329, "learning_rate": 1.3123721814428408e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.18281838297843933, "step": 2975, "valid_targets_mean": 4889.7, "valid_targets_min": 918 }, { "epoch": 4.563552833078101, "grad_norm": 0.42341232828878017, "learning_rate": 1.3052046527654948e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.16951890289783478, "step": 2980, "valid_targets_mean": 5872.5, "valid_targets_min": 357 }, { "epoch": 4.571209800918836, "grad_norm": 0.4384091653374271, "learning_rate": 1.2980472580370162e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.16993127763271332, "step": 2985, "valid_targets_mean": 5593.4, "valid_targets_min": 990 }, { "epoch": 4.578866768759571, "grad_norm": 0.4736958546897791, "learning_rate": 1.2909001016517031e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.15475991368293762, "step": 2990, "valid_targets_mean": 5100.8, "valid_targets_min": 812 }, { "epoch": 4.586523736600307, "grad_norm": 0.4500490682468214, "learning_rate": 1.2837632878545212e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.17424660921096802, "step": 2995, "valid_targets_mean": 5034.8, "valid_targets_min": 2439 }, { "epoch": 4.594180704441041, "grad_norm": 0.4982990021173331, "learning_rate": 1.2766369207395845e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.15128692984580994, "step": 3000, "valid_targets_mean": 4580.6, "valid_targets_min": 655 }, { "epoch": 4.601837672281777, "grad_norm": 0.5411255865457929, "learning_rate": 1.269521104248637e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.19686409831047058, "step": 3005, "valid_targets_mean": 3894.5, "valid_targets_min": 412 }, { "epoch": 4.609494640122511, "grad_norm": 0.46544029566434875, "learning_rate": 1.2624159421695354e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.17594610154628754, "step": 3010, "valid_targets_mean": 5448.4, "valid_targets_min": 2259 }, { "epoch": 4.617151607963247, "grad_norm": 0.5041573873911557, "learning_rate": 1.2553215381347377e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.17713363468647003, "step": 3015, "valid_targets_mean": 3941.9, "valid_targets_min": 294 }, { "epoch": 4.624808575803982, "grad_norm": 0.4460422876457042, "learning_rate": 1.2482379956197898e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.1611134260892868, "step": 3020, "valid_targets_mean": 5502.9, "valid_targets_min": 649 }, { "epoch": 4.632465543644717, "grad_norm": 0.5123541360019072, "learning_rate": 1.2411654179418162e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.15525534749031067, "step": 3025, "valid_targets_mean": 4013.7, "valid_targets_min": 666 }, { "epoch": 4.640122511485452, "grad_norm": 0.5056279153295342, "learning_rate": 1.2341039082580143e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.20131169259548187, "step": 3030, "valid_targets_mean": 4715.8, "valid_targets_min": 453 }, { "epoch": 4.647779479326187, "grad_norm": 0.4963953600906092, "learning_rate": 1.2270535695641488e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591898500919342, "step": 3035, "valid_targets_mean": 4588.5, "valid_targets_min": 875 }, { "epoch": 4.655436447166922, "grad_norm": 0.4787452476331541, "learning_rate": 1.2200145046930494e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.18031710386276245, "step": 3040, "valid_targets_mean": 4756.6, "valid_targets_min": 619 }, { "epoch": 4.663093415007657, "grad_norm": 0.4353032563440157, "learning_rate": 1.2129868163131115e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.15741820633411407, "step": 3045, "valid_targets_mean": 5642.2, "valid_targets_min": 781 }, { "epoch": 4.670750382848392, "grad_norm": 0.4956709263367504, "learning_rate": 1.2059706069267985e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.20289403200149536, "step": 3050, "valid_targets_mean": 4478.3, "valid_targets_min": 654 }, { "epoch": 4.6784073506891275, "grad_norm": 0.4374701574959408, "learning_rate": 1.1989659788691472e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.15316550433635712, "step": 3055, "valid_targets_mean": 5378.1, "valid_targets_min": 326 }, { "epoch": 4.686064318529862, "grad_norm": 0.4312228148138217, "learning_rate": 1.1919730343062742e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1685815006494522, "step": 3060, "valid_targets_mean": 5913.8, "valid_targets_min": 2858 }, { "epoch": 4.6937212863705975, "grad_norm": 0.6788655954584126, "learning_rate": 1.1849918752338864e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.1469895839691162, "step": 3065, "valid_targets_mean": 5040.0, "valid_targets_min": 876 }, { "epoch": 4.701378254211332, "grad_norm": 0.5027169074416509, "learning_rate": 1.1780226034757938e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.15269100666046143, "step": 3070, "valid_targets_mean": 3950.4, "valid_targets_min": 714 }, { "epoch": 4.7090352220520675, "grad_norm": 0.45849599624176834, "learning_rate": 1.1710653206824225e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.1836073398590088, "step": 3075, "valid_targets_mean": 5161.0, "valid_targets_min": 617 }, { "epoch": 4.716692189892802, "grad_norm": 0.463224080205975, "learning_rate": 1.164120128329334e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.1551927775144577, "step": 3080, "valid_targets_mean": 4956.4, "valid_targets_min": 421 }, { "epoch": 4.7243491577335375, "grad_norm": 0.6749074626071137, "learning_rate": 1.1571871277157458e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.1819312572479248, "step": 3085, "valid_targets_mean": 3737.6, "valid_targets_min": 721 }, { "epoch": 4.732006125574273, "grad_norm": 0.4507533807504539, "learning_rate": 1.15026641996305e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.1480093002319336, "step": 3090, "valid_targets_mean": 5161.5, "valid_targets_min": 270 }, { "epoch": 4.7396630934150075, "grad_norm": 0.5183685281293393, "learning_rate": 1.1433581060133432e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799740195274353, "step": 3095, "valid_targets_mean": 5317.7, "valid_targets_min": 801 }, { "epoch": 4.747320061255743, "grad_norm": 0.5028716072176976, "learning_rate": 1.136462286627952e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.17748679220676422, "step": 3100, "valid_targets_mean": 4244.8, "valid_targets_min": 726 }, { "epoch": 4.7549770290964775, "grad_norm": 0.7306366733577314, "learning_rate": 1.1295790623859605e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16387039422988892, "step": 3105, "valid_targets_mean": 6011.9, "valid_targets_min": 1828 }, { "epoch": 4.762633996937213, "grad_norm": 0.4663498360213423, "learning_rate": 1.1227085336827492e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.18103697896003723, "step": 3110, "valid_targets_mean": 5026.4, "valid_targets_min": 410 }, { "epoch": 4.7702909647779475, "grad_norm": 0.483563480045064, "learning_rate": 1.1158508007285266e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.16695986688137054, "step": 3115, "valid_targets_mean": 5319.2, "valid_targets_min": 707 }, { "epoch": 4.777947932618683, "grad_norm": 0.4827606579725246, "learning_rate": 1.1090059635468693e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.167944997549057, "step": 3120, "valid_targets_mean": 4909.1, "valid_targets_min": 667 }, { "epoch": 4.785604900459418, "grad_norm": 0.43356790112848625, "learning_rate": 1.1021741219732602e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488049477338791, "step": 3125, "valid_targets_mean": 4725.1, "valid_targets_min": 1542 }, { "epoch": 4.793261868300153, "grad_norm": 0.4798237312494164, "learning_rate": 1.0953553756536363e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.202002614736557, "step": 3130, "valid_targets_mean": 5125.2, "valid_targets_min": 588 }, { "epoch": 4.800918836140888, "grad_norm": 0.4223262568134376, "learning_rate": 1.0885498240429344e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.16876980662345886, "step": 3135, "valid_targets_mean": 5708.7, "valid_targets_min": 1016 }, { "epoch": 4.808575803981624, "grad_norm": 0.4239980387727623, "learning_rate": 1.0817575664036371e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.1675986349582672, "step": 3140, "valid_targets_mean": 4858.1, "valid_targets_min": 2378 }, { "epoch": 4.816232771822358, "grad_norm": 0.4847147778344571, "learning_rate": 1.07497870180433e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.16506324708461761, "step": 3145, "valid_targets_mean": 5388.0, "valid_targets_min": 2902 }, { "epoch": 4.823889739663094, "grad_norm": 0.5548302078937414, "learning_rate": 1.0682133291182522e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.14651057124137878, "step": 3150, "valid_targets_mean": 5324.9, "valid_targets_min": 671 }, { "epoch": 4.831546707503828, "grad_norm": 0.5265431034812131, "learning_rate": 1.0614615470218585e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.19283831119537354, "step": 3155, "valid_targets_mean": 4184.3, "valid_targets_min": 777 }, { "epoch": 4.839203675344564, "grad_norm": 0.4752269724565345, "learning_rate": 1.0547234539933755e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17586413025856018, "step": 3160, "valid_targets_mean": 4714.7, "valid_targets_min": 949 }, { "epoch": 4.846860643185298, "grad_norm": 1.169559990539335, "learning_rate": 1.0479991483113697e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.17083494365215302, "step": 3165, "valid_targets_mean": 4708.2, "valid_targets_min": 812 }, { "epoch": 4.854517611026034, "grad_norm": 0.4368959854231952, "learning_rate": 1.0412887280533117e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704709231853485, "step": 3170, "valid_targets_mean": 5273.7, "valid_targets_min": 1007 }, { "epoch": 4.862174578866769, "grad_norm": 0.4944289144103065, "learning_rate": 1.0345922910941448e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.14916256070137024, "step": 3175, "valid_targets_mean": 6193.1, "valid_targets_min": 3214 }, { "epoch": 4.869831546707504, "grad_norm": 0.46502943737171365, "learning_rate": 1.0279099351048602e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.17156018316745758, "step": 3180, "valid_targets_mean": 5356.7, "valid_targets_min": 670 }, { "epoch": 4.877488514548239, "grad_norm": 0.5097200882162136, "learning_rate": 1.0212417575510694e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614779531955719, "step": 3185, "valid_targets_mean": 5069.6, "valid_targets_min": 591 }, { "epoch": 4.885145482388974, "grad_norm": 0.47471570009753655, "learning_rate": 1.0145878556915849e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.1738322228193283, "step": 3190, "valid_targets_mean": 4969.6, "valid_targets_min": 680 }, { "epoch": 4.892802450229709, "grad_norm": 0.4998838240469851, "learning_rate": 1.0079483265770019e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.17251190543174744, "step": 3195, "valid_targets_mean": 4337.6, "valid_targets_min": 953 }, { "epoch": 4.900459418070444, "grad_norm": 0.531925874666518, "learning_rate": 1.001323267048278e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.1674518585205078, "step": 3200, "valid_targets_mean": 4905.7, "valid_targets_min": 646 }, { "epoch": 4.908116385911179, "grad_norm": 0.5453180840806279, "learning_rate": 9.947127737353306e-06, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.17539682984352112, "step": 3205, "valid_targets_mean": 5963.2, "valid_targets_min": 788 }, { "epoch": 4.915773353751915, "grad_norm": 0.4250839312770307, "learning_rate": 9.88116943055615e-06, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.16129732131958008, "step": 3210, "valid_targets_mean": 5374.8, "valid_targets_min": 1861 }, { "epoch": 4.923430321592649, "grad_norm": 0.5076367049894257, "learning_rate": 9.81535871212729e-06, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.18412069976329803, "step": 3215, "valid_targets_mean": 4940.6, "valid_targets_min": 763 }, { "epoch": 4.931087289433385, "grad_norm": 0.46983192162441934, "learning_rate": 9.749696541950013e-06, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.18911156058311462, "step": 3220, "valid_targets_mean": 5087.8, "valid_targets_min": 494 }, { "epoch": 4.938744257274119, "grad_norm": 0.43659187427488777, "learning_rate": 9.684183877740985e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.17905791103839874, "step": 3225, "valid_targets_mean": 6008.7, "valid_targets_min": 3603 }, { "epoch": 4.946401225114855, "grad_norm": 0.4841288841367283, "learning_rate": 9.61882167503624e-06, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.20017869770526886, "step": 3230, "valid_targets_mean": 5367.9, "valid_targets_min": 878 }, { "epoch": 4.954058192955589, "grad_norm": 0.512592936573579, "learning_rate": 9.553610887177246e-06, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.19410035014152527, "step": 3235, "valid_targets_mean": 4450.0, "valid_targets_min": 544 }, { "epoch": 4.961715160796325, "grad_norm": 0.5188515954114221, "learning_rate": 9.488552465297015e-06, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1623811423778534, "step": 3240, "valid_targets_mean": 4658.7, "valid_targets_min": 591 }, { "epoch": 4.96937212863706, "grad_norm": 0.476731013903736, "learning_rate": 9.423647358306218e-06, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1714991182088852, "step": 3245, "valid_targets_mean": 4713.1, "valid_targets_min": 789 }, { "epoch": 4.977029096477795, "grad_norm": 0.5546365002101505, "learning_rate": 9.358896512879358e-06, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.15670126676559448, "step": 3250, "valid_targets_mean": 5500.0, "valid_targets_min": 2235 }, { "epoch": 4.98468606431853, "grad_norm": 0.4853561972328554, "learning_rate": 9.294300873440936e-06, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.17436271905899048, "step": 3255, "valid_targets_mean": 4673.0, "valid_targets_min": 908 }, { "epoch": 4.992343032159265, "grad_norm": 0.5222923370657017, "learning_rate": 9.22986138215171e-06, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.2152424305677414, "step": 3260, "valid_targets_mean": 5085.4, "valid_targets_min": 743 }, { "epoch": 5.0, "grad_norm": 0.6441979554730815, "learning_rate": 9.165578978894937e-06, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.17200767993927002, "step": 3265, "valid_targets_mean": 3869.9, "valid_targets_min": 351 }, { "epoch": 5.007656967840735, "grad_norm": 0.4220356269014037, "learning_rate": 9.10145460126265e-06, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.17021849751472473, "step": 3270, "valid_targets_mean": 5500.6, "valid_targets_min": 667 }, { "epoch": 5.01531393568147, "grad_norm": 0.4289204570010935, "learning_rate": 9.03748918454201e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.16679969429969788, "step": 3275, "valid_targets_mean": 6136.5, "valid_targets_min": 3099 }, { "epoch": 5.022970903522205, "grad_norm": 0.4712426003028533, "learning_rate": 8.973683661701637e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.1566212773323059, "step": 3280, "valid_targets_mean": 5120.7, "valid_targets_min": 851 }, { "epoch": 5.03062787136294, "grad_norm": 0.4518245512255529, "learning_rate": 8.910038963378032e-06, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.14622384309768677, "step": 3285, "valid_targets_mean": 4985.9, "valid_targets_min": 1493 }, { "epoch": 5.038284839203675, "grad_norm": 0.4982253074593932, "learning_rate": 8.846556017861987e-06, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.15284357964992523, "step": 3290, "valid_targets_mean": 4108.5, "valid_targets_min": 593 }, { "epoch": 5.04594180704441, "grad_norm": 0.5111382953009579, "learning_rate": 8.783235751085016e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.16670887172222137, "step": 3295, "valid_targets_mean": 5229.1, "valid_targets_min": 1762 }, { "epoch": 5.053598774885145, "grad_norm": 0.508139696790504, "learning_rate": 8.72007908660593e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.17335477471351624, "step": 3300, "valid_targets_mean": 4433.8, "valid_targets_min": 324 }, { "epoch": 5.061255742725881, "grad_norm": 0.4971355581613195, "learning_rate": 8.657086945597273e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560318022966385, "step": 3305, "valid_targets_mean": 4618.1, "valid_targets_min": 709 }, { "epoch": 5.068912710566615, "grad_norm": 0.519951349237222, "learning_rate": 8.594260246831954e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.17906685173511505, "step": 3310, "valid_targets_mean": 4824.6, "valid_targets_min": 727 }, { "epoch": 5.076569678407351, "grad_norm": 0.48195723569060445, "learning_rate": 8.531599906669802e-06, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.17248311638832092, "step": 3315, "valid_targets_mean": 5084.2, "valid_targets_min": 559 }, { "epoch": 5.084226646248085, "grad_norm": 0.5032723828958181, "learning_rate": 8.469106839044232e-06, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.18109896779060364, "step": 3320, "valid_targets_mean": 4405.3, "valid_targets_min": 276 }, { "epoch": 5.091883614088821, "grad_norm": 0.45559814554047867, "learning_rate": 8.406781955448913e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.16298320889472961, "step": 3325, "valid_targets_mean": 5751.0, "valid_targets_min": 428 }, { "epoch": 5.099540581929556, "grad_norm": 0.4939004046341742, "learning_rate": 8.344626164924436e-06, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.1718837022781372, "step": 3330, "valid_targets_mean": 5382.8, "valid_targets_min": 2252 }, { "epoch": 5.107197549770291, "grad_norm": 0.5085695929621461, "learning_rate": 8.28264037404511e-06, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606028974056244, "step": 3335, "valid_targets_mean": 4314.8, "valid_targets_min": 535 }, { "epoch": 5.114854517611026, "grad_norm": 0.5096351984468025, "learning_rate": 8.220825486905686e-06, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.14969605207443237, "step": 3340, "valid_targets_mean": 4719.4, "valid_targets_min": 839 }, { "epoch": 5.122511485451761, "grad_norm": 0.47515607105527047, "learning_rate": 8.159182405108222e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1551935225725174, "step": 3345, "valid_targets_mean": 5535.8, "valid_targets_min": 2886 }, { "epoch": 5.130168453292496, "grad_norm": 0.4465656432414435, "learning_rate": 8.097712027748879e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423056423664093, "step": 3350, "valid_targets_mean": 4984.5, "valid_targets_min": 980 }, { "epoch": 5.137825421133231, "grad_norm": 0.5427524948981346, "learning_rate": 8.036415251404855e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.1889774203300476, "step": 3355, "valid_targets_mean": 5009.1, "valid_targets_min": 819 }, { "epoch": 5.145482388973966, "grad_norm": 0.4892462664411317, "learning_rate": 7.975292970121286e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.15726116299629211, "step": 3360, "valid_targets_mean": 5218.2, "valid_targets_min": 268 }, { "epoch": 5.153139356814702, "grad_norm": 0.4770823262528399, "learning_rate": 7.914346075398191e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.16496963798999786, "step": 3365, "valid_targets_mean": 4660.6, "valid_targets_min": 696 }, { "epoch": 5.160796324655436, "grad_norm": 0.8056092258122578, "learning_rate": 7.85357545617751e-06, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.13913197815418243, "step": 3370, "valid_targets_mean": 4270.4, "valid_targets_min": 379 }, { "epoch": 5.168453292496172, "grad_norm": 0.5061408770101286, "learning_rate": 7.792981998830092e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.16775824129581451, "step": 3375, "valid_targets_mean": 5022.6, "valid_targets_min": 574 }, { "epoch": 5.176110260336906, "grad_norm": 0.6037385627128377, "learning_rate": 7.732566587142793e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.17123952507972717, "step": 3380, "valid_targets_mean": 4231.1, "valid_targets_min": 626 }, { "epoch": 5.183767228177642, "grad_norm": 0.5311926260698461, "learning_rate": 7.672330102305596e-06, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.19350102543830872, "step": 3385, "valid_targets_mean": 4315.9, "valid_targets_min": 292 }, { "epoch": 5.191424196018377, "grad_norm": 0.5044523176604377, "learning_rate": 7.612273422898726e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.19003711640834808, "step": 3390, "valid_targets_mean": 4566.2, "valid_targets_min": 457 }, { "epoch": 5.199081163859112, "grad_norm": 0.6176433774855741, "learning_rate": 7.5523974248798714e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.16127054393291473, "step": 3395, "valid_targets_mean": 5243.8, "valid_targets_min": 936 }, { "epoch": 5.206738131699847, "grad_norm": 0.5162091315973347, "learning_rate": 7.492702981571363e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597318947315216, "step": 3400, "valid_targets_mean": 4938.6, "valid_targets_min": 814 }, { "epoch": 5.214395099540582, "grad_norm": 0.8676299780329471, "learning_rate": 7.433190963647488e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.14614874124526978, "step": 3405, "valid_targets_mean": 4358.2, "valid_targets_min": 840 }, { "epoch": 5.222052067381317, "grad_norm": 0.4774915723911, "learning_rate": 7.373862239121743e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.16033905744552612, "step": 3410, "valid_targets_mean": 4894.8, "valid_targets_min": 648 }, { "epoch": 5.229709035222052, "grad_norm": 0.5040954116535451, "learning_rate": 7.314717673334213e-06, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.16919949650764465, "step": 3415, "valid_targets_mean": 6000.2, "valid_targets_min": 3105 }, { "epoch": 5.237366003062787, "grad_norm": 0.4912501104493769, "learning_rate": 7.255758128938934e-06, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.20043662190437317, "step": 3420, "valid_targets_mean": 6128.0, "valid_targets_min": 804 }, { "epoch": 5.2450229709035225, "grad_norm": 0.530597468241474, "learning_rate": 7.196984465891288e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.16545242071151733, "step": 3425, "valid_targets_mean": 4632.1, "valid_targets_min": 792 }, { "epoch": 5.252679938744257, "grad_norm": 0.4704553688188211, "learning_rate": 7.138397541435513e-06, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.16121527552604675, "step": 3430, "valid_targets_mean": 5139.7, "valid_targets_min": 1540 }, { "epoch": 5.2603369065849925, "grad_norm": 0.5036246695889622, "learning_rate": 7.079998210092132e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.18528419733047485, "step": 3435, "valid_targets_mean": 4868.1, "valid_targets_min": 727 }, { "epoch": 5.267993874425727, "grad_norm": 0.5946952911939519, "learning_rate": 7.021787323645557e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.1626713126897812, "step": 3440, "valid_targets_mean": 5682.8, "valid_targets_min": 776 }, { "epoch": 5.2756508422664625, "grad_norm": 0.44380451085617817, "learning_rate": 6.963765731131622e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.13598023355007172, "step": 3445, "valid_targets_mean": 5084.1, "valid_targets_min": 372 }, { "epoch": 5.283307810107198, "grad_norm": 0.44937678766204686, "learning_rate": 6.9059342788252035e-06, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.15446916222572327, "step": 3450, "valid_targets_mean": 5280.4, "valid_targets_min": 743 }, { "epoch": 5.2909647779479325, "grad_norm": 0.5423325722642703, "learning_rate": 6.848293810227901e-06, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.16436201333999634, "step": 3455, "valid_targets_mean": 3904.1, "valid_targets_min": 709 }, { "epoch": 5.298621745788668, "grad_norm": 0.5230875510151383, "learning_rate": 6.790845166055699e-06, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1833193153142929, "step": 3460, "valid_targets_mean": 4362.5, "valid_targets_min": 633 }, { "epoch": 5.3062787136294025, "grad_norm": 0.47630676748649625, "learning_rate": 6.733589184226747e-06, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.14603200554847717, "step": 3465, "valid_targets_mean": 5092.8, "valid_targets_min": 636 }, { "epoch": 5.313935681470138, "grad_norm": 0.47996042244501036, "learning_rate": 6.676526699849086e-06, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.17878413200378418, "step": 3470, "valid_targets_mean": 5376.2, "valid_targets_min": 2328 }, { "epoch": 5.3215926493108725, "grad_norm": 0.49793974395131096, "learning_rate": 6.619658545208523e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.17316502332687378, "step": 3475, "valid_targets_mean": 4947.2, "valid_targets_min": 490 }, { "epoch": 5.329249617151608, "grad_norm": 0.5080242803851914, "learning_rate": 6.562985549756448e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.14953093230724335, "step": 3480, "valid_targets_mean": 4898.6, "valid_targets_min": 643 }, { "epoch": 5.336906584992343, "grad_norm": 0.514443547063424, "learning_rate": 6.506508540097769e-06, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.16423040628433228, "step": 3485, "valid_targets_mean": 5819.7, "valid_targets_min": 1855 }, { "epoch": 5.344563552833078, "grad_norm": 0.4584620928236497, "learning_rate": 6.450228339978832e-06, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.17829495668411255, "step": 3490, "valid_targets_mean": 5519.6, "valid_targets_min": 478 }, { "epoch": 5.352220520673813, "grad_norm": 0.47394337082009697, "learning_rate": 6.394145770275402e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514066755771637, "step": 3495, "valid_targets_mean": 5396.5, "valid_targets_min": 566 }, { "epoch": 5.359877488514548, "grad_norm": 0.4729834195916555, "learning_rate": 6.338261648980728e-06, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.16408702731132507, "step": 3500, "valid_targets_mean": 4929.8, "valid_targets_min": 593 }, { "epoch": 5.367534456355283, "grad_norm": 0.4695111134489663, "learning_rate": 6.282576791193557e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.14791680872440338, "step": 3505, "valid_targets_mean": 4815.1, "valid_targets_min": 274 }, { "epoch": 5.375191424196018, "grad_norm": 0.6948673104574568, "learning_rate": 6.227092009106301e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.1767755150794983, "step": 3510, "valid_targets_mean": 3131.2, "valid_targets_min": 566 }, { "epoch": 5.382848392036753, "grad_norm": 0.5735437955530691, "learning_rate": 6.171808111993158e-06, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.17738190293312073, "step": 3515, "valid_targets_mean": 4039.9, "valid_targets_min": 591 }, { "epoch": 5.390505359877489, "grad_norm": 0.4761051088696013, "learning_rate": 6.116725906198297e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.1486128270626068, "step": 3520, "valid_targets_mean": 4567.4, "valid_targets_min": 847 }, { "epoch": 5.398162327718223, "grad_norm": 0.4579204274900233, "learning_rate": 6.061846195124144e-06, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.18317697942256927, "step": 3525, "valid_targets_mean": 5270.5, "valid_targets_min": 888 }, { "epoch": 5.405819295558959, "grad_norm": 0.41159114268724806, "learning_rate": 6.007169779219606e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442817747592926, "step": 3530, "valid_targets_mean": 5373.3, "valid_targets_min": 291 }, { "epoch": 5.413476263399693, "grad_norm": 0.665150948244762, "learning_rate": 5.952697455968444e-06, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.17882975935935974, "step": 3535, "valid_targets_mean": 3959.0, "valid_targets_min": 326 }, { "epoch": 5.421133231240429, "grad_norm": 0.5112194729196444, "learning_rate": 5.898430019877626e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1770792305469513, "step": 3540, "valid_targets_mean": 4908.1, "valid_targets_min": 1011 }, { "epoch": 5.428790199081164, "grad_norm": 0.49899364818543357, "learning_rate": 5.8443682624657095e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.14375297725200653, "step": 3545, "valid_targets_mean": 4505.1, "valid_targets_min": 582 }, { "epoch": 5.436447166921899, "grad_norm": 0.5057554070553661, "learning_rate": 5.790512972251356e-06, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.14775539934635162, "step": 3550, "valid_targets_mean": 5433.1, "valid_targets_min": 767 }, { "epoch": 5.444104134762634, "grad_norm": 0.4379349439343321, "learning_rate": 5.736864934741764e-06, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.14294332265853882, "step": 3555, "valid_targets_mean": 5075.1, "valid_targets_min": 615 }, { "epoch": 5.451761102603369, "grad_norm": 0.46265699177561026, "learning_rate": 5.683424932421273e-06, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.15184825658798218, "step": 3560, "valid_targets_mean": 5332.7, "valid_targets_min": 611 }, { "epoch": 5.459418070444104, "grad_norm": 0.5952621899721654, "learning_rate": 5.630193744739896e-06, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.19496630132198334, "step": 3565, "valid_targets_mean": 4201.9, "valid_targets_min": 704 }, { "epoch": 5.46707503828484, "grad_norm": 0.48070697420874536, "learning_rate": 5.577172148101993e-06, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.16540558636188507, "step": 3570, "valid_targets_mean": 4890.1, "valid_targets_min": 803 }, { "epoch": 5.474732006125574, "grad_norm": 0.6848512357907565, "learning_rate": 5.52436091585493e-06, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.17848747968673706, "step": 3575, "valid_targets_mean": 4479.4, "valid_targets_min": 675 }, { "epoch": 5.48238897396631, "grad_norm": 0.47722149531129565, "learning_rate": 5.471760818277792e-06, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.17572689056396484, "step": 3580, "valid_targets_mean": 5303.5, "valid_targets_min": 378 }, { "epoch": 5.490045941807044, "grad_norm": 0.5271976003353499, "learning_rate": 5.419372622570169e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.15122967958450317, "step": 3585, "valid_targets_mean": 4763.6, "valid_targets_min": 597 }, { "epoch": 5.49770290964778, "grad_norm": 0.7659869620019119, "learning_rate": 5.367197092840932e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.17659571766853333, "step": 3590, "valid_targets_mean": 4276.9, "valid_targets_min": 756 }, { "epoch": 5.505359877488514, "grad_norm": 0.5759762429875664, "learning_rate": 5.315234990097131e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.14629271626472473, "step": 3595, "valid_targets_mean": 5444.4, "valid_targets_min": 686 }, { "epoch": 5.51301684532925, "grad_norm": 0.4702162740174821, "learning_rate": 5.263487072232851e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.15715420246124268, "step": 3600, "valid_targets_mean": 5552.1, "valid_targets_min": 464 }, { "epoch": 5.520673813169985, "grad_norm": 0.5664693454943723, "learning_rate": 5.211954094018201e-06, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.2129855751991272, "step": 3605, "valid_targets_mean": 4471.0, "valid_targets_min": 669 }, { "epoch": 5.52833078101072, "grad_norm": 0.439009368809084, "learning_rate": 5.160636807088277e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.1415124386548996, "step": 3610, "valid_targets_mean": 4938.8, "valid_targets_min": 837 }, { "epoch": 5.535987748851455, "grad_norm": 0.4784953299934146, "learning_rate": 5.109535959932195e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.16233739256858826, "step": 3615, "valid_targets_mean": 4896.0, "valid_targets_min": 445 }, { "epoch": 5.54364471669219, "grad_norm": 0.48393748501482625, "learning_rate": 5.058652297882205e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.16299815475940704, "step": 3620, "valid_targets_mean": 4792.2, "valid_targets_min": 578 }, { "epoch": 5.551301684532925, "grad_norm": 0.4788193457811368, "learning_rate": 5.007986563102778e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.13831590116024017, "step": 3625, "valid_targets_mean": 5167.0, "valid_targets_min": 565 }, { "epoch": 5.55895865237366, "grad_norm": 0.5713684082322842, "learning_rate": 4.9575394945798236e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.15097324550151825, "step": 3630, "valid_targets_mean": 4927.1, "valid_targets_min": 434 }, { "epoch": 5.566615620214395, "grad_norm": 0.5133104989832143, "learning_rate": 4.9073118281098845e-06, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.19625042378902435, "step": 3635, "valid_targets_mean": 5513.1, "valid_targets_min": 2604 }, { "epoch": 5.5742725880551305, "grad_norm": 0.454081092007902, "learning_rate": 4.857304296289398e-06, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.15363352000713348, "step": 3640, "valid_targets_mean": 5523.7, "valid_targets_min": 600 }, { "epoch": 5.581929555895865, "grad_norm": 0.46884469793283995, "learning_rate": 4.807517628504048e-06, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.17339780926704407, "step": 3645, "valid_targets_mean": 5304.4, "valid_targets_min": 1990 }, { "epoch": 5.5895865237366005, "grad_norm": 0.45801637501032694, "learning_rate": 4.757952550918077e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.14689268171787262, "step": 3650, "valid_targets_mean": 5640.2, "valid_targets_min": 576 }, { "epoch": 5.597243491577335, "grad_norm": 0.5120675322489687, "learning_rate": 4.7086097864637444e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1544780433177948, "step": 3655, "valid_targets_mean": 5030.8, "valid_targets_min": 610 }, { "epoch": 5.6049004594180705, "grad_norm": 0.567671223880722, "learning_rate": 4.659490054830729e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.1720244139432907, "step": 3660, "valid_targets_mean": 4914.8, "valid_targets_min": 724 }, { "epoch": 5.612557427258805, "grad_norm": 0.43509274496020417, "learning_rate": 4.6105940724557e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.15081757307052612, "step": 3665, "valid_targets_mean": 6018.0, "valid_targets_min": 805 }, { "epoch": 5.6202143950995405, "grad_norm": 0.5912507132310114, "learning_rate": 4.561922552511788e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.17240439355373383, "step": 3670, "valid_targets_mean": 3949.9, "valid_targets_min": 240 }, { "epoch": 5.627871362940276, "grad_norm": 0.4793859887692694, "learning_rate": 4.5134762048982485e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.1666552871465683, "step": 3675, "valid_targets_mean": 5170.1, "valid_targets_min": 319 }, { "epoch": 5.6355283307810105, "grad_norm": 0.45725888831198136, "learning_rate": 4.465255736230076e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15449725091457367, "step": 3680, "valid_targets_mean": 5772.3, "valid_targets_min": 726 }, { "epoch": 5.643185298621746, "grad_norm": 0.4785523703342554, "learning_rate": 4.417261849827696e-06, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.19263219833374023, "step": 3685, "valid_targets_mean": 5215.2, "valid_targets_min": 689 }, { "epoch": 5.650842266462481, "grad_norm": 0.4757831273839956, "learning_rate": 4.369495245706729e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494811326265335, "step": 3690, "valid_targets_mean": 5826.9, "valid_targets_min": 583 }, { "epoch": 5.658499234303216, "grad_norm": 0.4702461000587345, "learning_rate": 4.321956620567751e-06, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.1776936650276184, "step": 3695, "valid_targets_mean": 5043.8, "valid_targets_min": 871 }, { "epoch": 5.666156202143951, "grad_norm": 0.46987683467332103, "learning_rate": 4.274646667786157e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.15853236615657806, "step": 3700, "valid_targets_mean": 4678.7, "valid_targets_min": 592 }, { "epoch": 5.673813169984686, "grad_norm": 0.4680178929081938, "learning_rate": 4.227566077402041e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.1535928100347519, "step": 3705, "valid_targets_mean": 4963.2, "valid_targets_min": 261 }, { "epoch": 5.681470137825421, "grad_norm": 0.44046042021206055, "learning_rate": 4.180715536110112e-06, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.13984829187393188, "step": 3710, "valid_targets_mean": 5743.1, "valid_targets_min": 588 }, { "epoch": 5.689127105666156, "grad_norm": 0.5050717822406969, "learning_rate": 4.1340957272497115e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.14051397144794464, "step": 3715, "valid_targets_mean": 4413.8, "valid_targets_min": 663 }, { "epoch": 5.696784073506891, "grad_norm": 0.609576054055646, "learning_rate": 4.087707330794814e-06, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.14713960886001587, "step": 3720, "valid_targets_mean": 5758.8, "valid_targets_min": 1866 }, { "epoch": 5.704441041347627, "grad_norm": 0.5071420592448429, "learning_rate": 4.041551023344139e-06, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.17213720083236694, "step": 3725, "valid_targets_mean": 5253.4, "valid_targets_min": 301 }, { "epoch": 5.712098009188361, "grad_norm": 0.46046580007849597, "learning_rate": 3.995627478111264e-06, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543341875076294, "step": 3730, "valid_targets_mean": 5808.6, "valid_targets_min": 606 }, { "epoch": 5.719754977029097, "grad_norm": 0.4717948081992276, "learning_rate": 3.949937364914798e-06, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.14789888262748718, "step": 3735, "valid_targets_mean": 5842.7, "valid_targets_min": 913 }, { "epoch": 5.727411944869831, "grad_norm": 0.472692526766977, "learning_rate": 3.904481350168641e-06, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.18231379985809326, "step": 3740, "valid_targets_mean": 5480.3, "valid_targets_min": 582 }, { "epoch": 5.735068912710567, "grad_norm": 0.4774164157350961, "learning_rate": 3.8592600968722285e-06, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.17668023705482483, "step": 3745, "valid_targets_mean": 5286.9, "valid_targets_min": 806 }, { "epoch": 5.742725880551301, "grad_norm": 0.5089014992120109, "learning_rate": 3.814274264600899e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.15314318239688873, "step": 3750, "valid_targets_mean": 4953.4, "valid_targets_min": 747 }, { "epoch": 5.750382848392037, "grad_norm": 0.5179707303157852, "learning_rate": 3.7695245094962228e-06, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.16455323994159698, "step": 3755, "valid_targets_mean": 5168.4, "valid_targets_min": 840 }, { "epoch": 5.758039816232772, "grad_norm": 0.49543638175235816, "learning_rate": 3.7250114842565087e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.15587033331394196, "step": 3760, "valid_targets_mean": 4512.6, "valid_targets_min": 679 }, { "epoch": 5.765696784073507, "grad_norm": 0.5025738435987257, "learning_rate": 3.6807358381271963e-06, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.2389712631702423, "step": 3765, "valid_targets_mean": 5495.2, "valid_targets_min": 294 }, { "epoch": 5.773353751914242, "grad_norm": 0.44563197876271343, "learning_rate": 3.6366982168914456e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.14085888862609863, "step": 3770, "valid_targets_mean": 5305.1, "valid_targets_min": 1943 }, { "epoch": 5.781010719754977, "grad_norm": 0.4711699929533897, "learning_rate": 3.5928992628607075e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.14801645278930664, "step": 3775, "valid_targets_mean": 5146.2, "valid_targets_min": 1545 }, { "epoch": 5.788667687595712, "grad_norm": 0.45863808724665833, "learning_rate": 3.549339614865328e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.17908339202404022, "step": 3780, "valid_targets_mean": 5437.6, "valid_targets_min": 1859 }, { "epoch": 5.796324655436447, "grad_norm": 0.5602836811382915, "learning_rate": 3.506019908245275e-06, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.15862153470516205, "step": 3785, "valid_targets_mean": 4928.1, "valid_targets_min": 593 }, { "epoch": 5.803981623277182, "grad_norm": 0.5625845577017787, "learning_rate": 3.462940774840826e-06, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.18470574915409088, "step": 3790, "valid_targets_mean": 4665.9, "valid_targets_min": 933 }, { "epoch": 5.811638591117918, "grad_norm": 0.5156477028052144, "learning_rate": 3.4201028429833883e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.14838847517967224, "step": 3795, "valid_targets_mean": 5494.6, "valid_targets_min": 661 }, { "epoch": 5.819295558958652, "grad_norm": 0.4397002728342675, "learning_rate": 3.37750673748632e-06, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.14019045233726501, "step": 3800, "valid_targets_mean": 5286.6, "valid_targets_min": 983 }, { "epoch": 5.826952526799388, "grad_norm": 0.48750838244321903, "learning_rate": 3.3351530796358024e-06, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.1837264895439148, "step": 3805, "valid_targets_mean": 5369.9, "valid_targets_min": 2433 }, { "epoch": 5.834609494640122, "grad_norm": 0.575464842240813, "learning_rate": 3.2930424871818145e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1724276840686798, "step": 3810, "valid_targets_mean": 5045.8, "valid_targets_min": 380 }, { "epoch": 5.842266462480858, "grad_norm": 0.5014265385817863, "learning_rate": 3.2511755743290774e-06, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.16347980499267578, "step": 3815, "valid_targets_mean": 5700.8, "valid_targets_min": 1001 }, { "epoch": 5.849923430321593, "grad_norm": 0.4971195883757721, "learning_rate": 3.2095529517281365e-06, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.15201014280319214, "step": 3820, "valid_targets_mean": 4555.1, "valid_targets_min": 251 }, { "epoch": 5.857580398162328, "grad_norm": 0.5008524466215926, "learning_rate": 3.1681752264664387e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.15063107013702393, "step": 3825, "valid_targets_mean": 4804.3, "valid_targets_min": 903 }, { "epoch": 5.865237366003063, "grad_norm": 0.5064320357447261, "learning_rate": 3.12704300205946e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.16848312318325043, "step": 3830, "valid_targets_mean": 4334.7, "valid_targets_min": 249 }, { "epoch": 5.8728943338437976, "grad_norm": 0.5582372456603737, "learning_rate": 3.0861568784419393e-06, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.15561410784721375, "step": 3835, "valid_targets_mean": 4067.6, "valid_targets_min": 762 }, { "epoch": 5.880551301684533, "grad_norm": 0.48015271820719657, "learning_rate": 3.0455174519590926e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.17181405425071716, "step": 3840, "valid_targets_mean": 5108.1, "valid_targets_min": 800 }, { "epoch": 5.888208269525268, "grad_norm": 0.5032917025542417, "learning_rate": 3.0051253153579373e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.15245842933654785, "step": 3845, "valid_targets_mean": 4856.6, "valid_targets_min": 591 }, { "epoch": 5.895865237366003, "grad_norm": 0.4568927865552627, "learning_rate": 2.964981057778644e-06, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.15734651684761047, "step": 3850, "valid_targets_mean": 5474.4, "valid_targets_min": 1911 }, { "epoch": 5.903522205206738, "grad_norm": 0.5333563811950146, "learning_rate": 2.9250852647459418e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.14090844988822937, "step": 3855, "valid_targets_mean": 4721.5, "valid_targets_min": 553 }, { "epoch": 5.911179173047473, "grad_norm": 0.4809515679578391, "learning_rate": 2.8854385181605594e-06, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540873646736145, "step": 3860, "valid_targets_mean": 5109.4, "valid_targets_min": 1901 }, { "epoch": 5.918836140888208, "grad_norm": 0.48239544970207976, "learning_rate": 2.8460413962907705e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.17352712154388428, "step": 3865, "valid_targets_mean": 4727.1, "valid_targets_min": 847 }, { "epoch": 5.926493108728943, "grad_norm": 0.5337046272163664, "learning_rate": 2.8068944737639436e-06, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.16555720567703247, "step": 3870, "valid_targets_mean": 4828.6, "valid_targets_min": 586 }, { "epoch": 5.934150076569678, "grad_norm": 0.475103452331955, "learning_rate": 2.7679983215581474e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.19165559113025665, "step": 3875, "valid_targets_mean": 6190.2, "valid_targets_min": 816 }, { "epoch": 5.941807044410414, "grad_norm": 0.5134784747632062, "learning_rate": 2.72935350699385e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15154170989990234, "step": 3880, "valid_targets_mean": 4244.9, "valid_targets_min": 812 }, { "epoch": 5.949464012251148, "grad_norm": 0.43408459090260726, "learning_rate": 2.69096059372562e-06, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.1547510176897049, "step": 3885, "valid_targets_mean": 5395.6, "valid_targets_min": 717 }, { "epoch": 5.957120980091884, "grad_norm": 0.6503354175258022, "learning_rate": 2.6528201417339205e-06, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.1949981451034546, "step": 3890, "valid_targets_mean": 3938.8, "valid_targets_min": 612 }, { "epoch": 5.964777947932618, "grad_norm": 0.5246115940102106, "learning_rate": 2.614932707316942e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.17228254675865173, "step": 3895, "valid_targets_mean": 4690.4, "valid_targets_min": 1224 }, { "epoch": 5.972434915773354, "grad_norm": 0.4986410635561786, "learning_rate": 2.5772988430824697e-06, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.16765034198760986, "step": 3900, "valid_targets_mean": 5091.7, "valid_targets_min": 587 }, { "epoch": 5.980091883614088, "grad_norm": 0.41080740486480766, "learning_rate": 2.5399190979398493e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1336369514465332, "step": 3905, "valid_targets_mean": 6159.9, "valid_targets_min": 941 }, { "epoch": 5.987748851454824, "grad_norm": 0.42306492813111624, "learning_rate": 2.5027940170919583e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.14831745624542236, "step": 3910, "valid_targets_mean": 6090.9, "valid_targets_min": 2635 }, { "epoch": 5.995405819295559, "grad_norm": 0.4748890363586371, "learning_rate": 2.4659241420272716e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.1577981561422348, "step": 3915, "valid_targets_mean": 5881.8, "valid_targets_min": 697 }, { "epoch": 6.003062787136294, "grad_norm": 0.46055683667700925, "learning_rate": 2.429310010511956e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.16992008686065674, "step": 3920, "valid_targets_mean": 5102.2, "valid_targets_min": 1521 }, { "epoch": 6.010719754977029, "grad_norm": 0.42406910050920277, "learning_rate": 2.392952156582018e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.13615508377552032, "step": 3925, "valid_targets_mean": 5358.2, "valid_targets_min": 693 }, { "epoch": 6.018376722817764, "grad_norm": 0.4799597914576974, "learning_rate": 2.3568511105355363e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.1690567135810852, "step": 3930, "valid_targets_mean": 4816.2, "valid_targets_min": 663 }, { "epoch": 6.026033690658499, "grad_norm": 0.4808874892486829, "learning_rate": 2.321007398924897e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.14551788568496704, "step": 3935, "valid_targets_mean": 4578.4, "valid_targets_min": 430 }, { "epoch": 6.033690658499235, "grad_norm": 0.44957556088245915, "learning_rate": 2.2854215445491467e-06, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.15582698583602905, "step": 3940, "valid_targets_mean": 5508.3, "valid_targets_min": 1228 }, { "epoch": 6.041347626339969, "grad_norm": 0.5135673979652564, "learning_rate": 2.250094066446342e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.1671498417854309, "step": 3945, "valid_targets_mean": 4560.2, "valid_targets_min": 742 }, { "epoch": 6.049004594180705, "grad_norm": 0.5547826648523004, "learning_rate": 2.215025479885999e-06, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.16672340035438538, "step": 3950, "valid_targets_mean": 4601.8, "valid_targets_min": 737 }, { "epoch": 6.056661562021439, "grad_norm": 0.4009473872690044, "learning_rate": 2.180216296361548e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.12265469133853912, "step": 3955, "valid_targets_mean": 6534.8, "valid_targets_min": 1368 }, { "epoch": 6.064318529862175, "grad_norm": 0.4564705546836802, "learning_rate": 2.145667023582907e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.144794762134552, "step": 3960, "valid_targets_mean": 5498.0, "valid_targets_min": 276 }, { "epoch": 6.071975497702909, "grad_norm": 0.5051561406739382, "learning_rate": 2.1113781654690624e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1356779932975769, "step": 3965, "valid_targets_mean": 4497.1, "valid_targets_min": 566 }, { "epoch": 6.079632465543645, "grad_norm": 0.47564995155516737, "learning_rate": 2.077350222140704e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1437039077281952, "step": 3970, "valid_targets_mean": 5306.3, "valid_targets_min": 560 }, { "epoch": 6.08728943338438, "grad_norm": 0.5940128337403686, "learning_rate": 2.0435836899129624e-06, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.19864995777606964, "step": 3975, "valid_targets_mean": 4722.4, "valid_targets_min": 1353 }, { "epoch": 6.094946401225115, "grad_norm": 0.49070285695934485, "learning_rate": 2.0100790612881392e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.19582757353782654, "step": 3980, "valid_targets_mean": 5257.1, "valid_targets_min": 272 }, { "epoch": 6.10260336906585, "grad_norm": 0.46266996157161816, "learning_rate": 1.9768368249485427e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.16311945021152496, "step": 3985, "valid_targets_mean": 5434.1, "valid_targets_min": 472 }, { "epoch": 6.110260336906585, "grad_norm": 0.46875844903787695, "learning_rate": 1.9438574657493547e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.148982971906662, "step": 3990, "valid_targets_mean": 5669.6, "valid_targets_min": 3120 }, { "epoch": 6.11791730474732, "grad_norm": 0.4856031191051758, "learning_rate": 1.9111414647115545e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.14689423143863678, "step": 3995, "valid_targets_mean": 5054.9, "valid_targets_min": 2586 }, { "epoch": 6.1255742725880555, "grad_norm": 0.6163929918826091, "learning_rate": 1.878689299014913e-06, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.15235333144664764, "step": 4000, "valid_targets_mean": 4759.5, "valid_targets_min": 1983 }, { "epoch": 6.13323124042879, "grad_norm": 0.429934054934571, "learning_rate": 1.8465014419910155e-06, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.1379457414150238, "step": 4005, "valid_targets_mean": 6366.9, "valid_targets_min": 3204 }, { "epoch": 6.1408882082695255, "grad_norm": 0.7233086750971975, "learning_rate": 1.8145783631163772e-06, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.18254977464675903, "step": 4010, "valid_targets_mean": 3828.1, "valid_targets_min": 434 }, { "epoch": 6.14854517611026, "grad_norm": 0.5027392672006016, "learning_rate": 1.7829205280055938e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1422107219696045, "step": 4015, "valid_targets_mean": 4783.3, "valid_targets_min": 661 }, { "epoch": 6.1562021439509955, "grad_norm": 0.5617038740562822, "learning_rate": 1.7515283984045228e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.1379905641078949, "step": 4020, "valid_targets_mean": 3973.9, "valid_targets_min": 240 }, { "epoch": 6.16385911179173, "grad_norm": 0.48304445431238197, "learning_rate": 1.7204024321835944e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.14369803667068481, "step": 4025, "valid_targets_mean": 5558.6, "valid_targets_min": 1845 }, { "epoch": 6.1715160796324655, "grad_norm": 0.5855970422459711, "learning_rate": 1.6895430833310844e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.1536564975976944, "step": 4030, "valid_targets_mean": 3549.4, "valid_targets_min": 767 }, { "epoch": 6.179173047473201, "grad_norm": 0.48239528326391967, "learning_rate": 1.6589508019465395e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.16883978247642517, "step": 4035, "valid_targets_mean": 5138.6, "valid_targets_min": 1466 }, { "epoch": 6.1868300153139355, "grad_norm": 0.5343661046550146, "learning_rate": 1.628626034234173e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.16661593317985535, "step": 4040, "valid_targets_mean": 5237.5, "valid_targets_min": 758 }, { "epoch": 6.194486983154671, "grad_norm": 0.42129658187000146, "learning_rate": 1.5985692224963844e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.12375140190124512, "step": 4045, "valid_targets_mean": 6090.9, "valid_targets_min": 787 }, { "epoch": 6.2021439509954055, "grad_norm": 0.4842019759636806, "learning_rate": 1.5687808051272835e-06, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.18923643231391907, "step": 4050, "valid_targets_mean": 5465.9, "valid_targets_min": 357 }, { "epoch": 6.209800918836141, "grad_norm": 1.005454460289286, "learning_rate": 1.5392612166063203e-06, "loss": 0.1691, "loss_nan_ranks": 0, "loss_rank_avg": 0.18108555674552917, "step": 4055, "valid_targets_mean": 3432.4, "valid_targets_min": 666 }, { "epoch": 6.217457886676876, "grad_norm": 0.5016868489631979, "learning_rate": 1.5100108874919395e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.12715457379817963, "step": 4060, "valid_targets_mean": 4946.0, "valid_targets_min": 563 }, { "epoch": 6.225114854517611, "grad_norm": 0.49871078521671197, "learning_rate": 1.4810302444152868e-06, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.17101529240608215, "step": 4065, "valid_targets_mean": 5428.0, "valid_targets_min": 533 }, { "epoch": 6.232771822358346, "grad_norm": 0.44896200586577506, "learning_rate": 1.4523197100740127e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.14551226794719696, "step": 4070, "valid_targets_mean": 5273.6, "valid_targets_min": 1350 }, { "epoch": 6.240428790199081, "grad_norm": 0.5369466730400164, "learning_rate": 1.423879703226072e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.18292181193828583, "step": 4075, "valid_targets_mean": 4546.9, "valid_targets_min": 429 }, { "epoch": 6.248085758039816, "grad_norm": 0.4534004010866802, "learning_rate": 1.3957106386836584e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.14585313200950623, "step": 4080, "valid_targets_mean": 5585.4, "valid_targets_min": 353 }, { "epoch": 6.255742725880551, "grad_norm": 0.4562447826282773, "learning_rate": 1.3678129273071194e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.18082283437252045, "step": 4085, "valid_targets_mean": 5402.2, "valid_targets_min": 822 }, { "epoch": 6.263399693721286, "grad_norm": 0.5446884739075963, "learning_rate": 1.340186975998976e-06, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.15701700747013092, "step": 4090, "valid_targets_mean": 4313.9, "valid_targets_min": 724 }, { "epoch": 6.271056661562022, "grad_norm": 0.5562186277826435, "learning_rate": 1.3128331876979994e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1641978621482849, "step": 4095, "valid_targets_mean": 4410.6, "valid_targets_min": 858 }, { "epoch": 6.278713629402756, "grad_norm": 0.4458800063927126, "learning_rate": 1.285751961373305e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.14536157250404358, "step": 4100, "valid_targets_mean": 5645.1, "valid_targets_min": 700 }, { "epoch": 6.286370597243492, "grad_norm": 0.5283911789373491, "learning_rate": 1.2589436920185661e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.16219042241573334, "step": 4105, "valid_targets_mean": 4158.7, "valid_targets_min": 542 }, { "epoch": 6.294027565084226, "grad_norm": 0.5094779670955533, "learning_rate": 1.232408770646234e-06, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.17320656776428223, "step": 4110, "valid_targets_mean": 4912.1, "valid_targets_min": 621 }, { "epoch": 6.301684532924962, "grad_norm": 0.5719763141764206, "learning_rate": 1.2061475842818337e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.17003297805786133, "step": 4115, "valid_targets_mean": 4195.1, "valid_targets_min": 326 }, { "epoch": 6.309341500765697, "grad_norm": 0.5256383923265986, "learning_rate": 1.1801605159583307e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1623782217502594, "step": 4120, "valid_targets_mean": 4425.1, "valid_targets_min": 728 }, { "epoch": 6.316998468606432, "grad_norm": 0.48481180094784476, "learning_rate": 1.1544479447105261e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16785955429077148, "step": 4125, "valid_targets_mean": 5730.3, "valid_targets_min": 511 }, { "epoch": 6.324655436447167, "grad_norm": 0.4572254396324727, "learning_rate": 1.1290102455695595e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.16064852476119995, "step": 4130, "valid_targets_mean": 5513.2, "valid_targets_min": 1849 }, { "epoch": 6.332312404287902, "grad_norm": 0.4530850293667914, "learning_rate": 1.1038477895573974e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.16299015283584595, "step": 4135, "valid_targets_mean": 5793.6, "valid_targets_min": 880 }, { "epoch": 6.339969372128637, "grad_norm": 0.48028598319389537, "learning_rate": 1.0789609436814552e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.14780756831169128, "step": 4140, "valid_targets_mean": 5281.0, "valid_targets_min": 773 }, { "epoch": 6.347626339969372, "grad_norm": 0.4496051344582939, "learning_rate": 1.0543500709292309e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.17510706186294556, "step": 4145, "valid_targets_mean": 6073.4, "valid_targets_min": 762 }, { "epoch": 6.355283307810107, "grad_norm": 0.509916750158182, "learning_rate": 1.0300155302630045e-06, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.18384206295013428, "step": 4150, "valid_targets_mean": 4543.0, "valid_targets_min": 312 }, { "epoch": 6.362940275650843, "grad_norm": 0.4914861553380316, "learning_rate": 1.005957676614624e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.15742814540863037, "step": 4155, "valid_targets_mean": 5673.4, "valid_targets_min": 730 }, { "epoch": 6.370597243491577, "grad_norm": 0.44389672499265986, "learning_rate": 9.821768608802995e-07, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.12984803318977356, "step": 4160, "valid_targets_mean": 5247.4, "valid_targets_min": 313 }, { "epoch": 6.378254211332313, "grad_norm": 0.5068179023268576, "learning_rate": 9.58673429915511e-07, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.18095433712005615, "step": 4165, "valid_targets_mean": 4936.8, "valid_targets_min": 493 }, { "epoch": 6.385911179173047, "grad_norm": 0.6110721344279758, "learning_rate": 9.354477265299277e-07, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.14109715819358826, "step": 4170, "valid_targets_mean": 4727.2, "valid_targets_min": 844 }, { "epoch": 6.393568147013783, "grad_norm": 0.4593471805913175, "learning_rate": 9.125000894824332e-07, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15586645901203156, "step": 4175, "valid_targets_mean": 5135.5, "valid_targets_min": 779 }, { "epoch": 6.401225114854517, "grad_norm": 0.5144834066021605, "learning_rate": 8.898308534761591e-07, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.15124112367630005, "step": 4180, "valid_targets_mean": 4934.0, "valid_targets_min": 616 }, { "epoch": 6.408882082695253, "grad_norm": 0.4240329535706579, "learning_rate": 8.674403491536121e-07, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.1325221210718155, "step": 4185, "valid_targets_mean": 6155.0, "valid_targets_min": 2846 }, { "epoch": 6.416539050535988, "grad_norm": 0.4349870239932218, "learning_rate": 8.453289030918643e-07, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.13124766945838928, "step": 4190, "valid_targets_mean": 5847.3, "valid_targets_min": 594 }, { "epoch": 6.424196018376723, "grad_norm": 0.4258108290720063, "learning_rate": 8.234968377977704e-07, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.13588905334472656, "step": 4195, "valid_targets_mean": 5795.6, "valid_targets_min": 2571 }, { "epoch": 6.431852986217458, "grad_norm": 0.4823382335960822, "learning_rate": 8.019444717032732e-07, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.14344608783721924, "step": 4200, "valid_targets_mean": 5538.8, "valid_targets_min": 801 }, { "epoch": 6.439509954058193, "grad_norm": 0.5440916742867541, "learning_rate": 7.806721191607658e-07, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.14522123336791992, "step": 4205, "valid_targets_mean": 4628.5, "valid_targets_min": 840 }, { "epoch": 6.447166921898928, "grad_norm": 0.47576315988744305, "learning_rate": 7.596800904384838e-07, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.14390070736408234, "step": 4210, "valid_targets_mean": 5652.9, "valid_targets_min": 966 }, { "epoch": 6.4548238897396635, "grad_norm": 0.5218061277679277, "learning_rate": 7.38968691716011e-07, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.18774065375328064, "step": 4215, "valid_targets_mean": 4977.1, "valid_targets_min": 723 }, { "epoch": 6.462480857580398, "grad_norm": 0.4286228931036304, "learning_rate": 7.185382250797901e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377241015434265, "step": 4220, "valid_targets_mean": 5731.1, "valid_targets_min": 615 }, { "epoch": 6.4701378254211335, "grad_norm": 0.47837224891886565, "learning_rate": 6.983889885187279e-07, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.15443077683448792, "step": 4225, "valid_targets_mean": 5042.2, "valid_targets_min": 2433 }, { "epoch": 6.477794793261868, "grad_norm": 0.49422631910990883, "learning_rate": 6.785212759198345e-07, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.15702563524246216, "step": 4230, "valid_targets_mean": 4542.4, "valid_targets_min": 379 }, { "epoch": 6.4854517611026035, "grad_norm": 0.477290567718433, "learning_rate": 6.58935377063965e-07, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.1609748899936676, "step": 4235, "valid_targets_mean": 5713.4, "valid_targets_min": 538 }, { "epoch": 6.493108728943339, "grad_norm": 0.4756474679960268, "learning_rate": 6.396315776215645e-07, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16133789718151093, "step": 4240, "valid_targets_mean": 5269.2, "valid_targets_min": 685 }, { "epoch": 6.5007656967840735, "grad_norm": 0.4929632772608458, "learning_rate": 6.206101591485092e-07, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.14727333188056946, "step": 4245, "valid_targets_mean": 5250.6, "valid_targets_min": 686 }, { "epoch": 6.508422664624809, "grad_norm": 0.5014543137245218, "learning_rate": 6.018713990820168e-07, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.18269553780555725, "step": 4250, "valid_targets_mean": 4937.0, "valid_targets_min": 1441 }, { "epoch": 6.5160796324655434, "grad_norm": 0.5773327888472211, "learning_rate": 5.834155707365696e-07, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.16463427245616913, "step": 4255, "valid_targets_mean": 4428.4, "valid_targets_min": 750 }, { "epoch": 6.523736600306279, "grad_norm": 0.5158369739919062, "learning_rate": 5.652429432999596e-07, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.20093436539173126, "step": 4260, "valid_targets_mean": 5806.6, "valid_targets_min": 816 }, { "epoch": 6.531393568147013, "grad_norm": 0.5089399556927194, "learning_rate": 5.47353781829334e-07, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14460662007331848, "step": 4265, "valid_targets_mean": 4637.4, "valid_targets_min": 426 }, { "epoch": 6.539050535987749, "grad_norm": 0.5388069418287857, "learning_rate": 5.297483472473541e-07, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15606024861335754, "step": 4270, "valid_targets_mean": 4018.7, "valid_targets_min": 534 }, { "epoch": 6.546707503828484, "grad_norm": 0.47769896995919425, "learning_rate": 5.12426896338376e-07, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.12930753827095032, "step": 4275, "valid_targets_mean": 5469.5, "valid_targets_min": 1085 }, { "epoch": 6.554364471669219, "grad_norm": 0.5133848406051136, "learning_rate": 4.953896817446957e-07, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.14288434386253357, "step": 4280, "valid_targets_mean": 4725.6, "valid_targets_min": 618 }, { "epoch": 6.562021439509954, "grad_norm": 0.5203682808767163, "learning_rate": 4.78636951962892e-07, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.18543046712875366, "step": 4285, "valid_targets_mean": 5126.2, "valid_targets_min": 685 }, { "epoch": 6.569678407350689, "grad_norm": 0.46911153856516075, "learning_rate": 4.621689513401739e-07, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.14522890746593475, "step": 4290, "valid_targets_mean": 5616.9, "valid_targets_min": 736 }, { "epoch": 6.577335375191424, "grad_norm": 0.49903648422517666, "learning_rate": 4.4598592007083277e-07, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15592968463897705, "step": 4295, "valid_targets_mean": 4984.1, "valid_targets_min": 751 }, { "epoch": 6.584992343032159, "grad_norm": 0.562087312070281, "learning_rate": 4.300880941927399e-07, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15358403325080872, "step": 4300, "valid_targets_mean": 5085.4, "valid_targets_min": 1655 }, { "epoch": 6.592649310872894, "grad_norm": 0.47791617240764883, "learning_rate": 4.1447570558388774e-07, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530168354511261, "step": 4305, "valid_targets_mean": 5281.8, "valid_targets_min": 854 }, { "epoch": 6.60030627871363, "grad_norm": 0.45343705198477624, "learning_rate": 3.991489819590322e-07, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15143750607967377, "step": 4310, "valid_targets_mean": 5688.8, "valid_targets_min": 717 }, { "epoch": 6.607963246554364, "grad_norm": 0.6088682794383126, "learning_rate": 3.8410814686634214e-07, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1674603819847107, "step": 4315, "valid_targets_mean": 4535.4, "valid_targets_min": 712 }, { "epoch": 6.6156202143951, "grad_norm": 0.5417614540657483, "learning_rate": 3.6935341968417305e-07, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.1633644849061966, "step": 4320, "valid_targets_mean": 4694.1, "valid_targets_min": 310 }, { "epoch": 6.623277182235834, "grad_norm": 0.5680715181021335, "learning_rate": 3.548850156178274e-07, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.15728434920310974, "step": 4325, "valid_targets_mean": 5259.0, "valid_targets_min": 478 }, { "epoch": 6.63093415007657, "grad_norm": 0.4664775223352316, "learning_rate": 3.407031456964571e-07, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1763657182455063, "step": 4330, "valid_targets_mean": 5762.2, "valid_targets_min": 490 }, { "epoch": 6.638591117917304, "grad_norm": 0.6365218167161506, "learning_rate": 3.2680801676995724e-07, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.19776296615600586, "step": 4335, "valid_targets_mean": 4274.9, "valid_targets_min": 466 }, { "epoch": 6.64624808575804, "grad_norm": 0.4910720869258167, "learning_rate": 3.1319983150595035e-07, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.1406899392604828, "step": 4340, "valid_targets_mean": 5006.8, "valid_targets_min": 1618 }, { "epoch": 6.653905053598775, "grad_norm": 0.569329802811622, "learning_rate": 2.998787883868537e-07, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.16043078899383545, "step": 4345, "valid_targets_mean": 3629.7, "valid_targets_min": 599 }, { "epoch": 6.66156202143951, "grad_norm": 0.5169327909748895, "learning_rate": 2.868450817069501e-07, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.18156372010707855, "step": 4350, "valid_targets_mean": 5023.1, "valid_targets_min": 1035 }, { "epoch": 6.669218989280245, "grad_norm": 0.5620209579007543, "learning_rate": 2.7409890156958607e-07, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16176734864711761, "step": 4355, "valid_targets_mean": 4832.9, "valid_targets_min": 1225 }, { "epoch": 6.676875957120981, "grad_norm": 0.4949524076974463, "learning_rate": 2.616404338843803e-07, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.16081801056861877, "step": 4360, "valid_targets_mean": 5138.5, "valid_targets_min": 850 }, { "epoch": 6.684532924961715, "grad_norm": 0.4562359420788241, "learning_rate": 2.4946986036451294e-07, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.16743341088294983, "step": 4365, "valid_targets_mean": 5915.8, "valid_targets_min": 805 }, { "epoch": 6.692189892802451, "grad_norm": 0.4911008520965554, "learning_rate": 2.375873585240851e-07, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.14914241433143616, "step": 4370, "valid_targets_mean": 4897.8, "valid_targets_min": 321 }, { "epoch": 6.699846860643185, "grad_norm": 0.5140272838780794, "learning_rate": 2.2599310167551902e-07, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.15968918800354004, "step": 4375, "valid_targets_mean": 4938.5, "valid_targets_min": 453 }, { "epoch": 6.707503828483921, "grad_norm": 0.5219624600556243, "learning_rate": 2.1468725892704212e-07, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.15002906322479248, "step": 4380, "valid_targets_mean": 5464.5, "valid_targets_min": 360 }, { "epoch": 6.715160796324655, "grad_norm": 0.5319553307201998, "learning_rate": 2.0366999518020015e-07, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.15449857711791992, "step": 4385, "valid_targets_mean": 4223.0, "valid_targets_min": 313 }, { "epoch": 6.722817764165391, "grad_norm": 0.6335557414758894, "learning_rate": 1.9294147112748129e-07, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.18669471144676208, "step": 4390, "valid_targets_mean": 3495.2, "valid_targets_min": 382 }, { "epoch": 6.730474732006126, "grad_norm": 0.5264194401944684, "learning_rate": 1.8250184324994258e-07, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.15428876876831055, "step": 4395, "valid_targets_mean": 4849.3, "valid_targets_min": 635 }, { "epoch": 6.738131699846861, "grad_norm": 0.5483060983513385, "learning_rate": 1.7235126381494716e-07, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.15400370955467224, "step": 4400, "valid_targets_mean": 3996.1, "valid_targets_min": 763 }, { "epoch": 6.745788667687596, "grad_norm": 0.484798407756023, "learning_rate": 1.6248988087393946e-07, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.18481765687465668, "step": 4405, "valid_targets_mean": 5657.8, "valid_targets_min": 625 }, { "epoch": 6.7534456355283305, "grad_norm": 0.4730938326668684, "learning_rate": 1.529178382602803e-07, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.15649360418319702, "step": 4410, "valid_targets_mean": 5236.0, "valid_targets_min": 559 }, { "epoch": 6.761102603369066, "grad_norm": 0.5092523070882127, "learning_rate": 1.4363527558715286e-07, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.1409115046262741, "step": 4415, "valid_targets_mean": 5457.8, "valid_targets_min": 874 }, { "epoch": 6.7687595712098005, "grad_norm": 0.524901721297739, "learning_rate": 1.346423282455267e-07, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1688336730003357, "step": 4420, "valid_targets_mean": 4615.9, "valid_targets_min": 713 }, { "epoch": 6.776416539050536, "grad_norm": 0.5105117143096871, "learning_rate": 1.259391274021815e-07, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1753007471561432, "step": 4425, "valid_targets_mean": 4862.4, "valid_targets_min": 594 }, { "epoch": 6.784073506891271, "grad_norm": 0.5143595147260921, "learning_rate": 1.1752579999779523e-07, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.18723537027835846, "step": 4430, "valid_targets_mean": 5300.6, "valid_targets_min": 602 }, { "epoch": 6.791730474732006, "grad_norm": 0.47454601556028797, "learning_rate": 1.094024687450923e-07, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.13127397000789642, "step": 4435, "valid_targets_mean": 4709.1, "valid_targets_min": 614 }, { "epoch": 6.799387442572741, "grad_norm": 0.520781711890744, "learning_rate": 1.0156925212705171e-07, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.1573190838098526, "step": 4440, "valid_targets_mean": 4981.8, "valid_targets_min": 929 }, { "epoch": 6.807044410413476, "grad_norm": 0.4496519457965003, "learning_rate": 9.402626439518393e-08, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.14165663719177246, "step": 4445, "valid_targets_mean": 5795.9, "valid_targets_min": 3105 }, { "epoch": 6.814701378254211, "grad_norm": 0.6215392778464087, "learning_rate": 8.677361556786113e-08, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.18268686532974243, "step": 4450, "valid_targets_mean": 6543.2, "valid_targets_min": 535 }, { "epoch": 6.822358346094946, "grad_norm": 0.49471966346976204, "learning_rate": 7.98114114287052e-08, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.15616750717163086, "step": 4455, "valid_targets_mean": 4753.4, "valid_targets_min": 910 }, { "epoch": 6.830015313935681, "grad_norm": 0.4930676116391729, "learning_rate": 7.313975352506442e-08, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.18801480531692505, "step": 4460, "valid_targets_mean": 4775.8, "valid_targets_min": 581 }, { "epoch": 6.837672281776417, "grad_norm": 0.52961697008991, "learning_rate": 6.675873916651032e-08, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.17023101449012756, "step": 4465, "valid_targets_mean": 4687.8, "valid_targets_min": 619 }, { "epoch": 6.845329249617151, "grad_norm": 0.49808821468991554, "learning_rate": 6.066846142343208e-08, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.15167677402496338, "step": 4470, "valid_targets_mean": 4647.4, "valid_targets_min": 689 }, { "epoch": 6.852986217457887, "grad_norm": 0.5002402449999928, "learning_rate": 5.4869009125677606e-08, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.16921664774417877, "step": 4475, "valid_targets_mean": 5446.4, "valid_targets_min": 801 }, { "epoch": 6.860643185298621, "grad_norm": 0.49397088265179795, "learning_rate": 4.936046686125018e-08, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.18386386334896088, "step": 4480, "valid_targets_mean": 5190.6, "valid_targets_min": 1004 }, { "epoch": 6.868300153139357, "grad_norm": 0.4374868435323064, "learning_rate": 4.414291497508494e-08, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.12061470746994019, "step": 4485, "valid_targets_mean": 5660.0, "valid_targets_min": 747 }, { "epoch": 6.875957120980092, "grad_norm": 0.46344991151869086, "learning_rate": 3.921642956786764e-08, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.15344613790512085, "step": 4490, "valid_targets_mean": 5533.7, "valid_targets_min": 1023 }, { "epoch": 6.883614088820827, "grad_norm": 0.5499673381962632, "learning_rate": 3.4581082494933306e-08, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1682521402835846, "step": 4495, "valid_targets_mean": 5424.2, "valid_targets_min": 680 }, { "epoch": 6.891271056661562, "grad_norm": 0.5661611699091585, "learning_rate": 3.023694136521149e-08, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.19145449995994568, "step": 4500, "valid_targets_mean": 5180.9, "valid_targets_min": 901 }, { "epoch": 6.898928024502297, "grad_norm": 0.5138739009042879, "learning_rate": 2.6184069540244883e-08, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396559178829193, "step": 4505, "valid_targets_mean": 4953.2, "valid_targets_min": 571 }, { "epoch": 6.906584992343032, "grad_norm": 0.4734940775508067, "learning_rate": 2.2422526133258905e-08, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.1580895334482193, "step": 4510, "valid_targets_mean": 5021.9, "valid_targets_min": 576 }, { "epoch": 6.914241960183768, "grad_norm": 0.4706534435530353, "learning_rate": 1.8952366008309076e-08, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.1342153698205948, "step": 4515, "valid_targets_mean": 5286.7, "valid_targets_min": 2509 }, { "epoch": 6.921898928024502, "grad_norm": 0.48739925177110227, "learning_rate": 1.5773639779470552e-08, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1816117912530899, "step": 4520, "valid_targets_mean": 5406.6, "valid_targets_min": 975 }, { "epoch": 6.929555895865238, "grad_norm": 0.5208874030422277, "learning_rate": 1.288639381010759e-08, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.15851663053035736, "step": 4525, "valid_targets_mean": 4442.0, "valid_targets_min": 763 }, { "epoch": 6.937212863705972, "grad_norm": 0.48457417601240316, "learning_rate": 1.0290670212191878e-08, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.165914848446846, "step": 4530, "valid_targets_mean": 4708.8, "valid_targets_min": 345 }, { "epoch": 6.944869831546708, "grad_norm": 0.4583395498556372, "learning_rate": 7.986506845696351e-09, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.13576406240463257, "step": 4535, "valid_targets_mean": 4882.4, "valid_targets_min": 495 }, { "epoch": 6.952526799387442, "grad_norm": 0.5546301713936433, "learning_rate": 5.973937318028977e-09, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.17114219069480896, "step": 4540, "valid_targets_mean": 4222.1, "valid_targets_min": 291 }, { "epoch": 6.960183767228178, "grad_norm": 0.4983059823209655, "learning_rate": 4.2529909835553604e-09, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.13904789090156555, "step": 4545, "valid_targets_mean": 4797.2, "valid_targets_min": 803 }, { "epoch": 6.967840735068913, "grad_norm": 0.45715360287978724, "learning_rate": 2.8236929431701975e-09, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.15358659625053406, "step": 4550, "valid_targets_mean": 6263.0, "valid_targets_min": 3534 }, { "epoch": 6.975497702909648, "grad_norm": 0.48704332473921397, "learning_rate": 1.6860640439197995e-09, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.14753298461437225, "step": 4555, "valid_targets_mean": 4750.9, "valid_targets_min": 792 }, { "epoch": 6.983154670750383, "grad_norm": 0.6282723983499863, "learning_rate": 8.401208787112147e-10, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16771043837070465, "step": 4560, "valid_targets_mean": 4766.7, "valid_targets_min": 680 }, { "epoch": 6.990811638591118, "grad_norm": 0.49667792484401724, "learning_rate": 2.858757860590977e-10, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.1469840109348297, "step": 4565, "valid_targets_mean": 4585.7, "valid_targets_min": 648 }, { "epoch": 6.998468606431853, "grad_norm": 0.5186330018791039, "learning_rate": 2.3336849919175508e-11, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.18415594100952148, "step": 4570, "valid_targets_mean": 5133.5, "valid_targets_min": 1042 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.15374836325645447, "step": 4571, "total_flos": 2281086641373184.0, "train_loss": 0.20197117474362877, "train_runtime": 35007.247, "train_samples_per_second": 2.086, "train_steps_per_second": 0.131, "valid_targets_mean": 5963.9, "valid_targets_min": 640 } ], "logging_steps": 5, "max_steps": 4571, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2281086641373184.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }