{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4872, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007189072609633357, "grad_norm": 20.573642478850733, "learning_rate": 3.278688524590164e-07, "loss": 0.8805, "loss_nan_ranks": 0, "loss_rank_avg": 0.3877447843551636, "step": 5, "valid_targets_mean": 3123.6, "valid_targets_min": 486 }, { "epoch": 0.014378145219266714, "grad_norm": 23.534982518621135, "learning_rate": 7.377049180327869e-07, "loss": 0.8809, "loss_nan_ranks": 0, "loss_rank_avg": 0.46912896633148193, "step": 10, "valid_targets_mean": 3414.8, "valid_targets_min": 528 }, { "epoch": 0.021567217828900073, "grad_norm": 24.164733243587904, "learning_rate": 1.1475409836065575e-06, "loss": 0.87, "loss_nan_ranks": 0, "loss_rank_avg": 0.39718469977378845, "step": 15, "valid_targets_mean": 4687.1, "valid_targets_min": 572 }, { "epoch": 0.02875629043853343, "grad_norm": 15.447184493591537, "learning_rate": 1.557377049180328e-06, "loss": 0.8027, "loss_nan_ranks": 0, "loss_rank_avg": 0.35776641964912415, "step": 20, "valid_targets_mean": 3202.1, "valid_targets_min": 616 }, { "epoch": 0.035945363048166784, "grad_norm": 9.664768453884538, "learning_rate": 1.9672131147540985e-06, "loss": 0.7594, "loss_nan_ranks": 0, "loss_rank_avg": 0.41083261370658875, "step": 25, "valid_targets_mean": 3431.6, "valid_targets_min": 640 }, { "epoch": 0.043134435657800146, "grad_norm": 5.254693135892583, "learning_rate": 2.377049180327869e-06, "loss": 0.6731, "loss_nan_ranks": 0, "loss_rank_avg": 0.23213350772857666, "step": 30, "valid_targets_mean": 3386.2, "valid_targets_min": 711 }, { "epoch": 0.0503235082674335, "grad_norm": 3.298015416368021, "learning_rate": 2.786885245901639e-06, "loss": 0.6337, "loss_nan_ranks": 0, "loss_rank_avg": 0.3576735854148865, "step": 35, "valid_targets_mean": 3571.2, "valid_targets_min": 867 }, { "epoch": 0.05751258087706686, "grad_norm": 2.2393410140351944, "learning_rate": 3.1967213114754105e-06, "loss": 0.6398, "loss_nan_ranks": 0, "loss_rank_avg": 0.3916738033294678, "step": 40, "valid_targets_mean": 3223.5, "valid_targets_min": 604 }, { "epoch": 0.06470165348670022, "grad_norm": 1.5520759530652233, "learning_rate": 3.6065573770491806e-06, "loss": 0.5755, "loss_nan_ranks": 0, "loss_rank_avg": 0.267872154712677, "step": 45, "valid_targets_mean": 3251.4, "valid_targets_min": 735 }, { "epoch": 0.07189072609633357, "grad_norm": 1.5311865640065894, "learning_rate": 4.016393442622951e-06, "loss": 0.5943, "loss_nan_ranks": 0, "loss_rank_avg": 0.32756370306015015, "step": 50, "valid_targets_mean": 4207.4, "valid_targets_min": 566 }, { "epoch": 0.07907979870596693, "grad_norm": 1.0685857284108062, "learning_rate": 4.426229508196722e-06, "loss": 0.562, "loss_nan_ranks": 0, "loss_rank_avg": 0.24649468064308167, "step": 55, "valid_targets_mean": 3997.9, "valid_targets_min": 557 }, { "epoch": 0.08626887131560029, "grad_norm": 0.9461006126567058, "learning_rate": 4.836065573770492e-06, "loss": 0.5413, "loss_nan_ranks": 0, "loss_rank_avg": 0.2554165720939636, "step": 60, "valid_targets_mean": 4351.4, "valid_targets_min": 974 }, { "epoch": 0.09345794392523364, "grad_norm": 0.8074203824966353, "learning_rate": 5.245901639344263e-06, "loss": 0.5373, "loss_nan_ranks": 0, "loss_rank_avg": 0.20570573210716248, "step": 65, "valid_targets_mean": 3216.0, "valid_targets_min": 569 }, { "epoch": 0.100647016534867, "grad_norm": 0.864406247661593, "learning_rate": 5.655737704918033e-06, "loss": 0.5013, "loss_nan_ranks": 0, "loss_rank_avg": 0.26434096693992615, "step": 70, "valid_targets_mean": 3315.5, "valid_targets_min": 466 }, { "epoch": 0.10783608914450037, "grad_norm": 0.8551627943262912, "learning_rate": 6.065573770491804e-06, "loss": 0.4944, "loss_nan_ranks": 0, "loss_rank_avg": 0.24443431198596954, "step": 75, "valid_targets_mean": 2707.8, "valid_targets_min": 580 }, { "epoch": 0.11502516175413371, "grad_norm": 0.8588233832507804, "learning_rate": 6.475409836065575e-06, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.24194490909576416, "step": 80, "valid_targets_mean": 2786.4, "valid_targets_min": 653 }, { "epoch": 0.12221423436376708, "grad_norm": 0.6257850424268222, "learning_rate": 6.885245901639345e-06, "loss": 0.4667, "loss_nan_ranks": 0, "loss_rank_avg": 0.21724802255630493, "step": 85, "valid_targets_mean": 4494.2, "valid_targets_min": 773 }, { "epoch": 0.12940330697340044, "grad_norm": 0.8358272469336914, "learning_rate": 7.295081967213115e-06, "loss": 0.4568, "loss_nan_ranks": 0, "loss_rank_avg": 0.27527081966400146, "step": 90, "valid_targets_mean": 2980.9, "valid_targets_min": 639 }, { "epoch": 0.1365923795830338, "grad_norm": 0.65329510451641, "learning_rate": 7.704918032786886e-06, "loss": 0.4659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2408151626586914, "step": 95, "valid_targets_mean": 4151.5, "valid_targets_min": 777 }, { "epoch": 0.14378145219266714, "grad_norm": 0.7011088331824381, "learning_rate": 8.114754098360657e-06, "loss": 0.4525, "loss_nan_ranks": 0, "loss_rank_avg": 0.20888058841228485, "step": 100, "valid_targets_mean": 3260.6, "valid_targets_min": 509 }, { "epoch": 0.1509705248023005, "grad_norm": 0.6314975069994072, "learning_rate": 8.524590163934427e-06, "loss": 0.431, "loss_nan_ranks": 0, "loss_rank_avg": 0.18482504785060883, "step": 105, "valid_targets_mean": 3340.9, "valid_targets_min": 286 }, { "epoch": 0.15815959741193386, "grad_norm": 0.6827616460242438, "learning_rate": 8.934426229508197e-06, "loss": 0.4346, "loss_nan_ranks": 0, "loss_rank_avg": 0.2140287458896637, "step": 110, "valid_targets_mean": 3119.0, "valid_targets_min": 621 }, { "epoch": 0.16534867002156722, "grad_norm": 0.6892155095210419, "learning_rate": 9.344262295081968e-06, "loss": 0.4294, "loss_nan_ranks": 0, "loss_rank_avg": 0.17718997597694397, "step": 115, "valid_targets_mean": 2981.2, "valid_targets_min": 359 }, { "epoch": 0.17253774263120059, "grad_norm": 0.6184317431223036, "learning_rate": 9.754098360655738e-06, "loss": 0.4188, "loss_nan_ranks": 0, "loss_rank_avg": 0.19387683272361755, "step": 120, "valid_targets_mean": 3474.8, "valid_targets_min": 368 }, { "epoch": 0.17972681524083392, "grad_norm": 0.713134279760954, "learning_rate": 1.0163934426229509e-05, "loss": 0.4329, "loss_nan_ranks": 0, "loss_rank_avg": 0.26430848240852356, "step": 125, "valid_targets_mean": 3852.6, "valid_targets_min": 597 }, { "epoch": 0.18691588785046728, "grad_norm": 0.6130847433392762, "learning_rate": 1.0573770491803279e-05, "loss": 0.4123, "loss_nan_ranks": 0, "loss_rank_avg": 0.211105078458786, "step": 130, "valid_targets_mean": 4527.5, "valid_targets_min": 985 }, { "epoch": 0.19410496046010065, "grad_norm": 0.6406368473479827, "learning_rate": 1.0983606557377052e-05, "loss": 0.4021, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940620243549347, "step": 135, "valid_targets_mean": 3756.5, "valid_targets_min": 779 }, { "epoch": 0.201294033069734, "grad_norm": 0.6589114143141694, "learning_rate": 1.1393442622950821e-05, "loss": 0.3855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18273743987083435, "step": 140, "valid_targets_mean": 4232.9, "valid_targets_min": 3231 }, { "epoch": 0.20848310567936737, "grad_norm": 0.7140798654127781, "learning_rate": 1.1803278688524591e-05, "loss": 0.399, "loss_nan_ranks": 0, "loss_rank_avg": 0.22288499772548676, "step": 145, "valid_targets_mean": 4247.5, "valid_targets_min": 805 }, { "epoch": 0.21567217828900073, "grad_norm": 0.6264015086815747, "learning_rate": 1.221311475409836e-05, "loss": 0.4161, "loss_nan_ranks": 0, "loss_rank_avg": 0.2211969941854477, "step": 150, "valid_targets_mean": 4673.0, "valid_targets_min": 1091 }, { "epoch": 0.22286125089863407, "grad_norm": 0.6162894585137502, "learning_rate": 1.2622950819672132e-05, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.20758062601089478, "step": 155, "valid_targets_mean": 4587.4, "valid_targets_min": 4059 }, { "epoch": 0.23005032350826743, "grad_norm": 0.7212307073246284, "learning_rate": 1.3032786885245904e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.1758236587047577, "step": 160, "valid_targets_mean": 3042.4, "valid_targets_min": 761 }, { "epoch": 0.2372393961179008, "grad_norm": 0.680625458237956, "learning_rate": 1.3442622950819673e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.18720507621765137, "step": 165, "valid_targets_mean": 3616.2, "valid_targets_min": 509 }, { "epoch": 0.24442846872753415, "grad_norm": 0.7144132390270651, "learning_rate": 1.3852459016393445e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.16533072292804718, "step": 170, "valid_targets_mean": 2691.1, "valid_targets_min": 489 }, { "epoch": 0.2516175413371675, "grad_norm": 0.7023635269438706, "learning_rate": 1.4262295081967214e-05, "loss": 0.3832, "loss_nan_ranks": 0, "loss_rank_avg": 0.2062736600637436, "step": 175, "valid_targets_mean": 4041.8, "valid_targets_min": 523 }, { "epoch": 0.2588066139468009, "grad_norm": 0.6519958114973764, "learning_rate": 1.4672131147540984e-05, "loss": 0.3795, "loss_nan_ranks": 0, "loss_rank_avg": 0.1904088258743286, "step": 180, "valid_targets_mean": 4690.5, "valid_targets_min": 642 }, { "epoch": 0.26599568655643424, "grad_norm": 0.803127069107535, "learning_rate": 1.5081967213114754e-05, "loss": 0.3747, "loss_nan_ranks": 0, "loss_rank_avg": 0.19250091910362244, "step": 185, "valid_targets_mean": 3694.6, "valid_targets_min": 622 }, { "epoch": 0.2731847591660676, "grad_norm": 0.6524842255260931, "learning_rate": 1.5491803278688525e-05, "loss": 0.3738, "loss_nan_ranks": 0, "loss_rank_avg": 0.14555513858795166, "step": 190, "valid_targets_mean": 3740.8, "valid_targets_min": 556 }, { "epoch": 0.2803738317757009, "grad_norm": 0.7353147851076066, "learning_rate": 1.5901639344262295e-05, "loss": 0.3709, "loss_nan_ranks": 0, "loss_rank_avg": 0.18715769052505493, "step": 195, "valid_targets_mean": 3398.0, "valid_targets_min": 545 }, { "epoch": 0.2875629043853343, "grad_norm": 0.699110190722482, "learning_rate": 1.6311475409836068e-05, "loss": 0.3718, "loss_nan_ranks": 0, "loss_rank_avg": 0.19545572996139526, "step": 200, "valid_targets_mean": 3607.5, "valid_targets_min": 568 }, { "epoch": 0.29475197699496763, "grad_norm": 1.1808205066742428, "learning_rate": 1.6721311475409837e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.16610263288021088, "step": 205, "valid_targets_mean": 3263.6, "valid_targets_min": 636 }, { "epoch": 0.301941049604601, "grad_norm": 0.6397168520175814, "learning_rate": 1.7131147540983607e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.19341236352920532, "step": 210, "valid_targets_mean": 3819.5, "valid_targets_min": 852 }, { "epoch": 0.30913012221423436, "grad_norm": 0.6379639056463705, "learning_rate": 1.7540983606557377e-05, "loss": 0.3826, "loss_nan_ranks": 0, "loss_rank_avg": 0.17195996642112732, "step": 215, "valid_targets_mean": 3233.1, "valid_targets_min": 500 }, { "epoch": 0.3163191948238677, "grad_norm": 0.5942179551543917, "learning_rate": 1.795081967213115e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.16106751561164856, "step": 220, "valid_targets_mean": 4271.6, "valid_targets_min": 601 }, { "epoch": 0.3235082674335011, "grad_norm": 0.826034647461399, "learning_rate": 1.836065573770492e-05, "loss": 0.3718, "loss_nan_ranks": 0, "loss_rank_avg": 0.17342892289161682, "step": 225, "valid_targets_mean": 3681.0, "valid_targets_min": 813 }, { "epoch": 0.33069734004313445, "grad_norm": 0.8058653706281842, "learning_rate": 1.877049180327869e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488562822341919, "step": 230, "valid_targets_mean": 3804.8, "valid_targets_min": 648 }, { "epoch": 0.3378864126527678, "grad_norm": 0.6344857788769837, "learning_rate": 1.918032786885246e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404256522655487, "step": 235, "valid_targets_mean": 3125.4, "valid_targets_min": 617 }, { "epoch": 0.34507548526240117, "grad_norm": 0.6434328742127456, "learning_rate": 1.9590163934426232e-05, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.13383261859416962, "step": 240, "valid_targets_mean": 2855.4, "valid_targets_min": 630 }, { "epoch": 0.35226455787203453, "grad_norm": 0.7064545774971568, "learning_rate": 2e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.14416509866714478, "step": 245, "valid_targets_mean": 2471.6, "valid_targets_min": 556 }, { "epoch": 0.35945363048166784, "grad_norm": 0.6931492333324353, "learning_rate": 2.040983606557377e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.1825331151485443, "step": 250, "valid_targets_mean": 4504.8, "valid_targets_min": 3506 }, { "epoch": 0.3666427030913012, "grad_norm": 0.657195768961274, "learning_rate": 2.081967213114754e-05, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.2167544960975647, "step": 255, "valid_targets_mean": 4500.5, "valid_targets_min": 894 }, { "epoch": 0.37383177570093457, "grad_norm": 0.6384973135842494, "learning_rate": 2.122950819672131e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.17248007655143738, "step": 260, "valid_targets_mean": 4212.5, "valid_targets_min": 829 }, { "epoch": 0.38102084831056793, "grad_norm": 0.7144789700157379, "learning_rate": 2.1639344262295087e-05, "loss": 0.3607, "loss_nan_ranks": 0, "loss_rank_avg": 0.16193635761737823, "step": 265, "valid_targets_mean": 2716.9, "valid_targets_min": 593 }, { "epoch": 0.3882099209202013, "grad_norm": 0.598654567786524, "learning_rate": 2.2049180327868857e-05, "loss": 0.3483, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530938744544983, "step": 270, "valid_targets_mean": 4164.4, "valid_targets_min": 865 }, { "epoch": 0.39539899352983465, "grad_norm": 0.6904258025944402, "learning_rate": 2.2459016393442626e-05, "loss": 0.3401, "loss_nan_ranks": 0, "loss_rank_avg": 0.17960868775844574, "step": 275, "valid_targets_mean": 4070.1, "valid_targets_min": 740 }, { "epoch": 0.402588066139468, "grad_norm": 0.6894409028737439, "learning_rate": 2.2868852459016396e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.1807325780391693, "step": 280, "valid_targets_mean": 4034.6, "valid_targets_min": 845 }, { "epoch": 0.4097771387491014, "grad_norm": 0.6802842259041161, "learning_rate": 2.3278688524590166e-05, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1755760908126831, "step": 285, "valid_targets_mean": 4237.8, "valid_targets_min": 462 }, { "epoch": 0.41696621135873474, "grad_norm": 0.7153194015500277, "learning_rate": 2.3688524590163936e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.14597834646701813, "step": 290, "valid_targets_mean": 3897.8, "valid_targets_min": 762 }, { "epoch": 0.4241552839683681, "grad_norm": 0.626280930870836, "learning_rate": 2.4098360655737705e-05, "loss": 0.3368, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872946321964264, "step": 295, "valid_targets_mean": 4110.1, "valid_targets_min": 723 }, { "epoch": 0.43134435657800146, "grad_norm": 0.6413132226933951, "learning_rate": 2.4508196721311478e-05, "loss": 0.3494, "loss_nan_ranks": 0, "loss_rank_avg": 0.21533772349357605, "step": 300, "valid_targets_mean": 4881.5, "valid_targets_min": 3844 }, { "epoch": 0.43853342918763477, "grad_norm": 0.6984612265778307, "learning_rate": 2.4918032786885248e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.20868580043315887, "step": 305, "valid_targets_mean": 3898.6, "valid_targets_min": 769 }, { "epoch": 0.44572250179726813, "grad_norm": 0.6522216187873998, "learning_rate": 2.5327868852459018e-05, "loss": 0.3455, "loss_nan_ranks": 0, "loss_rank_avg": 0.19474999606609344, "step": 310, "valid_targets_mean": 4632.5, "valid_targets_min": 450 }, { "epoch": 0.4529115744069015, "grad_norm": 0.7149143783713475, "learning_rate": 2.5737704918032787e-05, "loss": 0.3323, "loss_nan_ranks": 0, "loss_rank_avg": 0.14127987623214722, "step": 315, "valid_targets_mean": 3658.1, "valid_targets_min": 760 }, { "epoch": 0.46010064701653486, "grad_norm": 0.7290870789351198, "learning_rate": 2.6147540983606557e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2236519455909729, "step": 320, "valid_targets_mean": 3496.0, "valid_targets_min": 764 }, { "epoch": 0.4672897196261682, "grad_norm": 0.8173532165490279, "learning_rate": 2.655737704918033e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.22370921075344086, "step": 325, "valid_targets_mean": 2928.8, "valid_targets_min": 587 }, { "epoch": 0.4744787922358016, "grad_norm": 0.6390755149026872, "learning_rate": 2.6967213114754103e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.17742975056171417, "step": 330, "valid_targets_mean": 4116.4, "valid_targets_min": 744 }, { "epoch": 0.48166786484543495, "grad_norm": 0.7504325873347869, "learning_rate": 2.7377049180327873e-05, "loss": 0.3504, "loss_nan_ranks": 0, "loss_rank_avg": 0.19246351718902588, "step": 335, "valid_targets_mean": 4115.6, "valid_targets_min": 504 }, { "epoch": 0.4888569374550683, "grad_norm": 0.6918553039170531, "learning_rate": 2.7786885245901642e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.16972219944000244, "step": 340, "valid_targets_mean": 4123.5, "valid_targets_min": 647 }, { "epoch": 0.49604601006470167, "grad_norm": 0.8450381784807004, "learning_rate": 2.8196721311475412e-05, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.13487985730171204, "step": 345, "valid_targets_mean": 2433.0, "valid_targets_min": 307 }, { "epoch": 0.503235082674335, "grad_norm": 0.6459380214431669, "learning_rate": 2.8606557377049182e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.15826758742332458, "step": 350, "valid_targets_mean": 4429.6, "valid_targets_min": 542 }, { "epoch": 0.5104241552839683, "grad_norm": 0.6500752629382867, "learning_rate": 2.901639344262295e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564514935016632, "step": 355, "valid_targets_mean": 4117.2, "valid_targets_min": 520 }, { "epoch": 0.5176132278936018, "grad_norm": 0.599014418508955, "learning_rate": 2.942622950819672e-05, "loss": 0.339, "loss_nan_ranks": 0, "loss_rank_avg": 0.1816200613975525, "step": 360, "valid_targets_mean": 4451.4, "valid_targets_min": 238 }, { "epoch": 0.5248023005032351, "grad_norm": 0.7406430431356334, "learning_rate": 2.9836065573770498e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.23748645186424255, "step": 365, "valid_targets_mean": 4112.0, "valid_targets_min": 624 }, { "epoch": 0.5319913731128685, "grad_norm": 0.7126978990023, "learning_rate": 3.0245901639344267e-05, "loss": 0.3289, "loss_nan_ranks": 0, "loss_rank_avg": 0.1286466419696808, "step": 370, "valid_targets_mean": 3026.0, "valid_targets_min": 524 }, { "epoch": 0.5391804457225018, "grad_norm": 0.6742826194350676, "learning_rate": 3.065573770491804e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.14347417652606964, "step": 375, "valid_targets_mean": 3989.8, "valid_targets_min": 767 }, { "epoch": 0.5463695183321352, "grad_norm": 0.6286067545561252, "learning_rate": 3.106557377049181e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.17555642127990723, "step": 380, "valid_targets_mean": 4182.5, "valid_targets_min": 878 }, { "epoch": 0.5535585909417685, "grad_norm": 0.6903987730789588, "learning_rate": 3.1475409836065576e-05, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.19024711847305298, "step": 385, "valid_targets_mean": 3651.9, "valid_targets_min": 709 }, { "epoch": 0.5607476635514018, "grad_norm": 0.6375843615935716, "learning_rate": 3.1885245901639346e-05, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.14437010884284973, "step": 390, "valid_targets_mean": 3916.0, "valid_targets_min": 572 }, { "epoch": 0.5679367361610352, "grad_norm": 0.7053727765954131, "learning_rate": 3.2295081967213116e-05, "loss": 0.3426, "loss_nan_ranks": 0, "loss_rank_avg": 0.1976805031299591, "step": 395, "valid_targets_mean": 4752.4, "valid_targets_min": 652 }, { "epoch": 0.5751258087706685, "grad_norm": 0.8072569984620446, "learning_rate": 3.270491803278689e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.19607961177825928, "step": 400, "valid_targets_mean": 3763.6, "valid_targets_min": 828 }, { "epoch": 0.582314881380302, "grad_norm": 0.6106476152608095, "learning_rate": 3.311475409836066e-05, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.13127343356609344, "step": 405, "valid_targets_mean": 3272.8, "valid_targets_min": 377 }, { "epoch": 0.5895039539899353, "grad_norm": 0.6482116985826718, "learning_rate": 3.352459016393443e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.12706303596496582, "step": 410, "valid_targets_mean": 3338.0, "valid_targets_min": 742 }, { "epoch": 0.5966930265995687, "grad_norm": 0.6632153860197335, "learning_rate": 3.39344262295082e-05, "loss": 0.33, "loss_nan_ranks": 0, "loss_rank_avg": 0.21092239022254944, "step": 415, "valid_targets_mean": 4265.2, "valid_targets_min": 405 }, { "epoch": 0.603882099209202, "grad_norm": 0.7713246956378941, "learning_rate": 3.434426229508197e-05, "loss": 0.3262, "loss_nan_ranks": 0, "loss_rank_avg": 0.19024214148521423, "step": 420, "valid_targets_mean": 3687.9, "valid_targets_min": 314 }, { "epoch": 0.6110711718188354, "grad_norm": 0.6573267560100432, "learning_rate": 3.475409836065574e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.21130415797233582, "step": 425, "valid_targets_mean": 4377.6, "valid_targets_min": 879 }, { "epoch": 0.6182602444284687, "grad_norm": 0.7418379210193793, "learning_rate": 3.516393442622951e-05, "loss": 0.3249, "loss_nan_ranks": 0, "loss_rank_avg": 0.14313599467277527, "step": 430, "valid_targets_mean": 2593.2, "valid_targets_min": 499 }, { "epoch": 0.6254493170381021, "grad_norm": 0.7328316064174966, "learning_rate": 3.557377049180329e-05, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.20951959490776062, "step": 435, "valid_targets_mean": 3922.9, "valid_targets_min": 599 }, { "epoch": 0.6326383896477354, "grad_norm": 0.6249361811748065, "learning_rate": 3.5983606557377056e-05, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.14408886432647705, "step": 440, "valid_targets_mean": 3574.6, "valid_targets_min": 221 }, { "epoch": 0.6398274622573688, "grad_norm": 0.570165396935894, "learning_rate": 3.6393442622950826e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.18353965878486633, "step": 445, "valid_targets_mean": 4853.2, "valid_targets_min": 1054 }, { "epoch": 0.6470165348670022, "grad_norm": 0.6538256952663059, "learning_rate": 3.6803278688524596e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1699550598859787, "step": 450, "valid_targets_mean": 4320.8, "valid_targets_min": 2765 }, { "epoch": 0.6542056074766355, "grad_norm": 0.7548701580728006, "learning_rate": 3.7213114754098365e-05, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.1741151511669159, "step": 455, "valid_targets_mean": 3483.0, "valid_targets_min": 674 }, { "epoch": 0.6613946800862689, "grad_norm": 0.6187130203116966, "learning_rate": 3.7622950819672135e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1886174976825714, "step": 460, "valid_targets_mean": 4379.4, "valid_targets_min": 3644 }, { "epoch": 0.6685837526959022, "grad_norm": 0.6026210220029745, "learning_rate": 3.8032786885245905e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.16248294711112976, "step": 465, "valid_targets_mean": 3981.2, "valid_targets_min": 768 }, { "epoch": 0.6757728253055356, "grad_norm": 0.5738755197300025, "learning_rate": 3.8442622950819674e-05, "loss": 0.3266, "loss_nan_ranks": 0, "loss_rank_avg": 0.1635032296180725, "step": 470, "valid_targets_mean": 3884.6, "valid_targets_min": 634 }, { "epoch": 0.6829618979151689, "grad_norm": 0.541333478441975, "learning_rate": 3.8852459016393444e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.1343890130519867, "step": 475, "valid_targets_mean": 3901.5, "valid_targets_min": 671 }, { "epoch": 0.6901509705248023, "grad_norm": 0.6297950944669213, "learning_rate": 3.9262295081967214e-05, "loss": 0.3312, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319078505039215, "step": 480, "valid_targets_mean": 2984.2, "valid_targets_min": 421 }, { "epoch": 0.6973400431344356, "grad_norm": 0.6442069487231398, "learning_rate": 3.9672131147540983e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.16742603480815887, "step": 485, "valid_targets_mean": 3123.9, "valid_targets_min": 601 }, { "epoch": 0.7045291157440691, "grad_norm": 0.5828680764992784, "learning_rate": 3.999999486478495e-05, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.16095879673957825, "step": 490, "valid_targets_mean": 3849.0, "valid_targets_min": 911 }, { "epoch": 0.7117181883537024, "grad_norm": 0.727100638844294, "learning_rate": 3.999981513253493e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447129249572754, "step": 495, "valid_targets_mean": 2987.5, "valid_targets_min": 549 }, { "epoch": 0.7189072609633357, "grad_norm": 0.66368309677484, "learning_rate": 3.999937864216924e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.2023858278989792, "step": 500, "valid_targets_mean": 4051.2, "valid_targets_min": 862 }, { "epoch": 0.7260963335729691, "grad_norm": 0.6046587260631622, "learning_rate": 3.999868539929155e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.15529820322990417, "step": 505, "valid_targets_mean": 4291.5, "valid_targets_min": 735 }, { "epoch": 0.7332854061826024, "grad_norm": 0.6538819878012135, "learning_rate": 3.999773541280172e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1858222782611847, "step": 510, "valid_targets_mean": 3583.4, "valid_targets_min": 785 }, { "epoch": 0.7404744787922358, "grad_norm": 0.5785423134923583, "learning_rate": 3.999652869489569e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.16107608377933502, "step": 515, "valid_targets_mean": 4236.2, "valid_targets_min": 838 }, { "epoch": 0.7476635514018691, "grad_norm": 0.6661760659117584, "learning_rate": 3.9995065261065356e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.17083489894866943, "step": 520, "valid_targets_mean": 3330.0, "valid_targets_min": 582 }, { "epoch": 0.7548526240115025, "grad_norm": 0.5814852024495063, "learning_rate": 3.9993345130098316e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.17902444303035736, "step": 525, "valid_targets_mean": 4703.5, "valid_targets_min": 575 }, { "epoch": 0.7620416966211359, "grad_norm": 0.7517015730135961, "learning_rate": 3.9991368324077635e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.15405789017677307, "step": 530, "valid_targets_mean": 2682.0, "valid_targets_min": 737 }, { "epoch": 0.7692307692307693, "grad_norm": 0.5665123479287115, "learning_rate": 3.998913486838161e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.16368168592453003, "step": 535, "valid_targets_mean": 4069.4, "valid_targets_min": 736 }, { "epoch": 0.7764198418404026, "grad_norm": 0.6136339063989368, "learning_rate": 3.9986644791683404e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1443198025226593, "step": 540, "valid_targets_mean": 3335.1, "valid_targets_min": 552 }, { "epoch": 0.783608914450036, "grad_norm": 0.5666189504479666, "learning_rate": 3.998389812595067e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.1655181646347046, "step": 545, "valid_targets_mean": 4019.6, "valid_targets_min": 691 }, { "epoch": 0.7907979870596693, "grad_norm": 0.6059954759818537, "learning_rate": 3.998089490644518e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.14678184688091278, "step": 550, "valid_targets_mean": 4046.4, "valid_targets_min": 965 }, { "epoch": 0.7979870596693026, "grad_norm": 0.6997466690052564, "learning_rate": 3.9977635171722334e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.18480221927165985, "step": 555, "valid_targets_mean": 3190.5, "valid_targets_min": 521 }, { "epoch": 0.805176132278936, "grad_norm": 0.6538968759183521, "learning_rate": 3.997411896363069e-05, "loss": 0.3133, "loss_nan_ranks": 0, "loss_rank_avg": 0.14448435604572296, "step": 560, "valid_targets_mean": 2742.0, "valid_targets_min": 577 }, { "epoch": 0.8123652048885693, "grad_norm": 0.6256037112502639, "learning_rate": 3.997034632731141e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.16057893633842468, "step": 565, "valid_targets_mean": 3521.4, "valid_targets_min": 767 }, { "epoch": 0.8195542774982028, "grad_norm": 0.5840588259185012, "learning_rate": 3.9966317311197686e-05, "loss": 0.3129, "loss_nan_ranks": 0, "loss_rank_avg": 0.12496450543403625, "step": 570, "valid_targets_mean": 3774.1, "valid_targets_min": 939 }, { "epoch": 0.8267433501078361, "grad_norm": 0.5874137343327693, "learning_rate": 3.996203196701414e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374460607767105, "step": 575, "valid_targets_mean": 2572.0, "valid_targets_min": 582 }, { "epoch": 0.8339324227174695, "grad_norm": 0.5907503480926745, "learning_rate": 3.9957490349776114e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.14356018602848053, "step": 580, "valid_targets_mean": 3366.4, "valid_targets_min": 675 }, { "epoch": 0.8411214953271028, "grad_norm": 0.6733516990659187, "learning_rate": 3.9952692517789004e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.11857141554355621, "step": 585, "valid_targets_mean": 2340.8, "valid_targets_min": 528 }, { "epoch": 0.8483105679367362, "grad_norm": 0.5327001453074538, "learning_rate": 3.9947638532647495e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.09966681897640228, "step": 590, "valid_targets_mean": 2746.8, "valid_targets_min": 551 }, { "epoch": 0.8554996405463695, "grad_norm": 0.5572753499291244, "learning_rate": 3.994232845923477e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.21287260949611664, "step": 595, "valid_targets_mean": 5236.8, "valid_targets_min": 3550 }, { "epoch": 0.8626887131560029, "grad_norm": 0.6260309292514555, "learning_rate": 3.993676236572169e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.1779523491859436, "step": 600, "valid_targets_mean": 3889.1, "valid_targets_min": 638 }, { "epoch": 0.8698777857656362, "grad_norm": 0.7575276187630292, "learning_rate": 3.9930940323565885e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.13865935802459717, "step": 605, "valid_targets_mean": 1711.0, "valid_targets_min": 468 }, { "epoch": 0.8770668583752695, "grad_norm": 0.5771116052061334, "learning_rate": 3.992486240751088e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751812994480133, "step": 610, "valid_targets_mean": 4495.6, "valid_targets_min": 859 }, { "epoch": 0.884255930984903, "grad_norm": 0.569118648358242, "learning_rate": 3.991852869558512e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.15517261624336243, "step": 615, "valid_targets_mean": 3612.4, "valid_targets_min": 766 }, { "epoch": 0.8914450035945363, "grad_norm": 0.5972077897181785, "learning_rate": 3.9911939269100944e-05, "loss": 0.3149, "loss_nan_ranks": 0, "loss_rank_avg": 0.150088369846344, "step": 620, "valid_targets_mean": 3230.4, "valid_targets_min": 1066 }, { "epoch": 0.8986340762041697, "grad_norm": 0.5925744591529776, "learning_rate": 3.990509421265357e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1893511861562729, "step": 625, "valid_targets_mean": 4402.9, "valid_targets_min": 577 }, { "epoch": 0.905823148813803, "grad_norm": 0.5548472057370831, "learning_rate": 3.9897993614120006e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.14507707953453064, "step": 630, "valid_targets_mean": 3072.5, "valid_targets_min": 651 }, { "epoch": 0.9130122214234364, "grad_norm": 0.7175648198925466, "learning_rate": 3.9890637564657894e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.17302565276622772, "step": 635, "valid_targets_mean": 2339.6, "valid_targets_min": 586 }, { "epoch": 0.9202012940330697, "grad_norm": 0.584831764924473, "learning_rate": 3.98830261587044e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.14775174856185913, "step": 640, "valid_targets_mean": 2893.2, "valid_targets_min": 550 }, { "epoch": 0.9273903666427031, "grad_norm": 0.5577687168235862, "learning_rate": 3.987515949397492e-05, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.15221062302589417, "step": 645, "valid_targets_mean": 3455.2, "valid_targets_min": 656 }, { "epoch": 0.9345794392523364, "grad_norm": 0.6171762638763584, "learning_rate": 3.98670376714619e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.1562863290309906, "step": 650, "valid_targets_mean": 3444.6, "valid_targets_min": 382 }, { "epoch": 0.9417685118619699, "grad_norm": 0.5304534943571708, "learning_rate": 3.98586607954335e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725115031003952, "step": 655, "valid_targets_mean": 4867.2, "valid_targets_min": 3896 }, { "epoch": 0.9489575844716032, "grad_norm": 0.6458847453284171, "learning_rate": 3.9850028973432235e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1688905954360962, "step": 660, "valid_targets_mean": 2693.9, "valid_targets_min": 607 }, { "epoch": 0.9561466570812365, "grad_norm": 0.6039242605720511, "learning_rate": 3.9841142316273675e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.14590154588222504, "step": 665, "valid_targets_mean": 2759.8, "valid_targets_min": 477 }, { "epoch": 0.9633357296908699, "grad_norm": 0.5542962369979113, "learning_rate": 3.983200093804493e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.1160636693239212, "step": 670, "valid_targets_mean": 3096.2, "valid_targets_min": 319 }, { "epoch": 0.9705248023005032, "grad_norm": 0.5550120004817779, "learning_rate": 3.982260495610324e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.12880077958106995, "step": 675, "valid_targets_mean": 3627.6, "valid_targets_min": 807 }, { "epoch": 0.9777138749101366, "grad_norm": 0.6372929298938798, "learning_rate": 3.981295449107444e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.17799600958824158, "step": 680, "valid_targets_mean": 3177.5, "valid_targets_min": 490 }, { "epoch": 0.9849029475197699, "grad_norm": 0.6615093926941519, "learning_rate": 3.980304966685145e-05, "loss": 0.311, "loss_nan_ranks": 0, "loss_rank_avg": 0.17152747511863708, "step": 685, "valid_targets_mean": 2525.2, "valid_targets_min": 552 }, { "epoch": 0.9920920201294033, "grad_norm": 0.5636978041977779, "learning_rate": 3.9792890610592634e-05, "loss": 0.3323, "loss_nan_ranks": 0, "loss_rank_avg": 0.13472625613212585, "step": 690, "valid_targets_mean": 3632.8, "valid_targets_min": 643 }, { "epoch": 0.9992810927390366, "grad_norm": 0.581225709789264, "learning_rate": 3.9782477452720216e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.12449763715267181, "step": 695, "valid_targets_mean": 2487.5, "valid_targets_min": 669 }, { "epoch": 1.0057512580877066, "grad_norm": 0.5553439973715237, "learning_rate": 3.9771810326918565e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.13287323713302612, "step": 700, "valid_targets_mean": 3585.4, "valid_targets_min": 614 }, { "epoch": 1.0129403306973401, "grad_norm": 0.5197160209197271, "learning_rate": 3.9760889370132504e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.12326624989509583, "step": 705, "valid_targets_mean": 4040.6, "valid_targets_min": 761 }, { "epoch": 1.0201294033069734, "grad_norm": 0.5196009784810837, "learning_rate": 3.9749714722565537e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.1603870689868927, "step": 710, "valid_targets_mean": 4360.2, "valid_targets_min": 724 }, { "epoch": 1.0273184759166067, "grad_norm": 0.6261659804356468, "learning_rate": 3.9738286527678074e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.1782304346561432, "step": 715, "valid_targets_mean": 4026.9, "valid_targets_min": 854 }, { "epoch": 1.03450754852624, "grad_norm": 0.49968328840683635, "learning_rate": 3.972660493218555e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302112638950348, "step": 720, "valid_targets_mean": 4280.0, "valid_targets_min": 693 }, { "epoch": 1.0416966211358736, "grad_norm": 0.5850771062290935, "learning_rate": 3.9714670086056595e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.1399659812450409, "step": 725, "valid_targets_mean": 3400.4, "valid_targets_min": 853 }, { "epoch": 1.0488856937455069, "grad_norm": 0.5603228569463079, "learning_rate": 3.970248214251102e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.19615839421749115, "step": 730, "valid_targets_mean": 4814.4, "valid_targets_min": 542 }, { "epoch": 1.0560747663551402, "grad_norm": 0.5648677645837813, "learning_rate": 3.969004125801797e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.1610637754201889, "step": 735, "valid_targets_mean": 3886.6, "valid_targets_min": 446 }, { "epoch": 1.0632638389647735, "grad_norm": 0.5661342249379625, "learning_rate": 3.967734759229382e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.11380840837955475, "step": 740, "valid_targets_mean": 2696.4, "valid_targets_min": 563 }, { "epoch": 1.0704529115744068, "grad_norm": 0.5656284137955258, "learning_rate": 3.9664401308300154e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349925696849823, "step": 745, "valid_targets_mean": 3692.1, "valid_targets_min": 577 }, { "epoch": 1.0776419841840403, "grad_norm": 0.5463550825307542, "learning_rate": 3.9651202572241686e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1740422248840332, "step": 750, "valid_targets_mean": 4041.4, "valid_targets_min": 1094 }, { "epoch": 1.0848310567936736, "grad_norm": 0.5384229571092451, "learning_rate": 3.96377515535641e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.1499461531639099, "step": 755, "valid_targets_mean": 4691.0, "valid_targets_min": 678 }, { "epoch": 1.092020129403307, "grad_norm": 0.633330557474276, "learning_rate": 3.962404842495193e-05, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.1790314018726349, "step": 760, "valid_targets_mean": 4441.2, "valid_targets_min": 3412 }, { "epoch": 1.0992092020129403, "grad_norm": 0.5429522369804931, "learning_rate": 3.961009336232625e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.13355664908885956, "step": 765, "valid_targets_mean": 3497.9, "valid_targets_min": 525 }, { "epoch": 1.1063982746225738, "grad_norm": 0.5462783839750516, "learning_rate": 3.9595886544842505e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.13674771785736084, "step": 770, "valid_targets_mean": 3951.1, "valid_targets_min": 824 }, { "epoch": 1.113587347232207, "grad_norm": 0.5817114409791175, "learning_rate": 3.958142815488817e-05, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.17169195413589478, "step": 775, "valid_targets_mean": 4445.0, "valid_targets_min": 691 }, { "epoch": 1.1207764198418404, "grad_norm": 0.5648447798317549, "learning_rate": 3.9566718378080404e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.19211627542972565, "step": 780, "valid_targets_mean": 5507.4, "valid_targets_min": 4306 }, { "epoch": 1.1279654924514737, "grad_norm": 0.49341847979292497, "learning_rate": 3.955175740326368e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.11916790157556534, "step": 785, "valid_targets_mean": 3905.2, "valid_targets_min": 915 }, { "epoch": 1.1351545650611072, "grad_norm": 0.5330042034626139, "learning_rate": 3.953654542250735e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.1617271602153778, "step": 790, "valid_targets_mean": 4198.2, "valid_targets_min": 638 }, { "epoch": 1.1423436376707405, "grad_norm": 0.5544000058211358, "learning_rate": 3.952108263110322e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.18863481283187866, "step": 795, "valid_targets_mean": 4211.5, "valid_targets_min": 678 }, { "epoch": 1.1495327102803738, "grad_norm": 0.5235489672450487, "learning_rate": 3.950536922756297e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.14819476008415222, "step": 800, "valid_targets_mean": 4272.1, "valid_targets_min": 919 }, { "epoch": 1.1567217828900072, "grad_norm": 0.5772533147962314, "learning_rate": 3.948940541361565e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17812474071979523, "step": 805, "valid_targets_mean": 4165.8, "valid_targets_min": 498 }, { "epoch": 1.1639108554996405, "grad_norm": 0.5665999962700897, "learning_rate": 3.9473191394205104e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.22693896293640137, "step": 810, "valid_targets_mean": 4864.1, "valid_targets_min": 918 }, { "epoch": 1.171099928109274, "grad_norm": 0.5703615550122877, "learning_rate": 3.945672737748731e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.13685652613639832, "step": 815, "valid_targets_mean": 3327.9, "valid_targets_min": 632 }, { "epoch": 1.1782890007189073, "grad_norm": 0.5198138670541621, "learning_rate": 3.9440013574827706e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.14325293898582458, "step": 820, "valid_targets_mean": 4258.8, "valid_targets_min": 643 }, { "epoch": 1.1854780733285406, "grad_norm": 0.5606799589906808, "learning_rate": 3.942305020079852e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.12138460576534271, "step": 825, "valid_targets_mean": 3280.8, "valid_targets_min": 704 }, { "epoch": 1.192667145938174, "grad_norm": 0.530676980031532, "learning_rate": 3.9405837473175944e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1585422158241272, "step": 830, "valid_targets_mean": 4695.2, "valid_targets_min": 649 }, { "epoch": 1.1998562185478074, "grad_norm": 0.6260228453322427, "learning_rate": 3.9388375612937403e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.139860600233078, "step": 835, "valid_targets_mean": 3119.8, "valid_targets_min": 620 }, { "epoch": 1.2070452911574407, "grad_norm": 0.5979955679371329, "learning_rate": 3.9370664844258684e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.2046428620815277, "step": 840, "valid_targets_mean": 4263.0, "valid_targets_min": 811 }, { "epoch": 1.214234363767074, "grad_norm": 0.5717668797739937, "learning_rate": 3.935270539451107e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.10338851064443588, "step": 845, "valid_targets_mean": 2618.5, "valid_targets_min": 640 }, { "epoch": 1.2214234363767074, "grad_norm": 0.6324183749578863, "learning_rate": 3.933449749425842e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.18412905931472778, "step": 850, "valid_targets_mean": 3746.4, "valid_targets_min": 704 }, { "epoch": 1.2286125089863407, "grad_norm": 0.5586992298582395, "learning_rate": 3.931604137725419e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.14152535796165466, "step": 855, "valid_targets_mean": 3474.4, "valid_targets_min": 631 }, { "epoch": 1.2358015815959742, "grad_norm": 0.5379461460790473, "learning_rate": 3.9297337280438475e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.19222573935985565, "step": 860, "valid_targets_mean": 4866.8, "valid_targets_min": 1089 }, { "epoch": 1.2429906542056075, "grad_norm": 0.5721426437343275, "learning_rate": 3.927838544393492e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283596009016037, "step": 865, "valid_targets_mean": 2917.4, "valid_targets_min": 567 }, { "epoch": 1.2501797268152408, "grad_norm": 0.5517369618312897, "learning_rate": 3.925918611104767e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.15437334775924683, "step": 870, "valid_targets_mean": 2915.2, "valid_targets_min": 598 }, { "epoch": 1.2573687994248741, "grad_norm": 0.48267731416875964, "learning_rate": 3.923973952825822e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.15360784530639648, "step": 875, "valid_targets_mean": 4809.2, "valid_targets_min": 766 }, { "epoch": 1.2645578720345076, "grad_norm": 0.6005327005122898, "learning_rate": 3.922004594522229e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.168386310338974, "step": 880, "valid_targets_mean": 3697.8, "valid_targets_min": 759 }, { "epoch": 1.271746944644141, "grad_norm": 0.5900526270016355, "learning_rate": 3.920010561476657e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1541575938463211, "step": 885, "valid_targets_mean": 3725.8, "valid_targets_min": 739 }, { "epoch": 1.2789360172537743, "grad_norm": 0.5424428958428384, "learning_rate": 3.9179918792885516e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.1631605625152588, "step": 890, "valid_targets_mean": 5033.8, "valid_targets_min": 3917 }, { "epoch": 1.2861250898634076, "grad_norm": 0.562110119178797, "learning_rate": 3.915948573873804e-05, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.13708816468715668, "step": 895, "valid_targets_mean": 2972.0, "valid_targets_min": 533 }, { "epoch": 1.2933141624730409, "grad_norm": 0.5251225453501762, "learning_rate": 3.913880671464418e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.10703599452972412, "step": 900, "valid_targets_mean": 3083.0, "valid_targets_min": 531 }, { "epoch": 1.3005032350826744, "grad_norm": 0.527255808693065, "learning_rate": 3.911788198608177e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.12984885275363922, "step": 905, "valid_targets_mean": 3227.2, "valid_targets_min": 633 }, { "epoch": 1.3076923076923077, "grad_norm": 0.5523871978932965, "learning_rate": 3.909671182168297e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.1515636146068573, "step": 910, "valid_targets_mean": 3423.0, "valid_targets_min": 567 }, { "epoch": 1.314881380301941, "grad_norm": 0.5458514275613986, "learning_rate": 3.907529649323088e-05, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.18874332308769226, "step": 915, "valid_targets_mean": 4317.4, "valid_targets_min": 1326 }, { "epoch": 1.3220704529115745, "grad_norm": 0.5171016490633233, "learning_rate": 3.905363627565601e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.13986511528491974, "step": 920, "valid_targets_mean": 4300.5, "valid_targets_min": 655 }, { "epoch": 1.3292595255212079, "grad_norm": 0.5446205102221678, "learning_rate": 3.903173144703275e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.12331528216600418, "step": 925, "valid_targets_mean": 3761.5, "valid_targets_min": 650 }, { "epoch": 1.3364485981308412, "grad_norm": 0.5666138697419204, "learning_rate": 3.900958228857585e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.16033025085926056, "step": 930, "valid_targets_mean": 4147.9, "valid_targets_min": 625 }, { "epoch": 1.3436376707404745, "grad_norm": 0.6532210361778743, "learning_rate": 3.898718908463672e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.1362089365720749, "step": 935, "valid_targets_mean": 2751.1, "valid_targets_min": 593 }, { "epoch": 1.3508267433501078, "grad_norm": 0.5051696538336935, "learning_rate": 3.896455212269988e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.12954682111740112, "step": 940, "valid_targets_mean": 3428.1, "valid_targets_min": 846 }, { "epoch": 1.358015815959741, "grad_norm": 0.5736534132040085, "learning_rate": 3.894167169337919e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1548313945531845, "step": 945, "valid_targets_mean": 3938.4, "valid_targets_min": 675 }, { "epoch": 1.3652048885693746, "grad_norm": 0.4938670698885232, "learning_rate": 3.891854809041417e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.12290967255830765, "step": 950, "valid_targets_mean": 4109.2, "valid_targets_min": 800 }, { "epoch": 1.372393961179008, "grad_norm": 0.5938911117965663, "learning_rate": 3.8895181610666196e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.14941787719726562, "step": 955, "valid_targets_mean": 3038.4, "valid_targets_min": 545 }, { "epoch": 1.3795830337886412, "grad_norm": 0.521484016781839, "learning_rate": 3.8871572554114696e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.1749972552061081, "step": 960, "valid_targets_mean": 4396.4, "valid_targets_min": 608 }, { "epoch": 1.3867721063982748, "grad_norm": 0.5176443132865125, "learning_rate": 3.8847721223853334e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388823539018631, "step": 965, "valid_targets_mean": 4115.0, "valid_targets_min": 753 }, { "epoch": 1.393961179007908, "grad_norm": 0.5872567204224207, "learning_rate": 3.882362792608606e-05, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.21744276583194733, "step": 970, "valid_targets_mean": 4367.5, "valid_targets_min": 655 }, { "epoch": 1.4011502516175414, "grad_norm": 0.56539435990809, "learning_rate": 3.879929297012321e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.14727197587490082, "step": 975, "valid_targets_mean": 3567.1, "valid_targets_min": 516 }, { "epoch": 1.4083393242271747, "grad_norm": 0.5059918570200229, "learning_rate": 3.877471666837756e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.14970964193344116, "step": 980, "valid_targets_mean": 4185.9, "valid_targets_min": 3115 }, { "epoch": 1.415528396836808, "grad_norm": 0.5163164050679078, "learning_rate": 3.874989933636028e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.12308366596698761, "step": 985, "valid_targets_mean": 3170.4, "valid_targets_min": 566 }, { "epoch": 1.4227174694464413, "grad_norm": 0.5522952793806271, "learning_rate": 3.872484129267686e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.17238599061965942, "step": 990, "valid_targets_mean": 3889.1, "valid_targets_min": 588 }, { "epoch": 1.4299065420560748, "grad_norm": 0.5961879603097092, "learning_rate": 3.869954285902309e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.15300405025482178, "step": 995, "valid_targets_mean": 3697.9, "valid_targets_min": 592 }, { "epoch": 1.4370956146657081, "grad_norm": 0.47392520471736505, "learning_rate": 3.8674004360180886e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.14228011667728424, "step": 1000, "valid_targets_mean": 4135.2, "valid_targets_min": 516 }, { "epoch": 1.4442846872753414, "grad_norm": 0.59329784213223, "learning_rate": 3.864822612401411e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.12148600816726685, "step": 1005, "valid_targets_mean": 2810.2, "valid_targets_min": 415 }, { "epoch": 1.451473759884975, "grad_norm": 0.5156223018651376, "learning_rate": 3.86222084814644e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.2099960893392563, "step": 1010, "valid_targets_mean": 4676.2, "valid_targets_min": 954 }, { "epoch": 1.4586628324946083, "grad_norm": 0.5929213995699328, "learning_rate": 3.8595951766546874e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.18259933590888977, "step": 1015, "valid_targets_mean": 3383.6, "valid_targets_min": 589 }, { "epoch": 1.4658519051042416, "grad_norm": 0.44437186370848597, "learning_rate": 3.856945631634589e-05, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.11551199853420258, "step": 1020, "valid_targets_mean": 3701.6, "valid_targets_min": 524 }, { "epoch": 1.4730409777138749, "grad_norm": 0.5072064763974775, "learning_rate": 3.854272247101068e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.14987875521183014, "step": 1025, "valid_targets_mean": 4569.1, "valid_targets_min": 612 }, { "epoch": 1.4802300503235082, "grad_norm": 0.4655200344372254, "learning_rate": 3.851575057375101e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1204090267419815, "step": 1030, "valid_targets_mean": 3899.2, "valid_targets_min": 617 }, { "epoch": 1.4874191229331415, "grad_norm": 0.5728562126071537, "learning_rate": 3.8488540970832754e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308048665523529, "step": 1035, "valid_targets_mean": 2915.0, "valid_targets_min": 477 }, { "epoch": 1.494608195542775, "grad_norm": 0.5511649364727081, "learning_rate": 3.846109401157345e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.09357282519340515, "step": 1040, "valid_targets_mean": 1808.2, "valid_targets_min": 486 }, { "epoch": 1.5017972681524083, "grad_norm": 0.5296838223120048, "learning_rate": 3.843341004833784e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.15539321303367615, "step": 1045, "valid_targets_mean": 4149.1, "valid_targets_min": 861 }, { "epoch": 1.5089863407620419, "grad_norm": 0.5461095453788049, "learning_rate": 3.840548943653333e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.12287761270999908, "step": 1050, "valid_targets_mean": 2310.9, "valid_targets_min": 730 }, { "epoch": 1.5161754133716752, "grad_norm": 0.5100354908552306, "learning_rate": 3.83773325346054e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.14473143219947815, "step": 1055, "valid_targets_mean": 4014.5, "valid_targets_min": 887 }, { "epoch": 1.5233644859813085, "grad_norm": 0.5226379950787434, "learning_rate": 3.834893970403306e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.13530033826828003, "step": 1060, "valid_targets_mean": 2959.1, "valid_targets_min": 653 }, { "epoch": 1.5305535585909418, "grad_norm": 0.5566617697030245, "learning_rate": 3.832031130932415e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.12731043994426727, "step": 1065, "valid_targets_mean": 3113.8, "valid_targets_min": 660 }, { "epoch": 1.537742631200575, "grad_norm": 0.4513676317081486, "learning_rate": 3.8291447718010706e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.11857186257839203, "step": 1070, "valid_targets_mean": 4130.1, "valid_targets_min": 581 }, { "epoch": 1.5449317038102084, "grad_norm": 0.5703581165114259, "learning_rate": 3.826234930064422e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.13232873380184174, "step": 1075, "valid_targets_mean": 3404.8, "valid_targets_min": 888 }, { "epoch": 1.5521207764198417, "grad_norm": 0.5209632185141453, "learning_rate": 3.82330164307909e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.12993882596492767, "step": 1080, "valid_targets_mean": 3908.0, "valid_targets_min": 535 }, { "epoch": 1.5593098490294752, "grad_norm": 0.5068701501791201, "learning_rate": 3.820344948502682e-05, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.20242813229560852, "step": 1085, "valid_targets_mean": 4670.1, "valid_targets_min": 1088 }, { "epoch": 1.5664989216391085, "grad_norm": 0.5323592122608582, "learning_rate": 3.8173648842933173e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.1509951651096344, "step": 1090, "valid_targets_mean": 5006.2, "valid_targets_min": 3176 }, { "epoch": 1.573687994248742, "grad_norm": 0.6152354366056297, "learning_rate": 3.814361488709132e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.16126582026481628, "step": 1095, "valid_targets_mean": 3042.6, "valid_targets_min": 673 }, { "epoch": 1.5808770668583754, "grad_norm": 0.5961551035844662, "learning_rate": 3.8113348003077926e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.12394510954618454, "step": 1100, "valid_targets_mean": 3242.1, "valid_targets_min": 573 }, { "epoch": 1.5880661394680087, "grad_norm": 0.47980821001671486, "learning_rate": 3.808284857945999e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.1280575692653656, "step": 1105, "valid_targets_mean": 4582.2, "valid_targets_min": 607 }, { "epoch": 1.595255212077642, "grad_norm": 0.507500812907104, "learning_rate": 3.805211700778984e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.13678506016731262, "step": 1110, "valid_targets_mean": 3753.8, "valid_targets_min": 720 }, { "epoch": 1.6024442846872753, "grad_norm": 0.49705689698484373, "learning_rate": 3.802115368260016e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.15146461129188538, "step": 1115, "valid_targets_mean": 3863.8, "valid_targets_min": 770 }, { "epoch": 1.6096333572969086, "grad_norm": 0.43272714289145614, "learning_rate": 3.798995900139889e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581413447856903, "step": 1120, "valid_targets_mean": 4227.2, "valid_targets_min": 905 }, { "epoch": 1.616822429906542, "grad_norm": 0.6434087265414399, "learning_rate": 3.795853336466408e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.1903274953365326, "step": 1125, "valid_targets_mean": 3343.6, "valid_targets_min": 708 }, { "epoch": 1.6240115025161754, "grad_norm": 0.5786733657323256, "learning_rate": 3.7926877175838844e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.2227598875761032, "step": 1130, "valid_targets_mean": 3601.8, "valid_targets_min": 706 }, { "epoch": 1.6312005751258087, "grad_norm": 0.5216255139577858, "learning_rate": 3.7894990841326095e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.19719943404197693, "step": 1135, "valid_targets_mean": 4424.4, "valid_targets_min": 1563 }, { "epoch": 1.6383896477354423, "grad_norm": 0.47385348746292455, "learning_rate": 3.786287477048338e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.14471015334129333, "step": 1140, "valid_targets_mean": 4585.0, "valid_targets_min": 758 }, { "epoch": 1.6455787203450756, "grad_norm": 0.496509144966886, "learning_rate": 3.783052937561762e-05, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12411241978406906, "step": 1145, "valid_targets_mean": 3547.8, "valid_targets_min": 727 }, { "epoch": 1.6527677929547089, "grad_norm": 0.5337477757052604, "learning_rate": 3.779795507197975e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.12069012969732285, "step": 1150, "valid_targets_mean": 2619.9, "valid_targets_min": 630 }, { "epoch": 1.6599568655643422, "grad_norm": 0.555030233675228, "learning_rate": 3.77651522777595e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.1416761577129364, "step": 1155, "valid_targets_mean": 2981.6, "valid_targets_min": 543 }, { "epoch": 1.6671459381739755, "grad_norm": 0.5314725659453191, "learning_rate": 3.773212141407994e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1304677575826645, "step": 1160, "valid_targets_mean": 3663.9, "valid_targets_min": 661 }, { "epoch": 1.6743350107836088, "grad_norm": 0.557105621995766, "learning_rate": 3.769886290499211e-05, "loss": 0.3171, "loss_nan_ranks": 0, "loss_rank_avg": 0.14408347010612488, "step": 1165, "valid_targets_mean": 3259.2, "valid_targets_min": 670 }, { "epoch": 1.681524083393242, "grad_norm": 0.5236188088487769, "learning_rate": 3.766537717746955e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.13859708607196808, "step": 1170, "valid_targets_mean": 3392.2, "valid_targets_min": 491 }, { "epoch": 1.6887131560028756, "grad_norm": 0.47979346096235626, "learning_rate": 3.7631664661402854e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1257590651512146, "step": 1175, "valid_targets_mean": 4215.4, "valid_targets_min": 964 }, { "epoch": 1.695902228612509, "grad_norm": 0.5549812009815447, "learning_rate": 3.759772578959413e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.14304929971694946, "step": 1180, "valid_targets_mean": 2919.5, "valid_targets_min": 635 }, { "epoch": 1.7030913012221425, "grad_norm": 0.5100981619143163, "learning_rate": 3.7563560997751453e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.12205301225185394, "step": 1185, "valid_targets_mean": 3287.5, "valid_targets_min": 297 }, { "epoch": 1.7102803738317758, "grad_norm": 0.5542814369344694, "learning_rate": 3.752917072448324e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.1393413543701172, "step": 1190, "valid_targets_mean": 3343.5, "valid_targets_min": 532 }, { "epoch": 1.717469446441409, "grad_norm": 0.5004127002541743, "learning_rate": 3.7494555411292665e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.14154654741287231, "step": 1195, "valid_targets_mean": 3552.9, "valid_targets_min": 882 }, { "epoch": 1.7246585190510424, "grad_norm": 0.5369377603113736, "learning_rate": 3.7459715502571974e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.14404495060443878, "step": 1200, "valid_targets_mean": 3497.0, "valid_targets_min": 732 }, { "epoch": 1.7318475916606757, "grad_norm": 0.5692617287750511, "learning_rate": 3.742465144559675e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.14669956266880035, "step": 1205, "valid_targets_mean": 2881.1, "valid_targets_min": 617 }, { "epoch": 1.739036664270309, "grad_norm": 0.5065041606981532, "learning_rate": 3.7389363690520236e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.10892973095178604, "step": 1210, "valid_targets_mean": 3190.4, "valid_targets_min": 861 }, { "epoch": 1.7462257368799425, "grad_norm": 0.5083030454665067, "learning_rate": 3.735385269036747e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.15521150827407837, "step": 1215, "valid_targets_mean": 3963.9, "valid_targets_min": 663 }, { "epoch": 1.7534148094895758, "grad_norm": 0.44482574218300447, "learning_rate": 3.731811890102956e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.1155744269490242, "step": 1220, "valid_targets_mean": 3604.9, "valid_targets_min": 770 }, { "epoch": 1.7606038820992091, "grad_norm": 0.539860187359408, "learning_rate": 3.728216278125776e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.15875539183616638, "step": 1225, "valid_targets_mean": 3555.1, "valid_targets_min": 745 }, { "epoch": 1.7677929547088427, "grad_norm": 0.4410205993807063, "learning_rate": 3.724598479265761e-05, "loss": 0.2843, "loss_nan_ranks": 0, "loss_rank_avg": 0.12200931459665298, "step": 1230, "valid_targets_mean": 4136.0, "valid_targets_min": 583 }, { "epoch": 1.774982027318476, "grad_norm": 0.49605181628499445, "learning_rate": 3.720958539968302e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.15854984521865845, "step": 1235, "valid_targets_mean": 3980.0, "valid_targets_min": 412 }, { "epoch": 1.7821710999281093, "grad_norm": 0.5097674785148915, "learning_rate": 3.7172965069630285e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.12535299360752106, "step": 1240, "valid_targets_mean": 3590.9, "valid_targets_min": 555 }, { "epoch": 1.7893601725377426, "grad_norm": 0.530740961884203, "learning_rate": 3.713612427263209e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.17841705679893494, "step": 1245, "valid_targets_mean": 4256.5, "valid_targets_min": 785 }, { "epoch": 1.796549245147376, "grad_norm": 0.525125717742193, "learning_rate": 3.70990634816515e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.14326494932174683, "step": 1250, "valid_targets_mean": 2654.0, "valid_targets_min": 567 }, { "epoch": 1.8037383177570092, "grad_norm": 0.47882978123124514, "learning_rate": 3.706178317247585e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471397876739502, "step": 1255, "valid_targets_mean": 4397.4, "valid_targets_min": 593 }, { "epoch": 1.8109273903666427, "grad_norm": 0.5886031941773199, "learning_rate": 3.702428382371066e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.15693509578704834, "step": 1260, "valid_targets_mean": 2723.0, "valid_targets_min": 448 }, { "epoch": 1.818116462976276, "grad_norm": 0.5664729440418096, "learning_rate": 3.698656591677348e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.09844028949737549, "step": 1265, "valid_targets_mean": 2811.0, "valid_targets_min": 275 }, { "epoch": 1.8253055355859096, "grad_norm": 0.498049887694824, "learning_rate": 3.694862993588774e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390022337436676, "step": 1270, "valid_targets_mean": 4099.2, "valid_targets_min": 3258 }, { "epoch": 1.8324946081955429, "grad_norm": 0.6036330907468369, "learning_rate": 3.6910476368076466e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.16148319840431213, "step": 1275, "valid_targets_mean": 3122.1, "valid_targets_min": 648 }, { "epoch": 1.8396836808051762, "grad_norm": 0.5012127171683514, "learning_rate": 3.6872105703156116e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.11360730975866318, "step": 1280, "valid_targets_mean": 3105.0, "valid_targets_min": 422 }, { "epoch": 1.8468727534148095, "grad_norm": 0.5151919144409882, "learning_rate": 3.683351843373021e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.16393089294433594, "step": 1285, "valid_targets_mean": 4949.4, "valid_targets_min": 4000 }, { "epoch": 1.8540618260244428, "grad_norm": 0.5266250897243666, "learning_rate": 3.679471505518306e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.13978716731071472, "step": 1290, "valid_targets_mean": 3342.1, "valid_targets_min": 767 }, { "epoch": 1.8612508986340761, "grad_norm": 0.49171130776521615, "learning_rate": 3.67556960656734e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.14079241454601288, "step": 1295, "valid_targets_mean": 3342.5, "valid_targets_min": 726 }, { "epoch": 1.8684399712437094, "grad_norm": 0.49843468685276926, "learning_rate": 3.6716461966127955e-05, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.14257866144180298, "step": 1300, "valid_targets_mean": 3800.0, "valid_targets_min": 640 }, { "epoch": 1.875629043853343, "grad_norm": 0.5496180609804349, "learning_rate": 3.6677013260235054e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.16164788603782654, "step": 1305, "valid_targets_mean": 3051.6, "valid_targets_min": 671 }, { "epoch": 1.8828181164629763, "grad_norm": 0.5170287488041243, "learning_rate": 3.663735045443816e-05, "loss": 0.2995, "loss_nan_ranks": 0, "loss_rank_avg": 0.16715139150619507, "step": 1310, "valid_targets_mean": 3631.0, "valid_targets_min": 665 }, { "epoch": 1.8900071890726098, "grad_norm": 0.5086856038225003, "learning_rate": 3.659747405792935e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597132831811905, "step": 1315, "valid_targets_mean": 3384.6, "valid_targets_min": 720 }, { "epoch": 1.897196261682243, "grad_norm": 0.5276886812025636, "learning_rate": 3.655738458264275e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.12705910205841064, "step": 1320, "valid_targets_mean": 3736.5, "valid_targets_min": 593 }, { "epoch": 1.9043853342918764, "grad_norm": 0.47184848582856675, "learning_rate": 3.651708254324805e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.14923986792564392, "step": 1325, "valid_targets_mean": 4219.8, "valid_targets_min": 505 }, { "epoch": 1.9115744069015097, "grad_norm": 0.5095295218556172, "learning_rate": 3.64765684571438e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307600885629654, "step": 1330, "valid_targets_mean": 3621.0, "valid_targets_min": 977 }, { "epoch": 1.918763479511143, "grad_norm": 0.4994876634935122, "learning_rate": 3.6435842844450834e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.14474749565124512, "step": 1335, "valid_targets_mean": 3611.5, "valid_targets_min": 678 }, { "epoch": 1.9259525521207763, "grad_norm": 0.8084296900592843, "learning_rate": 3.639490622800557e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.15133309364318848, "step": 1340, "valid_targets_mean": 3889.6, "valid_targets_min": 903 }, { "epoch": 1.9331416247304096, "grad_norm": 0.47612540531078573, "learning_rate": 3.635375913335328e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.11670131981372833, "step": 1345, "valid_targets_mean": 3428.1, "valid_targets_min": 620 }, { "epoch": 1.9403306973400432, "grad_norm": 0.5201381114302891, "learning_rate": 3.631240208874138e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.17568343877792358, "step": 1350, "valid_targets_mean": 4018.5, "valid_targets_min": 771 }, { "epoch": 1.9475197699496765, "grad_norm": 0.5684687696419027, "learning_rate": 3.627083562511262e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.15264779329299927, "step": 1355, "valid_targets_mean": 4340.8, "valid_targets_min": 502 }, { "epoch": 1.95470884255931, "grad_norm": 0.505802871570166, "learning_rate": 3.622906027609826e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.14337629079818726, "step": 1360, "valid_targets_mean": 3748.8, "valid_targets_min": 482 }, { "epoch": 1.9618979151689433, "grad_norm": 0.5332734023712747, "learning_rate": 3.618707657801127e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.12836483120918274, "step": 1365, "valid_targets_mean": 3103.9, "valid_targets_min": 596 }, { "epoch": 1.9690869877785766, "grad_norm": 0.5021612024263556, "learning_rate": 3.614488506983939e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.14348819851875305, "step": 1370, "valid_targets_mean": 4130.9, "valid_targets_min": 851 }, { "epoch": 1.97627606038821, "grad_norm": 0.610411285067793, "learning_rate": 3.6102486293238236e-05, "loss": 0.2889, "loss_nan_ranks": 0, "loss_rank_avg": 0.15583057701587677, "step": 1375, "valid_targets_mean": 3433.0, "valid_targets_min": 538 }, { "epoch": 1.9834651329978432, "grad_norm": 0.49020599604774884, "learning_rate": 3.6059880792524326e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.10183790326118469, "step": 1380, "valid_targets_mean": 2611.9, "valid_targets_min": 712 }, { "epoch": 1.9906542056074765, "grad_norm": 0.4649398951912101, "learning_rate": 3.601706911466813e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.11849203705787659, "step": 1385, "valid_targets_mean": 4027.6, "valid_targets_min": 918 }, { "epoch": 1.9978432782171098, "grad_norm": 0.5652715236268022, "learning_rate": 3.597405180928701e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.16841626167297363, "step": 1390, "valid_targets_mean": 4007.5, "valid_targets_min": 821 }, { "epoch": 2.00431344356578, "grad_norm": 0.44042475910319384, "learning_rate": 3.5930829428638195e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.12045784294605255, "step": 1395, "valid_targets_mean": 3999.5, "valid_targets_min": 286 }, { "epoch": 2.011502516175413, "grad_norm": 0.46014945634483034, "learning_rate": 3.588740252761165e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.15798038244247437, "step": 1400, "valid_targets_mean": 5402.1, "valid_targets_min": 3999 }, { "epoch": 2.0186915887850465, "grad_norm": 0.5864474166210711, "learning_rate": 3.5843771663722994e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.14607274532318115, "step": 1405, "valid_targets_mean": 2451.4, "valid_targets_min": 606 }, { "epoch": 2.0258806613946803, "grad_norm": 0.5922859588085109, "learning_rate": 3.5799937397106336e-05, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.149421826004982, "step": 1410, "valid_targets_mean": 3078.4, "valid_targets_min": 615 }, { "epoch": 2.0330697340043136, "grad_norm": 0.576123978661105, "learning_rate": 3.575590029050705e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.1341801881790161, "step": 1415, "valid_targets_mean": 2612.0, "valid_targets_min": 694 }, { "epoch": 2.040258806613947, "grad_norm": 0.5001343696732509, "learning_rate": 3.57116609092746e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.16290068626403809, "step": 1420, "valid_targets_mean": 4209.9, "valid_targets_min": 783 }, { "epoch": 2.04744787922358, "grad_norm": 0.47175040208647506, "learning_rate": 3.5667219821355226e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.12168647348880768, "step": 1425, "valid_targets_mean": 4308.9, "valid_targets_min": 721 }, { "epoch": 2.0546369518332135, "grad_norm": 0.5196704922805649, "learning_rate": 3.5622577597284724e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.13878659904003143, "step": 1430, "valid_targets_mean": 4093.0, "valid_targets_min": 882 }, { "epoch": 2.061826024442847, "grad_norm": 0.5477085097658387, "learning_rate": 3.557773481018104e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.11407799273729324, "step": 1435, "valid_targets_mean": 2638.8, "valid_targets_min": 551 }, { "epoch": 2.06901509705248, "grad_norm": 0.47586536612060937, "learning_rate": 3.5532692035736975e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.11465832591056824, "step": 1440, "valid_targets_mean": 3847.8, "valid_targets_min": 671 }, { "epoch": 2.0762041696621134, "grad_norm": 0.6396794264804806, "learning_rate": 3.548744985221277e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.09672622382640839, "step": 1445, "valid_targets_mean": 2118.6, "valid_targets_min": 706 }, { "epoch": 2.083393242271747, "grad_norm": 0.5908485673059465, "learning_rate": 3.544200884042869e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.11773449927568436, "step": 1450, "valid_targets_mean": 2278.6, "valid_targets_min": 606 }, { "epoch": 2.0905823148813805, "grad_norm": 0.9011502937614828, "learning_rate": 3.539636958375755e-05, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.1216643825173378, "step": 1455, "valid_targets_mean": 2758.0, "valid_targets_min": 652 }, { "epoch": 2.0977713874910138, "grad_norm": 0.5586718911086384, "learning_rate": 3.535053266811725e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.1211056336760521, "step": 1460, "valid_targets_mean": 2683.1, "valid_targets_min": 586 }, { "epoch": 2.104960460100647, "grad_norm": 0.49054572735296403, "learning_rate": 3.5304498681963216e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.12743888795375824, "step": 1465, "valid_targets_mean": 3772.6, "valid_targets_min": 916 }, { "epoch": 2.1121495327102804, "grad_norm": 0.5650208920966238, "learning_rate": 3.52582682162809e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.14947383105754852, "step": 1470, "valid_targets_mean": 2826.8, "valid_targets_min": 499 }, { "epoch": 2.1193386053199137, "grad_norm": 0.45465073195112815, "learning_rate": 3.521184186457815e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.13897745311260223, "step": 1475, "valid_targets_mean": 4228.9, "valid_targets_min": 575 }, { "epoch": 2.126527677929547, "grad_norm": 0.5735246322929461, "learning_rate": 3.51652202228776e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.17849652469158173, "step": 1480, "valid_targets_mean": 4539.4, "valid_targets_min": 734 }, { "epoch": 2.1337167505391803, "grad_norm": 0.6091822343999242, "learning_rate": 3.511840388970903e-05, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.145311176776886, "step": 1485, "valid_targets_mean": 2660.6, "valid_targets_min": 206 }, { "epoch": 2.1409058231488136, "grad_norm": 0.5177727754454414, "learning_rate": 3.507139346610167e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.13099326193332672, "step": 1490, "valid_targets_mean": 3336.1, "valid_targets_min": 500 }, { "epoch": 2.1480948957584474, "grad_norm": 0.47860594671573575, "learning_rate": 3.502418955557649e-05, "loss": 0.2554, "loss_nan_ranks": 0, "loss_rank_avg": 0.10694457590579987, "step": 1495, "valid_targets_mean": 3990.4, "valid_targets_min": 616 }, { "epoch": 2.1552839683680807, "grad_norm": 0.5251786287771435, "learning_rate": 3.4976792764138446e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.09503109753131866, "step": 1500, "valid_targets_mean": 2990.2, "valid_targets_min": 670 }, { "epoch": 2.162473040977714, "grad_norm": 0.4993754918391816, "learning_rate": 3.4929203700268706e-05, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.11814264208078384, "step": 1505, "valid_targets_mean": 3831.6, "valid_targets_min": 802 }, { "epoch": 2.1696621135873473, "grad_norm": 0.5661575463954994, "learning_rate": 3.488142297491683e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.11874938011169434, "step": 1510, "valid_targets_mean": 3086.4, "valid_targets_min": 599 }, { "epoch": 2.1768511861969806, "grad_norm": 0.5826772519983847, "learning_rate": 3.483345120149294e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15646061301231384, "step": 1515, "valid_targets_mean": 3559.1, "valid_targets_min": 242 }, { "epoch": 2.184040258806614, "grad_norm": 0.5139252289446473, "learning_rate": 3.4785288995859835e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.13239224255084991, "step": 1520, "valid_targets_mean": 3718.9, "valid_targets_min": 503 }, { "epoch": 2.191229331416247, "grad_norm": 0.4982519981602888, "learning_rate": 3.4736936976325094e-05, "loss": 0.2843, "loss_nan_ranks": 0, "loss_rank_avg": 0.15333423018455505, "step": 1525, "valid_targets_mean": 4679.8, "valid_targets_min": 693 }, { "epoch": 2.1984184040258805, "grad_norm": 0.48520099933200456, "learning_rate": 3.468839576363313e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.15786109864711761, "step": 1530, "valid_targets_mean": 4654.2, "valid_targets_min": 3386 }, { "epoch": 2.205607476635514, "grad_norm": 0.5104245415475017, "learning_rate": 3.463966598095721e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.12429475039243698, "step": 1535, "valid_targets_mean": 3454.0, "valid_targets_min": 694 }, { "epoch": 2.2127965492451476, "grad_norm": 0.5657497859202579, "learning_rate": 3.459074825389147e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.141516774892807, "step": 1540, "valid_targets_mean": 3773.1, "valid_targets_min": 647 }, { "epoch": 2.219985621854781, "grad_norm": 0.5163287527650611, "learning_rate": 3.4541643210442895e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.17117419838905334, "step": 1545, "valid_targets_mean": 5093.4, "valid_targets_min": 745 }, { "epoch": 2.227174694464414, "grad_norm": 0.5564079368258821, "learning_rate": 3.4492351481023236e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.19022008776664734, "step": 1550, "valid_targets_mean": 4066.0, "valid_targets_min": 635 }, { "epoch": 2.2343637670740475, "grad_norm": 0.5397979967201494, "learning_rate": 3.444287369844092e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.09026080369949341, "step": 1555, "valid_targets_mean": 1724.5, "valid_targets_min": 221 }, { "epoch": 2.241552839683681, "grad_norm": 0.4815453466365358, "learning_rate": 3.439321049789292e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.11930803209543228, "step": 1560, "valid_targets_mean": 3645.6, "valid_targets_min": 619 }, { "epoch": 2.248741912293314, "grad_norm": 0.5625767162580588, "learning_rate": 3.434336251695663e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.10417810082435608, "step": 1565, "valid_targets_mean": 2749.9, "valid_targets_min": 578 }, { "epoch": 2.2559309849029474, "grad_norm": 0.5803374667156413, "learning_rate": 3.429333039558164e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1408432126045227, "step": 1570, "valid_targets_mean": 3556.9, "valid_targets_min": 769 }, { "epoch": 2.2631200575125807, "grad_norm": 0.5223520497569117, "learning_rate": 3.424311477608155e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.14780449867248535, "step": 1575, "valid_targets_mean": 4020.1, "valid_targets_min": 629 }, { "epoch": 2.2703091301222145, "grad_norm": 0.5120310717401553, "learning_rate": 3.419271630312571e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.09790432453155518, "step": 1580, "valid_targets_mean": 3122.2, "valid_targets_min": 474 }, { "epoch": 2.2774982027318478, "grad_norm": 0.5335207312364842, "learning_rate": 3.4142135623730954e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.15345562994480133, "step": 1585, "valid_targets_mean": 3602.5, "valid_targets_min": 925 }, { "epoch": 2.284687275341481, "grad_norm": 0.5126000830068731, "learning_rate": 3.4091373387253275e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.1684829741716385, "step": 1590, "valid_targets_mean": 4178.2, "valid_targets_min": 516 }, { "epoch": 2.2918763479511144, "grad_norm": 0.48256289234266836, "learning_rate": 3.4040430245379504e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.11229759454727173, "step": 1595, "valid_targets_mean": 3424.4, "valid_targets_min": 605 }, { "epoch": 2.2990654205607477, "grad_norm": 0.55020456280713, "learning_rate": 3.398930685211895e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.11756587028503418, "step": 1600, "valid_targets_mean": 3094.5, "valid_targets_min": 497 }, { "epoch": 2.306254493170381, "grad_norm": 0.441903715964592, "learning_rate": 3.3938003863794985e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.11097332835197449, "step": 1605, "valid_targets_mean": 3508.8, "valid_targets_min": 613 }, { "epoch": 2.3134435657800143, "grad_norm": 0.5014046749229496, "learning_rate": 3.3886521939036615e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317036747932434, "step": 1610, "valid_targets_mean": 3808.2, "valid_targets_min": 755 }, { "epoch": 2.3206326383896476, "grad_norm": 0.5329301293062252, "learning_rate": 3.383486173877006e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.12639915943145752, "step": 1615, "valid_targets_mean": 3335.2, "valid_targets_min": 804 }, { "epoch": 2.327821710999281, "grad_norm": 0.5057564917431732, "learning_rate": 3.378302392621023e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.15294601023197174, "step": 1620, "valid_targets_mean": 3938.2, "valid_targets_min": 612 }, { "epoch": 2.3350107836089142, "grad_norm": 0.5552358600783263, "learning_rate": 3.3731009166852234e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.16431793570518494, "step": 1625, "valid_targets_mean": 4337.2, "valid_targets_min": 1382 }, { "epoch": 2.342199856218548, "grad_norm": 0.4430784978799377, "learning_rate": 3.367881812846282e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.118332639336586, "step": 1630, "valid_targets_mean": 3640.8, "valid_targets_min": 470 }, { "epoch": 2.3493889288281813, "grad_norm": 0.492835719915706, "learning_rate": 3.362645148107183e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.13531847298145294, "step": 1635, "valid_targets_mean": 3750.9, "valid_targets_min": 586 }, { "epoch": 2.3565780014378146, "grad_norm": 0.49387897152804017, "learning_rate": 3.357390989696353e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.12371513247489929, "step": 1640, "valid_targets_mean": 3756.9, "valid_targets_min": 723 }, { "epoch": 2.363767074047448, "grad_norm": 0.5292204315605716, "learning_rate": 3.352119405066809e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.1294528990983963, "step": 1645, "valid_targets_mean": 3740.4, "valid_targets_min": 726 }, { "epoch": 2.370956146657081, "grad_norm": 0.5482500192647483, "learning_rate": 3.346830461895283e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.11841487884521484, "step": 1650, "valid_targets_mean": 3236.2, "valid_targets_min": 617 }, { "epoch": 2.3781452192667145, "grad_norm": 0.5569155952182551, "learning_rate": 3.3415242280813567e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.16182178258895874, "step": 1655, "valid_targets_mean": 3206.0, "valid_targets_min": 643 }, { "epoch": 2.385334291876348, "grad_norm": 0.4187873978975146, "learning_rate": 3.3362007717465884e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.12652206420898438, "step": 1660, "valid_targets_mean": 4757.6, "valid_targets_min": 995 }, { "epoch": 2.392523364485981, "grad_norm": 0.48405464845552704, "learning_rate": 3.330860161233642e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.13703463971614838, "step": 1665, "valid_targets_mean": 3936.0, "valid_targets_min": 779 }, { "epoch": 2.399712437095615, "grad_norm": 0.525936038970634, "learning_rate": 3.3255024651054045e-05, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.1976655125617981, "step": 1670, "valid_targets_mean": 4660.8, "valid_targets_min": 2417 }, { "epoch": 2.406901509705248, "grad_norm": 0.48342772806241563, "learning_rate": 3.320127752144111e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.18336616456508636, "step": 1675, "valid_targets_mean": 5358.4, "valid_targets_min": 895 }, { "epoch": 2.4140905823148815, "grad_norm": 0.5414300080613395, "learning_rate": 3.314736091350458e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.16382211446762085, "step": 1680, "valid_targets_mean": 4076.9, "valid_targets_min": 950 }, { "epoch": 2.421279654924515, "grad_norm": 0.5247367013493369, "learning_rate": 3.3093275519427175e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.1400073617696762, "step": 1685, "valid_targets_mean": 3772.5, "valid_targets_min": 913 }, { "epoch": 2.428468727534148, "grad_norm": 0.5038530432636198, "learning_rate": 3.303902203355852e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.08247102051973343, "step": 1690, "valid_targets_mean": 2354.1, "valid_targets_min": 480 }, { "epoch": 2.4356578001437814, "grad_norm": 0.47032603091705133, "learning_rate": 3.2984601152406176e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.12384230643510818, "step": 1695, "valid_targets_mean": 3688.6, "valid_targets_min": 554 }, { "epoch": 2.4428468727534147, "grad_norm": 0.6205205557490409, "learning_rate": 3.293001357462676e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.11945857107639313, "step": 1700, "valid_targets_mean": 2112.8, "valid_targets_min": 489 }, { "epoch": 2.450035945363048, "grad_norm": 0.58735452653188, "learning_rate": 3.287526000101693e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.14614614844322205, "step": 1705, "valid_targets_mean": 2608.5, "valid_targets_min": 638 }, { "epoch": 2.4572250179726813, "grad_norm": 0.5529963455269361, "learning_rate": 3.28203411345044e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.15596972405910492, "step": 1710, "valid_targets_mean": 3632.6, "valid_targets_min": 789 }, { "epoch": 2.4644140905823146, "grad_norm": 0.46547199433659353, "learning_rate": 3.2765257680138914e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.12506428360939026, "step": 1715, "valid_targets_mean": 4817.8, "valid_targets_min": 3107 }, { "epoch": 2.4716031631919484, "grad_norm": 0.4630677382270778, "learning_rate": 3.271001034508321e-05, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.15703052282333374, "step": 1720, "valid_targets_mean": 4160.2, "valid_targets_min": 847 }, { "epoch": 2.4787922358015817, "grad_norm": 0.537284473855485, "learning_rate": 3.2654599838603934e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.11568139493465424, "step": 1725, "valid_targets_mean": 2814.8, "valid_targets_min": 615 }, { "epoch": 2.485981308411215, "grad_norm": 0.5363135175126315, "learning_rate": 3.259902687206251e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.10325951129198074, "step": 1730, "valid_targets_mean": 2743.4, "valid_targets_min": 604 }, { "epoch": 2.4931703810208483, "grad_norm": 0.49958194974316356, "learning_rate": 3.254329215890605e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.14953942596912384, "step": 1735, "valid_targets_mean": 4127.9, "valid_targets_min": 792 }, { "epoch": 2.5003594536304816, "grad_norm": 0.47782238311011827, "learning_rate": 3.2487396414658175e-05, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.093122698366642, "step": 1740, "valid_targets_mean": 2792.6, "valid_targets_min": 766 }, { "epoch": 2.507548526240115, "grad_norm": 0.49969197033552243, "learning_rate": 3.2431340356909785e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.13741299510002136, "step": 1745, "valid_targets_mean": 3782.9, "valid_targets_min": 978 }, { "epoch": 2.5147375988497482, "grad_norm": 0.48532507278419035, "learning_rate": 3.2375124705309956e-05, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263132393360138, "step": 1750, "valid_targets_mean": 3629.0, "valid_targets_min": 706 }, { "epoch": 2.521926671459382, "grad_norm": 0.4891347428964143, "learning_rate": 3.2318750181556575e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.13069723546504974, "step": 1755, "valid_targets_mean": 3528.9, "valid_targets_min": 708 }, { "epoch": 2.5291157440690153, "grad_norm": 0.5186284903213042, "learning_rate": 3.226221750938716e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595681756734848, "step": 1760, "valid_targets_mean": 3760.9, "valid_targets_min": 832 }, { "epoch": 2.5363048166786486, "grad_norm": 0.48093912887760065, "learning_rate": 3.220552741456954e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.15026655793190002, "step": 1765, "valid_targets_mean": 4527.4, "valid_targets_min": 934 }, { "epoch": 2.543493889288282, "grad_norm": 0.4814466453376168, "learning_rate": 3.214868062489254e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.13298210501670837, "step": 1770, "valid_targets_mean": 3778.2, "valid_targets_min": 675 }, { "epoch": 2.550682961897915, "grad_norm": 0.4969943214307037, "learning_rate": 3.209167787015663e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.15883077681064606, "step": 1775, "valid_targets_mean": 4380.6, "valid_targets_min": 647 }, { "epoch": 2.5578720345075485, "grad_norm": 0.4560608460390592, "learning_rate": 3.203451988216458e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.11129967868328094, "step": 1780, "valid_targets_mean": 3518.4, "valid_targets_min": 577 }, { "epoch": 2.565061107117182, "grad_norm": 0.5037014636875286, "learning_rate": 3.197720739471202e-05, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.15875720977783203, "step": 1785, "valid_targets_mean": 4701.8, "valid_targets_min": 753 }, { "epoch": 2.572250179726815, "grad_norm": 0.472938402206803, "learning_rate": 3.1919741143578086e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.12956391274929047, "step": 1790, "valid_targets_mean": 4941.9, "valid_targets_min": 3822 }, { "epoch": 2.5794392523364484, "grad_norm": 0.4832272367661924, "learning_rate": 3.186212186651591e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.1389496773481369, "step": 1795, "valid_targets_mean": 4036.4, "valid_targets_min": 861 }, { "epoch": 2.5866283249460817, "grad_norm": 0.48575809575681733, "learning_rate": 3.1804350303243175e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.145027756690979, "step": 1800, "valid_targets_mean": 4709.1, "valid_targets_min": 993 }, { "epoch": 2.593817397555715, "grad_norm": 0.5342164381090817, "learning_rate": 3.174642719543262e-05, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.14232099056243896, "step": 1805, "valid_targets_mean": 4011.2, "valid_targets_min": 785 }, { "epoch": 2.601006470165349, "grad_norm": 0.5409491251603485, "learning_rate": 3.168835328670252e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.15404319763183594, "step": 1810, "valid_targets_mean": 4418.6, "valid_targets_min": 906 }, { "epoch": 2.608195542774982, "grad_norm": 0.5368817093148895, "learning_rate": 3.1630129322607135e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.15413588285446167, "step": 1815, "valid_targets_mean": 3734.1, "valid_targets_min": 567 }, { "epoch": 2.6153846153846154, "grad_norm": 0.4908534227910792, "learning_rate": 3.157175605062715e-05, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.11011715233325958, "step": 1820, "valid_targets_mean": 3284.6, "valid_targets_min": 545 }, { "epoch": 2.6225736879942487, "grad_norm": 0.6400744445531912, "learning_rate": 3.1513234220160046e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.18450883030891418, "step": 1825, "valid_targets_mean": 2911.4, "valid_targets_min": 467 }, { "epoch": 2.629762760603882, "grad_norm": 0.47741062151662667, "learning_rate": 3.145456458251052e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1267721801996231, "step": 1830, "valid_targets_mean": 3127.4, "valid_targets_min": 875 }, { "epoch": 2.6369518332135153, "grad_norm": 0.5287490483158872, "learning_rate": 3.139574789088081e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.11356522142887115, "step": 1835, "valid_targets_mean": 2696.1, "valid_targets_min": 661 }, { "epoch": 2.644140905823149, "grad_norm": 0.5207652535003496, "learning_rate": 3.133678490036105e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.11317160725593567, "step": 1840, "valid_targets_mean": 2998.9, "valid_targets_min": 551 }, { "epoch": 2.6513299784327824, "grad_norm": 0.49826783220149434, "learning_rate": 3.1277676367919536e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.12781062722206116, "step": 1845, "valid_targets_mean": 3907.8, "valid_targets_min": 804 }, { "epoch": 2.6585190510424157, "grad_norm": 0.49684271540043673, "learning_rate": 3.121842305239307e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.15386344492435455, "step": 1850, "valid_targets_mean": 4322.5, "valid_targets_min": 515 }, { "epoch": 2.665708123652049, "grad_norm": 0.42219428290284244, "learning_rate": 3.115902571447716e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.11060372740030289, "step": 1855, "valid_targets_mean": 4049.8, "valid_targets_min": 790 }, { "epoch": 2.6728971962616823, "grad_norm": 0.5333465277393413, "learning_rate": 3.109948511671628e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.15619201958179474, "step": 1860, "valid_targets_mean": 3500.9, "valid_targets_min": 956 }, { "epoch": 2.6800862688713156, "grad_norm": 0.5898901842447883, "learning_rate": 3.103980202349409e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.14231330156326294, "step": 1865, "valid_targets_mean": 4065.4, "valid_targets_min": 937 }, { "epoch": 2.687275341480949, "grad_norm": 0.5275929648717342, "learning_rate": 3.097997720102359e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.11855625361204147, "step": 1870, "valid_targets_mean": 2870.2, "valid_targets_min": 906 }, { "epoch": 2.6944644140905822, "grad_norm": 0.5322646973037383, "learning_rate": 3.092001141733731e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1415766030550003, "step": 1875, "valid_targets_mean": 3502.4, "valid_targets_min": 551 }, { "epoch": 2.7016534867002155, "grad_norm": 0.4532218793273748, "learning_rate": 3.085990544227745e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.1096867173910141, "step": 1880, "valid_targets_mean": 4147.9, "valid_targets_min": 422 }, { "epoch": 2.708842559309849, "grad_norm": 0.49742211703854067, "learning_rate": 3.079966004748601e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.12179790437221527, "step": 1885, "valid_targets_mean": 3049.1, "valid_targets_min": 663 }, { "epoch": 2.716031631919482, "grad_norm": 0.5312740695729437, "learning_rate": 3.073927600639481e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.18648596107959747, "step": 1890, "valid_targets_mean": 4425.0, "valid_targets_min": 3644 }, { "epoch": 2.723220704529116, "grad_norm": 0.45492540963452555, "learning_rate": 3.0678754094215654e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.12681034207344055, "step": 1895, "valid_targets_mean": 4011.2, "valid_targets_min": 1087 }, { "epoch": 2.730409777138749, "grad_norm": 0.5324709930689125, "learning_rate": 3.061809508793033e-05, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529749035835266, "step": 1900, "valid_targets_mean": 4182.0, "valid_targets_min": 969 }, { "epoch": 2.7375988497483825, "grad_norm": 0.5282988045210955, "learning_rate": 3.055729976628066e-05, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.11237910389900208, "step": 1905, "valid_targets_mean": 2708.0, "valid_targets_min": 600 }, { "epoch": 2.744787922358016, "grad_norm": 0.4592623854572585, "learning_rate": 3.0496368909758448e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.14295190572738647, "step": 1910, "valid_targets_mean": 4066.2, "valid_targets_min": 440 }, { "epoch": 2.751976994967649, "grad_norm": 0.4288185851911634, "learning_rate": 3.0435303300595538e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.14109700918197632, "step": 1915, "valid_targets_mean": 4810.4, "valid_targets_min": 624 }, { "epoch": 2.7591660675772824, "grad_norm": 0.4511482248881237, "learning_rate": 3.0374103722753704e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.11241908371448517, "step": 1920, "valid_targets_mean": 3693.0, "valid_targets_min": 833 }, { "epoch": 2.7663551401869158, "grad_norm": 0.4413291911556102, "learning_rate": 3.0312770961914623e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.12785547971725464, "step": 1925, "valid_targets_mean": 4205.5, "valid_targets_min": 615 }, { "epoch": 2.7735442127965495, "grad_norm": 0.44230100469185457, "learning_rate": 3.0251305805469776e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.13793818652629852, "step": 1930, "valid_targets_mean": 4618.0, "valid_targets_min": 3914 }, { "epoch": 2.780733285406183, "grad_norm": 0.5078636318952374, "learning_rate": 3.0189709042510345e-05, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.1292886734008789, "step": 1935, "valid_targets_mean": 2961.2, "valid_targets_min": 427 }, { "epoch": 2.787922358015816, "grad_norm": 0.5115324989698494, "learning_rate": 3.012798146381709e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.15270881354808807, "step": 1940, "valid_targets_mean": 3834.8, "valid_targets_min": 522 }, { "epoch": 2.7951114306254494, "grad_norm": 0.4648202628041615, "learning_rate": 3.0066123861850162e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.10922946035861969, "step": 1945, "valid_targets_mean": 3411.1, "valid_targets_min": 858 }, { "epoch": 2.8023005032350827, "grad_norm": 0.5272395212940438, "learning_rate": 3.000413703073898e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.12008656561374664, "step": 1950, "valid_targets_mean": 2605.2, "valid_targets_min": 772 }, { "epoch": 2.809489575844716, "grad_norm": 0.524615079864663, "learning_rate": 2.994202176627198e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.134141206741333, "step": 1955, "valid_targets_mean": 3072.1, "valid_targets_min": 707 }, { "epoch": 2.8166786484543493, "grad_norm": 0.5277222260085981, "learning_rate": 2.987977886588646e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.11295173317193985, "step": 1960, "valid_targets_mean": 2585.8, "valid_targets_min": 456 }, { "epoch": 2.8238677210639826, "grad_norm": 0.5327387085151372, "learning_rate": 2.981740912865829e-05, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.11163774132728577, "step": 1965, "valid_targets_mean": 2804.4, "valid_targets_min": 680 }, { "epoch": 2.831056793673616, "grad_norm": 0.5286702950441636, "learning_rate": 2.9754913355291687e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.11060294508934021, "step": 1970, "valid_targets_mean": 3187.1, "valid_targets_min": 596 }, { "epoch": 2.8382458662832493, "grad_norm": 0.48936639413972866, "learning_rate": 2.9692292348108913e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.14475484192371368, "step": 1975, "valid_targets_mean": 3586.5, "valid_targets_min": 701 }, { "epoch": 2.8454349388928826, "grad_norm": 0.41895977374703486, "learning_rate": 2.9629546911039995e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.1372557133436203, "step": 1980, "valid_targets_mean": 5150.8, "valid_targets_min": 4277 }, { "epoch": 2.8526240115025163, "grad_norm": 0.4623645207037126, "learning_rate": 2.9566677849612383e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.12075348943471909, "step": 1985, "valid_targets_mean": 2770.5, "valid_targets_min": 531 }, { "epoch": 2.8598130841121496, "grad_norm": 0.4547471741235561, "learning_rate": 2.950368597094063e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.12804922461509705, "step": 1990, "valid_targets_mean": 4452.6, "valid_targets_min": 3473 }, { "epoch": 2.867002156721783, "grad_norm": 0.5716261379564964, "learning_rate": 2.9440572083716e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.13049060106277466, "step": 1995, "valid_targets_mean": 3718.5, "valid_targets_min": 949 }, { "epoch": 2.8741912293314162, "grad_norm": 0.4523003790407094, "learning_rate": 2.9377336998196147e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.13575586676597595, "step": 2000, "valid_targets_mean": 3801.2, "valid_targets_min": 535 }, { "epoch": 2.8813803019410495, "grad_norm": 0.5916418462296764, "learning_rate": 2.931398152619462e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.10240516811609268, "step": 2005, "valid_targets_mean": 1806.5, "valid_targets_min": 471 }, { "epoch": 2.888569374550683, "grad_norm": 0.5087183669235579, "learning_rate": 2.925050648107053e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419801115989685, "step": 2010, "valid_targets_mean": 3731.9, "valid_targets_min": 610 }, { "epoch": 2.895758447160316, "grad_norm": 0.5450170825216338, "learning_rate": 2.9186912677718044e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.15140527486801147, "step": 2015, "valid_targets_mean": 3016.1, "valid_targets_min": 581 }, { "epoch": 2.90294751976995, "grad_norm": 0.5243099796515388, "learning_rate": 2.912320093255599e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.09774617850780487, "step": 2020, "valid_targets_mean": 2224.4, "valid_targets_min": 493 }, { "epoch": 2.910136592379583, "grad_norm": 0.4918756856019155, "learning_rate": 2.9059372063517285e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.10992417484521866, "step": 2025, "valid_targets_mean": 3224.4, "valid_targets_min": 594 }, { "epoch": 2.9173256649892165, "grad_norm": 0.5043736261289858, "learning_rate": 2.8995426890038533e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.19480252265930176, "step": 2030, "valid_targets_mean": 5160.0, "valid_targets_min": 573 }, { "epoch": 2.92451473759885, "grad_norm": 0.4624647860625992, "learning_rate": 2.8931366233049415e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.1291601061820984, "step": 2035, "valid_targets_mean": 3699.6, "valid_targets_min": 758 }, { "epoch": 2.931703810208483, "grad_norm": 0.4567936051912573, "learning_rate": 2.8867190914962228e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.1221659928560257, "step": 2040, "valid_targets_mean": 3541.9, "valid_targets_min": 989 }, { "epoch": 2.9388928828181164, "grad_norm": 0.5108265761866421, "learning_rate": 2.8802901759661256e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.11455883830785751, "step": 2045, "valid_targets_mean": 2693.2, "valid_targets_min": 574 }, { "epoch": 2.9460819554277498, "grad_norm": 0.462539235433949, "learning_rate": 2.873849959249226e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.12773972749710083, "step": 2050, "valid_targets_mean": 3324.9, "valid_targets_min": 688 }, { "epoch": 2.953271028037383, "grad_norm": 0.4922307858611935, "learning_rate": 2.8673985240251835e-05, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.15249422192573547, "step": 2055, "valid_targets_mean": 4484.2, "valid_targets_min": 685 }, { "epoch": 2.9604601006470164, "grad_norm": 0.5119981885399685, "learning_rate": 2.860935953117681e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.13160674273967743, "step": 2060, "valid_targets_mean": 3732.1, "valid_targets_min": 680 }, { "epoch": 2.9676491732566497, "grad_norm": 0.5867234583593739, "learning_rate": 2.854462329493362e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.13651028275489807, "step": 2065, "valid_targets_mean": 2434.2, "valid_targets_min": 840 }, { "epoch": 2.974838245866283, "grad_norm": 0.4906003413994672, "learning_rate": 2.8479777362607647e-05, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.14013247191905975, "step": 2070, "valid_targets_mean": 3921.0, "valid_targets_min": 557 }, { "epoch": 2.9820273184759167, "grad_norm": 0.5123460997995863, "learning_rate": 2.8414822566692558e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.14255797863006592, "step": 2075, "valid_targets_mean": 3564.1, "valid_targets_min": 751 }, { "epoch": 2.98921639108555, "grad_norm": 0.43494582159562417, "learning_rate": 2.8349759741079607e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.11678533256053925, "step": 2080, "valid_targets_mean": 4366.4, "valid_targets_min": 3042 }, { "epoch": 2.9964054636951833, "grad_norm": 0.45854822797123423, "learning_rate": 2.828458972104695e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.12588660418987274, "step": 2085, "valid_targets_mean": 3966.5, "valid_targets_min": 595 }, { "epoch": 3.0028756290438534, "grad_norm": 0.7069079359730072, "learning_rate": 2.8219313343248885e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.16991043090820312, "step": 2090, "valid_targets_mean": 4596.9, "valid_targets_min": 1041 }, { "epoch": 3.0100647016534867, "grad_norm": 0.5545887030564403, "learning_rate": 2.8153931445705162e-05, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15513832867145538, "step": 2095, "valid_targets_mean": 3631.5, "valid_targets_min": 615 }, { "epoch": 3.01725377426312, "grad_norm": 0.508386475491845, "learning_rate": 2.808844486779016e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.13907843828201294, "step": 2100, "valid_targets_mean": 3614.2, "valid_targets_min": 315 }, { "epoch": 3.0244428468727533, "grad_norm": 0.5044166011046787, "learning_rate": 2.8022854450222182e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.12767350673675537, "step": 2105, "valid_targets_mean": 3602.5, "valid_targets_min": 690 }, { "epoch": 3.0316319194823866, "grad_norm": 0.4597303620877388, "learning_rate": 2.7957161035052606e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1011454239487648, "step": 2110, "valid_targets_mean": 3388.5, "valid_targets_min": 693 }, { "epoch": 3.03882099209202, "grad_norm": 0.5324995493873002, "learning_rate": 2.789136546565511e-05, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.15829084813594818, "step": 2115, "valid_targets_mean": 3950.1, "valid_targets_min": 641 }, { "epoch": 3.0460100647016537, "grad_norm": 0.4661168596192042, "learning_rate": 2.782546858671481e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.10927501320838928, "step": 2120, "valid_targets_mean": 3423.1, "valid_targets_min": 830 }, { "epoch": 3.053199137311287, "grad_norm": 0.5030757007783364, "learning_rate": 2.775947124421746e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.12120012938976288, "step": 2125, "valid_targets_mean": 3486.4, "valid_targets_min": 730 }, { "epoch": 3.0603882099209203, "grad_norm": 0.5093743527850355, "learning_rate": 2.7693374285438547e-05, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.12037092447280884, "step": 2130, "valid_targets_mean": 3773.8, "valid_targets_min": 701 }, { "epoch": 3.0675772825305536, "grad_norm": 0.5318422279637071, "learning_rate": 2.7627178558932456e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12518146634101868, "step": 2135, "valid_targets_mean": 2867.9, "valid_targets_min": 736 }, { "epoch": 3.074766355140187, "grad_norm": 0.5495389139214483, "learning_rate": 2.756088491452153e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.17592960596084595, "step": 2140, "valid_targets_mean": 5162.5, "valid_targets_min": 617 }, { "epoch": 3.0819554277498202, "grad_norm": 0.5080084657969545, "learning_rate": 2.749449420328521e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.12165935337543488, "step": 2145, "valid_targets_mean": 3485.5, "valid_targets_min": 603 }, { "epoch": 3.0891445003594535, "grad_norm": 0.4581974538526893, "learning_rate": 2.742800727754906e-05, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.13358767330646515, "step": 2150, "valid_targets_mean": 4797.4, "valid_targets_min": 629 }, { "epoch": 3.096333572969087, "grad_norm": 0.5293145081012333, "learning_rate": 2.7361424990873864e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.12826603651046753, "step": 2155, "valid_targets_mean": 3203.6, "valid_targets_min": 609 }, { "epoch": 3.10352264557872, "grad_norm": 0.5045238984815654, "learning_rate": 2.7294748198044637e-05, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334061473608017, "step": 2160, "valid_targets_mean": 3690.8, "valid_targets_min": 611 }, { "epoch": 3.110711718188354, "grad_norm": 0.5944184962075417, "learning_rate": 2.722797775505969e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.12685522437095642, "step": 2165, "valid_targets_mean": 3470.2, "valid_targets_min": 862 }, { "epoch": 3.117900790797987, "grad_norm": 0.5242002429250229, "learning_rate": 2.7161114519119593e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.18032889068126678, "step": 2170, "valid_targets_mean": 4346.6, "valid_targets_min": 567 }, { "epoch": 3.1250898634076205, "grad_norm": 0.47519017295660587, "learning_rate": 2.7094159348616203e-05, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.11818739026784897, "step": 2175, "valid_targets_mean": 3679.6, "valid_targets_min": 620 }, { "epoch": 3.132278936017254, "grad_norm": 0.5510983437184556, "learning_rate": 2.702711310312164e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581596732139587, "step": 2180, "valid_targets_mean": 3518.8, "valid_targets_min": 653 }, { "epoch": 3.139468008626887, "grad_norm": 0.46201415582633937, "learning_rate": 2.6959976643377238e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.1287374198436737, "step": 2185, "valid_targets_mean": 4390.4, "valid_targets_min": 854 }, { "epoch": 3.1466570812365204, "grad_norm": 0.49096146703639676, "learning_rate": 2.689275083128252e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.12094248831272125, "step": 2190, "valid_targets_mean": 3696.8, "valid_targets_min": 368 }, { "epoch": 3.1538461538461537, "grad_norm": 0.4994916178852232, "learning_rate": 2.6825436529884094e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.11061419546604156, "step": 2195, "valid_targets_mean": 3000.4, "valid_targets_min": 514 }, { "epoch": 3.161035226455787, "grad_norm": 0.5036089659495702, "learning_rate": 2.6758034603364608e-05, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.11006475985050201, "step": 2200, "valid_targets_mean": 3325.2, "valid_targets_min": 723 }, { "epoch": 3.1682242990654204, "grad_norm": 0.47055905502722695, "learning_rate": 2.669054591703165e-05, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.12930098176002502, "step": 2205, "valid_targets_mean": 4341.8, "valid_targets_min": 938 }, { "epoch": 3.175413371675054, "grad_norm": 0.608692174157198, "learning_rate": 2.6622971337306625e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.09900519251823425, "step": 2210, "valid_targets_mean": 1953.5, "valid_targets_min": 484 }, { "epoch": 3.1826024442846874, "grad_norm": 0.47784907638231894, "learning_rate": 2.6555311731713626e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.12810474634170532, "step": 2215, "valid_targets_mean": 3757.8, "valid_targets_min": 758 }, { "epoch": 3.1897915168943207, "grad_norm": 0.5130577267818007, "learning_rate": 2.6487567968868347e-05, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.12371031194925308, "step": 2220, "valid_targets_mean": 3631.8, "valid_targets_min": 504 }, { "epoch": 3.196980589503954, "grad_norm": 0.4808527638754144, "learning_rate": 2.6419740918466844e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.09714284539222717, "step": 2225, "valid_targets_mean": 3717.6, "valid_targets_min": 586 }, { "epoch": 3.2041696621135873, "grad_norm": 0.5518930760729734, "learning_rate": 2.6351831451274477e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.11862578988075256, "step": 2230, "valid_targets_mean": 2508.8, "valid_targets_min": 468 }, { "epoch": 3.2113587347232206, "grad_norm": 0.4940521060256115, "learning_rate": 2.628384043911462e-05, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.13668888807296753, "step": 2235, "valid_targets_mean": 4032.0, "valid_targets_min": 891 }, { "epoch": 3.218547807332854, "grad_norm": 0.5034504739886473, "learning_rate": 2.621576875485757e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.1095261424779892, "step": 2240, "valid_targets_mean": 3305.0, "valid_targets_min": 573 }, { "epoch": 3.2257368799424873, "grad_norm": 0.43830856076779845, "learning_rate": 2.6147617272409255e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.12325970083475113, "step": 2245, "valid_targets_mean": 4494.5, "valid_targets_min": 916 }, { "epoch": 3.2329259525521206, "grad_norm": 0.47839573422386605, "learning_rate": 2.6079386866700095e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.1166163831949234, "step": 2250, "valid_targets_mean": 3777.6, "valid_targets_min": 580 }, { "epoch": 3.2401150251617543, "grad_norm": 0.4602584782158853, "learning_rate": 2.6011078413673692e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.12046687304973602, "step": 2255, "valid_targets_mean": 4617.8, "valid_targets_min": 3984 }, { "epoch": 3.2473040977713876, "grad_norm": 0.4655312917452448, "learning_rate": 2.594269279027564e-05, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.12522590160369873, "step": 2260, "valid_targets_mean": 4336.1, "valid_targets_min": 762 }, { "epoch": 3.254493170381021, "grad_norm": 0.48726149453285067, "learning_rate": 2.5874230874442238e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.15026704967021942, "step": 2265, "valid_targets_mean": 4303.4, "valid_targets_min": 895 }, { "epoch": 3.2616822429906542, "grad_norm": 0.6304249424929381, "learning_rate": 2.580569354508925e-05, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.13789577782154083, "step": 2270, "valid_targets_mean": 2981.5, "valid_targets_min": 639 }, { "epoch": 3.2688713156002875, "grad_norm": 0.6086760431353105, "learning_rate": 2.5737081682100575e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.10886932909488678, "step": 2275, "valid_targets_mean": 1702.2, "valid_targets_min": 579 }, { "epoch": 3.276060388209921, "grad_norm": 0.45586872184556493, "learning_rate": 2.5668396166316988e-05, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1350633203983307, "step": 2280, "valid_targets_mean": 5057.0, "valid_targets_min": 3466 }, { "epoch": 3.283249460819554, "grad_norm": 0.461465009195521, "learning_rate": 2.5599637879524822e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.12891460955142975, "step": 2285, "valid_targets_mean": 3825.4, "valid_targets_min": 636 }, { "epoch": 3.2904385334291875, "grad_norm": 0.4806164913168704, "learning_rate": 2.5530807704444646e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.10771054029464722, "step": 2290, "valid_targets_mean": 4006.0, "valid_targets_min": 665 }, { "epoch": 3.297627606038821, "grad_norm": 0.5441576056359098, "learning_rate": 2.5461906524719927e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.12522868812084198, "step": 2295, "valid_targets_mean": 3343.1, "valid_targets_min": 705 }, { "epoch": 3.3048166786484545, "grad_norm": 0.5946930017526083, "learning_rate": 2.539293522490569e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.1276351809501648, "step": 2300, "valid_targets_mean": 2709.4, "valid_targets_min": 639 }, { "epoch": 3.312005751258088, "grad_norm": 0.4879292674456743, "learning_rate": 2.5323894690457186e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.12799575924873352, "step": 2305, "valid_targets_mean": 3353.2, "valid_targets_min": 609 }, { "epoch": 3.319194823867721, "grad_norm": 0.42910242310010305, "learning_rate": 2.525478580771847e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.10297475755214691, "step": 2310, "valid_targets_mean": 4044.0, "valid_targets_min": 258 }, { "epoch": 3.3263838964773544, "grad_norm": 0.5347387405067475, "learning_rate": 2.5185609463911068e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.12474454939365387, "step": 2315, "valid_targets_mean": 4503.6, "valid_targets_min": 3153 }, { "epoch": 3.3335729690869877, "grad_norm": 0.4700670848022084, "learning_rate": 2.511636654712258e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.10849539190530777, "step": 2320, "valid_targets_mean": 3746.0, "valid_targets_min": 684 }, { "epoch": 3.340762041696621, "grad_norm": 0.4835583524848898, "learning_rate": 2.5047057946295263e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440524011850357, "step": 2325, "valid_targets_mean": 4286.1, "valid_targets_min": 451 }, { "epoch": 3.3479511143062544, "grad_norm": 0.6506238528935938, "learning_rate": 2.4977684551214628e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.1264440417289734, "step": 2330, "valid_targets_mean": 3910.2, "valid_targets_min": 551 }, { "epoch": 3.3551401869158877, "grad_norm": 0.5480561132118623, "learning_rate": 2.4908247252498016e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.12950649857521057, "step": 2335, "valid_targets_mean": 2837.0, "valid_targets_min": 724 }, { "epoch": 3.362329259525521, "grad_norm": 0.447018910737458, "learning_rate": 2.4838746941583165e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.10450244694948196, "step": 2340, "valid_targets_mean": 3569.1, "valid_targets_min": 791 }, { "epoch": 3.3695183321351547, "grad_norm": 0.5293944991502482, "learning_rate": 2.476918451071677e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15744715929031372, "step": 2345, "valid_targets_mean": 4600.1, "valid_targets_min": 827 }, { "epoch": 3.376707404744788, "grad_norm": 0.5794346987479623, "learning_rate": 2.4699560852943015e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.10630621761083603, "step": 2350, "valid_targets_mean": 2537.6, "valid_targets_min": 591 }, { "epoch": 3.3838964773544213, "grad_norm": 0.567018449508628, "learning_rate": 2.4629876862092123e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.13535767793655396, "step": 2355, "valid_targets_mean": 3689.2, "valid_targets_min": 646 }, { "epoch": 3.3910855499640546, "grad_norm": 0.49820742830571135, "learning_rate": 2.4560133432768868e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.11119614541530609, "step": 2360, "valid_targets_mean": 3304.4, "valid_targets_min": 594 }, { "epoch": 3.398274622573688, "grad_norm": 0.4797249357815499, "learning_rate": 2.4490331460341112e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.10317108780145645, "step": 2365, "valid_targets_mean": 3439.0, "valid_targets_min": 619 }, { "epoch": 3.4054636951833213, "grad_norm": 0.5444831821184157, "learning_rate": 2.442047184092827e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.11617874354124069, "step": 2370, "valid_targets_mean": 3076.0, "valid_targets_min": 492 }, { "epoch": 3.4126527677929546, "grad_norm": 0.5107430646256917, "learning_rate": 2.435055547138986e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.124700166285038, "step": 2375, "valid_targets_mean": 3625.1, "valid_targets_min": 598 }, { "epoch": 3.419841840402588, "grad_norm": 0.5189568720557954, "learning_rate": 2.4280583249313925e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.14366132020950317, "step": 2380, "valid_targets_mean": 4110.0, "valid_targets_min": 610 }, { "epoch": 3.4270309130122216, "grad_norm": 0.5341482929308659, "learning_rate": 2.4210556073005574e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.141306534409523, "step": 2385, "valid_targets_mean": 3757.0, "valid_targets_min": 628 }, { "epoch": 3.434219985621855, "grad_norm": 0.48115635467476825, "learning_rate": 2.4140474841475414e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.12492194771766663, "step": 2390, "valid_targets_mean": 4349.9, "valid_targets_min": 3705 }, { "epoch": 3.4414090582314882, "grad_norm": 0.48336377937661607, "learning_rate": 2.4070340454427997e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.1366448700428009, "step": 2395, "valid_targets_mean": 3848.9, "valid_targets_min": 634 }, { "epoch": 3.4485981308411215, "grad_norm": 0.5304216588904245, "learning_rate": 2.4000153812250307e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.11717712134122849, "step": 2400, "valid_targets_mean": 2570.8, "valid_targets_min": 647 }, { "epoch": 3.455787203450755, "grad_norm": 0.6855077706341426, "learning_rate": 2.3929915816000168e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.15973010659217834, "step": 2405, "valid_targets_mean": 3849.2, "valid_targets_min": 810 }, { "epoch": 3.462976276060388, "grad_norm": 0.540313346399356, "learning_rate": 2.3859627367394688e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.1391582190990448, "step": 2410, "valid_targets_mean": 3065.8, "valid_targets_min": 635 }, { "epoch": 3.4701653486700215, "grad_norm": 0.49233214084773025, "learning_rate": 2.3789289368798697e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.14611698687076569, "step": 2415, "valid_targets_mean": 4553.0, "valid_targets_min": 978 }, { "epoch": 3.4773544212796548, "grad_norm": 0.4898159022933566, "learning_rate": 2.3718902723213142e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.13121764361858368, "step": 2420, "valid_targets_mean": 4073.2, "valid_targets_min": 632 }, { "epoch": 3.484543493889288, "grad_norm": 0.5398527086062614, "learning_rate": 2.3648468334263495e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.1375160962343216, "step": 2425, "valid_targets_mean": 3811.4, "valid_targets_min": 765 }, { "epoch": 3.491732566498922, "grad_norm": 0.4501147730461357, "learning_rate": 2.357798710618817e-05, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.1265125274658203, "step": 2430, "valid_targets_mean": 4631.2, "valid_targets_min": 3903 }, { "epoch": 3.498921639108555, "grad_norm": 0.4518210089516425, "learning_rate": 2.3507459943826888e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.13443484902381897, "step": 2435, "valid_targets_mean": 4459.2, "valid_targets_min": 920 }, { "epoch": 3.5061107117181884, "grad_norm": 0.46454350403949213, "learning_rate": 2.343688775260909e-05, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.10301059484481812, "step": 2440, "valid_targets_mean": 3593.6, "valid_targets_min": 615 }, { "epoch": 3.5132997843278218, "grad_norm": 0.49423402003357275, "learning_rate": 2.3366271438542287e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.09725943207740784, "step": 2445, "valid_targets_mean": 3318.4, "valid_targets_min": 649 }, { "epoch": 3.520488856937455, "grad_norm": 0.47637389226364873, "learning_rate": 2.3295611908200454e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.10003632307052612, "step": 2450, "valid_targets_mean": 3680.4, "valid_targets_min": 709 }, { "epoch": 3.5276779295470884, "grad_norm": 0.4918339024950877, "learning_rate": 2.3224910068712355e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.126363143324852, "step": 2455, "valid_targets_mean": 3840.5, "valid_targets_min": 576 }, { "epoch": 3.5348670021567217, "grad_norm": 0.5921138868050676, "learning_rate": 2.3154166827749947e-05, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.11931576579809189, "step": 2460, "valid_targets_mean": 2681.2, "valid_targets_min": 732 }, { "epoch": 3.542056074766355, "grad_norm": 0.6086195584987955, "learning_rate": 2.3083383093516686e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.12224029749631882, "step": 2465, "valid_targets_mean": 3808.8, "valid_targets_min": 787 }, { "epoch": 3.5492451473759887, "grad_norm": 0.5021142253817824, "learning_rate": 2.301255977473587e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.11519993841648102, "step": 2470, "valid_targets_mean": 3547.0, "valid_targets_min": 693 }, { "epoch": 3.556434219985622, "grad_norm": 0.504249898299747, "learning_rate": 2.2941697780639018e-05, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.11413753032684326, "step": 2475, "valid_targets_mean": 3386.0, "valid_targets_min": 713 }, { "epoch": 3.5636232925952553, "grad_norm": 0.5258515811866988, "learning_rate": 2.2870798020954127e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.09162728488445282, "step": 2480, "valid_targets_mean": 2764.0, "valid_targets_min": 563 }, { "epoch": 3.5708123652048886, "grad_norm": 0.45667405800785726, "learning_rate": 2.279986140589405e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.14917941391468048, "step": 2485, "valid_targets_mean": 4933.5, "valid_targets_min": 693 }, { "epoch": 3.578001437814522, "grad_norm": 0.47014637028947304, "learning_rate": 2.2728888846144788e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.12864919006824493, "step": 2490, "valid_targets_mean": 4165.1, "valid_targets_min": 752 }, { "epoch": 3.5851905104241553, "grad_norm": 0.5232237334052633, "learning_rate": 2.2657881252853792e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.11721894145011902, "step": 2495, "valid_targets_mean": 3049.2, "valid_targets_min": 618 }, { "epoch": 3.5923795830337886, "grad_norm": 0.48021599807423754, "learning_rate": 2.2586839537618285e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.10148143023252487, "step": 2500, "valid_targets_mean": 3688.9, "valid_targets_min": 525 }, { "epoch": 3.599568655643422, "grad_norm": 0.4923060580408922, "learning_rate": 2.2515764612473553e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.10971393436193466, "step": 2505, "valid_targets_mean": 3988.9, "valid_targets_min": 634 }, { "epoch": 3.606757728253055, "grad_norm": 0.6862438146632643, "learning_rate": 2.2444657389881203e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.11502759903669357, "step": 2510, "valid_targets_mean": 2437.4, "valid_targets_min": 502 }, { "epoch": 3.6139468008626885, "grad_norm": 0.57899984231831, "learning_rate": 2.2373518782717513e-05, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.13824304938316345, "step": 2515, "valid_targets_mean": 4252.1, "valid_targets_min": 611 }, { "epoch": 3.621135873472322, "grad_norm": 0.47585894131516004, "learning_rate": 2.2302349704261657e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1324179470539093, "step": 2520, "valid_targets_mean": 4517.6, "valid_targets_min": 601 }, { "epoch": 3.6283249460819555, "grad_norm": 0.41528620994981147, "learning_rate": 2.2231151068184005e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.1042901873588562, "step": 2525, "valid_targets_mean": 4695.5, "valid_targets_min": 3257 }, { "epoch": 3.635514018691589, "grad_norm": 0.5069891883936893, "learning_rate": 2.2159923788534383e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.1232769638299942, "step": 2530, "valid_targets_mean": 3207.2, "valid_targets_min": 652 }, { "epoch": 3.642703091301222, "grad_norm": 0.43169111980404523, "learning_rate": 2.2088668779730352e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.11891108006238937, "step": 2535, "valid_targets_mean": 4488.8, "valid_targets_min": 933 }, { "epoch": 3.6498921639108555, "grad_norm": 0.53035855657901, "learning_rate": 2.201738695654546e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.12702947854995728, "step": 2540, "valid_targets_mean": 3401.8, "valid_targets_min": 1101 }, { "epoch": 3.6570812365204888, "grad_norm": 0.8015662534418149, "learning_rate": 2.1946079234097497e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.13921813666820526, "step": 2545, "valid_targets_mean": 4335.4, "valid_targets_min": 769 }, { "epoch": 3.664270309130122, "grad_norm": 0.529734503659625, "learning_rate": 2.1874746527836738e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.11016402393579483, "step": 2550, "valid_targets_mean": 2528.5, "valid_targets_min": 759 }, { "epoch": 3.671459381739756, "grad_norm": 0.6001197865922718, "learning_rate": 2.180338975353422e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.12066247314214706, "step": 2555, "valid_targets_mean": 2506.1, "valid_targets_min": 542 }, { "epoch": 3.678648454349389, "grad_norm": 0.46689109296603837, "learning_rate": 2.1732009827269947e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.11004269123077393, "step": 2560, "valid_targets_mean": 3788.0, "valid_targets_min": 833 }, { "epoch": 3.6858375269590224, "grad_norm": 0.46412325094131973, "learning_rate": 2.166060766542117e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.13252490758895874, "step": 2565, "valid_targets_mean": 4282.9, "valid_targets_min": 965 }, { "epoch": 3.6930265995686558, "grad_norm": 0.5207990273092182, "learning_rate": 2.1589184184650573e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.0916057825088501, "step": 2570, "valid_targets_mean": 2747.2, "valid_targets_min": 344 }, { "epoch": 3.700215672178289, "grad_norm": 0.5296101459863599, "learning_rate": 2.1517740301894565e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.09578610211610794, "step": 2575, "valid_targets_mean": 2223.9, "valid_targets_min": 421 }, { "epoch": 3.7074047447879224, "grad_norm": 0.5337544782692388, "learning_rate": 2.144627693435145e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.1551215648651123, "step": 2580, "valid_targets_mean": 3619.0, "valid_targets_min": 630 }, { "epoch": 3.7145938173975557, "grad_norm": 0.46977810033457923, "learning_rate": 2.1374794999469683e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.11778691411018372, "step": 2585, "valid_targets_mean": 4017.2, "valid_targets_min": 569 }, { "epoch": 3.721782890007189, "grad_norm": 0.5369932341533742, "learning_rate": 2.1303295414936104e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.18012884259223938, "step": 2590, "valid_targets_mean": 4391.9, "valid_targets_min": 743 }, { "epoch": 3.7289719626168223, "grad_norm": 0.5299860172850779, "learning_rate": 2.1231779098664117e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.13819974660873413, "step": 2595, "valid_targets_mean": 3378.9, "valid_targets_min": 652 }, { "epoch": 3.7361610352264556, "grad_norm": 0.5258708261765481, "learning_rate": 2.1160246968781946e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.1301390379667282, "step": 2600, "valid_targets_mean": 3329.5, "valid_targets_min": 678 }, { "epoch": 3.743350107836089, "grad_norm": 0.4743676812927684, "learning_rate": 2.1088699943620827e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.1157599464058876, "step": 2605, "valid_targets_mean": 3933.9, "valid_targets_min": 621 }, { "epoch": 3.7505391804457227, "grad_norm": 0.5364161202382962, "learning_rate": 2.1017138941703204e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.12845493853092194, "step": 2610, "valid_targets_mean": 3678.6, "valid_targets_min": 405 }, { "epoch": 3.757728253055356, "grad_norm": 0.46482943852345554, "learning_rate": 2.094556488173098e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247505247592926, "step": 2615, "valid_targets_mean": 3829.6, "valid_targets_min": 812 }, { "epoch": 3.7649173256649893, "grad_norm": 0.508770935066309, "learning_rate": 2.0873978682573684e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.15090303122997284, "step": 2620, "valid_targets_mean": 4160.5, "valid_targets_min": 686 }, { "epoch": 3.7721063982746226, "grad_norm": 0.493041194796532, "learning_rate": 2.0802381263256695e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.14253270626068115, "step": 2625, "valid_targets_mean": 3882.0, "valid_targets_min": 882 }, { "epoch": 3.779295470884256, "grad_norm": 0.4917977926190101, "learning_rate": 2.0730773542949428e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1122705489397049, "step": 2630, "valid_targets_mean": 3226.6, "valid_targets_min": 540 }, { "epoch": 3.786484543493889, "grad_norm": 0.4820507926987514, "learning_rate": 2.0659156440953548e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.09798593819141388, "step": 2635, "valid_targets_mean": 2979.9, "valid_targets_min": 700 }, { "epoch": 3.7936736161035225, "grad_norm": 0.5465128709652923, "learning_rate": 2.058753087669117e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.12692230939865112, "step": 2640, "valid_targets_mean": 3353.5, "valid_targets_min": 643 }, { "epoch": 3.8008626887131562, "grad_norm": 0.47851627989550993, "learning_rate": 2.0515897769693015e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.14869645237922668, "step": 2645, "valid_targets_mean": 4664.6, "valid_targets_min": 757 }, { "epoch": 3.8080517613227896, "grad_norm": 0.42380667956671314, "learning_rate": 2.044425803958669e-05, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.11933261156082153, "step": 2650, "valid_targets_mean": 4663.6, "valid_targets_min": 3223 }, { "epoch": 3.815240833932423, "grad_norm": 0.4795587784552931, "learning_rate": 2.0372612606084784e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1432308852672577, "step": 2655, "valid_targets_mean": 3894.0, "valid_targets_min": 812 }, { "epoch": 3.822429906542056, "grad_norm": 0.5626384295877633, "learning_rate": 2.030096238897314e-05, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.16091012954711914, "step": 2660, "valid_targets_mean": 3704.8, "valid_targets_min": 533 }, { "epoch": 3.8296189791516895, "grad_norm": 0.8151561380660051, "learning_rate": 2.022930830809898e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.18149186670780182, "step": 2665, "valid_targets_mean": 4656.2, "valid_targets_min": 821 }, { "epoch": 3.836808051761323, "grad_norm": 0.4453347518556729, "learning_rate": 2.015765128335916e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.12284523248672485, "step": 2670, "valid_targets_mean": 4547.9, "valid_targets_min": 565 }, { "epoch": 3.843997124370956, "grad_norm": 0.43116833253695513, "learning_rate": 2.0085992234688305e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14145714044570923, "step": 2675, "valid_targets_mean": 4979.5, "valid_targets_min": 3802 }, { "epoch": 3.8511861969805894, "grad_norm": 0.5595435853648367, "learning_rate": 2.0014332082047043e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.10264123976230621, "step": 2680, "valid_targets_mean": 2736.0, "valid_targets_min": 690 }, { "epoch": 3.8583752695902227, "grad_norm": 0.48529338510837766, "learning_rate": 1.994267174541015e-05, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.1485181450843811, "step": 2685, "valid_targets_mean": 3982.6, "valid_targets_min": 579 }, { "epoch": 3.865564342199856, "grad_norm": 0.549946831719716, "learning_rate": 1.9871012144754803e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.11590389907360077, "step": 2690, "valid_targets_mean": 3149.9, "valid_targets_min": 576 }, { "epoch": 3.8727534148094893, "grad_norm": 0.5228093621705135, "learning_rate": 1.9799354200048687e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.08893737196922302, "step": 2695, "valid_targets_mean": 3057.0, "valid_targets_min": 730 }, { "epoch": 3.879942487419123, "grad_norm": 0.530256928414435, "learning_rate": 1.9727698831238265e-05, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.14026793837547302, "step": 2700, "valid_targets_mean": 3831.9, "valid_targets_min": 648 }, { "epoch": 3.8871315600287564, "grad_norm": 0.4793247139706527, "learning_rate": 1.96560469582369e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.12756478786468506, "step": 2705, "valid_targets_mean": 4601.4, "valid_targets_min": 666 }, { "epoch": 3.8943206326383897, "grad_norm": 0.5375220032845645, "learning_rate": 1.9584399500913102e-05, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.13013246655464172, "step": 2710, "valid_targets_mean": 2996.8, "valid_targets_min": 485 }, { "epoch": 3.901509705248023, "grad_norm": 0.5200980131239384, "learning_rate": 1.9512757379078665e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247069388628006, "step": 2715, "valid_targets_mean": 3445.8, "valid_targets_min": 618 }, { "epoch": 3.9086987778576563, "grad_norm": 0.4778551860033752, "learning_rate": 1.9441121512476912e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516200453042984, "step": 2720, "valid_targets_mean": 4454.6, "valid_targets_min": 551 }, { "epoch": 3.9158878504672896, "grad_norm": 0.5198990277474976, "learning_rate": 1.9369492820770846e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.12661394476890564, "step": 2725, "valid_targets_mean": 3578.6, "valid_targets_min": 910 }, { "epoch": 3.9230769230769234, "grad_norm": 1.2379830764042923, "learning_rate": 1.9297872223531358e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.10750366747379303, "step": 2730, "valid_targets_mean": 2653.1, "valid_targets_min": 503 }, { "epoch": 3.9302659956865567, "grad_norm": 0.45535127246041973, "learning_rate": 1.922626064022544e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.12956029176712036, "step": 2735, "valid_targets_mean": 5278.4, "valid_targets_min": 998 }, { "epoch": 3.93745506829619, "grad_norm": 0.5503012132360744, "learning_rate": 1.9154658990204338e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.14677077531814575, "step": 2740, "valid_targets_mean": 2994.5, "valid_targets_min": 635 }, { "epoch": 3.9446441409058233, "grad_norm": 0.521779712095191, "learning_rate": 1.9083068192691792e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.10208123177289963, "step": 2745, "valid_targets_mean": 2528.6, "valid_targets_min": 767 }, { "epoch": 3.9518332135154566, "grad_norm": 0.5576470665601292, "learning_rate": 1.9011489166772204e-05, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1775783747434616, "step": 2750, "valid_targets_mean": 4281.1, "valid_targets_min": 656 }, { "epoch": 3.95902228612509, "grad_norm": 0.5764471708270146, "learning_rate": 1.8939922831378865e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.09720412641763687, "step": 2755, "valid_targets_mean": 2658.6, "valid_targets_min": 721 }, { "epoch": 3.966211358734723, "grad_norm": 0.4811282846227278, "learning_rate": 1.8868370105282135e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.10778206586837769, "step": 2760, "valid_targets_mean": 3013.0, "valid_targets_min": 735 }, { "epoch": 3.9734004313443565, "grad_norm": 0.4976074155858476, "learning_rate": 1.8796831907077664e-05, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.1072898805141449, "step": 2765, "valid_targets_mean": 2946.6, "valid_targets_min": 596 }, { "epoch": 3.98058950395399, "grad_norm": 0.46716125855521695, "learning_rate": 1.8725309155174586e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1110248863697052, "step": 2770, "valid_targets_mean": 3359.4, "valid_targets_min": 876 }, { "epoch": 3.987778576563623, "grad_norm": 0.4514491824659271, "learning_rate": 1.8653802767783745e-05, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.11654454469680786, "step": 2775, "valid_targets_mean": 4018.5, "valid_targets_min": 2968 }, { "epoch": 3.9949676491732564, "grad_norm": 0.5225982018438619, "learning_rate": 1.858231366290588e-05, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.0763361006975174, "step": 2780, "valid_targets_mean": 2114.1, "valid_targets_min": 756 }, { "epoch": 4.0014378145219265, "grad_norm": 0.45800317656753836, "learning_rate": 1.851084275831987e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.12621906399726868, "step": 2785, "valid_targets_mean": 3660.4, "valid_targets_min": 715 }, { "epoch": 4.00862688713156, "grad_norm": 0.4664591476372027, "learning_rate": 1.8439390971570945e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.13776497542858124, "step": 2790, "valid_targets_mean": 4713.0, "valid_targets_min": 601 }, { "epoch": 4.015815959741193, "grad_norm": 0.4389595253807518, "learning_rate": 1.836795921995889e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.08556051552295685, "step": 2795, "valid_targets_mean": 4176.5, "valid_targets_min": 3879 }, { "epoch": 4.023005032350826, "grad_norm": 0.5259882713055396, "learning_rate": 1.829654842052627e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.10955113172531128, "step": 2800, "valid_targets_mean": 3373.2, "valid_targets_min": 587 }, { "epoch": 4.03019410496046, "grad_norm": 0.4907017624215909, "learning_rate": 1.8225159490046677e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.09427815675735474, "step": 2805, "valid_targets_mean": 2864.4, "valid_targets_min": 473 }, { "epoch": 4.037383177570093, "grad_norm": 0.5215374767845408, "learning_rate": 1.8153793345012948e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.15280203521251678, "step": 2810, "valid_targets_mean": 4268.6, "valid_targets_min": 761 }, { "epoch": 4.044572250179727, "grad_norm": 0.5415288675373113, "learning_rate": 1.8082450901625398e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1138095110654831, "step": 2815, "valid_targets_mean": 2448.5, "valid_targets_min": 556 }, { "epoch": 4.0517613227893605, "grad_norm": 0.5781808878438677, "learning_rate": 1.8011133075780055e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.13912703096866608, "step": 2820, "valid_targets_mean": 3542.9, "valid_targets_min": 639 }, { "epoch": 4.058950395398994, "grad_norm": 0.5703158966366867, "learning_rate": 1.7939840783056918e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.1219850406050682, "step": 2825, "valid_targets_mean": 3617.2, "valid_targets_min": 597 }, { "epoch": 4.066139468008627, "grad_norm": 0.47744619786924974, "learning_rate": 1.7868574938708173e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.13453617691993713, "step": 2830, "valid_targets_mean": 4905.6, "valid_targets_min": 4107 }, { "epoch": 4.07332854061826, "grad_norm": 0.5329830970965606, "learning_rate": 1.779733645764649e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.14756852388381958, "step": 2835, "valid_targets_mean": 3957.4, "valid_targets_min": 682 }, { "epoch": 4.080517613227894, "grad_norm": 0.5576027992717706, "learning_rate": 1.772612625443321e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.1192103773355484, "step": 2840, "valid_targets_mean": 2559.9, "valid_targets_min": 759 }, { "epoch": 4.087706685837527, "grad_norm": 0.5100156431566057, "learning_rate": 1.7654945243266676e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.08618389070034027, "step": 2845, "valid_targets_mean": 3077.9, "valid_targets_min": 568 }, { "epoch": 4.09489575844716, "grad_norm": 0.5340345118577982, "learning_rate": 1.7583794337970452e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.14345303177833557, "step": 2850, "valid_targets_mean": 4346.1, "valid_targets_min": 1311 }, { "epoch": 4.102084831056794, "grad_norm": 0.4751066918549571, "learning_rate": 1.751267445198159e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11668483912944794, "step": 2855, "valid_targets_mean": 4779.1, "valid_targets_min": 3563 }, { "epoch": 4.109273903666427, "grad_norm": 0.5336703193480168, "learning_rate": 1.7441586498338933e-05, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.12484841048717499, "step": 2860, "valid_targets_mean": 3494.9, "valid_targets_min": 640 }, { "epoch": 4.11646297627606, "grad_norm": 0.5501336623672213, "learning_rate": 1.7370531389671362e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.14683029055595398, "step": 2865, "valid_targets_mean": 3951.5, "valid_targets_min": 1163 }, { "epoch": 4.123652048885694, "grad_norm": 0.4575645222074036, "learning_rate": 1.7299510038186105e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.12655046582221985, "step": 2870, "valid_targets_mean": 4511.2, "valid_targets_min": 664 }, { "epoch": 4.130841121495327, "grad_norm": 0.4774593976400927, "learning_rate": 1.7228523355657007e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.09447678923606873, "step": 2875, "valid_targets_mean": 3125.4, "valid_targets_min": 681 }, { "epoch": 4.13803019410496, "grad_norm": 0.5194608985400685, "learning_rate": 1.7157572253412837e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.12980666756629944, "step": 2880, "valid_targets_mean": 3581.4, "valid_targets_min": 742 }, { "epoch": 4.1452192667145935, "grad_norm": 0.509774077422665, "learning_rate": 1.7086657642325568e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.13197895884513855, "step": 2885, "valid_targets_mean": 4029.1, "valid_targets_min": 861 }, { "epoch": 4.152408339324227, "grad_norm": 0.5297749408912853, "learning_rate": 1.7015780432798727e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.09195668995380402, "step": 2890, "valid_targets_mean": 2926.8, "valid_targets_min": 664 }, { "epoch": 4.15959741193386, "grad_norm": 0.5090609267845478, "learning_rate": 1.694494153475565e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.09950702637434006, "step": 2895, "valid_targets_mean": 3153.4, "valid_targets_min": 257 }, { "epoch": 4.166786484543494, "grad_norm": 0.5818668202631337, "learning_rate": 1.6874141857627846e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345033049583435, "step": 2900, "valid_targets_mean": 3743.4, "valid_targets_min": 651 }, { "epoch": 4.173975557153128, "grad_norm": 0.5817354875875417, "learning_rate": 1.6803382310343307e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.12657590210437775, "step": 2905, "valid_targets_mean": 2877.4, "valid_targets_min": 537 }, { "epoch": 4.181164629762761, "grad_norm": 0.5317207649090678, "learning_rate": 1.6732663801314827e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.10397838056087494, "step": 2910, "valid_targets_mean": 2906.8, "valid_targets_min": 683 }, { "epoch": 4.188353702372394, "grad_norm": 0.535580648009678, "learning_rate": 1.6661987238428355e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1221417486667633, "step": 2915, "valid_targets_mean": 3189.6, "valid_targets_min": 670 }, { "epoch": 4.1955427749820275, "grad_norm": 0.5363296910044444, "learning_rate": 1.6591353529031334e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.11720272898674011, "step": 2920, "valid_targets_mean": 3409.9, "valid_targets_min": 647 }, { "epoch": 4.202731847591661, "grad_norm": 0.5406261463557596, "learning_rate": 1.6520763579921048e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.11183007061481476, "step": 2925, "valid_targets_mean": 3812.8, "valid_targets_min": 518 }, { "epoch": 4.209920920201294, "grad_norm": 0.48867123793633094, "learning_rate": 1.6450218297333e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.09008172154426575, "step": 2930, "valid_targets_mean": 2935.0, "valid_targets_min": 621 }, { "epoch": 4.2171099928109275, "grad_norm": 0.5048761048747257, "learning_rate": 1.6379718586929235e-05, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.13712650537490845, "step": 2935, "valid_targets_mean": 4341.1, "valid_targets_min": 564 }, { "epoch": 4.224299065420561, "grad_norm": 0.4903661529952285, "learning_rate": 1.6309265353786777e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.12769557535648346, "step": 2940, "valid_targets_mean": 4333.5, "valid_targets_min": 548 }, { "epoch": 4.231488138030194, "grad_norm": 0.5150498165284755, "learning_rate": 1.6238859502385943e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.07896912097930908, "step": 2945, "valid_targets_mean": 2458.0, "valid_targets_min": 230 }, { "epoch": 4.238677210639827, "grad_norm": 0.5953862527405311, "learning_rate": 1.6168501936598783e-05, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.12767180800437927, "step": 2950, "valid_targets_mean": 3435.4, "valid_targets_min": 711 }, { "epoch": 4.245866283249461, "grad_norm": 0.5210564257953418, "learning_rate": 1.609819355967744e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351774036884308, "step": 2955, "valid_targets_mean": 4328.6, "valid_targets_min": 582 }, { "epoch": 4.253055355859094, "grad_norm": 0.5229807638300585, "learning_rate": 1.6027935274242575e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.09753084182739258, "step": 2960, "valid_targets_mean": 2665.4, "valid_targets_min": 528 }, { "epoch": 4.260244428468727, "grad_norm": 0.4864103710763143, "learning_rate": 1.5957727982271788e-05, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.10253024846315384, "step": 2965, "valid_targets_mean": 3451.0, "valid_targets_min": 720 }, { "epoch": 4.267433501078361, "grad_norm": 0.5549949272831466, "learning_rate": 1.5887572585087995e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.08487284183502197, "step": 2970, "valid_targets_mean": 2780.6, "valid_targets_min": 542 }, { "epoch": 4.274622573687994, "grad_norm": 0.45558638561523057, "learning_rate": 1.5817469983347912e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.12247081845998764, "step": 2975, "valid_targets_mean": 4601.6, "valid_targets_min": 1034 }, { "epoch": 4.281811646297627, "grad_norm": 0.5024007698937418, "learning_rate": 1.5747421077030442e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.10787507891654968, "step": 2980, "valid_targets_mean": 3700.0, "valid_targets_min": 606 }, { "epoch": 4.2890007189072605, "grad_norm": 0.5082106914176634, "learning_rate": 1.5677426765425166e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.11795713007450104, "step": 2985, "valid_targets_mean": 3604.4, "valid_targets_min": 731 }, { "epoch": 4.296189791516895, "grad_norm": 0.4499094022949875, "learning_rate": 1.5607487947120766e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.1429499387741089, "step": 2990, "valid_targets_mean": 5784.1, "valid_targets_min": 3691 }, { "epoch": 4.303378864126528, "grad_norm": 0.43554600462791326, "learning_rate": 1.55376055199935e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.13606850802898407, "step": 2995, "valid_targets_mean": 5484.5, "valid_targets_min": 4161 }, { "epoch": 4.310567936736161, "grad_norm": 0.48479942765593714, "learning_rate": 1.5467780381195675e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.09615229070186615, "step": 3000, "valid_targets_mean": 3328.8, "valid_targets_min": 546 }, { "epoch": 4.317757009345795, "grad_norm": 0.5483839501262737, "learning_rate": 1.5398013427144136e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.13533805310726166, "step": 3005, "valid_targets_mean": 3739.2, "valid_targets_min": 528 }, { "epoch": 4.324946081955428, "grad_norm": 0.5325384384939251, "learning_rate": 1.5328305553508737e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10858841985464096, "step": 3010, "valid_targets_mean": 3556.6, "valid_targets_min": 867 }, { "epoch": 4.332135154565061, "grad_norm": 0.488394898199471, "learning_rate": 1.5258657655200862e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.11653181165456772, "step": 3015, "valid_targets_mean": 3955.2, "valid_targets_min": 557 }, { "epoch": 4.339324227174695, "grad_norm": 0.5105599359428391, "learning_rate": 1.5189070626361941e-05, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.12870097160339355, "step": 3020, "valid_targets_mean": 4240.0, "valid_targets_min": 702 }, { "epoch": 4.346513299784328, "grad_norm": 0.5715965859853566, "learning_rate": 1.5119545360351957e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.15724487602710724, "step": 3025, "valid_targets_mean": 3764.2, "valid_targets_min": 566 }, { "epoch": 4.353702372393961, "grad_norm": 0.5896736194868126, "learning_rate": 1.505008274973796e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.13168630003929138, "step": 3030, "valid_targets_mean": 3176.2, "valid_targets_min": 633 }, { "epoch": 4.3608914450035945, "grad_norm": 0.5156466323454092, "learning_rate": 1.4980683686282657e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.12574413418769836, "step": 3035, "valid_targets_mean": 3254.2, "valid_targets_min": 645 }, { "epoch": 4.368080517613228, "grad_norm": 0.47988451535887794, "learning_rate": 1.4911349060932909e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.11421344429254532, "step": 3040, "valid_targets_mean": 4213.0, "valid_targets_min": 732 }, { "epoch": 4.375269590222861, "grad_norm": 0.5042870458706878, "learning_rate": 1.484207976380834e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.1530284583568573, "step": 3045, "valid_targets_mean": 4835.0, "valid_targets_min": 918 }, { "epoch": 4.382458662832494, "grad_norm": 0.536704227286159, "learning_rate": 1.4772876684189879e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.13965827226638794, "step": 3050, "valid_targets_mean": 3876.8, "valid_targets_min": 423 }, { "epoch": 4.389647735442128, "grad_norm": 0.46602382013395727, "learning_rate": 1.4703740710508352e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.12959733605384827, "step": 3055, "valid_targets_mean": 5016.6, "valid_targets_min": 4090 }, { "epoch": 4.396836808051761, "grad_norm": 0.5514211790349896, "learning_rate": 1.4634672730333079e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.125798761844635, "step": 3060, "valid_targets_mean": 3335.4, "valid_targets_min": 727 }, { "epoch": 4.404025880661394, "grad_norm": 0.5827049576069567, "learning_rate": 1.4565673630360482e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.09962286055088043, "step": 3065, "valid_targets_mean": 2581.2, "valid_targets_min": 580 }, { "epoch": 4.411214953271028, "grad_norm": 0.47939759496807005, "learning_rate": 1.4496744296402686e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.0976216048002243, "step": 3070, "valid_targets_mean": 3415.2, "valid_targets_min": 691 }, { "epoch": 4.418404025880662, "grad_norm": 0.502919510044186, "learning_rate": 1.4427885613376176e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.10967571288347244, "step": 3075, "valid_targets_mean": 3390.2, "valid_targets_min": 559 }, { "epoch": 4.425593098490295, "grad_norm": 0.6305898129788904, "learning_rate": 1.4359098465290401e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10862769186496735, "step": 3080, "valid_targets_mean": 2415.8, "valid_targets_min": 786 }, { "epoch": 4.4327821710999284, "grad_norm": 0.5575222975267811, "learning_rate": 1.4290383735236453e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.10775524377822876, "step": 3085, "valid_targets_mean": 3085.9, "valid_targets_min": 611 }, { "epoch": 4.439971243709562, "grad_norm": 0.49802953687828977, "learning_rate": 1.4221742305375716e-05, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.0978183001279831, "step": 3090, "valid_targets_mean": 2689.6, "valid_targets_min": 538 }, { "epoch": 4.447160316319195, "grad_norm": 0.5756490270686243, "learning_rate": 1.4153175056928543e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.09058581292629242, "step": 3095, "valid_targets_mean": 2022.0, "valid_targets_min": 522 }, { "epoch": 4.454349388928828, "grad_norm": 0.5208077664252705, "learning_rate": 1.408468287016295e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.12745115160942078, "step": 3100, "valid_targets_mean": 3539.4, "valid_targets_min": 602 }, { "epoch": 4.461538461538462, "grad_norm": 0.4377191730808559, "learning_rate": 1.4016266624383299e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.11340028047561646, "step": 3105, "valid_targets_mean": 4446.4, "valid_targets_min": 680 }, { "epoch": 4.468727534148095, "grad_norm": 0.7054657373358831, "learning_rate": 1.3947927197919038e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14070342481136322, "step": 3110, "valid_targets_mean": 2662.5, "valid_targets_min": 507 }, { "epoch": 4.475916606757728, "grad_norm": 0.518522447767955, "learning_rate": 1.387966546811338e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.14628420770168304, "step": 3115, "valid_targets_mean": 4294.0, "valid_targets_min": 675 }, { "epoch": 4.483105679367362, "grad_norm": 0.45175962309797224, "learning_rate": 1.3811482311312092e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.1265779733657837, "step": 3120, "valid_targets_mean": 4493.6, "valid_targets_min": 3468 }, { "epoch": 4.490294751976995, "grad_norm": 0.5802694137312429, "learning_rate": 1.3743378602852201e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.10025407373905182, "step": 3125, "valid_targets_mean": 2324.8, "valid_targets_min": 722 }, { "epoch": 4.497483824586628, "grad_norm": 0.5255053806019105, "learning_rate": 1.3675355217050781e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.1405080258846283, "step": 3130, "valid_targets_mean": 4538.6, "valid_targets_min": 814 }, { "epoch": 4.5046728971962615, "grad_norm": 0.5595718040895143, "learning_rate": 1.360741302719373e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.13758280873298645, "step": 3135, "valid_targets_mean": 3494.5, "valid_targets_min": 627 }, { "epoch": 4.511861969805895, "grad_norm": 0.49673632869856904, "learning_rate": 1.3539552905524542e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12679347395896912, "step": 3140, "valid_targets_mean": 4069.8, "valid_targets_min": 455 }, { "epoch": 4.519051042415528, "grad_norm": 0.4796342803182259, "learning_rate": 1.347177572323311e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.11640562862157822, "step": 3145, "valid_targets_mean": 3925.0, "valid_targets_min": 954 }, { "epoch": 4.526240115025161, "grad_norm": 0.49543130568416427, "learning_rate": 1.340408235044457e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1236979067325592, "step": 3150, "valid_targets_mean": 3800.5, "valid_targets_min": 791 }, { "epoch": 4.533429187634795, "grad_norm": 0.45765247970692274, "learning_rate": 1.3336473656208084e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.12283189594745636, "step": 3155, "valid_targets_mean": 4273.1, "valid_targets_min": 877 }, { "epoch": 4.540618260244429, "grad_norm": 0.5129923770235678, "learning_rate": 1.326895050848573e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.13487502932548523, "step": 3160, "valid_targets_mean": 4268.9, "valid_targets_min": 3321 }, { "epoch": 4.547807332854061, "grad_norm": 0.44141191686175985, "learning_rate": 1.3201513774141321e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.12209541350603104, "step": 3165, "valid_targets_mean": 4852.6, "valid_targets_min": 1859 }, { "epoch": 4.5549964054636956, "grad_norm": 0.4942636534490483, "learning_rate": 1.3134164318929314e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.09581250697374344, "step": 3170, "valid_targets_mean": 3307.5, "valid_targets_min": 689 }, { "epoch": 4.562185478073329, "grad_norm": 0.47384730378168516, "learning_rate": 1.306690300748365e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.13601398468017578, "step": 3175, "valid_targets_mean": 4708.5, "valid_targets_min": 3342 }, { "epoch": 4.569374550682962, "grad_norm": 0.5943206386606482, "learning_rate": 1.2999730703306697e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.12636137008666992, "step": 3180, "valid_targets_mean": 3298.8, "valid_targets_min": 552 }, { "epoch": 4.5765636232925955, "grad_norm": 0.5239127580206798, "learning_rate": 1.2932648268758132e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.16251717507839203, "step": 3185, "valid_targets_mean": 5176.2, "valid_targets_min": 859 }, { "epoch": 4.583752695902229, "grad_norm": 0.4661488811609455, "learning_rate": 1.2865656565043896e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.11450262367725372, "step": 3190, "valid_targets_mean": 4073.1, "valid_targets_min": 1440 }, { "epoch": 4.590941768511862, "grad_norm": 0.509066791632617, "learning_rate": 1.2798756452205119e-05, "loss": 0.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.104307621717453, "step": 3195, "valid_targets_mean": 3497.1, "valid_targets_min": 651 }, { "epoch": 4.598130841121495, "grad_norm": 0.4906266924266068, "learning_rate": 1.273194878910708e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.1050233393907547, "step": 3200, "valid_targets_mean": 3821.8, "valid_targets_min": 987 }, { "epoch": 4.605319913731129, "grad_norm": 0.5811645770283341, "learning_rate": 1.2665234433428197e-05, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.10122254490852356, "step": 3205, "valid_targets_mean": 2902.4, "valid_targets_min": 620 }, { "epoch": 4.612508986340762, "grad_norm": 0.4816881331945686, "learning_rate": 1.2598614241648996e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.12213660031557083, "step": 3210, "valid_targets_mean": 3917.1, "valid_targets_min": 821 }, { "epoch": 4.619698058950395, "grad_norm": 0.610812993328097, "learning_rate": 1.2532089069041132e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.1288452297449112, "step": 3215, "valid_targets_mean": 3823.6, "valid_targets_min": 794 }, { "epoch": 4.626887131560029, "grad_norm": 0.44024322286663997, "learning_rate": 1.246565976965639e-05, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.1286042183637619, "step": 3220, "valid_targets_mean": 5272.4, "valid_targets_min": 4339 }, { "epoch": 4.634076204169662, "grad_norm": 0.5473777106333456, "learning_rate": 1.2399327196315751e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.18179279565811157, "step": 3225, "valid_targets_mean": 4101.0, "valid_targets_min": 700 }, { "epoch": 4.641265276779295, "grad_norm": 0.4742924751198838, "learning_rate": 1.2333092200598402e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.11457015573978424, "step": 3230, "valid_targets_mean": 4462.1, "valid_targets_min": 748 }, { "epoch": 4.6484543493889285, "grad_norm": 0.48078713086524894, "learning_rate": 1.2266955632830846e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.1189941018819809, "step": 3235, "valid_targets_mean": 3519.9, "valid_targets_min": 620 }, { "epoch": 4.655643421998562, "grad_norm": 0.5044909830237237, "learning_rate": 1.220091834207595e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.13733816146850586, "step": 3240, "valid_targets_mean": 4848.1, "valid_targets_min": 885 }, { "epoch": 4.662832494608195, "grad_norm": 0.6257029056964695, "learning_rate": 1.2134981176122068e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.12326426804065704, "step": 3245, "valid_targets_mean": 2731.6, "valid_targets_min": 521 }, { "epoch": 4.6700215672178285, "grad_norm": 0.49878248364441824, "learning_rate": 1.2069144981472151e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.11302924901247025, "step": 3250, "valid_targets_mean": 3593.5, "valid_targets_min": 584 }, { "epoch": 4.677210639827463, "grad_norm": 0.5530561603271289, "learning_rate": 1.2003410603332886e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.09142284095287323, "step": 3255, "valid_targets_mean": 2795.4, "valid_targets_min": 644 }, { "epoch": 4.684399712437096, "grad_norm": 0.4944302859327403, "learning_rate": 1.1937778885603808e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.12129175662994385, "step": 3260, "valid_targets_mean": 3967.4, "valid_targets_min": 817 }, { "epoch": 4.691588785046729, "grad_norm": 0.4862312666118715, "learning_rate": 1.187225067086653e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.10455331951379776, "step": 3265, "valid_targets_mean": 3429.9, "valid_targets_min": 602 }, { "epoch": 4.698777857656363, "grad_norm": 0.4994833360624931, "learning_rate": 1.1806826800373863e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.12258949130773544, "step": 3270, "valid_targets_mean": 3713.8, "valid_targets_min": 774 }, { "epoch": 4.705966930265996, "grad_norm": 0.49940999662894353, "learning_rate": 1.1741508114039064e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.12433376908302307, "step": 3275, "valid_targets_mean": 4469.5, "valid_targets_min": 583 }, { "epoch": 4.713156002875629, "grad_norm": 0.5623276876572705, "learning_rate": 1.1676295450425026e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.1007264107465744, "step": 3280, "valid_targets_mean": 2477.0, "valid_targets_min": 727 }, { "epoch": 4.7203450754852625, "grad_norm": 0.555739824339317, "learning_rate": 1.1611189646733502e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.12210990488529205, "step": 3285, "valid_targets_mean": 3138.5, "valid_targets_min": 651 }, { "epoch": 4.727534148094896, "grad_norm": 0.4994433206664333, "learning_rate": 1.1546191538794417e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.0810234323143959, "step": 3290, "valid_targets_mean": 3035.2, "valid_targets_min": 555 }, { "epoch": 4.734723220704529, "grad_norm": 0.4854393794231303, "learning_rate": 1.1481301961055058e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.10804124176502228, "step": 3295, "valid_targets_mean": 3984.9, "valid_targets_min": 411 }, { "epoch": 4.741912293314162, "grad_norm": 0.5717087891184073, "learning_rate": 1.14165217465694e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.11047998070716858, "step": 3300, "valid_targets_mean": 2894.4, "valid_targets_min": 761 }, { "epoch": 4.749101365923796, "grad_norm": 0.5418658879133041, "learning_rate": 1.1351851726987441e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.14435940980911255, "step": 3305, "valid_targets_mean": 3214.9, "valid_targets_min": 604 }, { "epoch": 4.756290438533429, "grad_norm": 0.44613577875582505, "learning_rate": 1.1287292732544462e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.11927706003189087, "step": 3310, "valid_targets_mean": 3904.1, "valid_targets_min": 708 }, { "epoch": 4.763479511143062, "grad_norm": 0.49545137174974385, "learning_rate": 1.1222845592050416e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.1117856502532959, "step": 3315, "valid_targets_mean": 4137.6, "valid_targets_min": 926 }, { "epoch": 4.770668583752696, "grad_norm": 0.44613604063424483, "learning_rate": 1.1158511132879254e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.08571384847164154, "step": 3320, "valid_targets_mean": 3550.2, "valid_targets_min": 524 }, { "epoch": 4.777857656362329, "grad_norm": 0.5561329176868874, "learning_rate": 1.109429018095836e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.174579918384552, "step": 3325, "valid_targets_mean": 3782.0, "valid_targets_min": 632 }, { "epoch": 4.785046728971962, "grad_norm": 0.5036404755895384, "learning_rate": 1.1030183560757873e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.10416017472743988, "step": 3330, "valid_targets_mean": 3204.6, "valid_targets_min": 801 }, { "epoch": 4.792235801581596, "grad_norm": 0.5301785485503443, "learning_rate": 1.0966192095280148e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.1077873557806015, "step": 3335, "valid_targets_mean": 3394.2, "valid_targets_min": 493 }, { "epoch": 4.79942487419123, "grad_norm": 0.5472468768495766, "learning_rate": 1.090231660604918e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.10582281649112701, "step": 3340, "valid_targets_mean": 2981.2, "valid_targets_min": 715 }, { "epoch": 4.806613946800863, "grad_norm": 0.5841063617132195, "learning_rate": 1.0838557913100074e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.08225120604038239, "step": 3345, "valid_targets_mean": 2107.0, "valid_targets_min": 456 }, { "epoch": 4.813803019410496, "grad_norm": 0.5072600809639856, "learning_rate": 1.0774916834968484e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.10606703162193298, "step": 3350, "valid_targets_mean": 3230.5, "valid_targets_min": 655 }, { "epoch": 4.82099209202013, "grad_norm": 0.5454695842764663, "learning_rate": 1.0711394188680117e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.09919101744890213, "step": 3355, "valid_targets_mean": 2742.1, "valid_targets_min": 614 }, { "epoch": 4.828181164629763, "grad_norm": 0.577090532210789, "learning_rate": 1.0647990789740269e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.14345696568489075, "step": 3360, "valid_targets_mean": 3700.5, "valid_targets_min": 614 }, { "epoch": 4.835370237239396, "grad_norm": 0.599439746241527, "learning_rate": 1.058470745212333e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.1152365431189537, "step": 3365, "valid_targets_mean": 3038.6, "valid_targets_min": 637 }, { "epoch": 4.84255930984903, "grad_norm": 0.4796989899141097, "learning_rate": 1.0521544988262335e-05, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.08579153567552567, "step": 3370, "valid_targets_mean": 3213.6, "valid_targets_min": 609 }, { "epoch": 4.849748382458663, "grad_norm": 0.6490810772399019, "learning_rate": 1.0458504209038533e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.14216336607933044, "step": 3375, "valid_targets_mean": 2942.9, "valid_targets_min": 557 }, { "epoch": 4.856937455068296, "grad_norm": 0.4870269459652767, "learning_rate": 1.0395585923770981e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.09269210696220398, "step": 3380, "valid_targets_mean": 3761.9, "valid_targets_min": 629 }, { "epoch": 4.8641265276779295, "grad_norm": 0.46747238467905033, "learning_rate": 1.0332790940206183e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.1230100691318512, "step": 3385, "valid_targets_mean": 4636.8, "valid_targets_min": 2480 }, { "epoch": 4.871315600287563, "grad_norm": 0.6495857497948903, "learning_rate": 1.0270120064507664e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402766853570938, "step": 3390, "valid_targets_mean": 4321.4, "valid_targets_min": 1066 }, { "epoch": 4.878504672897196, "grad_norm": 0.47843085114562955, "learning_rate": 1.0207574101245661e-05, "loss": 0.2317, "loss_nan_ranks": 0, "loss_rank_avg": 0.09787297248840332, "step": 3395, "valid_targets_mean": 3257.5, "valid_targets_min": 860 }, { "epoch": 4.885693745506829, "grad_norm": 0.4826999323999703, "learning_rate": 1.0145153853386764e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.08830671012401581, "step": 3400, "valid_targets_mean": 2271.1, "valid_targets_min": 582 }, { "epoch": 4.892882818116463, "grad_norm": 0.4933668590281263, "learning_rate": 1.0082860122283667e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.14057773351669312, "step": 3405, "valid_targets_mean": 4368.4, "valid_targets_min": 775 }, { "epoch": 4.900071890726096, "grad_norm": 0.5820889582759022, "learning_rate": 1.0020693707664799e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.11664923280477524, "step": 3410, "valid_targets_mean": 3539.9, "valid_targets_min": 670 }, { "epoch": 4.907260963335729, "grad_norm": 0.48946946217080056, "learning_rate": 9.958655407624103e-06, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.09979799389839172, "step": 3415, "valid_targets_mean": 3043.6, "valid_targets_min": 688 }, { "epoch": 4.914450035945363, "grad_norm": 0.5073233040403398, "learning_rate": 9.89674601861081e-06, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.11947494745254517, "step": 3420, "valid_targets_mean": 4196.5, "valid_targets_min": 1035 }, { "epoch": 4.921639108554997, "grad_norm": 0.7177282984792761, "learning_rate": 9.83496633541916e-06, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.12936556339263916, "step": 3425, "valid_targets_mean": 3776.4, "valid_targets_min": 842 }, { "epoch": 4.928828181164629, "grad_norm": 0.5118285957400573, "learning_rate": 9.773317151178239e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.13362133502960205, "step": 3430, "valid_targets_mean": 4502.4, "valid_targets_min": 779 }, { "epoch": 4.9360172537742635, "grad_norm": 0.5443810213820736, "learning_rate": 9.711799257341772e-06, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.10535494983196259, "step": 3435, "valid_targets_mean": 3771.1, "valid_targets_min": 673 }, { "epoch": 4.943206326383897, "grad_norm": 0.5591247338648125, "learning_rate": 9.650413443678e-06, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.13685429096221924, "step": 3440, "valid_targets_mean": 3843.8, "valid_targets_min": 979 }, { "epoch": 4.95039539899353, "grad_norm": 0.4678569233701499, "learning_rate": 9.58916049825949e-06, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.1224527508020401, "step": 3445, "valid_targets_mean": 4677.8, "valid_targets_min": 3661 }, { "epoch": 4.957584471603163, "grad_norm": 0.5440934246700909, "learning_rate": 9.528041207453056e-06, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.15713685750961304, "step": 3450, "valid_targets_mean": 5048.0, "valid_targets_min": 965 }, { "epoch": 4.964773544212797, "grad_norm": 0.49743408684165086, "learning_rate": 9.467056355909639e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.08757054060697556, "step": 3455, "valid_targets_mean": 3058.4, "valid_targets_min": 412 }, { "epoch": 4.97196261682243, "grad_norm": 0.48083670685811697, "learning_rate": 9.40620672655427e-06, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.10417330265045166, "step": 3460, "valid_targets_mean": 3597.5, "valid_targets_min": 682 }, { "epoch": 4.979151689432063, "grad_norm": 0.5179283083362081, "learning_rate": 9.34549310057597e-06, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.11766026169061661, "step": 3465, "valid_targets_mean": 3463.0, "valid_targets_min": 675 }, { "epoch": 4.986340762041697, "grad_norm": 0.4837812594204367, "learning_rate": 9.284916257417746e-06, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.18496853113174438, "step": 3470, "valid_targets_mean": 5729.2, "valid_targets_min": 950 }, { "epoch": 4.99352983465133, "grad_norm": 0.4904953793566584, "learning_rate": 9.2244769747666e-06, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.135883167386055, "step": 3475, "valid_targets_mean": 4532.1, "valid_targets_min": 761 }, { "epoch": 5.0, "grad_norm": 0.7004899366166182, "learning_rate": 9.16417602854353e-06, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.21526622772216797, "step": 3480, "valid_targets_mean": 3061.6, "valid_targets_min": 677 }, { "epoch": 5.007189072609633, "grad_norm": 0.5375983632773035, "learning_rate": 9.104014192893547e-06, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13673044741153717, "step": 3485, "valid_targets_mean": 3982.0, "valid_targets_min": 862 }, { "epoch": 5.014378145219267, "grad_norm": 0.5074525307969784, "learning_rate": 9.04399224017577e-06, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.08781856298446655, "step": 3490, "valid_targets_mean": 2563.9, "valid_targets_min": 565 }, { "epoch": 5.0215672178289, "grad_norm": 0.5226625346422593, "learning_rate": 8.984110940953485e-06, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.11326141655445099, "step": 3495, "valid_targets_mean": 4074.4, "valid_targets_min": 662 }, { "epoch": 5.028756290438533, "grad_norm": 0.5085797015984954, "learning_rate": 8.924371063984294e-06, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.11057010293006897, "step": 3500, "valid_targets_mean": 4120.9, "valid_targets_min": 455 }, { "epoch": 5.0359453630481665, "grad_norm": 0.4769148575385776, "learning_rate": 8.86477337621019e-06, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.12291170656681061, "step": 3505, "valid_targets_mean": 4678.4, "valid_targets_min": 3405 }, { "epoch": 5.0431344356578, "grad_norm": 0.5564512722540663, "learning_rate": 8.805318642747746e-06, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.11856968700885773, "step": 3510, "valid_targets_mean": 3500.5, "valid_targets_min": 624 }, { "epoch": 5.050323508267433, "grad_norm": 0.5566437898397325, "learning_rate": 8.746007626878274e-06, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.10583490133285522, "step": 3515, "valid_targets_mean": 3376.5, "valid_targets_min": 747 }, { "epoch": 5.0575125808770665, "grad_norm": 0.6086364544635542, "learning_rate": 8.686841090038066e-06, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.12775224447250366, "step": 3520, "valid_targets_mean": 3280.1, "valid_targets_min": 551 }, { "epoch": 5.064701653486701, "grad_norm": 0.5185408192200104, "learning_rate": 8.627819791808557e-06, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1279093325138092, "step": 3525, "valid_targets_mean": 4133.9, "valid_targets_min": 487 }, { "epoch": 5.071890726096334, "grad_norm": 0.5301333550786779, "learning_rate": 8.568944489906608e-06, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.13012029230594635, "step": 3530, "valid_targets_mean": 4145.6, "valid_targets_min": 893 }, { "epoch": 5.079079798705967, "grad_norm": 0.5183690582049101, "learning_rate": 8.510215940174802e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.13085518777370453, "step": 3535, "valid_targets_mean": 5321.9, "valid_targets_min": 597 }, { "epoch": 5.086268871315601, "grad_norm": 0.4579516502915308, "learning_rate": 8.45163489657169e-06, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.11568126827478409, "step": 3540, "valid_targets_mean": 3944.9, "valid_targets_min": 731 }, { "epoch": 5.093457943925234, "grad_norm": 0.5507002546950306, "learning_rate": 8.393202111162139e-06, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.09243332594633102, "step": 3545, "valid_targets_mean": 3075.0, "valid_targets_min": 591 }, { "epoch": 5.100647016534867, "grad_norm": 0.5383009778697873, "learning_rate": 8.334918334107673e-06, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1040419340133667, "step": 3550, "valid_targets_mean": 3633.8, "valid_targets_min": 711 }, { "epoch": 5.1078360891445005, "grad_norm": 0.5757360955048402, "learning_rate": 8.276784313656857e-06, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.11551609635353088, "step": 3555, "valid_targets_mean": 3326.9, "valid_targets_min": 601 }, { "epoch": 5.115025161754134, "grad_norm": 0.5291511551810913, "learning_rate": 8.218800796135666e-06, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.1199103370308876, "step": 3560, "valid_targets_mean": 3476.9, "valid_targets_min": 635 }, { "epoch": 5.122214234363767, "grad_norm": 0.5415093823430597, "learning_rate": 8.16096852593791e-06, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.1012372300028801, "step": 3565, "valid_targets_mean": 3252.1, "valid_targets_min": 616 }, { "epoch": 5.1294033069734, "grad_norm": 0.5573860753092026, "learning_rate": 8.103288245515681e-06, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514764130115509, "step": 3570, "valid_targets_mean": 5006.4, "valid_targets_min": 879 }, { "epoch": 5.136592379583034, "grad_norm": 0.5223848215183271, "learning_rate": 8.045760695369847e-06, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.12808704376220703, "step": 3575, "valid_targets_mean": 4967.6, "valid_targets_min": 471 }, { "epoch": 5.143781452192667, "grad_norm": 0.5143444928109423, "learning_rate": 7.988386614040494e-06, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381615698337555, "step": 3580, "valid_targets_mean": 4538.1, "valid_targets_min": 849 }, { "epoch": 5.1509705248023, "grad_norm": 0.5182514437257415, "learning_rate": 7.931166738097475e-06, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.09853020310401917, "step": 3585, "valid_targets_mean": 2926.4, "valid_targets_min": 568 }, { "epoch": 5.158159597411934, "grad_norm": 0.5520568816361435, "learning_rate": 7.874101802130962e-06, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1408407986164093, "step": 3590, "valid_targets_mean": 4108.1, "valid_targets_min": 572 }, { "epoch": 5.165348670021567, "grad_norm": 0.5558116754962581, "learning_rate": 7.817192538742006e-06, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.14348295331001282, "step": 3595, "valid_targets_mean": 4215.8, "valid_targets_min": 581 }, { "epoch": 5.1725377426312, "grad_norm": 0.4732036564036685, "learning_rate": 7.760439678533116e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.10638897120952606, "step": 3600, "valid_targets_mean": 4069.9, "valid_targets_min": 655 }, { "epoch": 5.179726815240834, "grad_norm": 0.46187611868482703, "learning_rate": 7.703843950098896e-06, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.12339513003826141, "step": 3605, "valid_targets_mean": 4986.5, "valid_targets_min": 3772 }, { "epoch": 5.186915887850467, "grad_norm": 0.47709162253072873, "learning_rate": 7.647406080016689e-06, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.10468283295631409, "step": 3610, "valid_targets_mean": 4060.6, "valid_targets_min": 516 }, { "epoch": 5.194104960460101, "grad_norm": 0.4666448228118238, "learning_rate": 7.59112679283726e-06, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.10728386789560318, "step": 3615, "valid_targets_mean": 4606.5, "valid_targets_min": 689 }, { "epoch": 5.201294033069734, "grad_norm": 0.47925545974428047, "learning_rate": 7.535006811075472e-06, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.14180710911750793, "step": 3620, "valid_targets_mean": 5071.1, "valid_targets_min": 572 }, { "epoch": 5.208483105679368, "grad_norm": 0.580957255481736, "learning_rate": 7.479046855201018e-06, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.17155005037784576, "step": 3625, "valid_targets_mean": 4656.0, "valid_targets_min": 604 }, { "epoch": 5.215672178289001, "grad_norm": 0.5079874024744255, "learning_rate": 7.4232476436291766e-06, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.1037202775478363, "step": 3630, "valid_targets_mean": 3508.1, "valid_targets_min": 818 }, { "epoch": 5.222861250898634, "grad_norm": 0.5341354860008051, "learning_rate": 7.3676098927116e-06, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.12585100531578064, "step": 3635, "valid_targets_mean": 3564.9, "valid_targets_min": 802 }, { "epoch": 5.230050323508268, "grad_norm": 0.654732208865685, "learning_rate": 7.312134316727093e-06, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1112690344452858, "step": 3640, "valid_targets_mean": 4563.2, "valid_targets_min": 897 }, { "epoch": 5.237239396117901, "grad_norm": 0.627062993991902, "learning_rate": 7.256821627872448e-06, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.12680819630622864, "step": 3645, "valid_targets_mean": 3043.4, "valid_targets_min": 493 }, { "epoch": 5.244428468727534, "grad_norm": 0.4696774303220318, "learning_rate": 7.2016725362533276e-06, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.09891338646411896, "step": 3650, "valid_targets_mean": 3879.6, "valid_targets_min": 661 }, { "epoch": 5.2516175413371675, "grad_norm": 0.5242072466435919, "learning_rate": 7.146687749875116e-06, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.13201574981212616, "step": 3655, "valid_targets_mean": 5096.6, "valid_targets_min": 693 }, { "epoch": 5.258806613946801, "grad_norm": 0.5949854365395237, "learning_rate": 7.091867974633841e-06, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.10788040608167648, "step": 3660, "valid_targets_mean": 2561.8, "valid_targets_min": 558 }, { "epoch": 5.265995686556434, "grad_norm": 0.5240634062040213, "learning_rate": 7.037213914307115e-06, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.10503746569156647, "step": 3665, "valid_targets_mean": 3181.1, "valid_targets_min": 523 }, { "epoch": 5.273184759166067, "grad_norm": 0.5267318614037361, "learning_rate": 6.9827262705451105e-06, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396285593509674, "step": 3670, "valid_targets_mean": 4749.4, "valid_targets_min": 656 }, { "epoch": 5.280373831775701, "grad_norm": 0.47731072982521167, "learning_rate": 6.928405742861526e-06, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1177634596824646, "step": 3675, "valid_targets_mean": 4171.5, "valid_targets_min": 464 }, { "epoch": 5.287562904385334, "grad_norm": 0.5068202864119911, "learning_rate": 6.874253028624625e-06, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.10211893916130066, "step": 3680, "valid_targets_mean": 3619.4, "valid_targets_min": 902 }, { "epoch": 5.294751976994967, "grad_norm": 0.5016652817729716, "learning_rate": 6.820268823048266e-06, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.13110285997390747, "step": 3685, "valid_targets_mean": 4559.0, "valid_targets_min": 739 }, { "epoch": 5.301941049604601, "grad_norm": 0.5322028847511757, "learning_rate": 6.7664538191830165e-06, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.1111895740032196, "step": 3690, "valid_targets_mean": 3257.4, "valid_targets_min": 746 }, { "epoch": 5.309130122214234, "grad_norm": 0.5242815050747506, "learning_rate": 6.712808707907206e-06, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.09911448508501053, "step": 3695, "valid_targets_mean": 3859.8, "valid_targets_min": 855 }, { "epoch": 5.316319194823867, "grad_norm": 0.5274184494318976, "learning_rate": 6.659334177918075e-06, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.10168007016181946, "step": 3700, "valid_targets_mean": 2894.0, "valid_targets_min": 649 }, { "epoch": 5.3235082674335015, "grad_norm": 0.5580532302216001, "learning_rate": 6.6060309157229566e-06, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.12171245366334915, "step": 3705, "valid_targets_mean": 3291.8, "valid_targets_min": 532 }, { "epoch": 5.330697340043135, "grad_norm": 0.5325308799675936, "learning_rate": 6.55289960563044e-06, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.10376730561256409, "step": 3710, "valid_targets_mean": 3438.8, "valid_targets_min": 604 }, { "epoch": 5.337886412652768, "grad_norm": 0.5586213161057807, "learning_rate": 6.499940929741577e-06, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.09677755832672119, "step": 3715, "valid_targets_mean": 2735.0, "valid_targets_min": 620 }, { "epoch": 5.345075485262401, "grad_norm": 0.5663803576851734, "learning_rate": 6.447155567941141e-06, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.11576307564973831, "step": 3720, "valid_targets_mean": 3961.1, "valid_targets_min": 645 }, { "epoch": 5.352264557872035, "grad_norm": 0.47758908764240937, "learning_rate": 6.394544197888895e-06, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.08779515326023102, "step": 3725, "valid_targets_mean": 3460.2, "valid_targets_min": 666 }, { "epoch": 5.359453630481668, "grad_norm": 0.5371407252655028, "learning_rate": 6.342107495010903e-06, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1303025633096695, "step": 3730, "valid_targets_mean": 3453.9, "valid_targets_min": 582 }, { "epoch": 5.366642703091301, "grad_norm": 0.5433261944894747, "learning_rate": 6.289846132490836e-06, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.10139200091362, "step": 3735, "valid_targets_mean": 3614.2, "valid_targets_min": 485 }, { "epoch": 5.373831775700935, "grad_norm": 0.4892527224392483, "learning_rate": 6.237760781261339e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.12653936445713043, "step": 3740, "valid_targets_mean": 4815.8, "valid_targets_min": 3923 }, { "epoch": 5.381020848310568, "grad_norm": 0.6281676767553033, "learning_rate": 6.185852109995423e-06, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.14503289759159088, "step": 3745, "valid_targets_mean": 4049.6, "valid_targets_min": 577 }, { "epoch": 5.388209920920201, "grad_norm": 0.5139220394937787, "learning_rate": 6.1341207850978905e-06, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.09314952790737152, "step": 3750, "valid_targets_mean": 3192.6, "valid_targets_min": 647 }, { "epoch": 5.3953989935298345, "grad_norm": 0.5836967326755717, "learning_rate": 6.082567470696747e-06, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.11038590967655182, "step": 3755, "valid_targets_mean": 3321.2, "valid_targets_min": 691 }, { "epoch": 5.402588066139468, "grad_norm": 0.5862170542230964, "learning_rate": 6.0311928286347e-06, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.150666743516922, "step": 3760, "valid_targets_mean": 4635.4, "valid_targets_min": 4223 }, { "epoch": 5.409777138749101, "grad_norm": 0.5619243601117232, "learning_rate": 5.97999751846067e-06, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.11010795086622238, "step": 3765, "valid_targets_mean": 3656.0, "valid_targets_min": 830 }, { "epoch": 5.4169662113587345, "grad_norm": 0.4793247356400887, "learning_rate": 5.9289821974212956e-06, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.0704135149717331, "step": 3770, "valid_targets_mean": 2109.9, "valid_targets_min": 330 }, { "epoch": 5.424155283968368, "grad_norm": 0.517481898207876, "learning_rate": 5.878147520452517e-06, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.10165617614984512, "step": 3775, "valid_targets_mean": 3652.1, "valid_targets_min": 567 }, { "epoch": 5.431344356578001, "grad_norm": 0.6135944967500202, "learning_rate": 5.827494140171152e-06, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.09592735767364502, "step": 3780, "valid_targets_mean": 2568.6, "valid_targets_min": 486 }, { "epoch": 5.438533429187634, "grad_norm": 0.49746523639145324, "learning_rate": 5.7770227068665485e-06, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.0968160480260849, "step": 3785, "valid_targets_mean": 3214.0, "valid_targets_min": 699 }, { "epoch": 5.445722501797269, "grad_norm": 0.6088131457344995, "learning_rate": 5.726733868492196e-06, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.12237273901700974, "step": 3790, "valid_targets_mean": 2801.8, "valid_targets_min": 704 }, { "epoch": 5.452911574406902, "grad_norm": 0.4755640662150841, "learning_rate": 5.676628270657429e-06, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.10788771510124207, "step": 3795, "valid_targets_mean": 3890.1, "valid_targets_min": 767 }, { "epoch": 5.460100647016535, "grad_norm": 0.5564304734402853, "learning_rate": 5.626706556619132e-06, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.11956202983856201, "step": 3800, "valid_targets_mean": 3888.9, "valid_targets_min": 828 }, { "epoch": 5.4672897196261685, "grad_norm": 0.5718654277621241, "learning_rate": 5.576969367273506e-06, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.13896629214286804, "step": 3805, "valid_targets_mean": 4125.5, "valid_targets_min": 710 }, { "epoch": 5.474478792235802, "grad_norm": 0.5032497846155108, "learning_rate": 5.527417341147794e-06, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.09287270903587341, "step": 3810, "valid_targets_mean": 3537.1, "valid_targets_min": 686 }, { "epoch": 5.481667864845435, "grad_norm": 0.4915204373542724, "learning_rate": 5.4780511143921115e-06, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.1148151308298111, "step": 3815, "valid_targets_mean": 4444.5, "valid_targets_min": 617 }, { "epoch": 5.488856937455068, "grad_norm": 0.6047640594429146, "learning_rate": 5.428871320771296e-06, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.1029304563999176, "step": 3820, "valid_targets_mean": 2823.0, "valid_targets_min": 772 }, { "epoch": 5.496046010064702, "grad_norm": 0.510548508866447, "learning_rate": 5.379878591656742e-06, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.1139189675450325, "step": 3825, "valid_targets_mean": 3634.5, "valid_targets_min": 534 }, { "epoch": 5.503235082674335, "grad_norm": 0.5003942789953372, "learning_rate": 5.3310735560183e-06, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.11003319919109344, "step": 3830, "valid_targets_mean": 4281.6, "valid_targets_min": 949 }, { "epoch": 5.510424155283968, "grad_norm": 0.6576710045774764, "learning_rate": 5.28245684041621e-06, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1553100049495697, "step": 3835, "valid_targets_mean": 3864.1, "valid_targets_min": 718 }, { "epoch": 5.517613227893602, "grad_norm": 0.47410941520350275, "learning_rate": 5.2340290689930515e-06, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.11888614296913147, "step": 3840, "valid_targets_mean": 3732.5, "valid_targets_min": 732 }, { "epoch": 5.524802300503235, "grad_norm": 0.5085462942465262, "learning_rate": 5.185790863465747e-06, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.10465127229690552, "step": 3845, "valid_targets_mean": 3367.5, "valid_targets_min": 685 }, { "epoch": 5.531991373112868, "grad_norm": 0.4801234294164676, "learning_rate": 5.137742843117555e-06, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.09817088395357132, "step": 3850, "valid_targets_mean": 3293.4, "valid_targets_min": 564 }, { "epoch": 5.539180445722502, "grad_norm": 0.5305608181594179, "learning_rate": 5.089885624790134e-06, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.09850573539733887, "step": 3855, "valid_targets_mean": 3317.8, "valid_targets_min": 679 }, { "epoch": 5.546369518332135, "grad_norm": 0.6077286044826221, "learning_rate": 5.042219822875618e-06, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.10427510738372803, "step": 3860, "valid_targets_mean": 3405.0, "valid_targets_min": 655 }, { "epoch": 5.553558590941768, "grad_norm": 0.5246120803533588, "learning_rate": 4.994746049308747e-06, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.11735428869724274, "step": 3865, "valid_targets_mean": 3809.6, "valid_targets_min": 878 }, { "epoch": 5.5607476635514015, "grad_norm": 0.605950559060801, "learning_rate": 4.947464913558986e-06, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.11098338663578033, "step": 3870, "valid_targets_mean": 4339.1, "valid_targets_min": 751 }, { "epoch": 5.567936736161036, "grad_norm": 0.580577525790607, "learning_rate": 4.900377022622702e-06, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.15154002606868744, "step": 3875, "valid_targets_mean": 3963.5, "valid_targets_min": 916 }, { "epoch": 5.575125808770668, "grad_norm": 0.5518840282788854, "learning_rate": 4.8534829810154e-06, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.12235703319311142, "step": 3880, "valid_targets_mean": 4262.4, "valid_targets_min": 411 }, { "epoch": 5.582314881380302, "grad_norm": 0.555269161273212, "learning_rate": 4.806783390763932e-06, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.09165024757385254, "step": 3885, "valid_targets_mean": 3564.1, "valid_targets_min": 615 }, { "epoch": 5.589503953989936, "grad_norm": 0.47658903316409296, "learning_rate": 4.760278851398776e-06, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.0927685797214508, "step": 3890, "valid_targets_mean": 3430.5, "valid_targets_min": 756 }, { "epoch": 5.596693026599569, "grad_norm": 0.5813698001221245, "learning_rate": 4.7139699599463426e-06, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.1289849877357483, "step": 3895, "valid_targets_mean": 3189.4, "valid_targets_min": 593 }, { "epoch": 5.603882099209202, "grad_norm": 0.5485491518781684, "learning_rate": 4.66785731092132e-06, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.10561780631542206, "step": 3900, "valid_targets_mean": 3082.2, "valid_targets_min": 624 }, { "epoch": 5.6110711718188355, "grad_norm": 0.6088578449194925, "learning_rate": 4.621941496319023e-06, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.12965992093086243, "step": 3905, "valid_targets_mean": 3030.9, "valid_targets_min": 539 }, { "epoch": 5.618260244428469, "grad_norm": 0.5743980711000396, "learning_rate": 4.5762231056077976e-06, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.11457179486751556, "step": 3910, "valid_targets_mean": 3469.0, "valid_targets_min": 613 }, { "epoch": 5.625449317038102, "grad_norm": 0.5735979192233173, "learning_rate": 4.530702725721456e-06, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.16201013326644897, "step": 3915, "valid_targets_mean": 4685.4, "valid_targets_min": 716 }, { "epoch": 5.632638389647735, "grad_norm": 0.5314576556957686, "learning_rate": 4.485380941051764e-06, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.13539963960647583, "step": 3920, "valid_targets_mean": 4214.4, "valid_targets_min": 2348 }, { "epoch": 5.639827462257369, "grad_norm": 0.4962243478682359, "learning_rate": 4.4402583334408925e-06, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.1239946112036705, "step": 3925, "valid_targets_mean": 4401.9, "valid_targets_min": 772 }, { "epoch": 5.647016534867002, "grad_norm": 0.5608654561683951, "learning_rate": 4.3953354821739745e-06, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.10213188081979752, "step": 3930, "valid_targets_mean": 3199.0, "valid_targets_min": 595 }, { "epoch": 5.654205607476635, "grad_norm": 0.4264040054006142, "learning_rate": 4.350612963971683e-06, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.11011867970228195, "step": 3935, "valid_targets_mean": 5150.9, "valid_targets_min": 4219 }, { "epoch": 5.661394680086269, "grad_norm": 0.7527457817817157, "learning_rate": 4.3060913529828e-06, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.13459980487823486, "step": 3940, "valid_targets_mean": 4806.9, "valid_targets_min": 4005 }, { "epoch": 5.668583752695902, "grad_norm": 0.5037853732946838, "learning_rate": 4.261771220776856e-06, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.10649976134300232, "step": 3945, "valid_targets_mean": 4182.1, "valid_targets_min": 939 }, { "epoch": 5.675772825305535, "grad_norm": 0.49120828952402623, "learning_rate": 4.217653136336788e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.10088129341602325, "step": 3950, "valid_targets_mean": 3940.2, "valid_targets_min": 612 }, { "epoch": 5.682961897915169, "grad_norm": 0.5345061789069356, "learning_rate": 4.173737666051638e-06, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.11330173909664154, "step": 3955, "valid_targets_mean": 3495.2, "valid_targets_min": 634 }, { "epoch": 5.690150970524803, "grad_norm": 0.5495034857434233, "learning_rate": 4.1300253737092985e-06, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.08555985987186432, "step": 3960, "valid_targets_mean": 2754.5, "valid_targets_min": 558 }, { "epoch": 5.697340043134435, "grad_norm": 0.5504471166752093, "learning_rate": 4.086516820489244e-06, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11938584595918655, "step": 3965, "valid_targets_mean": 4737.6, "valid_targets_min": 818 }, { "epoch": 5.704529115744069, "grad_norm": 0.7024099146976166, "learning_rate": 4.043212564955341e-06, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.11366365849971771, "step": 3970, "valid_targets_mean": 3613.2, "valid_targets_min": 769 }, { "epoch": 5.711718188353703, "grad_norm": 0.5567797213556551, "learning_rate": 4.000113163048678e-06, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.12813721597194672, "step": 3975, "valid_targets_mean": 3827.0, "valid_targets_min": 753 }, { "epoch": 5.718907260963336, "grad_norm": 0.4820690425614344, "learning_rate": 3.957219168080439e-06, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.08902594447135925, "step": 3980, "valid_targets_mean": 3253.6, "valid_targets_min": 629 }, { "epoch": 5.726096333572969, "grad_norm": 0.5241838560174583, "learning_rate": 3.914531130724777e-06, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.10416141152381897, "step": 3985, "valid_targets_mean": 3481.9, "valid_targets_min": 673 }, { "epoch": 5.733285406182603, "grad_norm": 0.55638613732615, "learning_rate": 3.872049599011754e-06, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.087767094373703, "step": 3990, "valid_targets_mean": 2224.9, "valid_targets_min": 611 }, { "epoch": 5.740474478792236, "grad_norm": 0.5096808510890435, "learning_rate": 3.829775118320322e-06, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.12581051886081696, "step": 3995, "valid_targets_mean": 4320.4, "valid_targets_min": 991 }, { "epoch": 5.747663551401869, "grad_norm": 0.5525616374673865, "learning_rate": 3.7877082313712944e-06, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.11794079840183258, "step": 4000, "valid_targets_mean": 3695.4, "valid_targets_min": 877 }, { "epoch": 5.7548526240115025, "grad_norm": 0.5443711074253681, "learning_rate": 3.7458494782203915e-06, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.13976985216140747, "step": 4005, "valid_targets_mean": 4345.1, "valid_targets_min": 702 }, { "epoch": 5.762041696621136, "grad_norm": 0.5340557650606426, "learning_rate": 3.7041993962513066e-06, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.10117100179195404, "step": 4010, "valid_targets_mean": 3320.6, "valid_targets_min": 743 }, { "epoch": 5.769230769230769, "grad_norm": 0.4803688175797287, "learning_rate": 3.662758520168821e-06, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.08951431512832642, "step": 4015, "valid_targets_mean": 3885.5, "valid_targets_min": 705 }, { "epoch": 5.7764198418404025, "grad_norm": 0.48476516277316617, "learning_rate": 3.6215273819919095e-06, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.12080979347229004, "step": 4020, "valid_targets_mean": 4147.9, "valid_targets_min": 489 }, { "epoch": 5.783608914450036, "grad_norm": 0.6249752714144173, "learning_rate": 3.5805065110469306e-06, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.13403496146202087, "step": 4025, "valid_targets_mean": 3137.0, "valid_targets_min": 864 }, { "epoch": 5.790797987059669, "grad_norm": 0.5364924278381279, "learning_rate": 3.5396964339608266e-06, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11756608635187149, "step": 4030, "valid_targets_mean": 4123.2, "valid_targets_min": 635 }, { "epoch": 5.797987059669302, "grad_norm": 0.5109349298834557, "learning_rate": 3.4990976746543727e-06, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.10641781985759735, "step": 4035, "valid_targets_mean": 3795.5, "valid_targets_min": 865 }, { "epoch": 5.805176132278936, "grad_norm": 0.5425174482086091, "learning_rate": 3.4587107543354236e-06, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.10321540385484695, "step": 4040, "valid_targets_mean": 3321.0, "valid_targets_min": 507 }, { "epoch": 5.812365204888569, "grad_norm": 0.4547290274337963, "learning_rate": 3.4185361914922588e-06, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.10309769958257675, "step": 4045, "valid_targets_mean": 4833.1, "valid_targets_min": 762 }, { "epoch": 5.819554277498202, "grad_norm": 0.6674311050708079, "learning_rate": 3.378574501886891e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.14393368363380432, "step": 4050, "valid_targets_mean": 3134.4, "valid_targets_min": 683 }, { "epoch": 5.8267433501078365, "grad_norm": 0.5103372393228983, "learning_rate": 3.338826198548477e-06, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.09888037294149399, "step": 4055, "valid_targets_mean": 4051.0, "valid_targets_min": 844 }, { "epoch": 5.83393242271747, "grad_norm": 0.5656063140256278, "learning_rate": 3.299291791766703e-06, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.09367987513542175, "step": 4060, "valid_targets_mean": 2694.8, "valid_targets_min": 482 }, { "epoch": 5.841121495327103, "grad_norm": 0.8203760991873118, "learning_rate": 3.2599717890852502e-06, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.13091842830181122, "step": 4065, "valid_targets_mean": 3690.6, "valid_targets_min": 592 }, { "epoch": 5.848310567936736, "grad_norm": 1.1540642624867812, "learning_rate": 3.220866695295266e-06, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.09300343692302704, "step": 4070, "valid_targets_mean": 2594.1, "valid_targets_min": 606 }, { "epoch": 5.85549964054637, "grad_norm": 0.5416675522579539, "learning_rate": 3.181977012428914e-06, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.09534624218940735, "step": 4075, "valid_targets_mean": 3515.5, "valid_targets_min": 659 }, { "epoch": 5.862688713156003, "grad_norm": 0.5680889544101823, "learning_rate": 3.143303239752886e-06, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.10078851878643036, "step": 4080, "valid_targets_mean": 3410.9, "valid_targets_min": 839 }, { "epoch": 5.869877785765636, "grad_norm": 0.48763425732795723, "learning_rate": 3.1048458737620258e-06, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.12355795502662659, "step": 4085, "valid_targets_mean": 4751.1, "valid_targets_min": 3760 }, { "epoch": 5.87706685837527, "grad_norm": 0.5255237214520677, "learning_rate": 3.066605408172929e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.09903688728809357, "step": 4090, "valid_targets_mean": 3674.5, "valid_targets_min": 948 }, { "epoch": 5.884255930984903, "grad_norm": 0.6092363999584978, "learning_rate": 3.028582333917638e-06, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.10750824213027954, "step": 4095, "valid_targets_mean": 3747.6, "valid_targets_min": 940 }, { "epoch": 5.891445003594536, "grad_norm": 0.46322807716375014, "learning_rate": 2.9907771391373087e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.110776387155056, "step": 4100, "valid_targets_mean": 4066.8, "valid_targets_min": 633 }, { "epoch": 5.89863407620417, "grad_norm": 0.5530260841245102, "learning_rate": 2.9531903091759464e-06, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.11539137363433838, "step": 4105, "valid_targets_mean": 3571.0, "valid_targets_min": 667 }, { "epoch": 5.905823148813803, "grad_norm": 0.49404735005998257, "learning_rate": 2.915822326574205e-06, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.09268874675035477, "step": 4110, "valid_targets_mean": 3558.6, "valid_targets_min": 814 }, { "epoch": 5.913012221423436, "grad_norm": 0.5418163287700767, "learning_rate": 2.8786736710631547e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.08183282613754272, "step": 4115, "valid_targets_mean": 2856.6, "valid_targets_min": 529 }, { "epoch": 5.9202012940330695, "grad_norm": 0.5829105600425594, "learning_rate": 2.841744819558141e-06, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.1069040447473526, "step": 4120, "valid_targets_mean": 3141.1, "valid_targets_min": 467 }, { "epoch": 5.927390366642703, "grad_norm": 0.5522333370692242, "learning_rate": 2.8050362461526614e-06, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.10800863802433014, "step": 4125, "valid_targets_mean": 3894.9, "valid_targets_min": 797 }, { "epoch": 5.934579439252336, "grad_norm": 0.5126538599484419, "learning_rate": 2.7685484221122847e-06, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.1306709349155426, "step": 4130, "valid_targets_mean": 4314.8, "valid_targets_min": 840 }, { "epoch": 5.941768511861969, "grad_norm": 0.5394517626708155, "learning_rate": 2.7322818158685847e-06, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.13361993432044983, "step": 4135, "valid_targets_mean": 3994.2, "valid_targets_min": 853 }, { "epoch": 5.948957584471604, "grad_norm": 0.5359612939529111, "learning_rate": 2.696236893013138e-06, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.10245585441589355, "step": 4140, "valid_targets_mean": 3500.2, "valid_targets_min": 649 }, { "epoch": 5.956146657081236, "grad_norm": 0.5688862266244793, "learning_rate": 2.660414116291543e-06, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.09202219545841217, "step": 4145, "valid_targets_mean": 2825.6, "valid_targets_min": 611 }, { "epoch": 5.96333572969087, "grad_norm": 0.5610739413081085, "learning_rate": 2.624813945597493e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.12422355264425278, "step": 4150, "valid_targets_mean": 4198.4, "valid_targets_min": 700 }, { "epoch": 5.9705248023005035, "grad_norm": 0.5885410928110363, "learning_rate": 2.5894368379668367e-06, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.09310132265090942, "step": 4155, "valid_targets_mean": 2653.9, "valid_targets_min": 691 }, { "epoch": 5.977713874910137, "grad_norm": 0.5635217064321498, "learning_rate": 2.5542832475717605e-06, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.13913258910179138, "step": 4160, "valid_targets_mean": 4385.0, "valid_targets_min": 867 }, { "epoch": 5.98490294751977, "grad_norm": 0.48587755558221085, "learning_rate": 2.5193536257149045e-06, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.0926017239689827, "step": 4165, "valid_targets_mean": 3001.0, "valid_targets_min": 889 }, { "epoch": 5.9920920201294035, "grad_norm": 0.5248853589772831, "learning_rate": 2.484648420823621e-06, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.11225050687789917, "step": 4170, "valid_targets_mean": 3894.8, "valid_targets_min": 785 }, { "epoch": 5.999281092739037, "grad_norm": 0.49185549380354215, "learning_rate": 2.4501680784441704e-06, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12695342302322388, "step": 4175, "valid_targets_mean": 4756.8, "valid_targets_min": 851 }, { "epoch": 6.005751258087707, "grad_norm": 0.5895294664188037, "learning_rate": 2.415913041236033e-06, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.1118449717760086, "step": 4180, "valid_targets_mean": 4720.0, "valid_targets_min": 3732 }, { "epoch": 6.01294033069734, "grad_norm": 0.6638987983800019, "learning_rate": 2.3818837489662096e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.10860610008239746, "step": 4185, "valid_targets_mean": 2938.6, "valid_targets_min": 773 }, { "epoch": 6.020129403306973, "grad_norm": 0.47545987837037096, "learning_rate": 2.348080638503596e-06, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.12051060050725937, "step": 4190, "valid_targets_mean": 4825.9, "valid_targets_min": 702 }, { "epoch": 6.027318475916607, "grad_norm": 0.511588230010411, "learning_rate": 2.3145041438133476e-06, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11961148679256439, "step": 4195, "valid_targets_mean": 4777.9, "valid_targets_min": 3944 }, { "epoch": 6.03450754852624, "grad_norm": 0.553898288205841, "learning_rate": 2.2811546959513196e-06, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.13163530826568604, "step": 4200, "valid_targets_mean": 4873.9, "valid_targets_min": 3944 }, { "epoch": 6.041696621135873, "grad_norm": 0.5899270631407394, "learning_rate": 2.24803272305854e-06, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.1202486902475357, "step": 4205, "valid_targets_mean": 3210.9, "valid_targets_min": 597 }, { "epoch": 6.048885693745507, "grad_norm": 0.5810648705314886, "learning_rate": 2.21513865035571e-06, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.10933034867048264, "step": 4210, "valid_targets_mean": 3725.1, "valid_targets_min": 601 }, { "epoch": 6.05607476635514, "grad_norm": 0.449972261249417, "learning_rate": 2.1824729001377396e-06, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.10579677671194077, "step": 4215, "valid_targets_mean": 4484.1, "valid_targets_min": 3859 }, { "epoch": 6.063263838964773, "grad_norm": 0.4943133972872266, "learning_rate": 2.150035891768323e-06, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.13363003730773926, "step": 4220, "valid_targets_mean": 4613.4, "valid_targets_min": 678 }, { "epoch": 6.070452911574407, "grad_norm": 0.5929568384137042, "learning_rate": 2.1178280416745743e-06, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.06701067090034485, "step": 4225, "valid_targets_mean": 1870.5, "valid_targets_min": 446 }, { "epoch": 6.07764198418404, "grad_norm": 0.4803255814125173, "learning_rate": 2.0858497633416565e-06, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.09893548488616943, "step": 4230, "valid_targets_mean": 3892.6, "valid_targets_min": 670 }, { "epoch": 6.084831056793673, "grad_norm": 0.6263462306661182, "learning_rate": 2.0541014673074898e-06, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.13514085114002228, "step": 4235, "valid_targets_mean": 4169.0, "valid_targets_min": 728 }, { "epoch": 6.092020129403307, "grad_norm": 0.5421931016830664, "learning_rate": 2.0225835611574697e-06, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11666776239871979, "step": 4240, "valid_targets_mean": 3620.8, "valid_targets_min": 915 }, { "epoch": 6.099209202012941, "grad_norm": 0.4857697103944299, "learning_rate": 1.9912964495192533e-06, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.11697093397378922, "step": 4245, "valid_targets_mean": 5469.8, "valid_targets_min": 640 }, { "epoch": 6.106398274622574, "grad_norm": 0.5323926029594881, "learning_rate": 1.9602405340575446e-06, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.10784275829792023, "step": 4250, "valid_targets_mean": 3823.8, "valid_targets_min": 825 }, { "epoch": 6.113587347232207, "grad_norm": 0.5447888444803873, "learning_rate": 1.929416213468942e-06, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.10931412875652313, "step": 4255, "valid_targets_mean": 3607.9, "valid_targets_min": 609 }, { "epoch": 6.120776419841841, "grad_norm": 0.6144296819100742, "learning_rate": 1.8988238834768235e-06, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.12556231021881104, "step": 4260, "valid_targets_mean": 3070.2, "valid_targets_min": 534 }, { "epoch": 6.127965492451474, "grad_norm": 0.49482382131724245, "learning_rate": 1.8684639368262792e-06, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1340388059616089, "step": 4265, "valid_targets_mean": 5229.5, "valid_targets_min": 4362 }, { "epoch": 6.135154565061107, "grad_norm": 0.5827050871510197, "learning_rate": 1.8383367632790384e-06, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.12392894178628922, "step": 4270, "valid_targets_mean": 3390.2, "valid_targets_min": 565 }, { "epoch": 6.1423436376707405, "grad_norm": 0.5131318427074524, "learning_rate": 1.8084427496084967e-06, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1041579395532608, "step": 4275, "valid_targets_mean": 3940.1, "valid_targets_min": 742 }, { "epoch": 6.149532710280374, "grad_norm": 0.5963777062849123, "learning_rate": 1.7787822795947262e-06, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.09274083375930786, "step": 4280, "valid_targets_mean": 2919.9, "valid_targets_min": 717 }, { "epoch": 6.156721782890007, "grad_norm": 0.49582307100103684, "learning_rate": 1.7493557340195754e-06, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.09546741843223572, "step": 4285, "valid_targets_mean": 4019.0, "valid_targets_min": 934 }, { "epoch": 6.1639108554996405, "grad_norm": 0.4871415848643614, "learning_rate": 1.7201634906617504e-06, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.10446576774120331, "step": 4290, "valid_targets_mean": 4068.0, "valid_targets_min": 649 }, { "epoch": 6.171099928109274, "grad_norm": 0.47120731528371945, "learning_rate": 1.6912059242919853e-06, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.11221934854984283, "step": 4295, "valid_targets_mean": 4832.8, "valid_targets_min": 895 }, { "epoch": 6.178289000718907, "grad_norm": 0.4965531368094695, "learning_rate": 1.6624834066682248e-06, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.09528857469558716, "step": 4300, "valid_targets_mean": 3653.1, "valid_targets_min": 748 }, { "epoch": 6.18547807332854, "grad_norm": 0.5756851241381141, "learning_rate": 1.6339963065308539e-06, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.08201570063829422, "step": 4305, "valid_targets_mean": 2631.0, "valid_targets_min": 710 }, { "epoch": 6.192667145938174, "grad_norm": 0.5002106473544778, "learning_rate": 1.6057449895979616e-06, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.09970113635063171, "step": 4310, "valid_targets_mean": 3362.1, "valid_targets_min": 691 }, { "epoch": 6.199856218547807, "grad_norm": 0.596931111317232, "learning_rate": 1.5777298185606428e-06, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.14602990448474884, "step": 4315, "valid_targets_mean": 4108.9, "valid_targets_min": 1363 }, { "epoch": 6.20704529115744, "grad_norm": 0.538595523809706, "learning_rate": 1.5499511530783462e-06, "loss": 0.2209, "loss_nan_ranks": 0, "loss_rank_avg": 0.12626773118972778, "step": 4320, "valid_targets_mean": 3403.0, "valid_targets_min": 601 }, { "epoch": 6.2142343637670745, "grad_norm": 0.5490331377416214, "learning_rate": 1.5224093497742654e-06, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11536562442779541, "step": 4325, "valid_targets_mean": 3286.5, "valid_targets_min": 732 }, { "epoch": 6.221423436376708, "grad_norm": 0.539453466902596, "learning_rate": 1.4951047622307413e-06, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.15311205387115479, "step": 4330, "valid_targets_mean": 4828.9, "valid_targets_min": 685 }, { "epoch": 6.228612508986341, "grad_norm": 0.5966313956547638, "learning_rate": 1.4680377409847314e-06, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.12395937740802765, "step": 4335, "valid_targets_mean": 3536.1, "valid_targets_min": 713 }, { "epoch": 6.235801581595974, "grad_norm": 0.6171088156882476, "learning_rate": 1.4412086335233255e-06, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.13875176012516022, "step": 4340, "valid_targets_mean": 3610.2, "valid_targets_min": 595 }, { "epoch": 6.242990654205608, "grad_norm": 0.5098548922882871, "learning_rate": 1.4146177842792573e-06, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.10508402436971664, "step": 4345, "valid_targets_mean": 3578.6, "valid_targets_min": 753 }, { "epoch": 6.250179726815241, "grad_norm": 0.5567296804680034, "learning_rate": 1.388265534626496e-06, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.11976335197687149, "step": 4350, "valid_targets_mean": 4137.0, "valid_targets_min": 558 }, { "epoch": 6.257368799424874, "grad_norm": 0.5039084294745627, "learning_rate": 1.3621522228758676e-06, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.09727634489536285, "step": 4355, "valid_targets_mean": 3437.0, "valid_targets_min": 521 }, { "epoch": 6.264557872034508, "grad_norm": 0.5493758228180413, "learning_rate": 1.336278184270714e-06, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.13206574320793152, "step": 4360, "valid_targets_mean": 4421.5, "valid_targets_min": 3544 }, { "epoch": 6.271746944644141, "grad_norm": 0.5749472389885733, "learning_rate": 1.3106437509825676e-06, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.11927582323551178, "step": 4365, "valid_targets_mean": 3679.4, "valid_targets_min": 591 }, { "epoch": 6.278936017253774, "grad_norm": 0.5863167521975554, "learning_rate": 1.285249252106915e-06, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.09201674908399582, "step": 4370, "valid_targets_mean": 2855.1, "valid_targets_min": 620 }, { "epoch": 6.286125089863408, "grad_norm": 0.5928713895291766, "learning_rate": 1.2600950136589463e-06, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.11213717609643936, "step": 4375, "valid_targets_mean": 3264.9, "valid_targets_min": 582 }, { "epoch": 6.293314162473041, "grad_norm": 0.7070213599440965, "learning_rate": 1.2351813585693995e-06, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.07634206861257553, "step": 4380, "valid_targets_mean": 1711.0, "valid_targets_min": 619 }, { "epoch": 6.300503235082674, "grad_norm": 0.6228414357157461, "learning_rate": 1.2105086066803783e-06, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.11248739063739777, "step": 4385, "valid_targets_mean": 3012.6, "valid_targets_min": 685 }, { "epoch": 6.3076923076923075, "grad_norm": 0.5643565877084489, "learning_rate": 1.1860770747412853e-06, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.113135427236557, "step": 4390, "valid_targets_mean": 2834.9, "valid_targets_min": 603 }, { "epoch": 6.314881380301941, "grad_norm": 0.6000792505033019, "learning_rate": 1.161887076404713e-06, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297518014907837, "step": 4395, "valid_targets_mean": 3398.4, "valid_targets_min": 721 }, { "epoch": 6.322070452911574, "grad_norm": 0.5197738471357597, "learning_rate": 1.1379389222224612e-06, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12117072939872742, "step": 4400, "valid_targets_mean": 3815.1, "valid_targets_min": 588 }, { "epoch": 6.329259525521207, "grad_norm": 0.6157655100543539, "learning_rate": 1.1142329196415158e-06, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.11843574792146683, "step": 4405, "valid_targets_mean": 3207.4, "valid_targets_min": 736 }, { "epoch": 6.336448598130841, "grad_norm": 0.6007875421280104, "learning_rate": 1.0907693730001156e-06, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.11485160887241364, "step": 4410, "valid_targets_mean": 3385.8, "valid_targets_min": 544 }, { "epoch": 6.343637670740474, "grad_norm": 0.5909221142624015, "learning_rate": 1.0675485835238453e-06, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.11618539690971375, "step": 4415, "valid_targets_mean": 3535.8, "valid_targets_min": 656 }, { "epoch": 6.350826743350108, "grad_norm": 0.5883536230905861, "learning_rate": 1.0445708493217732e-06, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.16777461767196655, "step": 4420, "valid_targets_mean": 3526.5, "valid_targets_min": 604 }, { "epoch": 6.3580158159597415, "grad_norm": 0.491586006809235, "learning_rate": 1.0218364653826106e-06, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.12006094306707382, "step": 4425, "valid_targets_mean": 4281.6, "valid_targets_min": 1431 }, { "epoch": 6.365204888569375, "grad_norm": 0.4767502238781207, "learning_rate": 9.993457235709325e-07, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.10189913213253021, "step": 4430, "valid_targets_mean": 3844.6, "valid_targets_min": 915 }, { "epoch": 6.372393961179008, "grad_norm": 0.5371473156112417, "learning_rate": 9.770989126234287e-07, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.11209119856357574, "step": 4435, "valid_targets_mean": 3499.1, "valid_targets_min": 615 }, { "epoch": 6.379583033788641, "grad_norm": 0.6149664809993349, "learning_rate": 9.550963181452121e-07, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.10318882018327713, "step": 4440, "valid_targets_mean": 3142.6, "valid_targets_min": 663 }, { "epoch": 6.386772106398275, "grad_norm": 0.5234090608011976, "learning_rate": 9.333382226061216e-07, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.11103767156600952, "step": 4445, "valid_targets_mean": 3792.0, "valid_targets_min": 545 }, { "epoch": 6.393961179007908, "grad_norm": 0.5832363451984859, "learning_rate": 9.118249053371176e-07, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.12992234528064728, "step": 4450, "valid_targets_mean": 3576.0, "valid_targets_min": 578 }, { "epoch": 6.401150251617541, "grad_norm": 0.4971374707007291, "learning_rate": 8.905566425267009e-07, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.11479949951171875, "step": 4455, "valid_targets_mean": 4383.1, "valid_targets_min": 640 }, { "epoch": 6.408339324227175, "grad_norm": 0.5060142693629047, "learning_rate": 8.695337072173448e-07, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.10227428376674652, "step": 4460, "valid_targets_mean": 3275.5, "valid_targets_min": 714 }, { "epoch": 6.415528396836808, "grad_norm": 0.5977172657593309, "learning_rate": 8.487563693020063e-07, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.10205759108066559, "step": 4465, "valid_targets_mean": 2500.6, "valid_targets_min": 655 }, { "epoch": 6.422717469446441, "grad_norm": 0.5650433111300472, "learning_rate": 8.282248955206573e-07, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.11529181152582169, "step": 4470, "valid_targets_mean": 3392.5, "valid_targets_min": 618 }, { "epoch": 6.429906542056075, "grad_norm": 0.5347555795795468, "learning_rate": 8.079395494568643e-07, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.10156741738319397, "step": 4475, "valid_targets_mean": 3383.0, "valid_targets_min": 872 }, { "epoch": 6.437095614665708, "grad_norm": 0.4365670326267589, "learning_rate": 7.879005915343918e-07, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.1043374314904213, "step": 4480, "valid_targets_mean": 4653.4, "valid_targets_min": 3482 }, { "epoch": 6.444284687275341, "grad_norm": 0.6426365264377848, "learning_rate": 7.68108279013875e-07, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.0819304957985878, "step": 4485, "valid_targets_mean": 2075.1, "valid_targets_min": 552 }, { "epoch": 6.4514737598849745, "grad_norm": 0.5102964897343093, "learning_rate": 7.485628659894994e-07, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.11622590571641922, "step": 4490, "valid_targets_mean": 3854.1, "valid_targets_min": 798 }, { "epoch": 6.458662832494608, "grad_norm": 0.8896510887896947, "learning_rate": 7.292646033857642e-07, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.12156560271978378, "step": 4495, "valid_targets_mean": 3445.5, "valid_targets_min": 689 }, { "epoch": 6.465851905104241, "grad_norm": 0.5066774432966253, "learning_rate": 7.102137389542285e-07, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.09936122596263885, "step": 4500, "valid_targets_mean": 3640.1, "valid_targets_min": 556 }, { "epoch": 6.473040977713875, "grad_norm": 0.48580434445087983, "learning_rate": 6.914105172703634e-07, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.10198426246643066, "step": 4505, "valid_targets_mean": 4095.1, "valid_targets_min": 981 }, { "epoch": 6.480230050323509, "grad_norm": 0.5480915043210962, "learning_rate": 6.728551797303806e-07, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.11724647879600525, "step": 4510, "valid_targets_mean": 3779.5, "valid_targets_min": 686 }, { "epoch": 6.487419122933142, "grad_norm": 0.4917565970472607, "learning_rate": 6.545479645481668e-07, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.09854386746883392, "step": 4515, "valid_targets_mean": 3022.0, "valid_targets_min": 534 }, { "epoch": 6.494608195542775, "grad_norm": 0.5955056659476884, "learning_rate": 6.364891067521894e-07, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.14446298778057098, "step": 4520, "valid_targets_mean": 3898.5, "valid_targets_min": 520 }, { "epoch": 6.5017972681524085, "grad_norm": 0.531573239442214, "learning_rate": 6.186788381825115e-07, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.10202017426490784, "step": 4525, "valid_targets_mean": 3164.8, "valid_targets_min": 607 }, { "epoch": 6.508986340762042, "grad_norm": 0.5236595235106791, "learning_rate": 6.011173874877907e-07, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.0913836658000946, "step": 4530, "valid_targets_mean": 3510.1, "valid_targets_min": 758 }, { "epoch": 6.516175413371675, "grad_norm": 0.5100939636244546, "learning_rate": 5.838049801223666e-07, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.12276538461446762, "step": 4535, "valid_targets_mean": 4939.5, "valid_targets_min": 734 }, { "epoch": 6.5233644859813085, "grad_norm": 0.5928341800974949, "learning_rate": 5.667418383433454e-07, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.09597209841012955, "step": 4540, "valid_targets_mean": 2316.5, "valid_targets_min": 571 }, { "epoch": 6.530553558590942, "grad_norm": 0.5147154688423627, "learning_rate": 5.499281812077595e-07, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11607391387224197, "step": 4545, "valid_targets_mean": 4424.6, "valid_targets_min": 582 }, { "epoch": 6.537742631200575, "grad_norm": 0.5729816597064707, "learning_rate": 5.333642245697479e-07, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11833793669939041, "step": 4550, "valid_targets_mean": 4566.2, "valid_targets_min": 3931 }, { "epoch": 6.544931703810208, "grad_norm": 0.6177362139918386, "learning_rate": 5.170501810777962e-07, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.12645436823368073, "step": 4555, "valid_targets_mean": 3126.6, "valid_targets_min": 666 }, { "epoch": 6.552120776419842, "grad_norm": 0.6246368411360932, "learning_rate": 5.009862601719895e-07, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.12022657692432404, "step": 4560, "valid_targets_mean": 3312.2, "valid_targets_min": 731 }, { "epoch": 6.559309849029475, "grad_norm": 0.5709298820469643, "learning_rate": 4.851726680813352e-07, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.12751153111457825, "step": 4565, "valid_targets_mean": 4387.9, "valid_targets_min": 630 }, { "epoch": 6.566498921639108, "grad_norm": 0.597713035176386, "learning_rate": 4.6960960782111764e-07, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.12144911289215088, "step": 4570, "valid_targets_mean": 4570.9, "valid_targets_min": 828 }, { "epoch": 6.573687994248742, "grad_norm": 0.5371421698345592, "learning_rate": 4.5429727919028777e-07, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.08236388862133026, "step": 4575, "valid_targets_mean": 2927.4, "valid_targets_min": 639 }, { "epoch": 6.580877066858375, "grad_norm": 0.48311881472200036, "learning_rate": 4.392358787688933e-07, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.11492183804512024, "step": 4580, "valid_targets_mean": 4438.8, "valid_targets_min": 546 }, { "epoch": 6.588066139468008, "grad_norm": 0.5324096131254584, "learning_rate": 4.2442559991555666e-07, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.10867210477590561, "step": 4585, "valid_targets_mean": 4227.9, "valid_targets_min": 767 }, { "epoch": 6.595255212077642, "grad_norm": 0.5806558853032571, "learning_rate": 4.098666327650036e-07, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.12176599353551865, "step": 4590, "valid_targets_mean": 4184.5, "valid_targets_min": 768 }, { "epoch": 6.602444284687275, "grad_norm": 0.5316832508972936, "learning_rate": 3.955591642256118e-07, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.09368228912353516, "step": 4595, "valid_targets_mean": 3312.2, "valid_targets_min": 617 }, { "epoch": 6.609633357296909, "grad_norm": 0.5262503581637803, "learning_rate": 3.8150337797701274e-07, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.12923449277877808, "step": 4600, "valid_targets_mean": 4870.6, "valid_targets_min": 637 }, { "epoch": 6.616822429906542, "grad_norm": 0.5198765305609072, "learning_rate": 3.67699454467727e-07, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.09299536049365997, "step": 4605, "valid_targets_mean": 4086.0, "valid_targets_min": 691 }, { "epoch": 6.624011502516176, "grad_norm": 0.5294711658533326, "learning_rate": 3.5414757091287055e-07, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1437724232673645, "step": 4610, "valid_targets_mean": 5623.2, "valid_targets_min": 4224 }, { "epoch": 6.631200575125809, "grad_norm": 0.5316860873672942, "learning_rate": 3.408479012918475e-07, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.11999592185020447, "step": 4615, "valid_targets_mean": 4838.4, "valid_targets_min": 719 }, { "epoch": 6.638389647735442, "grad_norm": 0.527365776930916, "learning_rate": 3.2780061634615e-07, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.0915064588189125, "step": 4620, "valid_targets_mean": 3768.5, "valid_targets_min": 671 }, { "epoch": 6.645578720345076, "grad_norm": 0.5476426776018154, "learning_rate": 3.1500588357713745e-07, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.15225091576576233, "step": 4625, "valid_targets_mean": 4842.1, "valid_targets_min": 1040 }, { "epoch": 6.652767792954709, "grad_norm": 0.6528164431079474, "learning_rate": 3.024638672439006e-07, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.10779650509357452, "step": 4630, "valid_targets_mean": 2673.1, "valid_targets_min": 689 }, { "epoch": 6.659956865564342, "grad_norm": 0.5231166358844416, "learning_rate": 2.901747283611545e-07, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.10894091427326202, "step": 4635, "valid_targets_mean": 4211.9, "valid_targets_min": 758 }, { "epoch": 6.6671459381739755, "grad_norm": 0.46431337768126324, "learning_rate": 2.7813862469716403e-07, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.11026604473590851, "step": 4640, "valid_targets_mean": 4567.1, "valid_targets_min": 4060 }, { "epoch": 6.674335010783609, "grad_norm": 0.4647171653285355, "learning_rate": 2.663557107717196e-07, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11128712445497513, "step": 4645, "valid_targets_mean": 4858.0, "valid_targets_min": 604 }, { "epoch": 6.681524083393242, "grad_norm": 0.5449440560939603, "learning_rate": 2.5482613785416277e-07, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.1023380309343338, "step": 4650, "valid_targets_mean": 3129.8, "valid_targets_min": 653 }, { "epoch": 6.688713156002875, "grad_norm": 0.5273355227723932, "learning_rate": 2.435500539614277e-07, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.14378316700458527, "step": 4655, "valid_targets_mean": 4260.0, "valid_targets_min": 610 }, { "epoch": 6.695902228612509, "grad_norm": 0.4760788362645504, "learning_rate": 2.3252760385615858e-07, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.09157054871320724, "step": 4660, "valid_targets_mean": 4021.9, "valid_targets_min": 515 }, { "epoch": 6.703091301222142, "grad_norm": 0.5599885016265596, "learning_rate": 2.2175892904483743e-07, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.09934373944997787, "step": 4665, "valid_targets_mean": 3322.4, "valid_targets_min": 736 }, { "epoch": 6.710280373831775, "grad_norm": 0.6374298891898735, "learning_rate": 2.112441677759769e-07, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.15255284309387207, "step": 4670, "valid_targets_mean": 3333.6, "valid_targets_min": 529 }, { "epoch": 6.7174694464414095, "grad_norm": 0.49118289338422527, "learning_rate": 2.0098345503833716e-07, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.10941498726606369, "step": 4675, "valid_targets_mean": 4543.6, "valid_targets_min": 1057 }, { "epoch": 6.724658519051042, "grad_norm": 0.5211196754678628, "learning_rate": 1.9097692255919843e-07, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.07783547788858414, "step": 4680, "valid_targets_mean": 2769.2, "valid_targets_min": 612 }, { "epoch": 6.731847591660676, "grad_norm": 0.4639278461542733, "learning_rate": 1.8122469880267335e-07, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.0822891891002655, "step": 4685, "valid_targets_mean": 3433.8, "valid_targets_min": 812 }, { "epoch": 6.7390366642703095, "grad_norm": 0.5699109580239698, "learning_rate": 1.717269089680462e-07, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.13950425386428833, "step": 4690, "valid_targets_mean": 3992.4, "valid_targets_min": 440 }, { "epoch": 6.746225736879943, "grad_norm": 0.5247787380613426, "learning_rate": 1.624836749881742e-07, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.10433037579059601, "step": 4695, "valid_targets_mean": 4130.0, "valid_targets_min": 722 }, { "epoch": 6.753414809489576, "grad_norm": 0.5002929707259851, "learning_rate": 1.5349511552792406e-07, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.11657604575157166, "step": 4700, "valid_targets_mean": 4010.6, "valid_targets_min": 645 }, { "epoch": 6.760603882099209, "grad_norm": 0.5473486191985781, "learning_rate": 1.4476134598263801e-07, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.10951299965381622, "step": 4705, "valid_targets_mean": 3421.9, "valid_targets_min": 775 }, { "epoch": 6.767792954708843, "grad_norm": 0.5364229068076471, "learning_rate": 1.362824784766681e-07, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.14374537765979767, "step": 4710, "valid_targets_mean": 4612.1, "valid_targets_min": 3213 }, { "epoch": 6.774982027318476, "grad_norm": 0.4971300029350325, "learning_rate": 1.2805862186191952e-07, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.11811932921409607, "step": 4715, "valid_targets_mean": 4107.0, "valid_targets_min": 1264 }, { "epoch": 6.782171099928109, "grad_norm": 0.601778889503626, "learning_rate": 1.200898817164631e-07, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.13035139441490173, "step": 4720, "valid_targets_mean": 4560.2, "valid_targets_min": 543 }, { "epoch": 6.789360172537743, "grad_norm": 0.5329664913979177, "learning_rate": 1.1237636034318045e-07, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.09042935818433762, "step": 4725, "valid_targets_mean": 2884.6, "valid_targets_min": 579 }, { "epoch": 6.796549245147376, "grad_norm": 0.5228200204151616, "learning_rate": 1.0491815676845207e-07, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.12473177909851074, "step": 4730, "valid_targets_mean": 4629.6, "valid_targets_min": 3120 }, { "epoch": 6.803738317757009, "grad_norm": 0.5690118973711813, "learning_rate": 9.771536674087145e-08, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.08270010352134705, "step": 4735, "valid_targets_mean": 3209.2, "valid_targets_min": 765 }, { "epoch": 6.8109273903666425, "grad_norm": 0.5794816335254488, "learning_rate": 9.076808273003724e-08, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.10203064233064651, "step": 4740, "valid_targets_mean": 3122.9, "valid_targets_min": 471 }, { "epoch": 6.818116462976276, "grad_norm": 0.547427353885318, "learning_rate": 8.407639392534972e-08, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.0994785875082016, "step": 4745, "valid_targets_mean": 2774.4, "valid_targets_min": 666 }, { "epoch": 6.825305535585909, "grad_norm": 0.5138980608440111, "learning_rate": 7.764038623487403e-08, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.11008846759796143, "step": 4750, "valid_targets_mean": 4515.4, "valid_targets_min": 3798 }, { "epoch": 6.832494608195542, "grad_norm": 0.5818429652487563, "learning_rate": 7.146014228423648e-08, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.11513659358024597, "step": 4755, "valid_targets_mean": 3747.6, "valid_targets_min": 756 }, { "epoch": 6.839683680805176, "grad_norm": 0.5618762340348782, "learning_rate": 6.553574141555442e-08, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377660632133484, "step": 4760, "valid_targets_mean": 4695.5, "valid_targets_min": 830 }, { "epoch": 6.846872753414809, "grad_norm": 0.6855689303799838, "learning_rate": 5.98672596864347e-08, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489717960357666, "step": 4765, "valid_targets_mean": 5110.5, "valid_targets_min": 3940 }, { "epoch": 6.854061826024443, "grad_norm": 0.5164135363567788, "learning_rate": 5.445476986898568e-08, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.09690165519714355, "step": 4770, "valid_targets_mean": 3323.0, "valid_targets_min": 745 }, { "epoch": 6.861250898634077, "grad_norm": 0.5218845429859494, "learning_rate": 4.929834144888013e-08, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.11343638598918915, "step": 4775, "valid_targets_mean": 3724.2, "valid_targets_min": 545 }, { "epoch": 6.86843997124371, "grad_norm": 0.5261894149495684, "learning_rate": 4.439804062447373e-08, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.13848835229873657, "step": 4780, "valid_targets_mean": 4062.4, "valid_targets_min": 515 }, { "epoch": 6.875629043853343, "grad_norm": 0.5845958694842275, "learning_rate": 3.9753930305950204e-08, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.08328050374984741, "step": 4785, "valid_targets_mean": 2377.4, "valid_targets_min": 486 }, { "epoch": 6.8828181164629765, "grad_norm": 0.5408789060985649, "learning_rate": 3.536607011451088e-08, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.10192709416151047, "step": 4790, "valid_targets_mean": 3126.0, "valid_targets_min": 650 }, { "epoch": 6.89000718907261, "grad_norm": 0.5731456185915917, "learning_rate": 3.123451638161079e-08, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.09156908094882965, "step": 4795, "valid_targets_mean": 3015.9, "valid_targets_min": 483 }, { "epoch": 6.897196261682243, "grad_norm": 0.5854299367435224, "learning_rate": 2.7359322148237112e-08, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.11642911285161972, "step": 4800, "valid_targets_mean": 3307.0, "valid_targets_min": 556 }, { "epoch": 6.904385334291876, "grad_norm": 0.5763256439747025, "learning_rate": 2.374053716422964e-08, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.10047812759876251, "step": 4805, "valid_targets_mean": 3457.4, "valid_targets_min": 854 }, { "epoch": 6.91157440690151, "grad_norm": 0.5585836434639017, "learning_rate": 2.0378207887639113e-08, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.13827770948410034, "step": 4810, "valid_targets_mean": 3833.6, "valid_targets_min": 691 }, { "epoch": 6.918763479511143, "grad_norm": 0.5021673769155096, "learning_rate": 1.7272377484127688e-08, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.09062834084033966, "step": 4815, "valid_targets_mean": 3467.6, "valid_targets_min": 554 }, { "epoch": 6.925952552120776, "grad_norm": 0.5420506057791676, "learning_rate": 1.4423085826427152e-08, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.1145763099193573, "step": 4820, "valid_targets_mean": 3325.9, "valid_targets_min": 450 }, { "epoch": 6.93314162473041, "grad_norm": 0.5429716282374907, "learning_rate": 1.1830369493808225e-08, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.0795266330242157, "step": 4825, "valid_targets_mean": 2546.1, "valid_targets_min": 374 }, { "epoch": 6.940330697340043, "grad_norm": 0.48748914177526553, "learning_rate": 9.49426177163204e-09, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494419127702713, "step": 4830, "valid_targets_mean": 6738.9, "valid_targets_min": 3612 }, { "epoch": 6.947519769949676, "grad_norm": 0.5597403208591729, "learning_rate": 7.414792650901614e-09, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.0868077427148819, "step": 4835, "valid_targets_mean": 3310.8, "valid_targets_min": 678 }, { "epoch": 6.9547088425593095, "grad_norm": 0.49658819468141957, "learning_rate": 5.591988827893247e-09, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.08313396573066711, "step": 4840, "valid_targets_mean": 3697.8, "valid_targets_min": 999 }, { "epoch": 6.961897915168943, "grad_norm": 0.6028617506588944, "learning_rate": 4.025873703810135e-09, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.11810679733753204, "step": 4845, "valid_targets_mean": 3725.8, "valid_targets_min": 684 }, { "epoch": 6.969086987778576, "grad_norm": 0.5726678330735068, "learning_rate": 2.7164673844737312e-09, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.13200724124908447, "step": 4850, "valid_targets_mean": 4098.9, "valid_targets_min": 575 }, { "epoch": 6.97627606038821, "grad_norm": 0.6080274682036577, "learning_rate": 1.6637866800750524e-09, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.12892693281173706, "step": 4855, "valid_targets_mean": 4071.0, "valid_targets_min": 314 }, { "epoch": 6.983465132997844, "grad_norm": 0.5745138575411652, "learning_rate": 8.678451049548564e-10, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.12005611509084702, "step": 4860, "valid_targets_mean": 3703.9, "valid_targets_min": 816 }, { "epoch": 6.990654205607477, "grad_norm": 0.6098451214662762, "learning_rate": 3.286528774326669e-10, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.12149364501237869, "step": 4865, "valid_targets_mean": 3561.4, "valid_targets_min": 927 }, { "epoch": 6.99784327821711, "grad_norm": 0.5050849963191119, "learning_rate": 4.621691966688602e-11, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.11706176400184631, "step": 4870, "valid_targets_mean": 4379.5, "valid_targets_min": 835 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101859748363495, "step": 4872, "total_flos": 2.402936079087829e+18, "train_loss": 0.2685813971707974, "train_runtime": 61451.9039, "train_samples_per_second": 1.267, "train_steps_per_second": 0.079, "valid_targets_mean": 2883.4, "valid_targets_min": 615 } ], "logging_steps": 5, "max_steps": 4872, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.402936079087829e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }