{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4354, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008038585209003215, "grad_norm": 15.487869480598855, "learning_rate": 3.6697247706422023e-07, "loss": 0.6902, "loss_nan_ranks": 0, "loss_rank_avg": 0.7185355424880981, "step": 5, "valid_targets_mean": 6218.2, "valid_targets_min": 1794 }, { "epoch": 0.01607717041800643, "grad_norm": 16.705030639862873, "learning_rate": 8.256880733944956e-07, "loss": 0.6933, "loss_nan_ranks": 0, "loss_rank_avg": 0.7040611505508423, "step": 10, "valid_targets_mean": 5971.0, "valid_targets_min": 1288 }, { "epoch": 0.024115755627009645, "grad_norm": 12.454754329110074, "learning_rate": 1.2844036697247707e-06, "loss": 0.6518, "loss_nan_ranks": 0, "loss_rank_avg": 0.5946602821350098, "step": 15, "valid_targets_mean": 5925.1, "valid_targets_min": 2579 }, { "epoch": 0.03215434083601286, "grad_norm": 11.220424247643189, "learning_rate": 1.743119266055046e-06, "loss": 0.6289, "loss_nan_ranks": 0, "loss_rank_avg": 0.5990424156188965, "step": 20, "valid_targets_mean": 4584.0, "valid_targets_min": 1532 }, { "epoch": 0.04019292604501608, "grad_norm": 6.228683067868804, "learning_rate": 2.2018348623853215e-06, "loss": 0.6005, "loss_nan_ranks": 0, "loss_rank_avg": 0.5438046455383301, "step": 25, "valid_targets_mean": 5913.2, "valid_targets_min": 1007 }, { "epoch": 0.04823151125401929, "grad_norm": 3.705703138387386, "learning_rate": 2.6605504587155968e-06, "loss": 0.5547, "loss_nan_ranks": 0, "loss_rank_avg": 0.4752989411354065, "step": 30, "valid_targets_mean": 5618.4, "valid_targets_min": 2547 }, { "epoch": 0.05627009646302251, "grad_norm": 2.2930526520291594, "learning_rate": 3.119266055045872e-06, "loss": 0.5046, "loss_nan_ranks": 0, "loss_rank_avg": 0.4889165163040161, "step": 35, "valid_targets_mean": 5507.8, "valid_targets_min": 1890 }, { "epoch": 0.06430868167202572, "grad_norm": 1.3788680494230385, "learning_rate": 3.5779816513761473e-06, "loss": 0.4708, "loss_nan_ranks": 0, "loss_rank_avg": 0.4641118049621582, "step": 40, "valid_targets_mean": 5501.1, "valid_targets_min": 2317 }, { "epoch": 0.07234726688102894, "grad_norm": 1.0707354953475499, "learning_rate": 4.036697247706423e-06, "loss": 0.4526, "loss_nan_ranks": 0, "loss_rank_avg": 0.44059669971466064, "step": 45, "valid_targets_mean": 5165.7, "valid_targets_min": 2549 }, { "epoch": 0.08038585209003216, "grad_norm": 1.0042764156736175, "learning_rate": 4.4954128440366975e-06, "loss": 0.4748, "loss_nan_ranks": 0, "loss_rank_avg": 0.4787266254425049, "step": 50, "valid_targets_mean": 5976.1, "valid_targets_min": 2505 }, { "epoch": 0.08842443729903537, "grad_norm": 0.8578820860325631, "learning_rate": 4.954128440366973e-06, "loss": 0.4525, "loss_nan_ranks": 0, "loss_rank_avg": 0.5156609416007996, "step": 55, "valid_targets_mean": 5803.9, "valid_targets_min": 707 }, { "epoch": 0.09646302250803858, "grad_norm": 0.7054778587694457, "learning_rate": 5.412844036697248e-06, "loss": 0.4304, "loss_nan_ranks": 0, "loss_rank_avg": 0.3835570216178894, "step": 60, "valid_targets_mean": 4718.1, "valid_targets_min": 368 }, { "epoch": 0.1045016077170418, "grad_norm": 0.5921455336434676, "learning_rate": 5.871559633027524e-06, "loss": 0.4285, "loss_nan_ranks": 0, "loss_rank_avg": 0.42219042778015137, "step": 65, "valid_targets_mean": 5650.0, "valid_targets_min": 1775 }, { "epoch": 0.11254019292604502, "grad_norm": 0.6432811667585792, "learning_rate": 6.330275229357799e-06, "loss": 0.4026, "loss_nan_ranks": 0, "loss_rank_avg": 0.4135628044605255, "step": 70, "valid_targets_mean": 4397.6, "valid_targets_min": 918 }, { "epoch": 0.12057877813504823, "grad_norm": 0.5954192316469062, "learning_rate": 6.788990825688074e-06, "loss": 0.4032, "loss_nan_ranks": 0, "loss_rank_avg": 0.3610105514526367, "step": 75, "valid_targets_mean": 5901.3, "valid_targets_min": 860 }, { "epoch": 0.12861736334405144, "grad_norm": 0.5561323896575481, "learning_rate": 7.247706422018349e-06, "loss": 0.4197, "loss_nan_ranks": 0, "loss_rank_avg": 0.3978654742240906, "step": 80, "valid_targets_mean": 6885.6, "valid_targets_min": 2842 }, { "epoch": 0.13665594855305466, "grad_norm": 0.5117138640075914, "learning_rate": 7.706422018348626e-06, "loss": 0.3789, "loss_nan_ranks": 0, "loss_rank_avg": 0.31353235244750977, "step": 85, "valid_targets_mean": 5075.9, "valid_targets_min": 1968 }, { "epoch": 0.14469453376205788, "grad_norm": 0.5185797042450433, "learning_rate": 8.1651376146789e-06, "loss": 0.3764, "loss_nan_ranks": 0, "loss_rank_avg": 0.35735011100769043, "step": 90, "valid_targets_mean": 6150.4, "valid_targets_min": 256 }, { "epoch": 0.1527331189710611, "grad_norm": 0.5651365251126268, "learning_rate": 8.623853211009175e-06, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.36827707290649414, "step": 95, "valid_targets_mean": 4620.4, "valid_targets_min": 514 }, { "epoch": 0.1607717041800643, "grad_norm": 0.5030199885647652, "learning_rate": 9.08256880733945e-06, "loss": 0.3975, "loss_nan_ranks": 0, "loss_rank_avg": 0.4012790322303772, "step": 100, "valid_targets_mean": 5582.3, "valid_targets_min": 1716 }, { "epoch": 0.16881028938906753, "grad_norm": 0.6830238553526883, "learning_rate": 9.541284403669727e-06, "loss": 0.3755, "loss_nan_ranks": 0, "loss_rank_avg": 0.4395039677619934, "step": 105, "valid_targets_mean": 6038.6, "valid_targets_min": 1901 }, { "epoch": 0.17684887459807075, "grad_norm": 0.5054231795330882, "learning_rate": 1e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.33131682872772217, "step": 110, "valid_targets_mean": 4955.4, "valid_targets_min": 1799 }, { "epoch": 0.18488745980707397, "grad_norm": 0.5366188136072383, "learning_rate": 1.0458715596330275e-05, "loss": 0.388, "loss_nan_ranks": 0, "loss_rank_avg": 0.3644598722457886, "step": 115, "valid_targets_mean": 4911.2, "valid_targets_min": 786 }, { "epoch": 0.19292604501607716, "grad_norm": 0.4523650959270129, "learning_rate": 1.091743119266055e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.3105719983577728, "step": 120, "valid_targets_mean": 5628.5, "valid_targets_min": 2498 }, { "epoch": 0.20096463022508038, "grad_norm": 0.7309781032290188, "learning_rate": 1.1376146788990828e-05, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.3655633330345154, "step": 125, "valid_targets_mean": 4542.7, "valid_targets_min": 726 }, { "epoch": 0.2090032154340836, "grad_norm": 0.5332714906008124, "learning_rate": 1.1834862385321102e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.3906615376472473, "step": 130, "valid_targets_mean": 4868.5, "valid_targets_min": 710 }, { "epoch": 0.2170418006430868, "grad_norm": 0.5413137226235663, "learning_rate": 1.2293577981651376e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.3571460545063019, "step": 135, "valid_targets_mean": 4481.6, "valid_targets_min": 2033 }, { "epoch": 0.22508038585209003, "grad_norm": 0.4819038192629592, "learning_rate": 1.2752293577981652e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.36454111337661743, "step": 140, "valid_targets_mean": 5984.9, "valid_targets_min": 1926 }, { "epoch": 0.23311897106109325, "grad_norm": 3.4522565919790846, "learning_rate": 1.3211009174311929e-05, "loss": 0.3607, "loss_nan_ranks": 0, "loss_rank_avg": 0.41981396079063416, "step": 145, "valid_targets_mean": 5873.2, "valid_targets_min": 2123 }, { "epoch": 0.24115755627009647, "grad_norm": 0.480191765296101, "learning_rate": 1.3669724770642203e-05, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.3925219774246216, "step": 150, "valid_targets_mean": 6098.4, "valid_targets_min": 477 }, { "epoch": 0.2491961414790997, "grad_norm": 0.5275995100411426, "learning_rate": 1.4128440366972477e-05, "loss": 0.3548, "loss_nan_ranks": 0, "loss_rank_avg": 0.39259496331214905, "step": 155, "valid_targets_mean": 5801.5, "valid_targets_min": 1534 }, { "epoch": 0.2572347266881029, "grad_norm": 0.4497605594039018, "learning_rate": 1.4587155963302753e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.2661333680152893, "step": 160, "valid_targets_mean": 5559.2, "valid_targets_min": 2047 }, { "epoch": 0.2652733118971061, "grad_norm": 0.5186829745052237, "learning_rate": 1.504587155963303e-05, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.32883208990097046, "step": 165, "valid_targets_mean": 5211.5, "valid_targets_min": 2437 }, { "epoch": 0.2733118971061093, "grad_norm": 0.5378694289846688, "learning_rate": 1.5504587155963304e-05, "loss": 0.328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3817879557609558, "step": 170, "valid_targets_mean": 6117.9, "valid_targets_min": 949 }, { "epoch": 0.28135048231511256, "grad_norm": 0.47655599775978846, "learning_rate": 1.5963302752293578e-05, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.3332779109477997, "step": 175, "valid_targets_mean": 6652.5, "valid_targets_min": 1061 }, { "epoch": 0.28938906752411575, "grad_norm": 0.5175596131296907, "learning_rate": 1.6422018348623852e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.2893512547016144, "step": 180, "valid_targets_mean": 5451.6, "valid_targets_min": 2715 }, { "epoch": 0.297427652733119, "grad_norm": 0.47484987666886874, "learning_rate": 1.688073394495413e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.3134007751941681, "step": 185, "valid_targets_mean": 5775.2, "valid_targets_min": 2507 }, { "epoch": 0.3054662379421222, "grad_norm": 0.5722106466766347, "learning_rate": 1.7339449541284407e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.316297709941864, "step": 190, "valid_targets_mean": 5722.6, "valid_targets_min": 602 }, { "epoch": 0.3135048231511254, "grad_norm": 0.5720677850765011, "learning_rate": 1.779816513761468e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.4151928126811981, "step": 195, "valid_targets_mean": 5507.1, "valid_targets_min": 2373 }, { "epoch": 0.3215434083601286, "grad_norm": 0.5017657301946835, "learning_rate": 1.8256880733944955e-05, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.34416627883911133, "step": 200, "valid_targets_mean": 5537.2, "valid_targets_min": 962 }, { "epoch": 0.3295819935691318, "grad_norm": 0.5004261222863479, "learning_rate": 1.8715596330275232e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.2886529862880707, "step": 205, "valid_targets_mean": 5239.9, "valid_targets_min": 643 }, { "epoch": 0.33762057877813506, "grad_norm": 0.4773649164878627, "learning_rate": 1.9174311926605506e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.3376484215259552, "step": 210, "valid_targets_mean": 6458.6, "valid_targets_min": 662 }, { "epoch": 0.34565916398713825, "grad_norm": 0.4850206053577162, "learning_rate": 1.963302752293578e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.2979908585548401, "step": 215, "valid_targets_mean": 5263.2, "valid_targets_min": 797 }, { "epoch": 0.3536977491961415, "grad_norm": 0.5013386580471846, "learning_rate": 2.0091743119266058e-05, "loss": 0.334, "loss_nan_ranks": 0, "loss_rank_avg": 0.30896592140197754, "step": 220, "valid_targets_mean": 5896.0, "valid_targets_min": 1675 }, { "epoch": 0.3617363344051447, "grad_norm": 0.5570090249676257, "learning_rate": 2.0550458715596332e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.3088981509208679, "step": 225, "valid_targets_mean": 5530.9, "valid_targets_min": 1200 }, { "epoch": 0.36977491961414793, "grad_norm": 0.597801049082016, "learning_rate": 2.100917431192661e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.3181556165218353, "step": 230, "valid_targets_mean": 6380.2, "valid_targets_min": 2558 }, { "epoch": 0.3778135048231511, "grad_norm": 0.5191577104221832, "learning_rate": 2.1467889908256883e-05, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3778053820133209, "step": 235, "valid_targets_mean": 5636.4, "valid_targets_min": 344 }, { "epoch": 0.3858520900321543, "grad_norm": 0.5854719585440191, "learning_rate": 2.1926605504587157e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.35405513644218445, "step": 240, "valid_targets_mean": 5000.0, "valid_targets_min": 1732 }, { "epoch": 0.39389067524115756, "grad_norm": 0.5476862094602315, "learning_rate": 2.238532110091743e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.2814165949821472, "step": 245, "valid_targets_mean": 4733.5, "valid_targets_min": 1002 }, { "epoch": 0.40192926045016075, "grad_norm": 0.5926979503199129, "learning_rate": 2.2844036697247705e-05, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.3770928382873535, "step": 250, "valid_targets_mean": 5427.2, "valid_targets_min": 493 }, { "epoch": 0.409967845659164, "grad_norm": 0.6100209266847794, "learning_rate": 2.3302752293577983e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3547223210334778, "step": 255, "valid_targets_mean": 4440.1, "valid_targets_min": 485 }, { "epoch": 0.4180064308681672, "grad_norm": 0.5566232844963857, "learning_rate": 2.376146788990826e-05, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.3098330497741699, "step": 260, "valid_targets_mean": 4793.3, "valid_targets_min": 364 }, { "epoch": 0.42604501607717044, "grad_norm": 0.5427122101027465, "learning_rate": 2.4220183486238534e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.31646621227264404, "step": 265, "valid_targets_mean": 4927.3, "valid_targets_min": 452 }, { "epoch": 0.4340836012861736, "grad_norm": 0.5988872869137836, "learning_rate": 2.467889908256881e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.34495389461517334, "step": 270, "valid_targets_mean": 4704.2, "valid_targets_min": 329 }, { "epoch": 0.44212218649517687, "grad_norm": 0.547941917409528, "learning_rate": 2.5137614678899085e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.3075386881828308, "step": 275, "valid_targets_mean": 4813.1, "valid_targets_min": 946 }, { "epoch": 0.45016077170418006, "grad_norm": 0.5249153697259977, "learning_rate": 2.559633027522936e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.28792035579681396, "step": 280, "valid_targets_mean": 5561.9, "valid_targets_min": 2942 }, { "epoch": 0.45819935691318325, "grad_norm": 0.43052674384652867, "learning_rate": 2.6055045871559633e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.31526419520378113, "step": 285, "valid_targets_mean": 7136.0, "valid_targets_min": 2915 }, { "epoch": 0.4662379421221865, "grad_norm": 0.5540575973124553, "learning_rate": 2.6513761467889907e-05, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.32834839820861816, "step": 290, "valid_targets_mean": 5022.2, "valid_targets_min": 237 }, { "epoch": 0.4742765273311897, "grad_norm": 0.48094194473889346, "learning_rate": 2.6972477064220185e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.3205365836620331, "step": 295, "valid_targets_mean": 5865.0, "valid_targets_min": 2315 }, { "epoch": 0.48231511254019294, "grad_norm": 0.5618267371932142, "learning_rate": 2.7431192660550462e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.3605026602745056, "step": 300, "valid_targets_mean": 4986.5, "valid_targets_min": 921 }, { "epoch": 0.4903536977491961, "grad_norm": 0.6404105383558549, "learning_rate": 2.7889908256880736e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.30333420634269714, "step": 305, "valid_targets_mean": 4107.6, "valid_targets_min": 466 }, { "epoch": 0.4983922829581994, "grad_norm": 0.5306270510654744, "learning_rate": 2.8348623853211014e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.29267704486846924, "step": 310, "valid_targets_mean": 5249.4, "valid_targets_min": 2300 }, { "epoch": 0.5064308681672026, "grad_norm": 0.49099328683222326, "learning_rate": 2.8807339449541288e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.30092453956604004, "step": 315, "valid_targets_mean": 5905.2, "valid_targets_min": 1454 }, { "epoch": 0.5144694533762058, "grad_norm": 0.663160338132964, "learning_rate": 2.926605504587156e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2730156183242798, "step": 320, "valid_targets_mean": 4000.4, "valid_targets_min": 419 }, { "epoch": 0.522508038585209, "grad_norm": 0.49329600788095035, "learning_rate": 2.9724770642201836e-05, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.32109999656677246, "step": 325, "valid_targets_mean": 6141.3, "valid_targets_min": 2263 }, { "epoch": 0.5305466237942122, "grad_norm": 0.5752524694010668, "learning_rate": 3.0183486238532113e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.40009579062461853, "step": 330, "valid_targets_mean": 6205.9, "valid_targets_min": 437 }, { "epoch": 0.5385852090032154, "grad_norm": 0.5350750612199158, "learning_rate": 3.0642201834862384e-05, "loss": 0.2993, "loss_nan_ranks": 0, "loss_rank_avg": 0.3526759147644043, "step": 335, "valid_targets_mean": 5805.6, "valid_targets_min": 1255 }, { "epoch": 0.5466237942122186, "grad_norm": 0.5826856037526428, "learning_rate": 3.110091743119266e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.3246879279613495, "step": 340, "valid_targets_mean": 5508.0, "valid_targets_min": 1309 }, { "epoch": 0.5546623794212219, "grad_norm": 0.42437748396411806, "learning_rate": 3.155963302752294e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.2742518186569214, "step": 345, "valid_targets_mean": 7056.8, "valid_targets_min": 2993 }, { "epoch": 0.5627009646302251, "grad_norm": 0.6228872767131681, "learning_rate": 3.201834862385321e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.30292758345603943, "step": 350, "valid_targets_mean": 4400.6, "valid_targets_min": 873 }, { "epoch": 0.5707395498392283, "grad_norm": 0.4664154597507688, "learning_rate": 3.2477064220183487e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.3061991333961487, "step": 355, "valid_targets_mean": 6292.2, "valid_targets_min": 3215 }, { "epoch": 0.5787781350482315, "grad_norm": 0.5161256905301413, "learning_rate": 3.293577981651377e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.24547383189201355, "step": 360, "valid_targets_mean": 4519.0, "valid_targets_min": 319 }, { "epoch": 0.5868167202572347, "grad_norm": 0.5365528928336145, "learning_rate": 3.339449541284404e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.29534512758255005, "step": 365, "valid_targets_mean": 4922.1, "valid_targets_min": 984 }, { "epoch": 0.594855305466238, "grad_norm": 0.5097548549634454, "learning_rate": 3.3853211009174315e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.296095073223114, "step": 370, "valid_targets_mean": 5232.6, "valid_targets_min": 872 }, { "epoch": 0.6028938906752411, "grad_norm": 0.49051425109618985, "learning_rate": 3.431192660550459e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.30179792642593384, "step": 375, "valid_targets_mean": 5981.7, "valid_targets_min": 1437 }, { "epoch": 0.6109324758842444, "grad_norm": 0.5966512802302277, "learning_rate": 3.477064220183486e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.3060946464538574, "step": 380, "valid_targets_mean": 5208.1, "valid_targets_min": 1644 }, { "epoch": 0.6189710610932476, "grad_norm": 0.6706382795742738, "learning_rate": 3.5229357798165144e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.34184399247169495, "step": 385, "valid_targets_mean": 5654.9, "valid_targets_min": 1790 }, { "epoch": 0.6270096463022508, "grad_norm": 0.5660946301266201, "learning_rate": 3.568807339449542e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.2994377017021179, "step": 390, "valid_targets_mean": 5468.1, "valid_targets_min": 696 }, { "epoch": 0.635048231511254, "grad_norm": 0.5340949761801713, "learning_rate": 3.614678899082569e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.30014336109161377, "step": 395, "valid_targets_mean": 5420.6, "valid_targets_min": 574 }, { "epoch": 0.6430868167202572, "grad_norm": 0.4923375299212512, "learning_rate": 3.6605504587155966e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.29296672344207764, "step": 400, "valid_targets_mean": 5953.8, "valid_targets_min": 2356 }, { "epoch": 0.6511254019292605, "grad_norm": 0.4912029841427183, "learning_rate": 3.706422018348624e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.24615658819675446, "step": 405, "valid_targets_mean": 5338.8, "valid_targets_min": 2680 }, { "epoch": 0.6591639871382636, "grad_norm": 0.46236233354479367, "learning_rate": 3.7522935779816514e-05, "loss": 0.2961, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032350540161133, "step": 410, "valid_targets_mean": 5982.8, "valid_targets_min": 3495 }, { "epoch": 0.6672025723472669, "grad_norm": 0.5212184732903835, "learning_rate": 3.798165137614679e-05, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.3059643507003784, "step": 415, "valid_targets_mean": 5736.6, "valid_targets_min": 2521 }, { "epoch": 0.6752411575562701, "grad_norm": 0.5207305397129113, "learning_rate": 3.844036697247707e-05, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.31649553775787354, "step": 420, "valid_targets_mean": 5298.9, "valid_targets_min": 3490 }, { "epoch": 0.6832797427652733, "grad_norm": 0.6992704167148815, "learning_rate": 3.889908256880734e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.2679362893104553, "step": 425, "valid_targets_mean": 5616.1, "valid_targets_min": 2463 }, { "epoch": 0.6913183279742765, "grad_norm": 0.511472564575663, "learning_rate": 3.935779816513762e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.30654776096343994, "step": 430, "valid_targets_mean": 5721.6, "valid_targets_min": 3272 }, { "epoch": 0.6993569131832797, "grad_norm": 0.4709582852431494, "learning_rate": 3.981651376146789e-05, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.2843867540359497, "step": 435, "valid_targets_mean": 5574.6, "valid_targets_min": 2023 }, { "epoch": 0.707395498392283, "grad_norm": 0.453220231562951, "learning_rate": 3.999994213536979e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.30728816986083984, "step": 440, "valid_targets_mean": 6203.7, "valid_targets_min": 3453 }, { "epoch": 0.7154340836012861, "grad_norm": 0.4755977887273865, "learning_rate": 3.999958851939771e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.28380826115608215, "step": 445, "valid_targets_mean": 6442.1, "valid_targets_min": 2803 }, { "epoch": 0.7234726688102894, "grad_norm": 0.49493667906582395, "learning_rate": 3.999891344014729e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.26691269874572754, "step": 450, "valid_targets_mean": 4888.2, "valid_targets_min": 2047 }, { "epoch": 0.7315112540192926, "grad_norm": 0.5095276271053644, "learning_rate": 3.999791690846941e-05, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.2900855243206024, "step": 455, "valid_targets_mean": 4938.0, "valid_targets_min": 1713 }, { "epoch": 0.7395498392282959, "grad_norm": 0.5205052676880491, "learning_rate": 3.9996598940381816e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.3060019910335541, "step": 460, "valid_targets_mean": 5271.0, "valid_targets_min": 699 }, { "epoch": 0.747588424437299, "grad_norm": 0.4876809443820683, "learning_rate": 3.9994959557068863e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.27658092975616455, "step": 465, "valid_targets_mean": 5591.4, "valid_targets_min": 1875 }, { "epoch": 0.7556270096463023, "grad_norm": 0.4923720425882284, "learning_rate": 3.999299878488117e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531621754169464, "step": 470, "valid_targets_mean": 5429.0, "valid_targets_min": 2498 }, { "epoch": 0.7636655948553055, "grad_norm": 0.585919343961974, "learning_rate": 3.99907166553352e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.30858397483825684, "step": 475, "valid_targets_mean": 4827.4, "valid_targets_min": 513 }, { "epoch": 0.7717041800643086, "grad_norm": 0.4747623432707116, "learning_rate": 3.9988113205112755e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.33221951127052307, "step": 480, "valid_targets_mean": 5955.8, "valid_targets_min": 675 }, { "epoch": 0.7797427652733119, "grad_norm": 0.456621692177911, "learning_rate": 3.998518847606036e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.28177374601364136, "step": 485, "valid_targets_mean": 5865.8, "valid_targets_min": 2025 }, { "epoch": 0.7877813504823151, "grad_norm": 0.4665811147170575, "learning_rate": 3.998194251518865e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.3034052550792694, "step": 490, "valid_targets_mean": 5511.8, "valid_targets_min": 3215 }, { "epoch": 0.7958199356913184, "grad_norm": 0.3911511618161914, "learning_rate": 3.9978375374671555e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.24626390635967255, "step": 495, "valid_targets_mean": 7323.9, "valid_targets_min": 2857 }, { "epoch": 0.8038585209003215, "grad_norm": 0.5396114749470258, "learning_rate": 3.997448711184548e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.308045893907547, "step": 500, "valid_targets_mean": 5182.1, "valid_targets_min": 747 }, { "epoch": 0.8118971061093248, "grad_norm": 0.4849544264425815, "learning_rate": 3.997027778920841e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3522014915943146, "step": 505, "valid_targets_mean": 6453.4, "valid_targets_min": 2028 }, { "epoch": 0.819935691318328, "grad_norm": 0.5350245918364654, "learning_rate": 3.9965747474418855e-05, "loss": 0.3212, "loss_nan_ranks": 0, "loss_rank_avg": 0.3169665038585663, "step": 510, "valid_targets_mean": 4740.1, "valid_targets_min": 576 }, { "epoch": 0.8279742765273312, "grad_norm": 0.4938218700461966, "learning_rate": 3.996089624029482e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.25281214714050293, "step": 515, "valid_targets_mean": 5391.9, "valid_targets_min": 588 }, { "epoch": 0.8360128617363344, "grad_norm": 0.46030799853278453, "learning_rate": 3.995572416481258e-05, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.2778337001800537, "step": 520, "valid_targets_mean": 5831.8, "valid_targets_min": 1928 }, { "epoch": 0.8440514469453376, "grad_norm": 0.4832421033589269, "learning_rate": 3.9950231331105464e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.28779375553131104, "step": 525, "valid_targets_mean": 5119.5, "valid_targets_min": 661 }, { "epoch": 0.8520900321543409, "grad_norm": 0.5293558575026555, "learning_rate": 3.994441782746251e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.2785415053367615, "step": 530, "valid_targets_mean": 5092.9, "valid_targets_min": 2581 }, { "epoch": 0.860128617363344, "grad_norm": 0.416392644109728, "learning_rate": 3.993828374732704e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805801033973694, "step": 535, "valid_targets_mean": 6368.6, "valid_targets_min": 355 }, { "epoch": 0.8681672025723473, "grad_norm": 0.4645205058216023, "learning_rate": 3.993182918929515e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.30918392539024353, "step": 540, "valid_targets_mean": 5649.8, "valid_targets_min": 2795 }, { "epoch": 0.8762057877813505, "grad_norm": 0.5308378752814893, "learning_rate": 3.992505425711414e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631094455718994, "step": 545, "valid_targets_mean": 4481.9, "valid_targets_min": 514 }, { "epoch": 0.8842443729903537, "grad_norm": 0.4801689653969418, "learning_rate": 3.991795905968086e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.30362850427627563, "step": 550, "valid_targets_mean": 5824.9, "valid_targets_min": 3011 }, { "epoch": 0.8922829581993569, "grad_norm": 0.44577993655229686, "learning_rate": 3.991054371103992e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.26914289593696594, "step": 555, "valid_targets_mean": 6685.0, "valid_targets_min": 2217 }, { "epoch": 0.9003215434083601, "grad_norm": 0.45000332721151537, "learning_rate": 3.9902808330381876e-05, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.26276689767837524, "step": 560, "valid_targets_mean": 6083.2, "valid_targets_min": 3312 }, { "epoch": 0.9083601286173634, "grad_norm": 0.5316772461451206, "learning_rate": 3.989475304204135e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.3673328757286072, "step": 565, "valid_targets_mean": 6526.5, "valid_targets_min": 2025 }, { "epoch": 0.9163987138263665, "grad_norm": 0.45002232479827187, "learning_rate": 3.988637797549496e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.25491195917129517, "step": 570, "valid_targets_mean": 6206.9, "valid_targets_min": 660 }, { "epoch": 0.9244372990353698, "grad_norm": 0.6688784807827985, "learning_rate": 3.9877683265359294e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.23365923762321472, "step": 575, "valid_targets_mean": 5251.8, "valid_targets_min": 2129 }, { "epoch": 0.932475884244373, "grad_norm": 0.5328784356408865, "learning_rate": 3.986866905138874e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.2967522144317627, "step": 580, "valid_targets_mean": 4377.9, "valid_targets_min": 398 }, { "epoch": 0.9405144694533762, "grad_norm": 0.4705101238005458, "learning_rate": 3.985933547847319e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.276937335729599, "step": 585, "valid_targets_mean": 5281.8, "valid_targets_min": 971 }, { "epoch": 0.9485530546623794, "grad_norm": 0.39879237511284055, "learning_rate": 3.984968269663582e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.268502801656723, "step": 590, "valid_targets_mean": 6211.7, "valid_targets_min": 2174 }, { "epoch": 0.9565916398713826, "grad_norm": 0.4480245882027022, "learning_rate": 3.983971086103053e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714992165565491, "step": 595, "valid_targets_mean": 5526.9, "valid_targets_min": 349 }, { "epoch": 0.9646302250803859, "grad_norm": 0.5403266638905054, "learning_rate": 3.982942013193958e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.3248938322067261, "step": 600, "valid_targets_mean": 6144.6, "valid_targets_min": 636 }, { "epoch": 0.9726688102893891, "grad_norm": 0.4516840633756994, "learning_rate": 3.981881067477095e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717623710632324, "step": 605, "valid_targets_mean": 5657.6, "valid_targets_min": 2868 }, { "epoch": 0.9807073954983923, "grad_norm": 0.4528229245449106, "learning_rate": 3.9807882660055696e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597085237503052, "step": 610, "valid_targets_mean": 5101.6, "valid_targets_min": 2236 }, { "epoch": 0.9887459807073955, "grad_norm": 0.44017945177584167, "learning_rate": 3.979663626344519e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.25955039262771606, "step": 615, "valid_targets_mean": 5319.9, "valid_targets_min": 686 }, { "epoch": 0.9967845659163987, "grad_norm": 0.47936626435483093, "learning_rate": 3.978507166570834e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.27693191170692444, "step": 620, "valid_targets_mean": 4538.5, "valid_targets_min": 1621 }, { "epoch": 1.004823151125402, "grad_norm": 0.4481854100624881, "learning_rate": 3.9773189052728645e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.2927781641483307, "step": 625, "valid_targets_mean": 5881.1, "valid_targets_min": 439 }, { "epoch": 1.0128617363344052, "grad_norm": 0.4518269756671226, "learning_rate": 3.9760988615501216e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.21591615676879883, "step": 630, "valid_targets_mean": 5202.7, "valid_targets_min": 706 }, { "epoch": 1.0209003215434083, "grad_norm": 0.4894405054425604, "learning_rate": 3.974847055012971e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.263643354177475, "step": 635, "valid_targets_mean": 4966.3, "valid_targets_min": 407 }, { "epoch": 1.0289389067524115, "grad_norm": 0.46931111935501457, "learning_rate": 3.97356350578232e-05, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.27274036407470703, "step": 640, "valid_targets_mean": 6239.4, "valid_targets_min": 2734 }, { "epoch": 1.0369774919614148, "grad_norm": 0.45174077610801744, "learning_rate": 3.9722482344892885e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2617829442024231, "step": 645, "valid_targets_mean": 5997.4, "valid_targets_min": 2568 }, { "epoch": 1.045016077170418, "grad_norm": 0.4548552448131556, "learning_rate": 3.970901262274883e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.26283806562423706, "step": 650, "valid_targets_mean": 6102.5, "valid_targets_min": 2567 }, { "epoch": 1.0530546623794212, "grad_norm": 0.43090204468670307, "learning_rate": 3.9695226107896544e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.23034942150115967, "step": 655, "valid_targets_mean": 5608.3, "valid_targets_min": 2451 }, { "epoch": 1.0610932475884245, "grad_norm": 0.4842292354424898, "learning_rate": 3.96811230219335e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.33251893520355225, "step": 660, "valid_targets_mean": 6044.6, "valid_targets_min": 1019 }, { "epoch": 1.0691318327974277, "grad_norm": 0.5166627086454233, "learning_rate": 3.9666703591545577e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.264485239982605, "step": 665, "valid_targets_mean": 5534.3, "valid_targets_min": 1623 }, { "epoch": 1.077170418006431, "grad_norm": 0.4561205383774768, "learning_rate": 3.965196804850341e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.2511570453643799, "step": 670, "valid_targets_mean": 6292.3, "valid_targets_min": 3831 }, { "epoch": 1.085209003215434, "grad_norm": 0.4664119838831818, "learning_rate": 3.963691662965866e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.2670794725418091, "step": 675, "valid_targets_mean": 6324.6, "valid_targets_min": 2635 }, { "epoch": 1.0932475884244373, "grad_norm": 0.4596143591998667, "learning_rate": 3.9621549576940237e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2652100920677185, "step": 680, "valid_targets_mean": 6118.9, "valid_targets_min": 3113 }, { "epoch": 1.1012861736334405, "grad_norm": 0.45527286052039845, "learning_rate": 3.9605867137350386e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.2878355383872986, "step": 685, "valid_targets_mean": 5584.5, "valid_targets_min": 861 }, { "epoch": 1.1093247588424437, "grad_norm": 0.46127939436236953, "learning_rate": 3.95898695629607e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.3002994954586029, "step": 690, "valid_targets_mean": 6248.5, "valid_targets_min": 2783 }, { "epoch": 1.117363344051447, "grad_norm": 0.4904239019276266, "learning_rate": 3.957355711090812e-05, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.3002205491065979, "step": 695, "valid_targets_mean": 6415.4, "valid_targets_min": 900 }, { "epoch": 1.1254019292604502, "grad_norm": 0.4695407346217511, "learning_rate": 3.955693004339074e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.2368508279323578, "step": 700, "valid_targets_mean": 4967.2, "valid_targets_min": 1648 }, { "epoch": 1.1334405144694535, "grad_norm": 0.4209177205357036, "learning_rate": 3.953998862766366e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.22972455620765686, "step": 705, "valid_targets_mean": 5793.0, "valid_targets_min": 2220 }, { "epoch": 1.1414790996784565, "grad_norm": 0.5792332549777016, "learning_rate": 3.9522733136034607e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.3492357134819031, "step": 710, "valid_targets_mean": 6088.8, "valid_targets_min": 3000 }, { "epoch": 1.1495176848874598, "grad_norm": 0.481756880710946, "learning_rate": 3.9505163845859666e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731996476650238, "step": 715, "valid_targets_mean": 5951.7, "valid_targets_min": 3413 }, { "epoch": 1.157556270096463, "grad_norm": 0.46578493054858106, "learning_rate": 3.94872810395387e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.2460387945175171, "step": 720, "valid_targets_mean": 5526.6, "valid_targets_min": 1749 }, { "epoch": 1.1655948553054662, "grad_norm": 0.4428649245983029, "learning_rate": 3.9469085004510915e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.2698541283607483, "step": 725, "valid_targets_mean": 5618.7, "valid_targets_min": 1464 }, { "epoch": 1.1736334405144695, "grad_norm": 0.41739653985008957, "learning_rate": 3.945057603325017e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.25388237833976746, "step": 730, "valid_targets_mean": 6771.8, "valid_targets_min": 2408 }, { "epoch": 1.1816720257234727, "grad_norm": 0.5085464936906313, "learning_rate": 3.9431754423260336e-05, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.24689799547195435, "step": 735, "valid_targets_mean": 4660.9, "valid_targets_min": 449 }, { "epoch": 1.189710610932476, "grad_norm": 0.46314872752532243, "learning_rate": 3.941262047707044e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2670508623123169, "step": 740, "valid_targets_mean": 6294.3, "valid_targets_min": 1012 }, { "epoch": 1.197749196141479, "grad_norm": 0.47881711338841565, "learning_rate": 3.939317450222987e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.30444222688674927, "step": 745, "valid_targets_mean": 6074.1, "valid_targets_min": 1556 }, { "epoch": 1.2057877813504823, "grad_norm": 0.4255017920309088, "learning_rate": 3.93734168113034e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.27554166316986084, "step": 750, "valid_targets_mean": 6897.2, "valid_targets_min": 2189 }, { "epoch": 1.2138263665594855, "grad_norm": 0.4254444753489672, "learning_rate": 3.935334772186617e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.23489391803741455, "step": 755, "valid_targets_mean": 5864.9, "valid_targets_min": 818 }, { "epoch": 1.2218649517684887, "grad_norm": 0.4819794151433871, "learning_rate": 3.933296755649857e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.3091309070587158, "step": 760, "valid_targets_mean": 6131.4, "valid_targets_min": 355 }, { "epoch": 1.229903536977492, "grad_norm": 0.5020999109939216, "learning_rate": 3.931227664278108e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.23047637939453125, "step": 765, "valid_targets_mean": 5521.8, "valid_targets_min": 1540 }, { "epoch": 1.2379421221864952, "grad_norm": 0.8030577323017846, "learning_rate": 3.9291275313289006e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.3151301443576813, "step": 770, "valid_targets_mean": 5532.3, "valid_targets_min": 1775 }, { "epoch": 1.2459807073954985, "grad_norm": 0.5081302977797679, "learning_rate": 3.926996390558709e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2657415270805359, "step": 775, "valid_targets_mean": 4668.9, "valid_targets_min": 2112 }, { "epoch": 1.2540192926045015, "grad_norm": 0.44368801982072564, "learning_rate": 3.9248342762224136e-05, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.31955486536026, "step": 780, "valid_targets_mean": 6386.7, "valid_targets_min": 3611 }, { "epoch": 1.2620578778135048, "grad_norm": 0.498931124537264, "learning_rate": 3.922641223072747e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.2425532042980194, "step": 785, "valid_targets_mean": 4810.9, "valid_targets_min": 486 }, { "epoch": 1.270096463022508, "grad_norm": 0.5320789984283447, "learning_rate": 3.9204172663597375e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.28130286931991577, "step": 790, "valid_targets_mean": 5046.2, "valid_targets_min": 563 }, { "epoch": 1.2781350482315113, "grad_norm": 0.49054524873365496, "learning_rate": 3.918162441830142e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.27069205045700073, "step": 795, "valid_targets_mean": 5739.9, "valid_targets_min": 1960 }, { "epoch": 1.2861736334405145, "grad_norm": 0.5131172853073105, "learning_rate": 3.915876785726869e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.30020472407341003, "step": 800, "valid_targets_mean": 5495.4, "valid_targets_min": 1822 }, { "epoch": 1.2942122186495177, "grad_norm": 0.389125813463063, "learning_rate": 3.9135603347884e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.24876119196414948, "step": 805, "valid_targets_mean": 6612.6, "valid_targets_min": 2915 }, { "epoch": 1.302250803858521, "grad_norm": 0.5127358532210575, "learning_rate": 3.911213126248198e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.30721384286880493, "step": 810, "valid_targets_mean": 5653.8, "valid_targets_min": 2095 }, { "epoch": 1.310289389067524, "grad_norm": 0.45232559019783497, "learning_rate": 3.908835197834105e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.27385708689689636, "step": 815, "valid_targets_mean": 5792.4, "valid_targets_min": 2123 }, { "epoch": 1.3183279742765273, "grad_norm": 0.41007757692762153, "learning_rate": 3.906426587767741e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.23161353170871735, "step": 820, "valid_targets_mean": 6021.1, "valid_targets_min": 829 }, { "epoch": 1.3263665594855305, "grad_norm": 0.46907797176400545, "learning_rate": 3.903987334763888e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2761453092098236, "step": 825, "valid_targets_mean": 5064.2, "valid_targets_min": 786 }, { "epoch": 1.3344051446945338, "grad_norm": 0.4404949978973486, "learning_rate": 3.901517478029865e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.3096669912338257, "step": 830, "valid_targets_mean": 6641.9, "valid_targets_min": 3329 }, { "epoch": 1.342443729903537, "grad_norm": 0.4447920716860381, "learning_rate": 3.8990170572649014e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.25655800104141235, "step": 835, "valid_targets_mean": 5353.0, "valid_targets_min": 514 }, { "epoch": 1.3504823151125402, "grad_norm": 0.4758215947665256, "learning_rate": 3.8964861126594966e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.24453280866146088, "step": 840, "valid_targets_mean": 5096.5, "valid_targets_min": 2521 }, { "epoch": 1.3585209003215435, "grad_norm": 0.4660195988112356, "learning_rate": 3.8939246848947744e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.24251258373260498, "step": 845, "valid_targets_mean": 5149.8, "valid_targets_min": 2196 }, { "epoch": 1.3665594855305465, "grad_norm": 0.5276309826854884, "learning_rate": 3.891332815141832e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.23830977082252502, "step": 850, "valid_targets_mean": 3673.4, "valid_targets_min": 872 }, { "epoch": 1.3745980707395498, "grad_norm": 0.5071830945159351, "learning_rate": 3.888710545061073e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.21140193939208984, "step": 855, "valid_targets_mean": 4074.1, "valid_targets_min": 1713 }, { "epoch": 1.382636655948553, "grad_norm": 0.612703762329473, "learning_rate": 3.886057916801541e-05, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.24329236149787903, "step": 860, "valid_targets_mean": 5770.9, "valid_targets_min": 586 }, { "epoch": 1.3906752411575563, "grad_norm": 0.4449814033613736, "learning_rate": 3.883374973000242e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.28173279762268066, "step": 865, "valid_targets_mean": 6413.9, "valid_targets_min": 3810 }, { "epoch": 1.3987138263665595, "grad_norm": 0.5574684911444241, "learning_rate": 3.880661756781459e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678368091583252, "step": 870, "valid_targets_mean": 5746.8, "valid_targets_min": 2217 }, { "epoch": 1.4067524115755627, "grad_norm": 0.47311959969303435, "learning_rate": 3.877918311756059e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.2587282955646515, "step": 875, "valid_targets_mean": 5679.6, "valid_targets_min": 818 }, { "epoch": 1.414790996784566, "grad_norm": 0.4587092469906857, "learning_rate": 3.875144682020789e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.24418002367019653, "step": 880, "valid_targets_mean": 5821.7, "valid_targets_min": 1972 }, { "epoch": 1.422829581993569, "grad_norm": 0.4889856734893498, "learning_rate": 3.8723409121575744e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.29113972187042236, "step": 885, "valid_targets_mean": 5141.8, "valid_targets_min": 717 }, { "epoch": 1.4308681672025725, "grad_norm": 0.42403843566188576, "learning_rate": 3.8695070472327926e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.239852637052536, "step": 890, "valid_targets_mean": 5505.6, "valid_targets_min": 1016 }, { "epoch": 1.4389067524115755, "grad_norm": 0.4122605365448489, "learning_rate": 3.866643132796557e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.23172590136528015, "step": 895, "valid_targets_mean": 5802.1, "valid_targets_min": 2917 }, { "epoch": 1.4469453376205788, "grad_norm": 0.450815706756309, "learning_rate": 3.86374921488198e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.23391862213611603, "step": 900, "valid_targets_mean": 5419.5, "valid_targets_min": 1843 }, { "epoch": 1.454983922829582, "grad_norm": 0.47144379339992176, "learning_rate": 3.8608253400044377e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.24085289239883423, "step": 905, "valid_targets_mean": 5648.8, "valid_targets_min": 1257 }, { "epoch": 1.4630225080385852, "grad_norm": 0.5190255717863838, "learning_rate": 3.857871555160816e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.29148176312446594, "step": 910, "valid_targets_mean": 5045.9, "valid_targets_min": 1940 }, { "epoch": 1.4710610932475885, "grad_norm": 0.43535103713572904, "learning_rate": 3.854887907828759e-05, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516050338745117, "step": 915, "valid_targets_mean": 5595.3, "valid_targets_min": 2333 }, { "epoch": 1.4790996784565915, "grad_norm": 0.4597492992897256, "learning_rate": 3.851874445965907e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.28193798661231995, "step": 920, "valid_targets_mean": 5760.1, "valid_targets_min": 2041 }, { "epoch": 1.487138263665595, "grad_norm": 0.4693120011789064, "learning_rate": 3.848831218009123e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.30137860774993896, "step": 925, "valid_targets_mean": 5774.6, "valid_targets_min": 344 }, { "epoch": 1.495176848874598, "grad_norm": 0.5339368400409602, "learning_rate": 3.845758272873714e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.22395455837249756, "step": 930, "valid_targets_mean": 4434.1, "valid_targets_min": 594 }, { "epoch": 1.5032154340836013, "grad_norm": 0.45015256467293435, "learning_rate": 3.842655659952649e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.24812501668930054, "step": 935, "valid_targets_mean": 6940.7, "valid_targets_min": 1619 }, { "epoch": 1.5112540192926045, "grad_norm": 0.5272600662534491, "learning_rate": 3.839523429115758e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567567229270935, "step": 940, "valid_targets_mean": 4858.2, "valid_targets_min": 631 }, { "epoch": 1.5192926045016077, "grad_norm": 0.46459840745407177, "learning_rate": 3.8363616307089386e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.28069034218788147, "step": 945, "valid_targets_mean": 5754.1, "valid_targets_min": 2011 }, { "epoch": 1.527331189710611, "grad_norm": 0.45214826038540773, "learning_rate": 3.833170315553338e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.22650398313999176, "step": 950, "valid_targets_mean": 4581.8, "valid_targets_min": 417 }, { "epoch": 1.535369774919614, "grad_norm": 0.48210984419010594, "learning_rate": 3.8299495349445456e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.31238895654678345, "step": 955, "valid_targets_mean": 5383.9, "valid_targets_min": 853 }, { "epoch": 1.5434083601286175, "grad_norm": 0.4928344805065733, "learning_rate": 3.82669934065176e-05, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.25374823808670044, "step": 960, "valid_targets_mean": 4763.8, "valid_targets_min": 2176 }, { "epoch": 1.5514469453376205, "grad_norm": 0.4717265251908609, "learning_rate": 3.823419784916962e-05, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.22140252590179443, "step": 965, "valid_targets_mean": 5637.1, "valid_targets_min": 2403 }, { "epoch": 1.5594855305466238, "grad_norm": 0.43590323716499957, "learning_rate": 3.8201109204540724e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.268430233001709, "step": 970, "valid_targets_mean": 6467.6, "valid_targets_min": 2807 }, { "epoch": 1.567524115755627, "grad_norm": 0.41768095476278655, "learning_rate": 3.8167728004481055e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.27189570665359497, "step": 975, "valid_targets_mean": 5752.6, "valid_targets_min": 450 }, { "epoch": 1.5755627009646302, "grad_norm": 0.4832348331279412, "learning_rate": 3.813405478554318e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.24511483311653137, "step": 980, "valid_targets_mean": 4317.7, "valid_targets_min": 1986 }, { "epoch": 1.5836012861736335, "grad_norm": 0.414328602413529, "learning_rate": 3.810009008897338e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.21237172186374664, "step": 985, "valid_targets_mean": 5577.9, "valid_targets_min": 2366 }, { "epoch": 1.5916398713826365, "grad_norm": 0.4172501302274523, "learning_rate": 3.806583446070303e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.2472105622291565, "step": 990, "valid_targets_mean": 5920.4, "valid_targets_min": 2797 }, { "epoch": 1.59967845659164, "grad_norm": 0.4832394129539713, "learning_rate": 3.8031288451339795e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524241507053375, "step": 995, "valid_targets_mean": 4624.0, "valid_targets_min": 381 }, { "epoch": 1.607717041800643, "grad_norm": 0.43112961475264444, "learning_rate": 3.799645261615875e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.2469416856765747, "step": 1000, "valid_targets_mean": 5810.0, "valid_targets_min": 858 }, { "epoch": 1.6157556270096463, "grad_norm": 0.4272566439316645, "learning_rate": 3.796132751509352e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.30346783995628357, "step": 1005, "valid_targets_mean": 6606.8, "valid_targets_min": 2392 }, { "epoch": 1.6237942122186495, "grad_norm": 0.623083786690726, "learning_rate": 3.792591371272722e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.31482112407684326, "step": 1010, "valid_targets_mean": 5230.8, "valid_targets_min": 731 }, { "epoch": 1.6318327974276527, "grad_norm": 0.44232132209642155, "learning_rate": 3.789021177828342e-05, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.3005584478378296, "step": 1015, "valid_targets_mean": 6064.6, "valid_targets_min": 1145 }, { "epoch": 1.639871382636656, "grad_norm": 0.492902103630694, "learning_rate": 3.7854222285616956e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.26609134674072266, "step": 1020, "valid_targets_mean": 5095.8, "valid_targets_min": 1490 }, { "epoch": 1.647909967845659, "grad_norm": 0.4657249866434225, "learning_rate": 3.7817945813204754e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.20303010940551758, "step": 1025, "valid_targets_mean": 5232.4, "valid_targets_min": 2010 }, { "epoch": 1.6559485530546625, "grad_norm": 0.4708623793870404, "learning_rate": 3.778138294413651e-05, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.25198543071746826, "step": 1030, "valid_targets_mean": 4911.9, "valid_targets_min": 955 }, { "epoch": 1.6639871382636655, "grad_norm": 0.4165794121258526, "learning_rate": 3.774453426610528e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.24974118173122406, "step": 1035, "valid_targets_mean": 5947.4, "valid_targets_min": 502 }, { "epoch": 1.6720257234726688, "grad_norm": 0.4623343866634942, "learning_rate": 3.770740037139811e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.2963433563709259, "step": 1040, "valid_targets_mean": 5770.4, "valid_targets_min": 2475 }, { "epoch": 1.680064308681672, "grad_norm": 0.44810587508987115, "learning_rate": 3.7669981856886446e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.23505745828151703, "step": 1045, "valid_targets_mean": 5224.3, "valid_targets_min": 2812 }, { "epoch": 1.6881028938906752, "grad_norm": 0.45408084656767045, "learning_rate": 3.763227932401658e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.28216275572776794, "step": 1050, "valid_targets_mean": 6022.9, "valid_targets_min": 2277 }, { "epoch": 1.6961414790996785, "grad_norm": 0.48656702854532063, "learning_rate": 3.759429337879997e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.2563022971153259, "step": 1055, "valid_targets_mean": 5356.8, "valid_targets_min": 2798 }, { "epoch": 1.7041800643086815, "grad_norm": 0.4640030243470164, "learning_rate": 3.755602463180352e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.281100332736969, "step": 1060, "valid_targets_mean": 5524.0, "valid_targets_min": 624 }, { "epoch": 1.712218649517685, "grad_norm": 0.4276795294452354, "learning_rate": 3.75174736981397e-05, "loss": 0.2576, "loss_nan_ranks": 0, "loss_rank_avg": 0.27050265669822693, "step": 1065, "valid_targets_mean": 6211.6, "valid_targets_min": 1851 }, { "epoch": 1.720257234726688, "grad_norm": 0.43509074431450273, "learning_rate": 3.747864119745676e-05, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.2742531895637512, "step": 1070, "valid_targets_mean": 5541.8, "valid_targets_min": 1342 }, { "epoch": 1.7282958199356915, "grad_norm": 0.4276767599048864, "learning_rate": 3.743952775392867e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.25381579995155334, "step": 1075, "valid_targets_mean": 6139.3, "valid_targets_min": 2570 }, { "epoch": 1.7363344051446945, "grad_norm": 0.4082778737016427, "learning_rate": 3.740013399624517e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.24455204606056213, "step": 1080, "valid_targets_mean": 6807.5, "valid_targets_min": 3321 }, { "epoch": 1.7443729903536977, "grad_norm": 0.5211692720816377, "learning_rate": 3.7360460557601606e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.22724205255508423, "step": 1085, "valid_targets_mean": 4765.9, "valid_targets_min": 1461 }, { "epoch": 1.752411575562701, "grad_norm": 0.41530096966623775, "learning_rate": 3.732050807568878e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.2500365972518921, "step": 1090, "valid_targets_mean": 6449.4, "valid_targets_min": 2058 }, { "epoch": 1.760450160771704, "grad_norm": 0.4110566935959379, "learning_rate": 3.728027719268269e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.20658278465270996, "step": 1095, "valid_targets_mean": 5735.3, "valid_targets_min": 732 }, { "epoch": 1.7684887459807075, "grad_norm": 0.4496533892795101, "learning_rate": 3.723976855523422e-05, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.25664013624191284, "step": 1100, "valid_targets_mean": 5087.9, "valid_targets_min": 424 }, { "epoch": 1.7765273311897105, "grad_norm": 0.43245947505535154, "learning_rate": 3.719898281445874e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.21936315298080444, "step": 1105, "valid_targets_mean": 5918.4, "valid_targets_min": 1393 }, { "epoch": 1.784565916398714, "grad_norm": 0.4858462448376596, "learning_rate": 3.7157920625925635e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2447369545698166, "step": 1110, "valid_targets_mean": 5035.6, "valid_targets_min": 306 }, { "epoch": 1.792604501607717, "grad_norm": 0.46070258121147467, "learning_rate": 3.711658264964776e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2854937016963959, "step": 1115, "valid_targets_mean": 5777.2, "valid_targets_min": 1674 }, { "epoch": 1.8006430868167203, "grad_norm": 0.5098752084264075, "learning_rate": 3.7074969550070875e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.20868563652038574, "step": 1120, "valid_targets_mean": 4280.9, "valid_targets_min": 1278 }, { "epoch": 1.8086816720257235, "grad_norm": 0.5023676700932536, "learning_rate": 3.7033081996062896e-05, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.19911417365074158, "step": 1125, "valid_targets_mean": 4927.6, "valid_targets_min": 413 }, { "epoch": 1.8167202572347267, "grad_norm": 0.4777981723842262, "learning_rate": 3.6990920660903196e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.26569002866744995, "step": 1130, "valid_targets_mean": 5073.6, "valid_targets_min": 677 }, { "epoch": 1.82475884244373, "grad_norm": 0.405932778909337, "learning_rate": 3.6948486222271775e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.23919036984443665, "step": 1135, "valid_targets_mean": 5587.4, "valid_targets_min": 1803 }, { "epoch": 1.832797427652733, "grad_norm": 0.5069414169140095, "learning_rate": 3.690577936223835e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.27143096923828125, "step": 1140, "valid_targets_mean": 5159.4, "valid_targets_min": 478 }, { "epoch": 1.8408360128617365, "grad_norm": 0.4527435917730049, "learning_rate": 3.686280076725141e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.2778286337852478, "step": 1145, "valid_targets_mean": 5918.1, "valid_targets_min": 3434 }, { "epoch": 1.8488745980707395, "grad_norm": 0.4865490947207327, "learning_rate": 3.6819551128127165e-05, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.24340906739234924, "step": 1150, "valid_targets_mean": 4307.2, "valid_targets_min": 319 }, { "epoch": 1.8569131832797428, "grad_norm": 0.47010193702456116, "learning_rate": 3.677603114003846e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.2454727590084076, "step": 1155, "valid_targets_mean": 5215.7, "valid_targets_min": 636 }, { "epoch": 1.864951768488746, "grad_norm": 0.44641315970979795, "learning_rate": 3.673224150250358e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.22875937819480896, "step": 1160, "valid_targets_mean": 5781.1, "valid_targets_min": 1309 }, { "epoch": 1.8729903536977492, "grad_norm": 0.431723088241146, "learning_rate": 3.6688182919375046e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.23499958217144012, "step": 1165, "valid_targets_mean": 6213.2, "valid_targets_min": 4048 }, { "epoch": 1.8810289389067525, "grad_norm": 0.4482594154633358, "learning_rate": 3.664385609882825e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.2637123763561249, "step": 1170, "valid_targets_mean": 5742.7, "valid_targets_min": 2334 }, { "epoch": 1.8890675241157555, "grad_norm": 0.46395903411691025, "learning_rate": 3.659926175335009e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.267189085483551, "step": 1175, "valid_targets_mean": 5911.4, "valid_targets_min": 1800 }, { "epoch": 1.897106109324759, "grad_norm": 0.487503842139191, "learning_rate": 3.655440059972755e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.2147846221923828, "step": 1180, "valid_targets_mean": 4204.1, "valid_targets_min": 355 }, { "epoch": 1.905144694533762, "grad_norm": 0.5590050907024217, "learning_rate": 3.650927335903614e-05, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.25826340913772583, "step": 1185, "valid_targets_mean": 5233.5, "valid_targets_min": 2790 }, { "epoch": 1.9131832797427653, "grad_norm": 0.5172485408806574, "learning_rate": 3.646388075662832e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.2364274263381958, "step": 1190, "valid_targets_mean": 3912.8, "valid_targets_min": 594 }, { "epoch": 1.9212218649517685, "grad_norm": 0.47682543135007205, "learning_rate": 3.6418223522121835e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.3126181960105896, "step": 1195, "valid_targets_mean": 6203.2, "valid_targets_min": 3521 }, { "epoch": 1.9292604501607717, "grad_norm": 0.4332316218299991, "learning_rate": 3.6372302389388e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.23799636960029602, "step": 1200, "valid_targets_mean": 6120.1, "valid_targets_min": 1830 }, { "epoch": 1.937299035369775, "grad_norm": 0.6921991264155489, "learning_rate": 3.632611809653991e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.23573598265647888, "step": 1205, "valid_targets_mean": 5838.8, "valid_targets_min": 1781 }, { "epoch": 1.945337620578778, "grad_norm": 0.4531182795153632, "learning_rate": 3.627967138592052e-05, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.3050065040588379, "step": 1210, "valid_targets_mean": 5898.8, "valid_targets_min": 3244 }, { "epoch": 1.9533762057877815, "grad_norm": 0.5163483143343605, "learning_rate": 3.6232963004090806e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.29905956983566284, "step": 1215, "valid_targets_mean": 5265.6, "valid_targets_min": 700 }, { "epoch": 1.9614147909967845, "grad_norm": 0.46818084772289176, "learning_rate": 3.6185993701817676e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.250349760055542, "step": 1220, "valid_targets_mean": 5315.4, "valid_targets_min": 363 }, { "epoch": 1.9694533762057878, "grad_norm": 0.4220431966160426, "learning_rate": 3.613876423406197e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675197720527649, "step": 1225, "valid_targets_mean": 6162.6, "valid_targets_min": 2403 }, { "epoch": 1.977491961414791, "grad_norm": 0.6178589423180992, "learning_rate": 3.609127535996628e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.2850725054740906, "step": 1230, "valid_targets_mean": 5503.9, "valid_targets_min": 2166 }, { "epoch": 1.9855305466237942, "grad_norm": 0.40980310008162896, "learning_rate": 3.604352784284276e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.28403544425964355, "step": 1235, "valid_targets_mean": 6754.5, "valid_targets_min": 877 }, { "epoch": 1.9935691318327975, "grad_norm": 0.4415011119338401, "learning_rate": 3.5995522450160876e-05, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.26181045174598694, "step": 1240, "valid_targets_mean": 6086.8, "valid_targets_min": 2879 }, { "epoch": 2.0016077170418005, "grad_norm": 0.5052011649335046, "learning_rate": 3.594725995353504e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.2215358167886734, "step": 1245, "valid_targets_mean": 4575.7, "valid_targets_min": 671 }, { "epoch": 2.009646302250804, "grad_norm": 0.49499392194788194, "learning_rate": 3.589874112871225e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.2807163596153259, "step": 1250, "valid_targets_mean": 6068.4, "valid_targets_min": 2833 }, { "epoch": 2.017684887459807, "grad_norm": 0.5037101851458272, "learning_rate": 3.584996675555956e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.20071212947368622, "step": 1255, "valid_targets_mean": 4558.1, "valid_targets_min": 364 }, { "epoch": 2.0257234726688105, "grad_norm": 0.5288682410650701, "learning_rate": 3.58009376180516e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.22459709644317627, "step": 1260, "valid_targets_mean": 4271.1, "valid_targets_min": 1686 }, { "epoch": 2.0337620578778135, "grad_norm": 0.4909968616058714, "learning_rate": 3.575165450425795e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.27638089656829834, "step": 1265, "valid_targets_mean": 5826.1, "valid_targets_min": 2544 }, { "epoch": 2.0418006430868165, "grad_norm": 0.501900908160109, "learning_rate": 3.5702118206330464e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.24548184871673584, "step": 1270, "valid_targets_mean": 5093.1, "valid_targets_min": 839 }, { "epoch": 2.04983922829582, "grad_norm": 0.4734765195442351, "learning_rate": 3.565232952049057e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.24846141040325165, "step": 1275, "valid_targets_mean": 5822.4, "valid_targets_min": 2417 }, { "epoch": 2.057877813504823, "grad_norm": 0.45203540694484684, "learning_rate": 3.560228924701644e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.23629529774188995, "step": 1280, "valid_targets_mean": 7071.5, "valid_targets_min": 4493 }, { "epoch": 2.0659163987138265, "grad_norm": 0.48899278419104575, "learning_rate": 3.555199819023013e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.24547456204891205, "step": 1285, "valid_targets_mean": 5600.9, "valid_targets_min": 1454 }, { "epoch": 2.0739549839228295, "grad_norm": 0.6019858773966105, "learning_rate": 3.5501457158484684e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.2651026248931885, "step": 1290, "valid_targets_mean": 4568.3, "valid_targets_min": 977 }, { "epoch": 2.081993569131833, "grad_norm": 0.5664362773624191, "learning_rate": 3.545066696415109e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.21541890501976013, "step": 1295, "valid_targets_mean": 4279.4, "valid_targets_min": 591 }, { "epoch": 2.090032154340836, "grad_norm": 0.48714257423252616, "learning_rate": 3.5399628423605286e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.20423497259616852, "step": 1300, "valid_targets_mean": 4730.8, "valid_targets_min": 1985 }, { "epoch": 2.098070739549839, "grad_norm": 0.5673114735609058, "learning_rate": 3.534834235721495e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.3088694214820862, "step": 1305, "valid_targets_mean": 6417.6, "valid_targets_min": 2499 }, { "epoch": 2.1061093247588425, "grad_norm": 0.5072612807927125, "learning_rate": 3.5296809589326414e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.27511778473854065, "step": 1310, "valid_targets_mean": 5805.1, "valid_targets_min": 2166 }, { "epoch": 2.1141479099678455, "grad_norm": 0.4887778350157169, "learning_rate": 3.524503094825134e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.29525697231292725, "step": 1315, "valid_targets_mean": 5837.6, "valid_targets_min": 3211 }, { "epoch": 2.122186495176849, "grad_norm": 0.4682327210334639, "learning_rate": 3.5193007266253436e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.25870102643966675, "step": 1320, "valid_targets_mean": 5548.1, "valid_targets_min": 2741 }, { "epoch": 2.130225080385852, "grad_norm": 0.4289895984990567, "learning_rate": 3.514073937953507e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.23811715841293335, "step": 1325, "valid_targets_mean": 5777.2, "valid_targets_min": 2849 }, { "epoch": 2.1382636655948555, "grad_norm": 0.465702346096192, "learning_rate": 3.508822812822384e-05, "loss": 0.2317, "loss_nan_ranks": 0, "loss_rank_avg": 0.25546348094940186, "step": 1330, "valid_targets_mean": 5231.3, "valid_targets_min": 351 }, { "epoch": 2.1463022508038585, "grad_norm": 0.46068575075324203, "learning_rate": 3.503547435635906e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.22912633419036865, "step": 1335, "valid_targets_mean": 5305.3, "valid_targets_min": 450 }, { "epoch": 2.154340836012862, "grad_norm": 0.5793563972286564, "learning_rate": 3.4982478911878204e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.25946539640426636, "step": 1340, "valid_targets_mean": 6271.1, "valid_targets_min": 355 }, { "epoch": 2.162379421221865, "grad_norm": 0.4321108762119069, "learning_rate": 3.492924264660326e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.21115905046463013, "step": 1345, "valid_targets_mean": 5771.3, "valid_targets_min": 1986 }, { "epoch": 2.170418006430868, "grad_norm": 0.47291052827659313, "learning_rate": 3.4875766416227046e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.22496125102043152, "step": 1350, "valid_targets_mean": 4972.3, "valid_targets_min": 3309 }, { "epoch": 2.1784565916398715, "grad_norm": 0.43470423287906323, "learning_rate": 3.4822051080299475e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.20437441766262054, "step": 1355, "valid_targets_mean": 6334.6, "valid_targets_min": 2286 }, { "epoch": 2.1864951768488745, "grad_norm": 0.46020505480546187, "learning_rate": 3.47680975022137e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.20249639451503754, "step": 1360, "valid_targets_mean": 5926.2, "valid_targets_min": 2284 }, { "epoch": 2.194533762057878, "grad_norm": 0.4305391092246054, "learning_rate": 3.471390654919226e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.21444851160049438, "step": 1365, "valid_targets_mean": 5687.1, "valid_targets_min": 1717 }, { "epoch": 2.202572347266881, "grad_norm": 0.43458160830767617, "learning_rate": 3.4659479092273165e-05, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.21879488229751587, "step": 1370, "valid_targets_mean": 5867.4, "valid_targets_min": 1288 }, { "epoch": 2.210610932475884, "grad_norm": 0.47071088104561204, "learning_rate": 3.460481600629584e-05, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.22845019400119781, "step": 1375, "valid_targets_mean": 5171.8, "valid_targets_min": 889 }, { "epoch": 2.2186495176848875, "grad_norm": 0.5187891419112453, "learning_rate": 3.4549918169887117e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.21421794593334198, "step": 1380, "valid_targets_mean": 4998.8, "valid_targets_min": 889 }, { "epoch": 2.2266881028938905, "grad_norm": 0.5234262982245236, "learning_rate": 3.4494786465447046e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.25294065475463867, "step": 1385, "valid_targets_mean": 5855.6, "valid_targets_min": 2768 }, { "epoch": 2.234726688102894, "grad_norm": 0.5321562652327939, "learning_rate": 3.44394217791348e-05, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.24745520949363708, "step": 1390, "valid_targets_mean": 4331.7, "valid_targets_min": 671 }, { "epoch": 2.242765273311897, "grad_norm": 0.4615900367652738, "learning_rate": 3.438382500085437e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2429751455783844, "step": 1395, "valid_targets_mean": 5807.1, "valid_targets_min": 3494 }, { "epoch": 2.2508038585209005, "grad_norm": 0.48836390162778914, "learning_rate": 3.432799702424026e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2340126484632492, "step": 1400, "valid_targets_mean": 4863.4, "valid_targets_min": 831 }, { "epoch": 2.2588424437299035, "grad_norm": 0.4992916459755242, "learning_rate": 3.427193874664316e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595020532608032, "step": 1405, "valid_targets_mean": 5894.4, "valid_targets_min": 2328 }, { "epoch": 2.266881028938907, "grad_norm": 0.48577187074590183, "learning_rate": 3.421565106911549e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.23440846800804138, "step": 1410, "valid_targets_mean": 4556.2, "valid_targets_min": 2277 }, { "epoch": 2.27491961414791, "grad_norm": 0.5013796741612716, "learning_rate": 3.4159134896396926e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.221354141831398, "step": 1415, "valid_targets_mean": 5789.2, "valid_targets_min": 555 }, { "epoch": 2.282958199356913, "grad_norm": 0.49298535713537966, "learning_rate": 3.410239113689988e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.23821865022182465, "step": 1420, "valid_targets_mean": 5011.8, "valid_targets_min": 1665 }, { "epoch": 2.2909967845659165, "grad_norm": 0.4626416750757732, "learning_rate": 3.4045420702694846e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.22496405243873596, "step": 1425, "valid_targets_mean": 5377.4, "valid_targets_min": 1255 }, { "epoch": 2.2990353697749195, "grad_norm": 0.4296716912834519, "learning_rate": 3.398822450949581e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.23885153234004974, "step": 1430, "valid_targets_mean": 6061.9, "valid_targets_min": 3491 }, { "epoch": 2.307073954983923, "grad_norm": 0.47636710237452873, "learning_rate": 3.393080347664547e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2698220908641815, "step": 1435, "valid_targets_mean": 6900.9, "valid_targets_min": 2064 }, { "epoch": 2.315112540192926, "grad_norm": 0.41767354690125497, "learning_rate": 3.3873158527100476e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.2261713743209839, "step": 1440, "valid_targets_mean": 6009.2, "valid_targets_min": 954 }, { "epoch": 2.323151125401929, "grad_norm": 0.45765199576612026, "learning_rate": 3.381529058741662e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.19748841226100922, "step": 1445, "valid_targets_mean": 4535.4, "valid_targets_min": 763 }, { "epoch": 2.3311897106109325, "grad_norm": 0.512506152526694, "learning_rate": 3.375720058773393e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.21968387067317963, "step": 1450, "valid_targets_mean": 4926.1, "valid_targets_min": 793 }, { "epoch": 2.3392282958199355, "grad_norm": 0.4272765943955022, "learning_rate": 3.369888946176169e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.2100493162870407, "step": 1455, "valid_targets_mean": 6448.4, "valid_targets_min": 1340 }, { "epoch": 2.347266881028939, "grad_norm": 0.4563671696414422, "learning_rate": 3.364035814676348e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.2688789665699005, "step": 1460, "valid_targets_mean": 5684.4, "valid_targets_min": 696 }, { "epoch": 2.355305466237942, "grad_norm": 0.4324693505868682, "learning_rate": 3.358160758354207e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.23381435871124268, "step": 1465, "valid_targets_mean": 5994.9, "valid_targets_min": 3248 }, { "epoch": 2.3633440514469455, "grad_norm": 0.4759857152996837, "learning_rate": 3.352263871642431e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.22635474801063538, "step": 1470, "valid_targets_mean": 5392.4, "valid_targets_min": 2033 }, { "epoch": 2.3713826366559485, "grad_norm": 0.4884246901728015, "learning_rate": 3.346345249324599e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.21876902878284454, "step": 1475, "valid_targets_mean": 4432.8, "valid_targets_min": 1507 }, { "epoch": 2.379421221864952, "grad_norm": 0.4330099288850315, "learning_rate": 3.340404986533654e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.23252514004707336, "step": 1480, "valid_targets_mean": 6527.4, "valid_targets_min": 3722 }, { "epoch": 2.387459807073955, "grad_norm": 0.45464353022352455, "learning_rate": 3.334443178750378e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.21697625517845154, "step": 1485, "valid_targets_mean": 4793.3, "valid_targets_min": 700 }, { "epoch": 2.395498392282958, "grad_norm": 0.4068622119059787, "learning_rate": 3.328459921801855e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.201742023229599, "step": 1490, "valid_targets_mean": 5870.1, "valid_targets_min": 2359 }, { "epoch": 2.4035369774919615, "grad_norm": 0.4122118914595108, "learning_rate": 3.322455311859936e-05, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.2373337745666504, "step": 1495, "valid_targets_mean": 6573.8, "valid_targets_min": 2667 }, { "epoch": 2.4115755627009645, "grad_norm": 0.5745692612063069, "learning_rate": 3.316429445439684e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.24043476581573486, "step": 1500, "valid_targets_mean": 6095.8, "valid_targets_min": 2709 }, { "epoch": 2.419614147909968, "grad_norm": 0.454172764523821, "learning_rate": 3.310382419397832e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.22647792100906372, "step": 1505, "valid_targets_mean": 5380.6, "valid_targets_min": 554 }, { "epoch": 2.427652733118971, "grad_norm": 0.45495338149369174, "learning_rate": 3.30431433093122e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.2454707771539688, "step": 1510, "valid_targets_mean": 5483.3, "valid_targets_min": 2993 }, { "epoch": 2.435691318327974, "grad_norm": 0.41609998478720306, "learning_rate": 3.298225277575235e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000729739665985, "step": 1515, "valid_targets_mean": 5734.8, "valid_targets_min": 395 }, { "epoch": 2.4437299035369775, "grad_norm": 0.4628501255715947, "learning_rate": 3.292115357202244e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.2211766541004181, "step": 1520, "valid_targets_mean": 5731.4, "valid_targets_min": 2463 }, { "epoch": 2.4517684887459805, "grad_norm": 0.48247050262549374, "learning_rate": 3.285984668020019e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2340318262577057, "step": 1525, "valid_targets_mean": 5772.2, "valid_targets_min": 2556 }, { "epoch": 2.459807073954984, "grad_norm": 0.4090879734351391, "learning_rate": 3.27983330857016e-05, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.20760081708431244, "step": 1530, "valid_targets_mean": 6043.8, "valid_targets_min": 2831 }, { "epoch": 2.467845659163987, "grad_norm": 0.46193519580530734, "learning_rate": 3.2736613777265076e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.18691232800483704, "step": 1535, "valid_targets_mean": 4827.1, "valid_targets_min": 2611 }, { "epoch": 2.4758842443729905, "grad_norm": 0.4790816763532421, "learning_rate": 3.2674689746935626e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.24825897812843323, "step": 1540, "valid_targets_mean": 4753.2, "valid_targets_min": 2313 }, { "epoch": 2.4839228295819935, "grad_norm": 0.4274916395823709, "learning_rate": 3.261256199004879e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.19343507289886475, "step": 1545, "valid_targets_mean": 5236.5, "valid_targets_min": 1379 }, { "epoch": 2.491961414790997, "grad_norm": 0.462266180497401, "learning_rate": 3.255023150521474e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.22728748619556427, "step": 1550, "valid_targets_mean": 5430.7, "valid_targets_min": 3000 }, { "epoch": 2.5, "grad_norm": 0.4876609578778693, "learning_rate": 3.2487699294302195e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.24499937891960144, "step": 1555, "valid_targets_mean": 5483.6, "valid_targets_min": 368 }, { "epoch": 2.508038585209003, "grad_norm": 0.42431584453451293, "learning_rate": 3.242496636242231e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.23072059452533722, "step": 1560, "valid_targets_mean": 5792.4, "valid_targets_min": 2293 }, { "epoch": 2.5160771704180065, "grad_norm": 0.48288970283703386, "learning_rate": 3.236203371791252e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.21728533506393433, "step": 1565, "valid_targets_mean": 5067.8, "valid_targets_min": 922 }, { "epoch": 2.5241157556270095, "grad_norm": 0.48817034020969907, "learning_rate": 3.2298902372320354e-05, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.2375354766845703, "step": 1570, "valid_targets_mean": 4957.4, "valid_targets_min": 424 }, { "epoch": 2.532154340836013, "grad_norm": 0.38867992655742173, "learning_rate": 3.2235573340387155e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.17898300290107727, "step": 1575, "valid_targets_mean": 5888.5, "valid_targets_min": 2584 }, { "epoch": 2.540192926045016, "grad_norm": 0.430940952546417, "learning_rate": 3.2172047640031774e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.22751542925834656, "step": 1580, "valid_targets_mean": 5754.3, "valid_targets_min": 1931 }, { "epoch": 2.548231511254019, "grad_norm": 0.4815894601905835, "learning_rate": 3.210832629233421e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.2273508906364441, "step": 1585, "valid_targets_mean": 5406.9, "valid_targets_min": 790 }, { "epoch": 2.5562700964630225, "grad_norm": 0.6068676978104833, "learning_rate": 3.204441032151921e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.21523119509220123, "step": 1590, "valid_targets_mean": 5741.2, "valid_targets_min": 2231 }, { "epoch": 2.564308681672026, "grad_norm": 0.5223510328320911, "learning_rate": 3.198030075493979e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.26558348536491394, "step": 1595, "valid_targets_mean": 5132.1, "valid_targets_min": 1019 }, { "epoch": 2.572347266881029, "grad_norm": 0.60222440656527, "learning_rate": 3.19159986230607e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.1857927143573761, "step": 1600, "valid_targets_mean": 4652.8, "valid_targets_min": 1007 }, { "epoch": 2.580385852090032, "grad_norm": 0.45369146995792226, "learning_rate": 3.185150495944194e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.203944593667984, "step": 1605, "valid_targets_mean": 5606.6, "valid_targets_min": 594 }, { "epoch": 2.5884244372990355, "grad_norm": 0.44158984490213105, "learning_rate": 3.1786820800722044e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.2083684355020523, "step": 1610, "valid_targets_mean": 5581.2, "valid_targets_min": 2542 }, { "epoch": 2.5964630225080385, "grad_norm": 0.3955024073939668, "learning_rate": 3.1721947186601494e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.23385578393936157, "step": 1615, "valid_targets_mean": 6655.3, "valid_targets_min": 2377 }, { "epoch": 2.604501607717042, "grad_norm": 0.4448231599721356, "learning_rate": 3.165688515982599e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.23172247409820557, "step": 1620, "valid_targets_mean": 5980.2, "valid_targets_min": 2938 }, { "epoch": 2.612540192926045, "grad_norm": 0.43163627602395105, "learning_rate": 3.1591635766169646e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.21875952184200287, "step": 1625, "valid_targets_mean": 6797.9, "valid_targets_min": 3875 }, { "epoch": 2.620578778135048, "grad_norm": 0.48035161655460856, "learning_rate": 3.152620005441826e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.25188302993774414, "step": 1630, "valid_targets_mean": 5222.1, "valid_targets_min": 872 }, { "epoch": 2.6286173633440515, "grad_norm": 0.47804467495955605, "learning_rate": 3.146057907635238e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.23584258556365967, "step": 1635, "valid_targets_mean": 5037.3, "valid_targets_min": 1577 }, { "epoch": 2.6366559485530545, "grad_norm": 0.49724922962510637, "learning_rate": 3.1394773886730447e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.21783044934272766, "step": 1640, "valid_targets_mean": 5010.2, "valid_targets_min": 2341 }, { "epoch": 2.644694533762058, "grad_norm": 0.47360896933063057, "learning_rate": 3.1328785543271824e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.23639383912086487, "step": 1645, "valid_targets_mean": 5103.1, "valid_targets_min": 2430 }, { "epoch": 2.652733118971061, "grad_norm": 0.4425730996552444, "learning_rate": 3.126261510663979e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.24800364673137665, "step": 1650, "valid_targets_mean": 5471.6, "valid_targets_min": 779 }, { "epoch": 2.660771704180064, "grad_norm": 0.5066362084521983, "learning_rate": 3.119626364042451e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.23977752029895782, "step": 1655, "valid_targets_mean": 6356.9, "valid_targets_min": 1168 }, { "epoch": 2.6688102893890675, "grad_norm": 0.46571003694651886, "learning_rate": 3.112973221112591e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.23410023748874664, "step": 1660, "valid_targets_mean": 5421.5, "valid_targets_min": 2427 }, { "epoch": 2.676848874598071, "grad_norm": 0.49670167200910814, "learning_rate": 3.106302188813656e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.23411546647548676, "step": 1665, "valid_targets_mean": 5066.6, "valid_targets_min": 902 }, { "epoch": 2.684887459807074, "grad_norm": 0.4489042276841892, "learning_rate": 3.099613374372449e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2577555179595947, "step": 1670, "valid_targets_mean": 5970.1, "valid_targets_min": 3474 }, { "epoch": 2.692926045016077, "grad_norm": 0.4726499258070017, "learning_rate": 3.092906885301591e-05, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.24142785370349884, "step": 1675, "valid_targets_mean": 5035.5, "valid_targets_min": 1983 }, { "epoch": 2.7009646302250805, "grad_norm": 0.45047970317259495, "learning_rate": 3.086182829397799e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.21712270379066467, "step": 1680, "valid_targets_mean": 5064.8, "valid_targets_min": 829 }, { "epoch": 2.7090032154340835, "grad_norm": 0.41145712760990627, "learning_rate": 3.07944131474015e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.19963139295578003, "step": 1685, "valid_targets_mean": 5160.9, "valid_targets_min": 268 }, { "epoch": 2.717041800643087, "grad_norm": 0.4773923313728519, "learning_rate": 3.072682449688342e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.24405084550380707, "step": 1690, "valid_targets_mean": 5581.8, "valid_targets_min": 2920 }, { "epoch": 2.72508038585209, "grad_norm": 0.4376554948889786, "learning_rate": 3.0659063428809574e-05, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.2001868635416031, "step": 1695, "valid_targets_mean": 5621.9, "valid_targets_min": 2576 }, { "epoch": 2.733118971061093, "grad_norm": 0.43672581570188307, "learning_rate": 3.059113103233711e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.20036949217319489, "step": 1700, "valid_targets_mean": 5967.9, "valid_targets_min": 1912 }, { "epoch": 2.7411575562700965, "grad_norm": 0.4890236832710162, "learning_rate": 3.052302839937706e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.23596787452697754, "step": 1705, "valid_targets_mean": 5446.7, "valid_targets_min": 3308 }, { "epoch": 2.7491961414790995, "grad_norm": 0.4635500560051159, "learning_rate": 3.045475662457671e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.24793817102909088, "step": 1710, "valid_targets_mean": 5555.2, "valid_targets_min": 1492 }, { "epoch": 2.757234726688103, "grad_norm": 0.4427640364687355, "learning_rate": 3.0386316805302064e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.22127273678779602, "step": 1715, "valid_targets_mean": 5390.1, "valid_targets_min": 2559 }, { "epoch": 2.765273311897106, "grad_norm": 0.4442190835436434, "learning_rate": 3.0317710041620194e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2600225806236267, "step": 1720, "valid_targets_mean": 6436.2, "valid_targets_min": 675 }, { "epoch": 2.7733118971061095, "grad_norm": 0.42238676851093976, "learning_rate": 3.024893743628154e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.20658443868160248, "step": 1725, "valid_targets_mean": 5774.4, "valid_targets_min": 1262 }, { "epoch": 2.7813504823151125, "grad_norm": 0.42021767660168513, "learning_rate": 3.018000009470222e-05, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.21164314448833466, "step": 1730, "valid_targets_mean": 5540.8, "valid_targets_min": 514 }, { "epoch": 2.789389067524116, "grad_norm": 0.4630792997560636, "learning_rate": 3.0110899124946203e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.24036768078804016, "step": 1735, "valid_targets_mean": 5809.8, "valid_targets_min": 2003 }, { "epoch": 2.797427652733119, "grad_norm": 0.5390343017669323, "learning_rate": 3.004163563770756e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.18927526473999023, "step": 1740, "valid_targets_mean": 5524.0, "valid_targets_min": 413 }, { "epoch": 2.805466237942122, "grad_norm": 0.506037679439928, "learning_rate": 2.9972210746292593e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2753189206123352, "step": 1745, "valid_targets_mean": 5811.8, "valid_targets_min": 1503 }, { "epoch": 2.8135048231511255, "grad_norm": 0.4477668704765513, "learning_rate": 2.9902625566601896e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.2465018332004547, "step": 1750, "valid_targets_mean": 5265.3, "valid_targets_min": 677 }, { "epoch": 2.8215434083601285, "grad_norm": 0.43112747090224235, "learning_rate": 2.9832881217112507e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.23881378769874573, "step": 1755, "valid_targets_mean": 5734.8, "valid_targets_min": 2236 }, { "epoch": 2.829581993569132, "grad_norm": 0.43331469697490993, "learning_rate": 2.9762978818859828e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.25261190533638, "step": 1760, "valid_targets_mean": 6195.2, "valid_targets_min": 364 }, { "epoch": 2.837620578778135, "grad_norm": 0.49846352204421746, "learning_rate": 2.9692919495419698e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.191496804356575, "step": 1765, "valid_targets_mean": 5438.2, "valid_targets_min": 793 }, { "epoch": 2.845659163987138, "grad_norm": 0.40728999160669044, "learning_rate": 2.9622704372890268e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332020401954651, "step": 1770, "valid_targets_mean": 6247.6, "valid_targets_min": 1709 }, { "epoch": 2.8536977491961415, "grad_norm": 0.44070923563948255, "learning_rate": 2.955233457987393e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.27117034792900085, "step": 1775, "valid_targets_mean": 6259.8, "valid_targets_min": 3163 }, { "epoch": 2.861736334405145, "grad_norm": 0.46843718336492085, "learning_rate": 2.9481811247459174e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.20232127606868744, "step": 1780, "valid_targets_mean": 4301.2, "valid_targets_min": 877 }, { "epoch": 2.869774919614148, "grad_norm": 0.4811831657791136, "learning_rate": 2.9411135509202407e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.22563835978507996, "step": 1785, "valid_targets_mean": 4858.6, "valid_targets_min": 297 }, { "epoch": 2.877813504823151, "grad_norm": 0.4776739267077266, "learning_rate": 2.9340308501109726e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.25109878182411194, "step": 1790, "valid_targets_mean": 4963.9, "valid_targets_min": 921 }, { "epoch": 2.8858520900321545, "grad_norm": 0.4552374822125526, "learning_rate": 2.926933136161866e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678318917751312, "step": 1795, "valid_targets_mean": 6130.4, "valid_targets_min": 1699 }, { "epoch": 2.8938906752411575, "grad_norm": 0.4998597785043118, "learning_rate": 2.919820523157988e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2558537721633911, "step": 1800, "valid_targets_mean": 5725.7, "valid_targets_min": 1049 }, { "epoch": 2.901929260450161, "grad_norm": 0.3985526663408574, "learning_rate": 2.9126931254238856e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.22993230819702148, "step": 1805, "valid_targets_mean": 5944.6, "valid_targets_min": 2174 }, { "epoch": 2.909967845659164, "grad_norm": 0.4328617676889273, "learning_rate": 2.905551057521748e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.24856430292129517, "step": 1810, "valid_targets_mean": 5760.9, "valid_targets_min": 726 }, { "epoch": 2.918006430868167, "grad_norm": 0.4542317521238959, "learning_rate": 2.898394434249565e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.21676376461982727, "step": 1815, "valid_targets_mean": 5277.0, "valid_targets_min": 1775 }, { "epoch": 2.9260450160771705, "grad_norm": 0.4960973232998586, "learning_rate": 2.8912233706392824e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.19444525241851807, "step": 1820, "valid_targets_mean": 4628.3, "valid_targets_min": 381 }, { "epoch": 2.9340836012861735, "grad_norm": 0.4351299120886839, "learning_rate": 2.8840379819549515e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.22263455390930176, "step": 1825, "valid_targets_mean": 5299.7, "valid_targets_min": 558 }, { "epoch": 2.942122186495177, "grad_norm": 0.47748132373633034, "learning_rate": 2.8768383836908804e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.21326063573360443, "step": 1830, "valid_targets_mean": 4476.9, "valid_targets_min": 935 }, { "epoch": 2.95016077170418, "grad_norm": 0.42660596230377495, "learning_rate": 2.8696246915697714e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.2128058224916458, "step": 1835, "valid_targets_mean": 5964.4, "valid_targets_min": 2572 }, { "epoch": 2.958199356913183, "grad_norm": 0.4506785970078862, "learning_rate": 2.862397021540867e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.26402390003204346, "step": 1840, "valid_targets_mean": 5856.1, "valid_targets_min": 2753 }, { "epoch": 2.9662379421221865, "grad_norm": 0.4391481347976392, "learning_rate": 2.855155489778082e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654515504837036, "step": 1845, "valid_targets_mean": 5673.1, "valid_targets_min": 1145 }, { "epoch": 2.97427652733119, "grad_norm": 0.4582126351879179, "learning_rate": 2.8479002126781383e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.24582958221435547, "step": 1850, "valid_targets_mean": 5058.6, "valid_targets_min": 575 }, { "epoch": 2.982315112540193, "grad_norm": 0.4291403858281957, "learning_rate": 2.8406313068586926e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.2569013833999634, "step": 1855, "valid_targets_mean": 6363.9, "valid_targets_min": 1189 }, { "epoch": 2.990353697749196, "grad_norm": 0.4008457746324607, "learning_rate": 2.8333488891564647e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.19619405269622803, "step": 1860, "valid_targets_mean": 5793.0, "valid_targets_min": 2157 }, { "epoch": 2.9983922829581995, "grad_norm": 0.42930616673946925, "learning_rate": 2.8260530766253557e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623644769191742, "step": 1865, "valid_targets_mean": 6299.9, "valid_targets_min": 3015 }, { "epoch": 3.0064308681672025, "grad_norm": 0.38344200812668733, "learning_rate": 2.8187439865345685e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.20248943567276, "step": 1870, "valid_targets_mean": 6622.2, "valid_targets_min": 2228 }, { "epoch": 3.014469453376206, "grad_norm": 0.46103181792250764, "learning_rate": 2.8114217363667246e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.20105582475662231, "step": 1875, "valid_targets_mean": 5312.6, "valid_targets_min": 2085 }, { "epoch": 3.022508038585209, "grad_norm": 0.4647259314919432, "learning_rate": 2.8040864438159707e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.20135775208473206, "step": 1880, "valid_targets_mean": 4949.4, "valid_targets_min": 1507 }, { "epoch": 3.030546623794212, "grad_norm": 0.4085250192487578, "learning_rate": 2.7967382267860946e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.23754431307315826, "step": 1885, "valid_targets_mean": 7139.6, "valid_targets_min": 1003 }, { "epoch": 3.0385852090032155, "grad_norm": 0.5510015583580707, "learning_rate": 2.7893772033886208e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.20717856287956238, "step": 1890, "valid_targets_mean": 5289.0, "valid_targets_min": 880 }, { "epoch": 3.0466237942122185, "grad_norm": 0.47108051497284203, "learning_rate": 2.7820034919409203e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.20311778783798218, "step": 1895, "valid_targets_mean": 4827.5, "valid_targets_min": 567 }, { "epoch": 3.054662379421222, "grad_norm": 0.4687658440412486, "learning_rate": 2.774617210964305e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.22327911853790283, "step": 1900, "valid_targets_mean": 6458.3, "valid_targets_min": 1909 }, { "epoch": 3.062700964630225, "grad_norm": 0.5317314845653304, "learning_rate": 2.767218479182121e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.28799089789390564, "step": 1905, "valid_targets_mean": 5339.3, "valid_targets_min": 344 }, { "epoch": 3.0707395498392285, "grad_norm": 0.4479836422167699, "learning_rate": 2.7598074155178447e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.23213958740234375, "step": 1910, "valid_targets_mean": 6368.8, "valid_targets_min": 2232 }, { "epoch": 3.0787781350482315, "grad_norm": 0.4879671474173943, "learning_rate": 2.7523841390931676e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.19620759785175323, "step": 1915, "valid_targets_mean": 5519.9, "valid_targets_min": 2982 }, { "epoch": 3.0868167202572345, "grad_norm": 0.576805679083638, "learning_rate": 2.7449487692260834e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544819414615631, "step": 1920, "valid_targets_mean": 4490.9, "valid_targets_min": 687 }, { "epoch": 3.094855305466238, "grad_norm": 0.4971668089459153, "learning_rate": 2.7375014254289695e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.1839742660522461, "step": 1925, "valid_targets_mean": 4795.8, "valid_targets_min": 1833 }, { "epoch": 3.102893890675241, "grad_norm": 0.4687617088950276, "learning_rate": 2.7300422274066672e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2087346613407135, "step": 1930, "valid_targets_mean": 5627.9, "valid_targets_min": 2985 }, { "epoch": 3.1109324758842445, "grad_norm": 0.4927605336472376, "learning_rate": 2.722571295054554e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347278743982315, "step": 1935, "valid_targets_mean": 5060.4, "valid_targets_min": 371 }, { "epoch": 3.1189710610932475, "grad_norm": 0.4987134488018747, "learning_rate": 2.715088748456622e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.23042768239974976, "step": 1940, "valid_targets_mean": 5561.6, "valid_targets_min": 550 }, { "epoch": 3.127009646302251, "grad_norm": 0.523421193954538, "learning_rate": 2.7075947078835438e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.22954672574996948, "step": 1945, "valid_targets_mean": 4881.9, "valid_targets_min": 1394 }, { "epoch": 3.135048231511254, "grad_norm": 0.43883645279150485, "learning_rate": 2.7000892937907398e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.19516025483608246, "step": 1950, "valid_targets_mean": 5517.6, "valid_targets_min": 3251 }, { "epoch": 3.143086816720257, "grad_norm": 0.4570199670863005, "learning_rate": 2.6925726268164427e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.24825003743171692, "step": 1955, "valid_targets_mean": 6280.4, "valid_targets_min": 2112 }, { "epoch": 3.1511254019292605, "grad_norm": 0.45672754180296316, "learning_rate": 2.685044827779759e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.20939724147319794, "step": 1960, "valid_targets_mean": 6016.7, "valid_targets_min": 2771 }, { "epoch": 3.1591639871382635, "grad_norm": 0.47906774477386277, "learning_rate": 2.6775060176787256e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.281923770904541, "step": 1965, "valid_targets_mean": 6699.8, "valid_targets_min": 2442 }, { "epoch": 3.167202572347267, "grad_norm": 0.39767857581545424, "learning_rate": 2.6699563176883664e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.2029469907283783, "step": 1970, "valid_targets_mean": 6916.5, "valid_targets_min": 1302 }, { "epoch": 3.17524115755627, "grad_norm": 0.4425799974084158, "learning_rate": 2.6623958491587446e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.20335035026073456, "step": 1975, "valid_targets_mean": 5785.0, "valid_targets_min": 2366 }, { "epoch": 3.1832797427652735, "grad_norm": 0.44544395721654917, "learning_rate": 2.654824733613008e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.21528367698192596, "step": 1980, "valid_targets_mean": 5611.8, "valid_targets_min": 2466 }, { "epoch": 3.1913183279742765, "grad_norm": 0.4460608523219643, "learning_rate": 2.6472430927454436e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.20754650235176086, "step": 1985, "valid_targets_mean": 7354.8, "valid_targets_min": 3155 }, { "epoch": 3.19935691318328, "grad_norm": 0.42210886653384705, "learning_rate": 2.6396510484195137e-05, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.2087785005569458, "step": 1990, "valid_targets_mean": 6236.5, "valid_targets_min": 2469 }, { "epoch": 3.207395498392283, "grad_norm": 0.43096075271764295, "learning_rate": 2.6320487226659025e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.16838577389717102, "step": 1995, "valid_targets_mean": 5186.6, "valid_targets_min": 1676 }, { "epoch": 3.215434083601286, "grad_norm": 0.4508053623757557, "learning_rate": 2.6244362376805526e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.23479191958904266, "step": 2000, "valid_targets_mean": 5779.5, "valid_targets_min": 763 }, { "epoch": 3.2234726688102895, "grad_norm": 0.4628118815083852, "learning_rate": 2.616813715822699e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.22613340616226196, "step": 2005, "valid_targets_mean": 5524.2, "valid_targets_min": 1492 }, { "epoch": 3.2315112540192925, "grad_norm": 0.4720924761087141, "learning_rate": 2.609181279612907e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.24971206486225128, "step": 2010, "valid_targets_mean": 5421.2, "valid_targets_min": 686 }, { "epoch": 3.239549839228296, "grad_norm": 0.4737698035846392, "learning_rate": 2.601539051731098e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.2119787633419037, "step": 2015, "valid_targets_mean": 5191.6, "valid_targets_min": 1255 }, { "epoch": 3.247588424437299, "grad_norm": 0.4572117282020224, "learning_rate": 2.5938871550145813e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.1961323767900467, "step": 2020, "valid_targets_mean": 5815.9, "valid_targets_min": 2510 }, { "epoch": 3.255627009646302, "grad_norm": 0.43770534537636197, "learning_rate": 2.5862257124560776e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.19521623849868774, "step": 2025, "valid_targets_mean": 4878.7, "valid_targets_min": 359 }, { "epoch": 3.2636655948553055, "grad_norm": 0.5133043126611774, "learning_rate": 2.5785548472017428e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.22816744446754456, "step": 2030, "valid_targets_mean": 5207.1, "valid_targets_min": 355 }, { "epoch": 3.2717041800643085, "grad_norm": 0.45988818406168736, "learning_rate": 2.5708746825491872e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.2291097640991211, "step": 2035, "valid_targets_mean": 5681.0, "valid_targets_min": 1539 }, { "epoch": 3.279742765273312, "grad_norm": 0.4942920353232446, "learning_rate": 2.5631853419454963e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.19933205842971802, "step": 2040, "valid_targets_mean": 4273.0, "valid_targets_min": 312 }, { "epoch": 3.287781350482315, "grad_norm": 0.4710297159118358, "learning_rate": 2.5554869489852462e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.25016915798187256, "step": 2045, "valid_targets_mean": 6010.7, "valid_targets_min": 3356 }, { "epoch": 3.2958199356913185, "grad_norm": 0.4329815260262049, "learning_rate": 2.5477796274085128e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.19916954636573792, "step": 2050, "valid_targets_mean": 5431.9, "valid_targets_min": 477 }, { "epoch": 3.3038585209003215, "grad_norm": 0.4382594314534806, "learning_rate": 2.540063501098889e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.22328132390975952, "step": 2055, "valid_targets_mean": 7057.8, "valid_targets_min": 2434 }, { "epoch": 3.311897106109325, "grad_norm": 0.4304909069133098, "learning_rate": 2.5323386940814894e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.20800434052944183, "step": 2060, "valid_targets_mean": 5571.2, "valid_targets_min": 2064 }, { "epoch": 3.319935691318328, "grad_norm": 0.45761114861789215, "learning_rate": 2.5246053305209576e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.22320008277893066, "step": 2065, "valid_targets_mean": 5810.9, "valid_targets_min": 2496 }, { "epoch": 3.327974276527331, "grad_norm": 0.5109891719100492, "learning_rate": 2.516863534719472e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.2085902988910675, "step": 2070, "valid_targets_mean": 5335.4, "valid_targets_min": 2868 }, { "epoch": 3.3360128617363345, "grad_norm": 0.46691815612294274, "learning_rate": 2.509113431114745e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.18727019429206848, "step": 2075, "valid_targets_mean": 5446.6, "valid_targets_min": 686 }, { "epoch": 3.3440514469453375, "grad_norm": 0.4900335050961584, "learning_rate": 2.5013551442780246e-05, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.26614588499069214, "step": 2080, "valid_targets_mean": 5034.6, "valid_targets_min": 1621 }, { "epoch": 3.352090032154341, "grad_norm": 0.44650493165960287, "learning_rate": 2.493588798912094e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.1934056580066681, "step": 2085, "valid_targets_mean": 6115.8, "valid_targets_min": 2803 }, { "epoch": 3.360128617363344, "grad_norm": 0.4994390565400204, "learning_rate": 2.485814519849262e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.22949208319187164, "step": 2090, "valid_targets_mean": 4577.1, "valid_targets_min": 1168 }, { "epoch": 3.368167202572347, "grad_norm": 0.4260321258743967, "learning_rate": 2.478032432049362e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.21895253658294678, "step": 2095, "valid_targets_mean": 5931.0, "valid_targets_min": 2107 }, { "epoch": 3.3762057877813505, "grad_norm": 0.4504678210337142, "learning_rate": 2.470242660597741e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.22290824353694916, "step": 2100, "valid_targets_mean": 5929.8, "valid_targets_min": 2326 }, { "epoch": 3.3842443729903535, "grad_norm": 0.41031164293445443, "learning_rate": 2.4624453307032475e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.23696118593215942, "step": 2105, "valid_targets_mean": 6418.2, "valid_targets_min": 1112 }, { "epoch": 3.392282958199357, "grad_norm": 0.48502919577531867, "learning_rate": 2.4546405676962212e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.2700331211090088, "step": 2110, "valid_targets_mean": 4992.6, "valid_targets_min": 955 }, { "epoch": 3.40032154340836, "grad_norm": 0.4229844699525625, "learning_rate": 2.4468284970264796e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.18260376155376434, "step": 2115, "valid_targets_mean": 5966.1, "valid_targets_min": 2274 }, { "epoch": 3.4083601286173635, "grad_norm": 0.4984857041447722, "learning_rate": 2.4390092442612977e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.23534205555915833, "step": 2120, "valid_targets_mean": 4669.6, "valid_targets_min": 1543 }, { "epoch": 3.4163987138263665, "grad_norm": 0.4859235898941334, "learning_rate": 2.4311829350833927e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.19799849390983582, "step": 2125, "valid_targets_mean": 6246.9, "valid_targets_min": 493 }, { "epoch": 3.42443729903537, "grad_norm": 0.4690768364402796, "learning_rate": 2.423349695288904e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516707181930542, "step": 2130, "valid_targets_mean": 5483.4, "valid_targets_min": 424 }, { "epoch": 3.432475884244373, "grad_norm": 0.44024466308006444, "learning_rate": 2.4155096507853668e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2450716495513916, "step": 2135, "valid_targets_mean": 6793.9, "valid_targets_min": 2403 }, { "epoch": 3.440514469453376, "grad_norm": 0.49255880868641494, "learning_rate": 2.407662927589697e-05, "loss": 0.2209, "loss_nan_ranks": 0, "loss_rank_avg": 0.27766314148902893, "step": 2140, "valid_targets_mean": 5863.6, "valid_targets_min": 1504 }, { "epoch": 3.4485530546623795, "grad_norm": 0.49652597672181636, "learning_rate": 2.3998096518261563e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.21233215928077698, "step": 2145, "valid_targets_mean": 5722.1, "valid_targets_min": 2198 }, { "epoch": 3.4565916398713825, "grad_norm": 0.4508380257265703, "learning_rate": 2.39194994972433e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.24831700325012207, "step": 2150, "valid_targets_mean": 5750.8, "valid_targets_min": 707 }, { "epoch": 3.464630225080386, "grad_norm": 0.505570603028868, "learning_rate": 2.3840839476170986e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.2556144595146179, "step": 2155, "valid_targets_mean": 5813.5, "valid_targets_min": 1052 }, { "epoch": 3.472668810289389, "grad_norm": 0.5080212244608979, "learning_rate": 2.3762117719386035e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.22166283428668976, "step": 2160, "valid_targets_mean": 5062.8, "valid_targets_min": 363 }, { "epoch": 3.4807073954983925, "grad_norm": 0.47342379469363194, "learning_rate": 2.368333549222219e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.23823466897010803, "step": 2165, "valid_targets_mean": 5316.8, "valid_targets_min": 1762 }, { "epoch": 3.4887459807073955, "grad_norm": 0.5419798446391779, "learning_rate": 2.3604494060985147e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.24541357159614563, "step": 2170, "valid_targets_mean": 5685.3, "valid_targets_min": 1966 }, { "epoch": 3.4967845659163985, "grad_norm": 0.4519419903196845, "learning_rate": 2.352559469293223e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.21435996890068054, "step": 2175, "valid_targets_mean": 5869.8, "valid_targets_min": 2068 }, { "epoch": 3.504823151125402, "grad_norm": 0.6041112174173733, "learning_rate": 2.3446638656252007e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.20639154314994812, "step": 2180, "valid_targets_mean": 4280.1, "valid_targets_min": 831 }, { "epoch": 3.512861736334405, "grad_norm": 0.438228796481592, "learning_rate": 2.336762722004391e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.19948528707027435, "step": 2185, "valid_targets_mean": 5539.8, "valid_targets_min": 842 }, { "epoch": 3.5209003215434085, "grad_norm": 0.4540829032794475, "learning_rate": 2.328856165429783e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2040947824716568, "step": 2190, "valid_targets_mean": 5811.5, "valid_targets_min": 2452 }, { "epoch": 3.5289389067524115, "grad_norm": 0.41836024915690306, "learning_rate": 2.3209443229873713e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.16951392590999603, "step": 2195, "valid_targets_mean": 6125.7, "valid_targets_min": 3390 }, { "epoch": 3.536977491961415, "grad_norm": 0.4850570987480443, "learning_rate": 2.313027321848113e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.20990464091300964, "step": 2200, "valid_targets_mean": 5732.7, "valid_targets_min": 364 }, { "epoch": 3.545016077170418, "grad_norm": 0.43896441152646415, "learning_rate": 2.3051052892658827e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.21642711758613586, "step": 2205, "valid_targets_mean": 5755.6, "valid_targets_min": 2773 }, { "epoch": 3.553054662379421, "grad_norm": 0.4709870338495115, "learning_rate": 2.297178352575429e-05, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.21805457770824432, "step": 2210, "valid_targets_mean": 5804.4, "valid_targets_min": 983 }, { "epoch": 3.5610932475884245, "grad_norm": 0.44572679930140774, "learning_rate": 2.2892466391903258e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.2034660279750824, "step": 2215, "valid_targets_mean": 5561.6, "valid_targets_min": 717 }, { "epoch": 3.5691318327974275, "grad_norm": 0.454325434835351, "learning_rate": 2.2813102766009254e-05, "loss": 0.2106, "loss_nan_ranks": 0, "loss_rank_avg": 0.22672885656356812, "step": 2220, "valid_targets_mean": 5497.9, "valid_targets_min": 505 }, { "epoch": 3.577170418006431, "grad_norm": 0.48626995312563503, "learning_rate": 2.2733693923723097e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.20194870233535767, "step": 2225, "valid_targets_mean": 5243.6, "valid_targets_min": 867 }, { "epoch": 3.585209003215434, "grad_norm": 0.4445447090227905, "learning_rate": 2.2654241141422386e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2123812437057495, "step": 2230, "valid_targets_mean": 4860.9, "valid_targets_min": 982 }, { "epoch": 3.593247588424437, "grad_norm": 0.6282387823578006, "learning_rate": 2.257474569619097e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.18385881185531616, "step": 2235, "valid_targets_mean": 5456.4, "valid_targets_min": 747 }, { "epoch": 3.6012861736334405, "grad_norm": 0.4661679781841043, "learning_rate": 2.2495208865798484e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516222596168518, "step": 2240, "valid_targets_mean": 5818.1, "valid_targets_min": 2430 }, { "epoch": 3.609324758842444, "grad_norm": 0.5063343638471681, "learning_rate": 2.241563192867974e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2693856358528137, "step": 2245, "valid_targets_mean": 5781.2, "valid_targets_min": 977 }, { "epoch": 3.617363344051447, "grad_norm": 0.46853096205787864, "learning_rate": 2.233601616391419e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.19709277153015137, "step": 2250, "valid_targets_mean": 4633.3, "valid_targets_min": 360 }, { "epoch": 3.62540192926045, "grad_norm": 0.47453245783445847, "learning_rate": 2.2256362851205423e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.20516790449619293, "step": 2255, "valid_targets_mean": 5310.6, "valid_targets_min": 584 }, { "epoch": 3.6334405144694535, "grad_norm": 0.4218807893646266, "learning_rate": 2.2176673270860513e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.2451988160610199, "step": 2260, "valid_targets_mean": 6055.2, "valid_targets_min": 2343 }, { "epoch": 3.6414790996784565, "grad_norm": 0.49840300841653384, "learning_rate": 2.209694870376951e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.23280146718025208, "step": 2265, "valid_targets_mean": 4976.8, "valid_targets_min": 628 }, { "epoch": 3.64951768488746, "grad_norm": 0.40449740396090167, "learning_rate": 2.2017190431384813e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.20014050602912903, "step": 2270, "valid_targets_mean": 6301.7, "valid_targets_min": 2562 }, { "epoch": 3.657556270096463, "grad_norm": 0.5348968486420073, "learning_rate": 2.1937399735700578e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.23371417820453644, "step": 2275, "valid_targets_mean": 4516.2, "valid_targets_min": 793 }, { "epoch": 3.665594855305466, "grad_norm": 0.4412069174813758, "learning_rate": 2.185757789923213e-05, "loss": 0.2092, "loss_nan_ranks": 0, "loss_rank_avg": 0.22182171046733856, "step": 2280, "valid_targets_mean": 5953.4, "valid_targets_min": 1050 }, { "epoch": 3.6736334405144695, "grad_norm": 0.4681541955311709, "learning_rate": 2.177772620499533e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.19206824898719788, "step": 2285, "valid_targets_mean": 4931.1, "valid_targets_min": 591 }, { "epoch": 3.6816720257234725, "grad_norm": 0.43440468582181413, "learning_rate": 2.169784593648594e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.21512943506240845, "step": 2290, "valid_targets_mean": 6165.6, "valid_targets_min": 3636 }, { "epoch": 3.689710610932476, "grad_norm": 0.4533493453174465, "learning_rate": 2.161793837765904e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.20502886176109314, "step": 2295, "valid_targets_mean": 6049.6, "valid_targets_min": 2196 }, { "epoch": 3.697749196141479, "grad_norm": 0.40904993139435536, "learning_rate": 2.1538004812908345e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.16571852564811707, "step": 2300, "valid_targets_mean": 5779.1, "valid_targets_min": 1787 }, { "epoch": 3.7057877813504825, "grad_norm": 0.49153894981339047, "learning_rate": 2.1458046527045563e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.2017051726579666, "step": 2305, "valid_targets_mean": 5293.1, "valid_targets_min": 479 }, { "epoch": 3.7138263665594855, "grad_norm": 0.4285879061951372, "learning_rate": 2.1378064805279796e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.23837776482105255, "step": 2310, "valid_targets_mean": 6358.2, "valid_targets_min": 1503 }, { "epoch": 3.721864951768489, "grad_norm": 0.4735435580454719, "learning_rate": 2.1298060933196797e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.22305136919021606, "step": 2315, "valid_targets_mean": 5233.4, "valid_targets_min": 1262 }, { "epoch": 3.729903536977492, "grad_norm": 0.4494458391637004, "learning_rate": 2.1218036196738382e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.20690946280956268, "step": 2320, "valid_targets_mean": 5577.9, "valid_targets_min": 2170 }, { "epoch": 3.737942122186495, "grad_norm": 0.4236260163992656, "learning_rate": 2.1137991882181716e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.2045375406742096, "step": 2325, "valid_targets_mean": 6003.2, "valid_targets_min": 735 }, { "epoch": 3.7459807073954985, "grad_norm": 0.4194948117221583, "learning_rate": 2.1057929276118663e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.2365095168352127, "step": 2330, "valid_targets_mean": 7019.9, "valid_targets_min": 2770 }, { "epoch": 3.7540192926045015, "grad_norm": 0.4554573167258968, "learning_rate": 2.097784966543509e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.22981056571006775, "step": 2335, "valid_targets_mean": 5870.8, "valid_targets_min": 2514 }, { "epoch": 3.762057877813505, "grad_norm": 0.3979763789428403, "learning_rate": 2.0897754337290186e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.249480202794075, "step": 2340, "valid_targets_mean": 6951.8, "valid_targets_min": 2075 }, { "epoch": 3.770096463022508, "grad_norm": 0.4326484331885382, "learning_rate": 2.081764457909578e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.21711274981498718, "step": 2345, "valid_targets_mean": 5988.9, "valid_targets_min": 3006 }, { "epoch": 3.778135048231511, "grad_norm": 0.4537090060178923, "learning_rate": 2.073752167849563e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.24819859862327576, "step": 2350, "valid_targets_mean": 6692.4, "valid_targets_min": 1672 }, { "epoch": 3.7861736334405145, "grad_norm": 0.4501156544408785, "learning_rate": 2.0657386923344763e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.19166472554206848, "step": 2355, "valid_targets_mean": 5443.9, "valid_targets_min": 2086 }, { "epoch": 3.7942122186495175, "grad_norm": 0.448471765482259, "learning_rate": 2.0577241601688715e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.21458148956298828, "step": 2360, "valid_targets_mean": 5981.8, "valid_targets_min": 964 }, { "epoch": 3.802250803858521, "grad_norm": 0.4361570179845142, "learning_rate": 2.0497087001742897e-05, "loss": 0.2145, "loss_nan_ranks": 0, "loss_rank_avg": 0.2361234426498413, "step": 2365, "valid_targets_mean": 5905.1, "valid_targets_min": 3336 }, { "epoch": 3.810289389067524, "grad_norm": 0.5319107692301696, "learning_rate": 2.0416924411871827e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.22896161675453186, "step": 2370, "valid_targets_mean": 4759.8, "valid_targets_min": 718 }, { "epoch": 3.8183279742765275, "grad_norm": 0.43055763396562985, "learning_rate": 2.0336755120568474e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.16542640328407288, "step": 2375, "valid_targets_mean": 5030.9, "valid_targets_min": 700 }, { "epoch": 3.8263665594855305, "grad_norm": 0.424784709923934, "learning_rate": 2.0256580416433507e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1930401623249054, "step": 2380, "valid_targets_mean": 5712.7, "valid_targets_min": 3377 }, { "epoch": 3.834405144694534, "grad_norm": 0.41048594391090903, "learning_rate": 2.017640158815459e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.19271403551101685, "step": 2385, "valid_targets_mean": 5625.4, "valid_targets_min": 398 }, { "epoch": 3.842443729903537, "grad_norm": 0.5112917261020897, "learning_rate": 2.0096219924485702e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.21932145953178406, "step": 2390, "valid_targets_mean": 4557.1, "valid_targets_min": 525 }, { "epoch": 3.85048231511254, "grad_norm": 0.46118075226408284, "learning_rate": 2.0016036714226375e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.2620882987976074, "step": 2395, "valid_targets_mean": 5693.9, "valid_targets_min": 1769 }, { "epoch": 3.8585209003215435, "grad_norm": 0.44773172289290925, "learning_rate": 1.993585324620101e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.20329290628433228, "step": 2400, "valid_targets_mean": 4980.4, "valid_targets_min": 923 }, { "epoch": 3.8665594855305465, "grad_norm": 0.494882324438044, "learning_rate": 1.985567080923815e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.22697266936302185, "step": 2405, "valid_targets_mean": 5325.9, "valid_targets_min": 2328 }, { "epoch": 3.87459807073955, "grad_norm": 0.44015889783779993, "learning_rate": 1.9775490692149754e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.20229412615299225, "step": 2410, "valid_targets_mean": 5463.9, "valid_targets_min": 1088 }, { "epoch": 3.882636655948553, "grad_norm": 0.42567259296177046, "learning_rate": 1.969531418371051e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.18126389384269714, "step": 2415, "valid_targets_mean": 5734.0, "valid_targets_min": 763 }, { "epoch": 3.890675241157556, "grad_norm": 0.45470968743706225, "learning_rate": 1.9615142572637088e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.24312356114387512, "step": 2420, "valid_targets_mean": 5781.9, "valid_targets_min": 2244 }, { "epoch": 3.8987138263665595, "grad_norm": 0.467052238827403, "learning_rate": 1.9534977147567457e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.18865913152694702, "step": 2425, "valid_targets_mean": 4876.2, "valid_targets_min": 1931 }, { "epoch": 3.906752411575563, "grad_norm": 0.47098837302480645, "learning_rate": 1.9454819197040142e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2384665310382843, "step": 2430, "valid_targets_mean": 5154.0, "valid_targets_min": 1026 }, { "epoch": 3.914790996784566, "grad_norm": 0.44490893084527133, "learning_rate": 1.9374670009473525e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.21634893119335175, "step": 2435, "valid_targets_mean": 5663.2, "valid_targets_min": 1532 }, { "epoch": 3.922829581993569, "grad_norm": 0.41659967178264024, "learning_rate": 1.9294530873145142e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.22321747243404388, "step": 2440, "valid_targets_mean": 6121.1, "valid_targets_min": 3266 }, { "epoch": 3.9308681672025725, "grad_norm": 0.43802772871467616, "learning_rate": 1.9214403076170968e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.20500494539737701, "step": 2445, "valid_targets_mean": 5410.9, "valid_targets_min": 1856 }, { "epoch": 3.9389067524115755, "grad_norm": 0.6732315793660567, "learning_rate": 1.913428790648472e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.21469956636428833, "step": 2450, "valid_targets_mean": 5684.2, "valid_targets_min": 2356 }, { "epoch": 3.946945337620579, "grad_norm": 0.4664945007826955, "learning_rate": 1.9054186651817145e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.23946499824523926, "step": 2455, "valid_targets_mean": 5438.3, "valid_targets_min": 2176 }, { "epoch": 3.954983922829582, "grad_norm": 0.4661613319228112, "learning_rate": 1.8974100599675324e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.22451001405715942, "step": 2460, "valid_targets_mean": 5269.4, "valid_targets_min": 1016 }, { "epoch": 3.963022508038585, "grad_norm": 0.41493904461143283, "learning_rate": 1.8894031037321983e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.18410423398017883, "step": 2465, "valid_targets_mean": 5644.1, "valid_targets_min": 3111 }, { "epoch": 3.9710610932475885, "grad_norm": 0.475551566600847, "learning_rate": 1.8813979251754823e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.25625407695770264, "step": 2470, "valid_targets_mean": 6587.2, "valid_targets_min": 2768 }, { "epoch": 3.9790996784565915, "grad_norm": 0.4457179679996537, "learning_rate": 1.8733946529685755e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.19752007722854614, "step": 2475, "valid_targets_mean": 5307.2, "valid_targets_min": 2521 }, { "epoch": 3.987138263665595, "grad_norm": 0.48633447011742686, "learning_rate": 1.865393415752033e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.2800830602645874, "step": 2480, "valid_targets_mean": 5018.9, "valid_targets_min": 502 }, { "epoch": 3.995176848874598, "grad_norm": 0.47160209353188187, "learning_rate": 1.8573943421336973e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.19500645995140076, "step": 2485, "valid_targets_mean": 5507.2, "valid_targets_min": 551 }, { "epoch": 4.003215434083601, "grad_norm": 0.4431683493276922, "learning_rate": 1.849397560686635e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.1778678148984909, "step": 2490, "valid_targets_mean": 5407.1, "valid_targets_min": 1746 }, { "epoch": 4.011254019292605, "grad_norm": 0.5063154975052353, "learning_rate": 1.8414031999470704e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000581920146942, "step": 2495, "valid_targets_mean": 4873.6, "valid_targets_min": 2477 }, { "epoch": 4.019292604501608, "grad_norm": 0.49353913726419607, "learning_rate": 1.8334113884123168e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.17449554800987244, "step": 2500, "valid_targets_mean": 5010.6, "valid_targets_min": 2113 }, { "epoch": 4.027331189710611, "grad_norm": 0.46262558060542996, "learning_rate": 1.825422254538714e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.25343796610832214, "step": 2505, "valid_targets_mean": 6078.9, "valid_targets_min": 653 }, { "epoch": 4.035369774919614, "grad_norm": 0.5362065215987764, "learning_rate": 1.8174359267395624e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.19421911239624023, "step": 2510, "valid_targets_mean": 4662.9, "valid_targets_min": 602 }, { "epoch": 4.043408360128617, "grad_norm": 0.4795175141250009, "learning_rate": 1.80945253338306e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.24856063723564148, "step": 2515, "valid_targets_mean": 6113.8, "valid_targets_min": 2423 }, { "epoch": 4.051446945337621, "grad_norm": 0.4876334669035427, "learning_rate": 1.801472202790235e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.18681687116622925, "step": 2520, "valid_targets_mean": 5507.8, "valid_targets_min": 2851 }, { "epoch": 4.059485530546624, "grad_norm": 0.46788947316546087, "learning_rate": 1.7934950632328893e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.18351972103118896, "step": 2525, "valid_targets_mean": 6029.2, "valid_targets_min": 1686 }, { "epoch": 4.067524115755627, "grad_norm": 0.4930457193060944, "learning_rate": 1.7855212429315323e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.1924591362476349, "step": 2530, "valid_targets_mean": 4770.0, "valid_targets_min": 310 }, { "epoch": 4.07556270096463, "grad_norm": 1.0707922894163995, "learning_rate": 1.7775508700533217e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.24290210008621216, "step": 2535, "valid_targets_mean": 5625.6, "valid_targets_min": 707 }, { "epoch": 4.083601286173633, "grad_norm": 0.45170678651858187, "learning_rate": 1.769584072710004e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.15965251624584198, "step": 2540, "valid_targets_mean": 5199.1, "valid_targets_min": 363 }, { "epoch": 4.091639871382637, "grad_norm": 0.4793914315138488, "learning_rate": 1.7616209789558513e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.1897103488445282, "step": 2545, "valid_targets_mean": 6103.6, "valid_targets_min": 1674 }, { "epoch": 4.09967845659164, "grad_norm": 0.509928017351408, "learning_rate": 1.75366171678561e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.27034711837768555, "step": 2550, "valid_targets_mean": 6321.3, "valid_targets_min": 586 }, { "epoch": 4.107717041800643, "grad_norm": 0.48592035160455116, "learning_rate": 1.7457064141324368e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.18286871910095215, "step": 2555, "valid_targets_mean": 5948.1, "valid_targets_min": 3357 }, { "epoch": 4.115755627009646, "grad_norm": 0.5511159152623385, "learning_rate": 1.7377551988658466e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.20568011701107025, "step": 2560, "valid_targets_mean": 4816.6, "valid_targets_min": 1377 }, { "epoch": 4.12379421221865, "grad_norm": 0.4984863584967216, "learning_rate": 1.7298081987896547e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.21172256767749786, "step": 2565, "valid_targets_mean": 5188.6, "valid_targets_min": 360 }, { "epoch": 4.131832797427653, "grad_norm": 0.450989941612913, "learning_rate": 1.721865541639924e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.18919016420841217, "step": 2570, "valid_targets_mean": 5664.1, "valid_targets_min": 2879 }, { "epoch": 4.139871382636656, "grad_norm": 0.43703722696294917, "learning_rate": 1.7139273550829117e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.19631536304950714, "step": 2575, "valid_targets_mean": 6282.9, "valid_targets_min": 2968 }, { "epoch": 4.147909967845659, "grad_norm": 0.432558045727956, "learning_rate": 1.7059937667130163e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.20107629895210266, "step": 2580, "valid_targets_mean": 6507.6, "valid_targets_min": 344 }, { "epoch": 4.155948553054662, "grad_norm": 0.42844076826077404, "learning_rate": 1.6980649040507296e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.20934857428073883, "step": 2585, "valid_targets_mean": 6436.5, "valid_targets_min": 2521 }, { "epoch": 4.163987138263666, "grad_norm": 0.4612185120502811, "learning_rate": 1.6901408945405794e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.18850497901439667, "step": 2590, "valid_targets_mean": 5565.6, "valid_targets_min": 889 }, { "epoch": 4.172025723472669, "grad_norm": 0.47366161861568484, "learning_rate": 1.6822218655490926e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.2318640649318695, "step": 2595, "valid_targets_mean": 5669.2, "valid_targets_min": 1787 }, { "epoch": 4.180064308681672, "grad_norm": 0.4478729477778503, "learning_rate": 1.674307944362738e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.16117283701896667, "step": 2600, "valid_targets_mean": 5841.4, "valid_targets_min": 2066 }, { "epoch": 4.188102893890675, "grad_norm": 0.513342399213119, "learning_rate": 1.6663992581858858e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.19785936176776886, "step": 2605, "valid_targets_mean": 4952.5, "valid_targets_min": 2254 }, { "epoch": 4.196141479099678, "grad_norm": 0.44758461547392403, "learning_rate": 1.65849593413876e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.2149113267660141, "step": 2610, "valid_targets_mean": 5862.0, "valid_targets_min": 2548 }, { "epoch": 4.204180064308682, "grad_norm": 0.47362083484044387, "learning_rate": 1.6505980992553973e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.22370827198028564, "step": 2615, "valid_targets_mean": 6501.8, "valid_targets_min": 368 }, { "epoch": 4.212218649517685, "grad_norm": 0.4855097676216963, "learning_rate": 1.6427058804816035e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.21815648674964905, "step": 2620, "valid_targets_mean": 5576.1, "valid_targets_min": 2816 }, { "epoch": 4.220257234726688, "grad_norm": 0.45317871679877536, "learning_rate": 1.634819404672916e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.18824812769889832, "step": 2625, "valid_targets_mean": 5293.6, "valid_targets_min": 2657 }, { "epoch": 4.228295819935691, "grad_norm": 0.4980247924474111, "learning_rate": 1.6269387985925607e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.3325211703777313, "step": 2630, "valid_targets_mean": 6427.8, "valid_targets_min": 363 }, { "epoch": 4.236334405144695, "grad_norm": 0.6649140044751879, "learning_rate": 1.6190641889094167e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.25851452350616455, "step": 2635, "valid_targets_mean": 5124.8, "valid_targets_min": 554 }, { "epoch": 4.244372990353698, "grad_norm": 0.4730526302752391, "learning_rate": 1.61119570219598e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.20996221899986267, "step": 2640, "valid_targets_mean": 5915.9, "valid_targets_min": 1928 }, { "epoch": 4.252411575562701, "grad_norm": 0.5118058577341814, "learning_rate": 1.6033334649263298e-05, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.21130703389644623, "step": 2645, "valid_targets_mean": 5496.5, "valid_targets_min": 822 }, { "epoch": 4.260450160771704, "grad_norm": 0.43776478494746524, "learning_rate": 1.595477603474095e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.18410971760749817, "step": 2650, "valid_targets_mean": 5455.0, "valid_targets_min": 1437 }, { "epoch": 4.268488745980707, "grad_norm": 0.553906016668327, "learning_rate": 1.5876282441104215e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.19235216081142426, "step": 2655, "valid_targets_mean": 5985.0, "valid_targets_min": 2192 }, { "epoch": 4.276527331189711, "grad_norm": 0.6277934063923197, "learning_rate": 1.5797855130019446e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.15879936516284943, "step": 2660, "valid_targets_mean": 5623.4, "valid_targets_min": 2064 }, { "epoch": 4.284565916398714, "grad_norm": 0.4175500519205594, "learning_rate": 1.5719495362087615e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.20981422066688538, "step": 2665, "valid_targets_mean": 6973.8, "valid_targets_min": 2993 }, { "epoch": 4.292604501607717, "grad_norm": 0.4837942057875352, "learning_rate": 1.5641204396824026e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.19984592497348785, "step": 2670, "valid_targets_mean": 4973.3, "valid_targets_min": 1122 }, { "epoch": 4.30064308681672, "grad_norm": 0.47079344745028745, "learning_rate": 1.556298349263809e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.1954348385334015, "step": 2675, "valid_targets_mean": 4884.9, "valid_targets_min": 449 }, { "epoch": 4.308681672025724, "grad_norm": 0.4594060901178028, "learning_rate": 1.5484833906813078e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.20647072792053223, "step": 2680, "valid_targets_mean": 5675.9, "valid_targets_min": 2232 }, { "epoch": 4.316720257234727, "grad_norm": 0.4600805545978283, "learning_rate": 1.5406756895485952e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.1757199764251709, "step": 2685, "valid_targets_mean": 6161.0, "valid_targets_min": 1423 }, { "epoch": 4.32475884244373, "grad_norm": 0.5361149346307585, "learning_rate": 1.5328753713627114e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.21314969658851624, "step": 2690, "valid_targets_mean": 5107.5, "valid_targets_min": 417 }, { "epoch": 4.332797427652733, "grad_norm": 0.4734201902427743, "learning_rate": 1.5250825615020314e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571180462837219, "step": 2695, "valid_targets_mean": 5717.2, "valid_targets_min": 514 }, { "epoch": 4.340836012861736, "grad_norm": 0.4384177489194904, "learning_rate": 1.5172973852242403e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.20939810574054718, "step": 2700, "valid_targets_mean": 6299.3, "valid_targets_min": 420 }, { "epoch": 4.34887459807074, "grad_norm": 0.4467839595052828, "learning_rate": 1.509519967664327e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935369223356247, "step": 2705, "valid_targets_mean": 6261.8, "valid_targets_min": 797 }, { "epoch": 4.356913183279743, "grad_norm": 0.43951166680518067, "learning_rate": 1.5017504338325724e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.17829066514968872, "step": 2710, "valid_targets_mean": 6320.8, "valid_targets_min": 4167 }, { "epoch": 4.364951768488746, "grad_norm": 0.5046374117946685, "learning_rate": 1.4939889086125354e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.2184838503599167, "step": 2715, "valid_targets_mean": 5021.6, "valid_targets_min": 2023 }, { "epoch": 4.372990353697749, "grad_norm": 0.47236424146260997, "learning_rate": 1.486235516759051e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101278305053711, "step": 2720, "valid_targets_mean": 4985.7, "valid_targets_min": 1302 }, { "epoch": 4.381028938906752, "grad_norm": 0.5296494215008, "learning_rate": 1.47849038289622e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.19631826877593994, "step": 2725, "valid_targets_mean": 4830.1, "valid_targets_min": 1901 }, { "epoch": 4.389067524115756, "grad_norm": 0.46328346813912447, "learning_rate": 1.4707536315154105e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.23391112685203552, "step": 2730, "valid_targets_mean": 6091.8, "valid_targets_min": 889 }, { "epoch": 4.397106109324759, "grad_norm": 0.49549169831142276, "learning_rate": 1.4630253869732538e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.2387903928756714, "step": 2735, "valid_targets_mean": 5893.7, "valid_targets_min": 2805 }, { "epoch": 4.405144694533762, "grad_norm": 0.5005618204176583, "learning_rate": 1.4553057734896485e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.19630920886993408, "step": 2740, "valid_targets_mean": 5303.3, "valid_targets_min": 458 }, { "epoch": 4.413183279742765, "grad_norm": 0.5071861848546898, "learning_rate": 1.4475949151457576e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.18431368470191956, "step": 2745, "valid_targets_mean": 5103.1, "valid_targets_min": 1717 }, { "epoch": 4.421221864951768, "grad_norm": 0.5717407040608831, "learning_rate": 1.4398929358820232e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.18112431466579437, "step": 2750, "valid_targets_mean": 5726.4, "valid_targets_min": 2752 }, { "epoch": 4.429260450160772, "grad_norm": 0.44976048990233286, "learning_rate": 1.4321999594961668e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.24178093671798706, "step": 2755, "valid_targets_mean": 6700.8, "valid_targets_min": 2324 }, { "epoch": 4.437299035369775, "grad_norm": 0.4753927161894043, "learning_rate": 1.4245161096412038e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.20099860429763794, "step": 2760, "valid_targets_mean": 5602.4, "valid_targets_min": 2348 }, { "epoch": 4.445337620578778, "grad_norm": 0.5209267732228876, "learning_rate": 1.4168415098234523e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.22852633893489838, "step": 2765, "valid_targets_mean": 5029.3, "valid_targets_min": 763 }, { "epoch": 4.453376205787781, "grad_norm": 0.486708199841311, "learning_rate": 1.4091762834005512e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.21605432033538818, "step": 2770, "valid_targets_mean": 6792.0, "valid_targets_min": 2662 }, { "epoch": 4.461414790996785, "grad_norm": 0.5015486523699413, "learning_rate": 1.401520553579476e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.19634661078453064, "step": 2775, "valid_targets_mean": 4970.1, "valid_targets_min": 2616 }, { "epoch": 4.469453376205788, "grad_norm": 0.47213874742476397, "learning_rate": 1.3938744434145597e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.17870403826236725, "step": 2780, "valid_targets_mean": 5548.0, "valid_targets_min": 1732 }, { "epoch": 4.477491961414791, "grad_norm": 0.48798130419819413, "learning_rate": 1.386238075805513e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.21423214673995972, "step": 2785, "valid_targets_mean": 5585.7, "valid_targets_min": 2704 }, { "epoch": 4.485530546623794, "grad_norm": 0.43853079491526586, "learning_rate": 1.3786115734954482e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.16943836212158203, "step": 2790, "valid_targets_mean": 5543.2, "valid_targets_min": 2570 }, { "epoch": 4.493569131832797, "grad_norm": 0.4318067748827032, "learning_rate": 1.3709950590689099e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.20014822483062744, "step": 2795, "valid_targets_mean": 6038.9, "valid_targets_min": 2778 }, { "epoch": 4.501607717041801, "grad_norm": 0.5234018992311159, "learning_rate": 1.3633886549499016e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.18016895651817322, "step": 2800, "valid_targets_mean": 5694.5, "valid_targets_min": 2535 }, { "epoch": 4.509646302250804, "grad_norm": 0.48964885396418867, "learning_rate": 1.3557924833999192e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.22023364901542664, "step": 2805, "valid_targets_mean": 5295.1, "valid_targets_min": 1017 }, { "epoch": 4.517684887459807, "grad_norm": 0.47778416704363436, "learning_rate": 1.3482066665159845e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.2275695502758026, "step": 2810, "valid_targets_mean": 5627.1, "valid_targets_min": 2083 }, { "epoch": 4.52572347266881, "grad_norm": 0.49092993021320624, "learning_rate": 1.3406313262286845e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.1840728521347046, "step": 2815, "valid_targets_mean": 4954.2, "valid_targets_min": 2803 }, { "epoch": 4.533762057877814, "grad_norm": 0.4928580565982705, "learning_rate": 1.333066584300211e-05, "loss": 0.2041, "loss_nan_ranks": 0, "loss_rank_avg": 0.19534510374069214, "step": 2820, "valid_targets_mean": 5510.9, "valid_targets_min": 2471 }, { "epoch": 4.541800643086817, "grad_norm": 0.4417672881758802, "learning_rate": 1.3255125623224025e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.19574567675590515, "step": 2825, "valid_targets_mean": 6772.1, "valid_targets_min": 816 }, { "epoch": 4.54983922829582, "grad_norm": 0.4770904638690074, "learning_rate": 1.317969381714791e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.18321281671524048, "step": 2830, "valid_targets_mean": 5458.4, "valid_targets_min": 794 }, { "epoch": 4.557877813504823, "grad_norm": 0.6085685008276643, "learning_rate": 1.3104371637226483e-05, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.22217214107513428, "step": 2835, "valid_targets_mean": 4775.9, "valid_targets_min": 780 }, { "epoch": 4.565916398713826, "grad_norm": 0.4838109854552672, "learning_rate": 1.30291602941504e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.19242960214614868, "step": 2840, "valid_targets_mean": 5120.0, "valid_targets_min": 1543 }, { "epoch": 4.57395498392283, "grad_norm": 0.5494698222405994, "learning_rate": 1.2954060996828783e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.2533257007598877, "step": 2845, "valid_targets_mean": 4385.7, "valid_targets_min": 669 }, { "epoch": 4.581993569131833, "grad_norm": 0.5485921989290943, "learning_rate": 1.2879074952369787e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.211238831281662, "step": 2850, "valid_targets_mean": 4155.8, "valid_targets_min": 969 }, { "epoch": 4.590032154340836, "grad_norm": 0.5041645016380173, "learning_rate": 1.280420336606118e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.20651057362556458, "step": 2855, "valid_targets_mean": 5091.2, "valid_targets_min": 974 }, { "epoch": 4.598070739549839, "grad_norm": 0.5242677107999061, "learning_rate": 1.272944744135101e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.17013058066368103, "step": 2860, "valid_targets_mean": 4655.6, "valid_targets_min": 904 }, { "epoch": 4.606109324758842, "grad_norm": 0.4816881362793337, "learning_rate": 1.265480837982823e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.16162796318531036, "step": 2865, "valid_targets_mean": 5032.6, "valid_targets_min": 2480 }, { "epoch": 4.614147909967846, "grad_norm": 0.5595574344139143, "learning_rate": 1.2580287381203395e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.19007542729377747, "step": 2870, "valid_targets_mean": 5541.3, "valid_targets_min": 2562 }, { "epoch": 4.622186495176849, "grad_norm": 0.5162023822041768, "learning_rate": 1.2505885643289376e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.2073974907398224, "step": 2875, "valid_targets_mean": 5048.6, "valid_targets_min": 914 }, { "epoch": 4.630225080385852, "grad_norm": 0.4295671718244202, "learning_rate": 1.2431604361982097e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.15762320160865784, "step": 2880, "valid_targets_mean": 5443.6, "valid_targets_min": 2303 }, { "epoch": 4.638263665594855, "grad_norm": 0.436533185299774, "learning_rate": 1.2357444731241341e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.1579321324825287, "step": 2885, "valid_targets_mean": 5016.8, "valid_targets_min": 1380 }, { "epoch": 4.646302250803858, "grad_norm": 0.45315199666744377, "learning_rate": 1.2283407943071527e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.21414679288864136, "step": 2890, "valid_targets_mean": 6171.1, "valid_targets_min": 681 }, { "epoch": 4.654340836012862, "grad_norm": 0.45840997399289807, "learning_rate": 1.2209495187502591e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.21173666417598724, "step": 2895, "valid_targets_mean": 6205.8, "valid_targets_min": 2671 }, { "epoch": 4.662379421221865, "grad_norm": 1.241580962067996, "learning_rate": 1.213570765257078e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.18394725024700165, "step": 2900, "valid_targets_mean": 5422.6, "valid_targets_min": 718 }, { "epoch": 4.670418006430868, "grad_norm": 0.4701730532716653, "learning_rate": 1.2062046524299662e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.21215137839317322, "step": 2905, "valid_targets_mean": 6072.1, "valid_targets_min": 3793 }, { "epoch": 4.678456591639871, "grad_norm": 0.47514186818883347, "learning_rate": 1.1988512986680977e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.26547539234161377, "step": 2910, "valid_targets_mean": 7249.2, "valid_targets_min": 2544 }, { "epoch": 4.686495176848875, "grad_norm": 0.5245596550859682, "learning_rate": 1.1915108221655646e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.1955907642841339, "step": 2915, "valid_targets_mean": 5297.4, "valid_targets_min": 964 }, { "epoch": 4.694533762057878, "grad_norm": 0.5750733791368552, "learning_rate": 1.1841833409094775e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.19828759133815765, "step": 2920, "valid_targets_mean": 4593.1, "valid_targets_min": 355 }, { "epoch": 4.702572347266881, "grad_norm": 0.46946293076584145, "learning_rate": 1.1768689726780652e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.15981552004814148, "step": 2925, "valid_targets_mean": 5449.8, "valid_targets_min": 3162 }, { "epoch": 4.710610932475884, "grad_norm": 0.4567632066199438, "learning_rate": 1.1695678350387864e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.15649572014808655, "step": 2930, "valid_targets_mean": 5421.6, "valid_targets_min": 509 }, { "epoch": 4.718649517684888, "grad_norm": 0.46216431003159764, "learning_rate": 1.1622800453464387e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.209588423371315, "step": 2935, "valid_targets_mean": 5569.3, "valid_targets_min": 2531 }, { "epoch": 4.726688102893891, "grad_norm": 0.46962991061066467, "learning_rate": 1.1550057207412704e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.16872183978557587, "step": 2940, "valid_targets_mean": 4777.9, "valid_targets_min": 2288 }, { "epoch": 4.734726688102894, "grad_norm": 0.4695838498589093, "learning_rate": 1.1477449781470975e-05, "loss": 0.2025, "loss_nan_ranks": 0, "loss_rank_avg": 0.21210195124149323, "step": 2945, "valid_targets_mean": 5874.9, "valid_targets_min": 1490 }, { "epoch": 4.742765273311897, "grad_norm": 0.5184365125355269, "learning_rate": 1.1404979342694271e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.2304067313671112, "step": 2950, "valid_targets_mean": 5133.4, "valid_targets_min": 1612 }, { "epoch": 4.7508038585209, "grad_norm": 0.5906947681279004, "learning_rate": 1.1332647055935815e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1860680878162384, "step": 2955, "valid_targets_mean": 5155.0, "valid_targets_min": 2688 }, { "epoch": 4.758842443729904, "grad_norm": 0.4759457622901129, "learning_rate": 1.1260454083828219e-05, "loss": 0.2126, "loss_nan_ranks": 0, "loss_rank_avg": 0.17885443568229675, "step": 2960, "valid_targets_mean": 4640.9, "valid_targets_min": 351 }, { "epoch": 4.766881028938907, "grad_norm": 0.46334565950112583, "learning_rate": 1.118840158676484e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.22456106543540955, "step": 2965, "valid_targets_mean": 5932.4, "valid_targets_min": 1003 }, { "epoch": 4.77491961414791, "grad_norm": 0.5024862102855205, "learning_rate": 1.1116490722881084e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.20128870010375977, "step": 2970, "valid_targets_mean": 5589.7, "valid_targets_min": 686 }, { "epoch": 4.782958199356913, "grad_norm": 0.5640048243597826, "learning_rate": 1.1044722648035844e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.16415663063526154, "step": 2975, "valid_targets_mean": 4988.2, "valid_targets_min": 683 }, { "epoch": 4.790996784565916, "grad_norm": 0.5068459771538669, "learning_rate": 1.0973098515792886e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.21549053490161896, "step": 2980, "valid_targets_mean": 4673.6, "valid_targets_min": 1088 }, { "epoch": 4.79903536977492, "grad_norm": 0.4441531212030373, "learning_rate": 1.090161947740231e-05, "loss": 0.2163, "loss_nan_ranks": 0, "loss_rank_avg": 0.21432173252105713, "step": 2985, "valid_targets_mean": 6529.7, "valid_targets_min": 2107 }, { "epoch": 4.807073954983923, "grad_norm": 0.4824083142982788, "learning_rate": 1.0830286681782058e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.17304901778697968, "step": 2990, "valid_targets_mean": 5721.2, "valid_targets_min": 3087 }, { "epoch": 4.815112540192926, "grad_norm": 0.4674232061795263, "learning_rate": 1.0759101275499436e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.1900356411933899, "step": 2995, "valid_targets_mean": 5728.6, "valid_targets_min": 274 }, { "epoch": 4.823151125401929, "grad_norm": 0.5691216186327724, "learning_rate": 1.0688064402752682e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550208270549774, "step": 3000, "valid_targets_mean": 5726.8, "valid_targets_min": 335 }, { "epoch": 4.831189710610932, "grad_norm": 0.45136375661997785, "learning_rate": 1.0617177205352599e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.23120132088661194, "step": 3005, "valid_targets_mean": 6514.9, "valid_targets_min": 2901 }, { "epoch": 4.839228295819936, "grad_norm": 0.4677445143572103, "learning_rate": 1.0546440822704161e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.16181737184524536, "step": 3010, "valid_targets_mean": 5833.4, "valid_targets_min": 2259 }, { "epoch": 4.847266881028939, "grad_norm": 0.4303599978006847, "learning_rate": 1.047585639178824e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.19590692222118378, "step": 3015, "valid_targets_mean": 6491.2, "valid_targets_min": 2829 }, { "epoch": 4.855305466237942, "grad_norm": 0.4968455190517692, "learning_rate": 1.0405425047143306e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.19899852573871613, "step": 3020, "valid_targets_mean": 4808.4, "valid_targets_min": 1306 }, { "epoch": 4.863344051446945, "grad_norm": 0.44258897347035453, "learning_rate": 1.0335147920847195e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.16738440096378326, "step": 3025, "valid_targets_mean": 6046.5, "valid_targets_min": 335 }, { "epoch": 4.871382636655948, "grad_norm": 0.4258283265646621, "learning_rate": 1.0265026142498931e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.17937082052230835, "step": 3030, "valid_targets_mean": 6212.4, "valid_targets_min": 424 }, { "epoch": 4.879421221864952, "grad_norm": 0.4400634408990787, "learning_rate": 1.0195060839200509e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.16629022359848022, "step": 3035, "valid_targets_mean": 5804.9, "valid_targets_min": 1181 }, { "epoch": 4.887459807073955, "grad_norm": 0.42872797950189373, "learning_rate": 1.0125253135538884e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.2543446123600006, "step": 3040, "valid_targets_mean": 7248.3, "valid_targets_min": 2207 }, { "epoch": 4.895498392282958, "grad_norm": 1.4172639399354463, "learning_rate": 1.0055604153567797e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.21109551191329956, "step": 3045, "valid_targets_mean": 4353.4, "valid_targets_min": 954 }, { "epoch": 4.903536977491961, "grad_norm": 0.516041539017509, "learning_rate": 9.98611501278979e-06, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.21019768714904785, "step": 3050, "valid_targets_mean": 5650.9, "valid_targets_min": 2814 }, { "epoch": 4.911575562700965, "grad_norm": 0.48566131713136484, "learning_rate": 9.916786830138179e-06, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.2410656213760376, "step": 3055, "valid_targets_mean": 5875.2, "valid_targets_min": 2784 }, { "epoch": 4.919614147909968, "grad_norm": 0.46141499765797606, "learning_rate": 9.847620719959142e-06, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.19822564721107483, "step": 3060, "valid_targets_mean": 6029.5, "valid_targets_min": 1188 }, { "epoch": 4.927652733118971, "grad_norm": 0.4994533341956204, "learning_rate": 9.77861779399377e-06, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.18340840935707092, "step": 3065, "valid_targets_mean": 5793.5, "valid_targets_min": 419 }, { "epoch": 4.935691318327974, "grad_norm": 0.4787179730500465, "learning_rate": 9.709779161360238e-06, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.1906869113445282, "step": 3070, "valid_targets_mean": 5818.4, "valid_targets_min": 1802 }, { "epoch": 4.943729903536978, "grad_norm": 0.49507384669911486, "learning_rate": 9.641105928535935e-06, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.1777634173631668, "step": 3075, "valid_targets_mean": 5820.6, "valid_targets_min": 1582 }, { "epoch": 4.951768488745981, "grad_norm": 0.5046231532831364, "learning_rate": 9.572599199339685e-06, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.16210362315177917, "step": 3080, "valid_targets_mean": 4660.9, "valid_targets_min": 2346 }, { "epoch": 4.959807073954984, "grad_norm": 0.4659755600893732, "learning_rate": 9.50426007491404e-06, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.20857881009578705, "step": 3085, "valid_targets_mean": 5818.4, "valid_targets_min": 2268 }, { "epoch": 4.967845659163987, "grad_norm": 0.43079763715355324, "learning_rate": 9.436089653707546e-06, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2077915072441101, "step": 3090, "valid_targets_mean": 6538.9, "valid_targets_min": 1969 }, { "epoch": 4.97588424437299, "grad_norm": 0.44859465981547175, "learning_rate": 9.368089031457099e-06, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704615354537964, "step": 3095, "valid_targets_mean": 5725.5, "valid_targets_min": 671 }, { "epoch": 4.983922829581994, "grad_norm": 0.5131061791485555, "learning_rate": 9.30025930117034e-06, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.20215710997581482, "step": 3100, "valid_targets_mean": 4396.8, "valid_targets_min": 1779 }, { "epoch": 4.991961414790997, "grad_norm": 0.46330324395499967, "learning_rate": 9.23260155310807e-06, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.19142061471939087, "step": 3105, "valid_targets_mean": 5785.6, "valid_targets_min": 1052 }, { "epoch": 5.0, "grad_norm": 0.46419646695644273, "learning_rate": 9.165116874766739e-06, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.21007190644741058, "step": 3110, "valid_targets_mean": 5836.8, "valid_targets_min": 699 }, { "epoch": 5.008038585209003, "grad_norm": 0.4979445134634955, "learning_rate": 9.097806350860963e-06, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.15829969942569733, "step": 3115, "valid_targets_mean": 4624.7, "valid_targets_min": 2507 }, { "epoch": 5.016077170418006, "grad_norm": 0.4866122349627383, "learning_rate": 9.03067106330608e-06, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.1525759994983673, "step": 3120, "valid_targets_mean": 4143.9, "valid_targets_min": 449 }, { "epoch": 5.02411575562701, "grad_norm": 0.5275864662151682, "learning_rate": 8.963712091200776e-06, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.17857800424098969, "step": 3125, "valid_targets_mean": 4387.2, "valid_targets_min": 1658 }, { "epoch": 5.032154340836013, "grad_norm": 0.46221163971498497, "learning_rate": 8.896930510809729e-06, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.18663164973258972, "step": 3130, "valid_targets_mean": 5841.6, "valid_targets_min": 2836 }, { "epoch": 5.040192926045016, "grad_norm": 0.5585973033774798, "learning_rate": 8.83032739554631e-06, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.21429578959941864, "step": 3135, "valid_targets_mean": 5289.9, "valid_targets_min": 700 }, { "epoch": 5.048231511254019, "grad_norm": 0.48266689854920847, "learning_rate": 8.763903815955343e-06, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.18342766165733337, "step": 3140, "valid_targets_mean": 5663.1, "valid_targets_min": 671 }, { "epoch": 5.056270096463023, "grad_norm": 0.47856495871810556, "learning_rate": 8.69766083969586e-06, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.1659879833459854, "step": 3145, "valid_targets_mean": 5181.4, "valid_targets_min": 1288 }, { "epoch": 5.064308681672026, "grad_norm": 0.4583945660599572, "learning_rate": 8.631599531523984e-06, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.19702893495559692, "step": 3150, "valid_targets_mean": 6398.4, "valid_targets_min": 2277 }, { "epoch": 5.072347266881029, "grad_norm": 0.4778149367767458, "learning_rate": 8.565720953275812e-06, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.21160531044006348, "step": 3155, "valid_targets_mean": 5688.0, "valid_targets_min": 2206 }, { "epoch": 5.080385852090032, "grad_norm": 0.5457542785844479, "learning_rate": 8.500026163850305e-06, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.19538471102714539, "step": 3160, "valid_targets_mean": 5499.2, "valid_targets_min": 2174 }, { "epoch": 5.088424437299035, "grad_norm": 0.47663165704336896, "learning_rate": 8.434516219192322e-06, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.21058623492717743, "step": 3165, "valid_targets_mean": 6227.2, "valid_targets_min": 705 }, { "epoch": 5.096463022508039, "grad_norm": 0.5270713782036919, "learning_rate": 8.369192172275582e-06, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.21326503157615662, "step": 3170, "valid_targets_mean": 5780.4, "valid_targets_min": 946 }, { "epoch": 5.104501607717042, "grad_norm": 0.47972931998923163, "learning_rate": 8.304055073085815e-06, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1448415368795395, "step": 3175, "valid_targets_mean": 4978.8, "valid_targets_min": 574 }, { "epoch": 5.112540192926045, "grad_norm": 0.5339301964753969, "learning_rate": 8.239105968603824e-06, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.21358755230903625, "step": 3180, "valid_targets_mean": 5267.1, "valid_targets_min": 2349 }, { "epoch": 5.120578778135048, "grad_norm": 0.43894080846451544, "learning_rate": 8.174345902788712e-06, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.13934409618377686, "step": 3185, "valid_targets_mean": 5794.8, "valid_targets_min": 3113 }, { "epoch": 5.128617363344051, "grad_norm": 0.4377305756613267, "learning_rate": 8.109775916561026e-06, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1634282022714615, "step": 3190, "valid_targets_mean": 6257.9, "valid_targets_min": 2573 }, { "epoch": 5.136655948553055, "grad_norm": 0.5100917432819688, "learning_rate": 8.045397047786103e-06, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.18037614226341248, "step": 3195, "valid_targets_mean": 6120.2, "valid_targets_min": 1045 }, { "epoch": 5.144694533762058, "grad_norm": 0.4857411122320573, "learning_rate": 7.981210331257336e-06, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.15463681519031525, "step": 3200, "valid_targets_mean": 4595.8, "valid_targets_min": 2333 }, { "epoch": 5.152733118971061, "grad_norm": 0.46626013958080015, "learning_rate": 7.917216798679575e-06, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.2193758636713028, "step": 3205, "valid_targets_mean": 6617.2, "valid_targets_min": 1900 }, { "epoch": 5.160771704180064, "grad_norm": 0.6986387448162077, "learning_rate": 7.853417478652516e-06, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.20716939866542816, "step": 3210, "valid_targets_mean": 5879.0, "valid_targets_min": 2331 }, { "epoch": 5.168810289389068, "grad_norm": 0.5316897024374411, "learning_rate": 7.78981339665419e-06, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.17304065823554993, "step": 3215, "valid_targets_mean": 4310.8, "valid_targets_min": 628 }, { "epoch": 5.176848874598071, "grad_norm": 1.0402816301379194, "learning_rate": 7.72640557502446e-06, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.18185323476791382, "step": 3220, "valid_targets_mean": 6621.9, "valid_targets_min": 2137 }, { "epoch": 5.184887459807074, "grad_norm": 0.5077283321168016, "learning_rate": 7.663195032948612e-06, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.19564370810985565, "step": 3225, "valid_targets_mean": 5012.2, "valid_targets_min": 344 }, { "epoch": 5.192926045016077, "grad_norm": 0.4449974444997836, "learning_rate": 7.6001827864409574e-06, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.19020414352416992, "step": 3230, "valid_targets_mean": 6730.3, "valid_targets_min": 2373 }, { "epoch": 5.20096463022508, "grad_norm": 0.45674780734397, "learning_rate": 7.537369848328482e-06, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.19216638803482056, "step": 3235, "valid_targets_mean": 6425.2, "valid_targets_min": 3486 }, { "epoch": 5.209003215434084, "grad_norm": 0.5432545315748706, "learning_rate": 7.474757228234626e-06, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.21978577971458435, "step": 3240, "valid_targets_mean": 4865.6, "valid_targets_min": 274 }, { "epoch": 5.217041800643087, "grad_norm": 0.4461775961777822, "learning_rate": 7.412345932562997e-06, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.16950002312660217, "step": 3245, "valid_targets_mean": 5934.8, "valid_targets_min": 2995 }, { "epoch": 5.22508038585209, "grad_norm": 0.4956785865612323, "learning_rate": 7.350136964481218e-06, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.16553393006324768, "step": 3250, "valid_targets_mean": 4609.6, "valid_targets_min": 831 }, { "epoch": 5.233118971061093, "grad_norm": 0.478657006339967, "learning_rate": 7.288131323904812e-06, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.17582754790782928, "step": 3255, "valid_targets_mean": 5341.8, "valid_targets_min": 3220 }, { "epoch": 5.241157556270096, "grad_norm": 0.48870709583594846, "learning_rate": 7.2263300074810925e-06, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.2231275886297226, "step": 3260, "valid_targets_mean": 5515.4, "valid_targets_min": 2141 }, { "epoch": 5.2491961414791, "grad_norm": 0.5538754582625227, "learning_rate": 7.164734008573186e-06, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.19707731902599335, "step": 3265, "valid_targets_mean": 6562.5, "valid_targets_min": 3759 }, { "epoch": 5.257234726688103, "grad_norm": 0.4983801668294154, "learning_rate": 7.103344317244065e-06, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.18967768549919128, "step": 3270, "valid_targets_mean": 5918.1, "valid_targets_min": 2175 }, { "epoch": 5.265273311897106, "grad_norm": 0.4586010946247427, "learning_rate": 7.0421619202406e-06, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.18738381564617157, "step": 3275, "valid_targets_mean": 6154.1, "valid_targets_min": 2023 }, { "epoch": 5.273311897106109, "grad_norm": 0.48811893275730395, "learning_rate": 6.981187800977706e-06, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.18499714136123657, "step": 3280, "valid_targets_mean": 5491.1, "valid_targets_min": 1459 }, { "epoch": 5.281350482315113, "grad_norm": 0.5268803552811097, "learning_rate": 6.920422939522573e-06, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.19314301013946533, "step": 3285, "valid_targets_mean": 4503.8, "valid_targets_min": 686 }, { "epoch": 5.289389067524116, "grad_norm": 0.46419450029948367, "learning_rate": 6.859868312578865e-06, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17092689871788025, "step": 3290, "valid_targets_mean": 6016.6, "valid_targets_min": 2676 }, { "epoch": 5.297427652733119, "grad_norm": 0.5047867299066612, "learning_rate": 6.799524893471055e-06, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.18408851325511932, "step": 3295, "valid_targets_mean": 4765.6, "valid_targets_min": 955 }, { "epoch": 5.305466237942122, "grad_norm": 0.4638194012764823, "learning_rate": 6.739393652128776e-06, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.17362159490585327, "step": 3300, "valid_targets_mean": 5807.0, "valid_targets_min": 2695 }, { "epoch": 5.313504823151125, "grad_norm": 0.518671277988672, "learning_rate": 6.679475555071198e-06, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.1955638825893402, "step": 3305, "valid_targets_mean": 4877.8, "valid_targets_min": 3273 }, { "epoch": 5.321543408360129, "grad_norm": 0.4312127415985306, "learning_rate": 6.619771565391535e-06, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737706959247589, "step": 3310, "valid_targets_mean": 6052.8, "valid_targets_min": 525 }, { "epoch": 5.329581993569132, "grad_norm": 0.4577678581026521, "learning_rate": 6.560282642741544e-06, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.17677032947540283, "step": 3315, "valid_targets_mean": 5634.6, "valid_targets_min": 2590 }, { "epoch": 5.337620578778135, "grad_norm": 0.47138237498351343, "learning_rate": 6.501009743316105e-06, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.20099903643131256, "step": 3320, "valid_targets_mean": 5851.9, "valid_targets_min": 2074 }, { "epoch": 5.345659163987138, "grad_norm": 0.4598019513900346, "learning_rate": 6.441953819837845e-06, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.18965350091457367, "step": 3325, "valid_targets_mean": 6094.8, "valid_targets_min": 2205 }, { "epoch": 5.353697749196142, "grad_norm": 0.483304158605293, "learning_rate": 6.383115821541834e-06, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.22649700939655304, "step": 3330, "valid_targets_mean": 5885.5, "valid_targets_min": 2844 }, { "epoch": 5.361736334405145, "grad_norm": 0.4779634450187073, "learning_rate": 6.324496694160318e-06, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.21910080313682556, "step": 3335, "valid_targets_mean": 5985.5, "valid_targets_min": 2095 }, { "epoch": 5.369774919614148, "grad_norm": 0.5067078850486267, "learning_rate": 6.266097379907534e-06, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.17074373364448547, "step": 3340, "valid_targets_mean": 5271.4, "valid_targets_min": 818 }, { "epoch": 5.377813504823151, "grad_norm": 0.5595730160635201, "learning_rate": 6.2079188174645335e-06, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.22083780169487, "step": 3345, "valid_targets_mean": 6631.5, "valid_targets_min": 1702 }, { "epoch": 5.385852090032154, "grad_norm": 0.5656540952095462, "learning_rate": 6.149961941964122e-06, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.2227296233177185, "step": 3350, "valid_targets_mean": 4248.2, "valid_targets_min": 726 }, { "epoch": 5.393890675241158, "grad_norm": 0.4504085084825842, "learning_rate": 6.09222768497584e-06, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.17969395220279694, "step": 3355, "valid_targets_mean": 6162.1, "valid_targets_min": 509 }, { "epoch": 5.401929260450161, "grad_norm": 0.5146997355757669, "learning_rate": 6.034716974490953e-06, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.24291618168354034, "step": 3360, "valid_targets_mean": 5900.8, "valid_targets_min": 3057 }, { "epoch": 5.409967845659164, "grad_norm": 0.5351421245212054, "learning_rate": 5.977430734907559e-06, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.18290022015571594, "step": 3365, "valid_targets_mean": 5167.9, "valid_targets_min": 755 }, { "epoch": 5.418006430868167, "grad_norm": 0.5014907743840198, "learning_rate": 5.9203698870157114e-06, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.2125318944454193, "step": 3370, "valid_targets_mean": 6113.8, "valid_targets_min": 1147 }, { "epoch": 5.42604501607717, "grad_norm": 0.47556758623766643, "learning_rate": 5.863535347982645e-06, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.20354855060577393, "step": 3375, "valid_targets_mean": 6618.1, "valid_targets_min": 3805 }, { "epoch": 5.434083601286174, "grad_norm": 0.49228060520233496, "learning_rate": 5.806928031338015e-06, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.1746979057788849, "step": 3380, "valid_targets_mean": 5142.9, "valid_targets_min": 343 }, { "epoch": 5.442122186495177, "grad_norm": 0.4658584374183205, "learning_rate": 5.750548846959234e-06, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.18658800423145294, "step": 3385, "valid_targets_mean": 5597.9, "valid_targets_min": 1719 }, { "epoch": 5.45016077170418, "grad_norm": 0.46391846520510605, "learning_rate": 5.694398701056801e-06, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.165060892701149, "step": 3390, "valid_targets_mean": 5311.4, "valid_targets_min": 683 }, { "epoch": 5.458199356913183, "grad_norm": 0.46640745139708, "learning_rate": 5.638478496159791e-06, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.22248056530952454, "step": 3395, "valid_targets_mean": 7049.8, "valid_targets_min": 2341 }, { "epoch": 5.466237942122186, "grad_norm": 0.488353156536436, "learning_rate": 5.5827891311013185e-06, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.22211244702339172, "step": 3400, "valid_targets_mean": 5960.9, "valid_targets_min": 2687 }, { "epoch": 5.47427652733119, "grad_norm": 0.5126088033141332, "learning_rate": 5.52733150100409e-06, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.20660114288330078, "step": 3405, "valid_targets_mean": 5240.8, "valid_targets_min": 359 }, { "epoch": 5.482315112540193, "grad_norm": 0.4838482712196251, "learning_rate": 5.472106497266023e-06, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.17103157937526703, "step": 3410, "valid_targets_mean": 5297.1, "valid_targets_min": 355 }, { "epoch": 5.490353697749196, "grad_norm": 0.4984237613144674, "learning_rate": 5.417115007545921e-06, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.22633609175682068, "step": 3415, "valid_targets_mean": 6094.9, "valid_targets_min": 904 }, { "epoch": 5.498392282958199, "grad_norm": 0.523636320883912, "learning_rate": 5.362357915749194e-06, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.21240352094173431, "step": 3420, "valid_targets_mean": 4989.8, "valid_targets_min": 2961 }, { "epoch": 5.506430868167203, "grad_norm": 0.48044513730538596, "learning_rate": 5.307836102013666e-06, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.15104694664478302, "step": 3425, "valid_targets_mean": 5328.5, "valid_targets_min": 1807 }, { "epoch": 5.514469453376206, "grad_norm": 0.4751176561827757, "learning_rate": 5.2535504426954145e-06, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.22195205092430115, "step": 3430, "valid_targets_mean": 6118.9, "valid_targets_min": 594 }, { "epoch": 5.522508038585209, "grad_norm": 0.48516517392290076, "learning_rate": 5.199501810354692e-06, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.15345501899719238, "step": 3435, "valid_targets_mean": 5330.9, "valid_targets_min": 2513 }, { "epoch": 5.530546623794212, "grad_norm": 0.5121095480216645, "learning_rate": 5.145691073741898e-06, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.18172189593315125, "step": 3440, "valid_targets_mean": 4640.0, "valid_targets_min": 1492 }, { "epoch": 5.538585209003215, "grad_norm": 0.49530201825529846, "learning_rate": 5.092119097783621e-06, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.18862499296665192, "step": 3445, "valid_targets_mean": 6436.6, "valid_targets_min": 2814 }, { "epoch": 5.546623794212219, "grad_norm": 0.49091742317146175, "learning_rate": 5.0387867435687265e-06, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.20091378688812256, "step": 3450, "valid_targets_mean": 5780.8, "valid_targets_min": 3062 }, { "epoch": 5.554662379421222, "grad_norm": 0.4462477186654765, "learning_rate": 4.9856948683345255e-06, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1533946990966797, "step": 3455, "valid_targets_mean": 5978.1, "valid_targets_min": 1061 }, { "epoch": 5.562700964630225, "grad_norm": 0.5033789822369987, "learning_rate": 4.9328443254529765e-06, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.17586976289749146, "step": 3460, "valid_targets_mean": 5279.8, "valid_targets_min": 2018 }, { "epoch": 5.570739549839228, "grad_norm": 0.4705676576038694, "learning_rate": 4.880235964417009e-06, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.17664816975593567, "step": 3465, "valid_targets_mean": 5694.1, "valid_targets_min": 2373 }, { "epoch": 5.578778135048232, "grad_norm": 0.47218177649090964, "learning_rate": 4.827870630826826e-06, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.16814285516738892, "step": 3470, "valid_targets_mean": 5590.7, "valid_targets_min": 2212 }, { "epoch": 5.586816720257235, "grad_norm": 0.48717963339489373, "learning_rate": 4.775749166376342e-06, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.1970927119255066, "step": 3475, "valid_targets_mean": 5571.5, "valid_targets_min": 3288 }, { "epoch": 5.594855305466238, "grad_norm": 0.4948032769777901, "learning_rate": 4.723872408839623e-06, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.21700280904769897, "step": 3480, "valid_targets_mean": 5748.1, "valid_targets_min": 872 }, { "epoch": 5.602893890675241, "grad_norm": 0.4284945969590602, "learning_rate": 4.672241192057456e-06, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.1854320764541626, "step": 3485, "valid_targets_mean": 6890.2, "valid_targets_min": 4311 }, { "epoch": 5.610932475884244, "grad_norm": 0.5279346730463442, "learning_rate": 4.620856345923928e-06, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.15860424935817719, "step": 3490, "valid_targets_mean": 5110.0, "valid_targets_min": 2205 }, { "epoch": 5.618971061093248, "grad_norm": 0.48080273997531287, "learning_rate": 4.56971869637308e-06, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.18217507004737854, "step": 3495, "valid_targets_mean": 5349.5, "valid_targets_min": 1174 }, { "epoch": 5.627009646302251, "grad_norm": 0.47073465398426945, "learning_rate": 4.518829065365664e-06, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.18675915896892548, "step": 3500, "valid_targets_mean": 5757.6, "valid_targets_min": 3083 }, { "epoch": 5.635048231511254, "grad_norm": 0.49790647435675167, "learning_rate": 4.468188270875873e-06, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.16006457805633545, "step": 3505, "valid_targets_mean": 5294.3, "valid_targets_min": 576 }, { "epoch": 5.643086816720257, "grad_norm": 0.4831653661292901, "learning_rate": 4.417797126878247e-06, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.17651981115341187, "step": 3510, "valid_targets_mean": 5286.9, "valid_targets_min": 466 }, { "epoch": 5.65112540192926, "grad_norm": 0.43558748477821085, "learning_rate": 4.367656443334574e-06, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.19159835577011108, "step": 3515, "valid_targets_mean": 5938.7, "valid_targets_min": 1799 }, { "epoch": 5.659163987138264, "grad_norm": 0.4302587876871802, "learning_rate": 4.317767026180854e-06, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.172641783952713, "step": 3520, "valid_targets_mean": 6267.8, "valid_targets_min": 3421 }, { "epoch": 5.667202572347267, "grad_norm": 0.6167202636928861, "learning_rate": 4.26812967731437e-06, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.2416028082370758, "step": 3525, "valid_targets_mean": 5056.8, "valid_targets_min": 297 }, { "epoch": 5.67524115755627, "grad_norm": 0.4939602441719698, "learning_rate": 4.218745194580778e-06, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.21441826224327087, "step": 3530, "valid_targets_mean": 5435.4, "valid_targets_min": 1059 }, { "epoch": 5.683279742765273, "grad_norm": 0.4756465888695026, "learning_rate": 4.169614371761299e-06, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.16448351740837097, "step": 3535, "valid_targets_mean": 5683.4, "valid_targets_min": 2153 }, { "epoch": 5.691318327974276, "grad_norm": 0.48743402946073533, "learning_rate": 4.120737998559945e-06, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667463630437851, "step": 3540, "valid_targets_mean": 6335.8, "valid_targets_min": 2521 }, { "epoch": 5.69935691318328, "grad_norm": 0.5120939404906634, "learning_rate": 4.07211686059084e-06, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.19326308369636536, "step": 3545, "valid_targets_mean": 5092.7, "valid_targets_min": 856 }, { "epoch": 5.707395498392283, "grad_norm": 0.5632246626673505, "learning_rate": 4.023751739365583e-06, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.20783701539039612, "step": 3550, "valid_targets_mean": 4398.4, "valid_targets_min": 786 }, { "epoch": 5.715434083601286, "grad_norm": 0.586002529442884, "learning_rate": 3.975643412280687e-06, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.18774420022964478, "step": 3555, "valid_targets_mean": 4162.2, "valid_targets_min": 449 }, { "epoch": 5.723472668810289, "grad_norm": 0.449918412147885, "learning_rate": 3.9277926526050915e-06, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.21148762106895447, "step": 3560, "valid_targets_mean": 6406.3, "valid_targets_min": 2032 }, { "epoch": 5.731511254019293, "grad_norm": 0.5102625262179785, "learning_rate": 3.8802002294677295e-06, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.2425631582736969, "step": 3565, "valid_targets_mean": 5427.5, "valid_targets_min": 453 }, { "epoch": 5.739549839228296, "grad_norm": 0.39393512706795425, "learning_rate": 3.8328669078451454e-06, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.16832399368286133, "step": 3570, "valid_targets_mean": 7606.4, "valid_targets_min": 4314 }, { "epoch": 5.747588424437299, "grad_norm": 0.4840682615333142, "learning_rate": 3.7857934485492308e-06, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.16461750864982605, "step": 3575, "valid_targets_mean": 5850.2, "valid_targets_min": 2446 }, { "epoch": 5.755627009646302, "grad_norm": 0.48701845226790647, "learning_rate": 3.738980608214988e-06, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.2235550880432129, "step": 3580, "valid_targets_mean": 5985.8, "valid_targets_min": 1647 }, { "epoch": 5.763665594855306, "grad_norm": 0.4915821728484182, "learning_rate": 3.6924291392883537e-06, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.1905771791934967, "step": 3585, "valid_targets_mean": 5496.2, "valid_targets_min": 407 }, { "epoch": 5.771704180064309, "grad_norm": 0.5265224188216318, "learning_rate": 3.646139790014114e-06, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.1957128345966339, "step": 3590, "valid_targets_mean": 5012.4, "valid_targets_min": 1706 }, { "epoch": 5.779742765273312, "grad_norm": 0.45450286343018304, "learning_rate": 3.6001133044238646e-06, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.22709839046001434, "step": 3595, "valid_targets_mean": 7698.6, "valid_targets_min": 2364 }, { "epoch": 5.787781350482315, "grad_norm": 0.47530926294274556, "learning_rate": 3.554350422324082e-06, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.1802034229040146, "step": 3600, "valid_targets_mean": 5487.3, "valid_targets_min": 977 }, { "epoch": 5.795819935691318, "grad_norm": 0.601663523973185, "learning_rate": 3.5088518792841986e-06, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.20563310384750366, "step": 3605, "valid_targets_mean": 4071.0, "valid_targets_min": 955 }, { "epoch": 5.803858520900322, "grad_norm": 0.5048571767634144, "learning_rate": 3.463618406624816e-06, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1549883484840393, "step": 3610, "valid_targets_mean": 5174.1, "valid_targets_min": 828 }, { "epoch": 5.811897106109325, "grad_norm": 0.5393411182416932, "learning_rate": 3.418650731405897e-06, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.16713210940361023, "step": 3615, "valid_targets_mean": 5148.2, "valid_targets_min": 1475 }, { "epoch": 5.819935691318328, "grad_norm": 0.5925366852450519, "learning_rate": 3.373949576415132e-06, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.19236284494400024, "step": 3620, "valid_targets_mean": 4236.4, "valid_targets_min": 417 }, { "epoch": 5.827974276527331, "grad_norm": 0.4981596093711268, "learning_rate": 3.329515660156297e-06, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.2149473875761032, "step": 3625, "valid_targets_mean": 4993.6, "valid_targets_min": 1612 }, { "epoch": 5.836012861736334, "grad_norm": 0.43691243542885205, "learning_rate": 3.2853496968377054e-06, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537531167268753, "step": 3630, "valid_targets_mean": 5682.8, "valid_targets_min": 355 }, { "epoch": 5.844051446945338, "grad_norm": 0.5038024496320214, "learning_rate": 3.2414523963607313e-06, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.19316399097442627, "step": 3635, "valid_targets_mean": 5242.4, "valid_targets_min": 268 }, { "epoch": 5.852090032154341, "grad_norm": 0.48583257296181714, "learning_rate": 3.1978244643083944e-06, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.1713036298751831, "step": 3640, "valid_targets_mean": 5449.9, "valid_targets_min": 793 }, { "epoch": 5.860128617363344, "grad_norm": 0.5008462037330859, "learning_rate": 3.1544666019340274e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.1978035867214203, "step": 3645, "valid_targets_mean": 6283.9, "valid_targets_min": 2974 }, { "epoch": 5.868167202572347, "grad_norm": 0.4767464107670729, "learning_rate": 3.1113795061499985e-06, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628812849521637, "step": 3650, "valid_targets_mean": 5884.2, "valid_targets_min": 1504 }, { "epoch": 5.87620578778135, "grad_norm": 0.5560475071125592, "learning_rate": 3.068563869516512e-06, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.17907622456550598, "step": 3655, "valid_targets_mean": 3833.8, "valid_targets_min": 398 }, { "epoch": 5.884244372990354, "grad_norm": 0.7011000684899574, "learning_rate": 3.026020380230461e-06, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1727597713470459, "step": 3660, "valid_targets_mean": 5416.0, "valid_targets_min": 505 }, { "epoch": 5.892282958199357, "grad_norm": 0.5018255589278392, "learning_rate": 2.983749722114404e-06, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.21103069186210632, "step": 3665, "valid_targets_mean": 6098.8, "valid_targets_min": 546 }, { "epoch": 5.90032154340836, "grad_norm": 0.4685610942564552, "learning_rate": 2.941752574605534e-06, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.18297003209590912, "step": 3670, "valid_targets_mean": 6018.0, "valid_targets_min": 2116 }, { "epoch": 5.908360128617363, "grad_norm": 0.4933707589439783, "learning_rate": 2.900029612744777e-06, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.2093782275915146, "step": 3675, "valid_targets_mean": 5958.1, "valid_targets_min": 1882 }, { "epoch": 5.916398713826366, "grad_norm": 0.465397474042975, "learning_rate": 2.8585815071659274e-06, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.13250520825386047, "step": 3680, "valid_targets_mean": 5000.4, "valid_targets_min": 256 }, { "epoch": 5.92443729903537, "grad_norm": 0.4861895013069857, "learning_rate": 2.8174089240848923e-06, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.17181509733200073, "step": 3685, "valid_targets_mean": 5327.6, "valid_targets_min": 964 }, { "epoch": 5.932475884244373, "grad_norm": 0.4822977088482712, "learning_rate": 2.776512525288959e-06, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.18289127945899963, "step": 3690, "valid_targets_mean": 5464.9, "valid_targets_min": 1861 }, { "epoch": 5.940514469453376, "grad_norm": 0.5287623887945523, "learning_rate": 2.7358929681261836e-06, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922057718038559, "step": 3695, "valid_targets_mean": 4948.4, "valid_targets_min": 804 }, { "epoch": 5.948553054662379, "grad_norm": 0.48382172273456314, "learning_rate": 2.695550905494797e-06, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.15750959515571594, "step": 3700, "valid_targets_mean": 4836.6, "valid_targets_min": 1302 }, { "epoch": 5.956591639871383, "grad_norm": 0.5233715291485577, "learning_rate": 2.655486985832718e-06, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.18856148421764374, "step": 3705, "valid_targets_mean": 5918.6, "valid_targets_min": 636 }, { "epoch": 5.964630225080386, "grad_norm": 0.48717200725467924, "learning_rate": 2.615701853107149e-06, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.22136838734149933, "step": 3710, "valid_targets_mean": 5422.0, "valid_targets_min": 2412 }, { "epoch": 5.972668810289389, "grad_norm": 0.48597064916098776, "learning_rate": 2.576196146804204e-06, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.14957702159881592, "step": 3715, "valid_targets_mean": 4877.0, "valid_targets_min": 726 }, { "epoch": 5.980707395498392, "grad_norm": 0.452012801780017, "learning_rate": 2.536970501918643e-06, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.15257996320724487, "step": 3720, "valid_targets_mean": 5929.3, "valid_targets_min": 514 }, { "epoch": 5.988745980707396, "grad_norm": 0.483217937140563, "learning_rate": 2.4980255489436565e-06, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.20844154059886932, "step": 3725, "valid_targets_mean": 5669.2, "valid_targets_min": 1328 }, { "epoch": 5.996784565916399, "grad_norm": 0.4724190619750239, "learning_rate": 2.459361913860736e-06, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.1832464635372162, "step": 3730, "valid_targets_mean": 5815.4, "valid_targets_min": 2576 }, { "epoch": 6.004823151125402, "grad_norm": 0.83317522207539, "learning_rate": 2.4209802181296136e-06, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.1619970053434372, "step": 3735, "valid_targets_mean": 5549.2, "valid_targets_min": 964 }, { "epoch": 6.012861736334405, "grad_norm": 0.5154255877325745, "learning_rate": 2.3828810786782674e-06, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856580525636673, "step": 3740, "valid_targets_mean": 5616.6, "valid_targets_min": 1732 }, { "epoch": 6.020900321543408, "grad_norm": 0.49816618610731805, "learning_rate": 2.34506510789301e-06, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.18047022819519043, "step": 3745, "valid_targets_mean": 5633.9, "valid_targets_min": 2586 }, { "epoch": 6.028938906752412, "grad_norm": 0.6550527611073069, "learning_rate": 2.3075329136086434e-06, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.17386046051979065, "step": 3750, "valid_targets_mean": 5468.9, "valid_targets_min": 457 }, { "epoch": 6.036977491961415, "grad_norm": 0.47279868176005735, "learning_rate": 2.2702850990986924e-06, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.1906416267156601, "step": 3755, "valid_targets_mean": 6038.7, "valid_targets_min": 3062 }, { "epoch": 6.045016077170418, "grad_norm": 0.4933331908426635, "learning_rate": 2.2333222630657025e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.17692366242408752, "step": 3760, "valid_targets_mean": 5261.4, "valid_targets_min": 1379 }, { "epoch": 6.053054662379421, "grad_norm": 0.8130085639082187, "learning_rate": 2.1966449996316208e-06, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.1743280589580536, "step": 3765, "valid_targets_mean": 5865.8, "valid_targets_min": 1931 }, { "epoch": 6.061093247588424, "grad_norm": 0.5466815490190559, "learning_rate": 2.1602538983282394e-06, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.1809442937374115, "step": 3770, "valid_targets_mean": 6375.1, "valid_targets_min": 4224 }, { "epoch": 6.069131832797428, "grad_norm": 0.49542785389406413, "learning_rate": 2.1241495440877258e-06, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.1862630546092987, "step": 3775, "valid_targets_mean": 5147.9, "valid_targets_min": 807 }, { "epoch": 6.077170418006431, "grad_norm": 0.47022987712208747, "learning_rate": 2.0883325172332357e-06, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.16111014783382416, "step": 3780, "valid_targets_mean": 5491.1, "valid_targets_min": 2277 }, { "epoch": 6.085209003215434, "grad_norm": 0.47395693170698344, "learning_rate": 2.052803393469549e-06, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.18137693405151367, "step": 3785, "valid_targets_mean": 5670.7, "valid_targets_min": 923 }, { "epoch": 6.093247588424437, "grad_norm": 0.48294409022389034, "learning_rate": 2.0175627438738488e-06, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.1723235547542572, "step": 3790, "valid_targets_mean": 5502.2, "valid_targets_min": 1221 }, { "epoch": 6.101286173633441, "grad_norm": 0.5705804543456575, "learning_rate": 1.9826111348865227e-06, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.1478518843650818, "step": 3795, "valid_targets_mean": 4955.9, "valid_targets_min": 2887 }, { "epoch": 6.109324758842444, "grad_norm": 0.509692421121887, "learning_rate": 1.9479491283020714e-06, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.20045389235019684, "step": 3800, "valid_targets_mean": 5041.6, "valid_targets_min": 954 }, { "epoch": 6.117363344051447, "grad_norm": 0.4866828715923054, "learning_rate": 1.913577281260066e-06, "loss": 0.1851, "loss_nan_ranks": 0, "loss_rank_avg": 0.18292544782161713, "step": 3805, "valid_targets_mean": 5632.7, "valid_targets_min": 598 }, { "epoch": 6.12540192926045, "grad_norm": 0.4863806235895185, "learning_rate": 1.8794961462362194e-06, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.18915069103240967, "step": 3810, "valid_targets_mean": 5742.5, "valid_targets_min": 1890 }, { "epoch": 6.133440514469453, "grad_norm": 0.4662278512075521, "learning_rate": 1.845706271033456e-06, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.16785621643066406, "step": 3815, "valid_targets_mean": 6455.1, "valid_targets_min": 2205 }, { "epoch": 6.141479099678457, "grad_norm": 0.4749251483380231, "learning_rate": 1.81220819877316e-06, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.22028598189353943, "step": 3820, "valid_targets_mean": 5887.7, "valid_targets_min": 1717 }, { "epoch": 6.14951768488746, "grad_norm": 0.5277330163447275, "learning_rate": 1.7790024678864149e-06, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.20545095205307007, "step": 3825, "valid_targets_mean": 5465.8, "valid_targets_min": 2498 }, { "epoch": 6.157556270096463, "grad_norm": 0.4888029274916281, "learning_rate": 1.746089612105355e-06, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.17628200352191925, "step": 3830, "valid_targets_mean": 5932.9, "valid_targets_min": 2621 }, { "epoch": 6.165594855305466, "grad_norm": 0.5116352727269389, "learning_rate": 1.7134701604545934e-06, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.2042563557624817, "step": 3835, "valid_targets_mean": 5198.4, "valid_targets_min": 856 }, { "epoch": 6.173633440514469, "grad_norm": 0.4919942862743339, "learning_rate": 1.6811446372427108e-06, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.19126807153224945, "step": 3840, "valid_targets_mean": 5945.5, "valid_targets_min": 449 }, { "epoch": 6.181672025723473, "grad_norm": 0.4665227200564428, "learning_rate": 1.6491135620538256e-06, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.17806287109851837, "step": 3845, "valid_targets_mean": 5732.4, "valid_targets_min": 935 }, { "epoch": 6.189710610932476, "grad_norm": 0.463406210984963, "learning_rate": 1.6173774497392592e-06, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.14907455444335938, "step": 3850, "valid_targets_mean": 5815.6, "valid_targets_min": 726 }, { "epoch": 6.197749196141479, "grad_norm": 0.5817896201740729, "learning_rate": 1.5859368104092387e-06, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.20796798169612885, "step": 3855, "valid_targets_mean": 4837.5, "valid_targets_min": 841 }, { "epoch": 6.205787781350482, "grad_norm": 0.4781524045532261, "learning_rate": 1.5547921494247065e-06, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.17145711183547974, "step": 3860, "valid_targets_mean": 6007.2, "valid_targets_min": 2405 }, { "epoch": 6.213826366559486, "grad_norm": 0.49548094344040206, "learning_rate": 1.5239439673892098e-06, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.19060102105140686, "step": 3865, "valid_targets_mean": 5291.6, "valid_targets_min": 2244 }, { "epoch": 6.221864951768489, "grad_norm": 0.49834757800080803, "learning_rate": 1.4933927601408327e-06, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.14511215686798096, "step": 3870, "valid_targets_mean": 4564.9, "valid_targets_min": 2297 }, { "epoch": 6.229903536977492, "grad_norm": 0.510379153220315, "learning_rate": 1.4631390187442441e-06, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.17495837807655334, "step": 3875, "valid_targets_mean": 5613.2, "valid_targets_min": 3486 }, { "epoch": 6.237942122186495, "grad_norm": 0.46568643547236416, "learning_rate": 1.433183229482793e-06, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.21530888974666595, "step": 3880, "valid_targets_mean": 6843.9, "valid_targets_min": 2342 }, { "epoch": 6.245980707395498, "grad_norm": 0.515917833968904, "learning_rate": 1.4035258738506908e-06, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.18214061856269836, "step": 3885, "valid_targets_mean": 5141.1, "valid_targets_min": 1200 }, { "epoch": 6.254019292604502, "grad_norm": 0.5217242607576065, "learning_rate": 1.3741674285452854e-06, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475576013326645, "step": 3890, "valid_targets_mean": 5111.0, "valid_targets_min": 873 }, { "epoch": 6.262057877813505, "grad_norm": 0.4407473996704603, "learning_rate": 1.3451083654593932e-06, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.21679872274398804, "step": 3895, "valid_targets_mean": 7420.8, "valid_targets_min": 3288 }, { "epoch": 6.270096463022508, "grad_norm": 0.5474233696114393, "learning_rate": 1.3163491516737104e-06, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.1937793493270874, "step": 3900, "valid_targets_mean": 5128.5, "valid_targets_min": 1288 }, { "epoch": 6.278135048231511, "grad_norm": 0.48218883082894765, "learning_rate": 1.2878902494492973e-06, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.17568941414356232, "step": 3905, "valid_targets_mean": 5506.8, "valid_targets_min": 1393 }, { "epoch": 6.286173633440514, "grad_norm": 0.473274067929269, "learning_rate": 1.259732116220167e-06, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.18140992522239685, "step": 3910, "valid_targets_mean": 5537.2, "valid_targets_min": 594 }, { "epoch": 6.294212218649518, "grad_norm": 0.4921331038109862, "learning_rate": 1.2318752045859262e-06, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.2152450680732727, "step": 3915, "valid_targets_mean": 5908.2, "valid_targets_min": 1647 }, { "epoch": 6.302250803858521, "grad_norm": 0.5159644200801217, "learning_rate": 1.204319962304492e-06, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.19172531366348267, "step": 3920, "valid_targets_mean": 5150.0, "valid_targets_min": 877 }, { "epoch": 6.310289389067524, "grad_norm": 0.48083461205602324, "learning_rate": 1.1770668322849032e-06, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.17192471027374268, "step": 3925, "valid_targets_mean": 5867.6, "valid_targets_min": 904 }, { "epoch": 6.318327974276527, "grad_norm": 0.49748778307814, "learning_rate": 1.1501162525801956e-06, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.1800798773765564, "step": 3930, "valid_targets_mean": 5804.5, "valid_targets_min": 1475 }, { "epoch": 6.326366559485531, "grad_norm": 0.509965747323788, "learning_rate": 1.1234686563803709e-06, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.17962145805358887, "step": 3935, "valid_targets_mean": 5479.6, "valid_targets_min": 2373 }, { "epoch": 6.334405144694534, "grad_norm": 0.4569426127753139, "learning_rate": 1.097124472005422e-06, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.15181009471416473, "step": 3940, "valid_targets_mean": 5221.9, "valid_targets_min": 3021 }, { "epoch": 6.342443729903537, "grad_norm": 0.4827950680272922, "learning_rate": 1.0710841228984536e-06, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.20170137286186218, "step": 3945, "valid_targets_mean": 5781.6, "valid_targets_min": 550 }, { "epoch": 6.35048231511254, "grad_norm": 0.7716956645165256, "learning_rate": 1.0453480276188777e-06, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16286450624465942, "step": 3950, "valid_targets_mean": 4926.1, "valid_targets_min": 718 }, { "epoch": 6.358520900321543, "grad_norm": 0.5109589924706025, "learning_rate": 1.019916599835682e-06, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.1650046706199646, "step": 3955, "valid_targets_mean": 5433.2, "valid_targets_min": 867 }, { "epoch": 6.366559485530547, "grad_norm": 0.4795377899307965, "learning_rate": 9.94790248320785e-07, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.18109866976737976, "step": 3960, "valid_targets_mean": 5475.3, "valid_targets_min": 3093 }, { "epoch": 6.37459807073955, "grad_norm": 0.5202485003895791, "learning_rate": 9.699693769424634e-07, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.1738145351409912, "step": 3965, "valid_targets_mean": 4568.5, "valid_targets_min": 686 }, { "epoch": 6.382636655948553, "grad_norm": 0.4630700661014578, "learning_rate": 9.454543846588571e-07, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.17738892138004303, "step": 3970, "valid_targets_mean": 6398.9, "valid_targets_min": 4449 }, { "epoch": 6.390675241157556, "grad_norm": 0.5531898311258766, "learning_rate": 9.212456655115609e-07, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.23551887273788452, "step": 3975, "valid_targets_mean": 4852.2, "valid_targets_min": 872 }, { "epoch": 6.39871382636656, "grad_norm": 0.5392493230684815, "learning_rate": 8.973436086192966e-07, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.20924073457717896, "step": 3980, "valid_targets_mean": 4547.6, "valid_targets_min": 681 }, { "epoch": 6.406752411575563, "grad_norm": 0.5246926009101333, "learning_rate": 8.737485981716465e-07, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.21452780067920685, "step": 3985, "valid_targets_mean": 5697.2, "valid_targets_min": 1800 }, { "epoch": 6.414790996784566, "grad_norm": 0.4966041907551861, "learning_rate": 8.50461013422883e-07, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.18985769152641296, "step": 3990, "valid_targets_mean": 5423.9, "valid_targets_min": 371 }, { "epoch": 6.422829581993569, "grad_norm": 0.48928365103208005, "learning_rate": 8.274812286858714e-07, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.16009929776191711, "step": 3995, "valid_targets_mean": 5772.6, "valid_targets_min": 368 }, { "epoch": 6.430868167202572, "grad_norm": 0.5205676594223365, "learning_rate": 8.048096133260586e-07, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.18772917985916138, "step": 4000, "valid_targets_mean": 5536.8, "valid_targets_min": 664 }, { "epoch": 6.438906752411576, "grad_norm": 0.46495455507078626, "learning_rate": 7.824465317555318e-07, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.15344102680683136, "step": 4005, "valid_targets_mean": 6885.2, "valid_targets_min": 712 }, { "epoch": 6.446945337620579, "grad_norm": 0.48861786608204816, "learning_rate": 7.603923434271699e-07, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2028530240058899, "step": 4010, "valid_targets_mean": 5799.2, "valid_targets_min": 2698 }, { "epoch": 6.454983922829582, "grad_norm": 0.54991147386686, "learning_rate": 7.386474028288382e-07, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.18571394681930542, "step": 4015, "valid_targets_mean": 4742.5, "valid_targets_min": 1168 }, { "epoch": 6.463022508038585, "grad_norm": 0.5715790732228933, "learning_rate": 7.172120594777299e-07, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.21050646901130676, "step": 4020, "valid_targets_mean": 5150.3, "valid_targets_min": 437 }, { "epoch": 6.471061093247588, "grad_norm": 0.4730497066181822, "learning_rate": 6.960866579147185e-07, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.17261850833892822, "step": 4025, "valid_targets_mean": 5338.9, "valid_targets_min": 363 }, { "epoch": 6.479099678456592, "grad_norm": 0.527431227427804, "learning_rate": 6.752715376988339e-07, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.18096715211868286, "step": 4030, "valid_targets_mean": 4199.8, "valid_targets_min": 1755 }, { "epoch": 6.487138263665595, "grad_norm": 0.46366935985990176, "learning_rate": 6.547670334017953e-07, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.22837695479393005, "step": 4035, "valid_targets_mean": 6578.4, "valid_targets_min": 1681 }, { "epoch": 6.495176848874598, "grad_norm": 0.46722736029353956, "learning_rate": 6.345734746026466e-07, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.1680130660533905, "step": 4040, "valid_targets_mean": 6325.9, "valid_targets_min": 2561 }, { "epoch": 6.503215434083601, "grad_norm": 0.5254245828058934, "learning_rate": 6.146911858824434e-07, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.16261672973632812, "step": 4045, "valid_targets_mean": 4747.1, "valid_targets_min": 1026 }, { "epoch": 6.511254019292604, "grad_norm": 0.45813060973081743, "learning_rate": 5.951204868190452e-07, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.16923211514949799, "step": 4050, "valid_targets_mean": 5838.7, "valid_targets_min": 411 }, { "epoch": 6.519292604501608, "grad_norm": 0.473936039803348, "learning_rate": 5.758616919819826e-07, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.19065213203430176, "step": 4055, "valid_targets_mean": 5748.9, "valid_targets_min": 2534 }, { "epoch": 6.527331189710611, "grad_norm": 0.47792389668692997, "learning_rate": 5.569151109273851e-07, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.19362300634384155, "step": 4060, "valid_targets_mean": 5755.1, "valid_targets_min": 2366 }, { "epoch": 6.535369774919614, "grad_norm": 0.5855563122421675, "learning_rate": 5.382810481930256e-07, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.1771083027124405, "step": 4065, "valid_targets_mean": 4887.2, "valid_targets_min": 548 }, { "epoch": 6.543408360128617, "grad_norm": 0.4745893409118789, "learning_rate": 5.199598032934106e-07, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.1631501466035843, "step": 4070, "valid_targets_mean": 5731.9, "valid_targets_min": 3409 }, { "epoch": 6.551446945337621, "grad_norm": 0.5161967610866468, "learning_rate": 5.019516707149685e-07, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.18905222415924072, "step": 4075, "valid_targets_mean": 4795.0, "valid_targets_min": 2189 }, { "epoch": 6.559485530546624, "grad_norm": 0.802682405482379, "learning_rate": 4.84256939911325e-07, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.21466057002544403, "step": 4080, "valid_targets_mean": 4320.0, "valid_targets_min": 548 }, { "epoch": 6.567524115755627, "grad_norm": 0.5031206858818378, "learning_rate": 4.6687589529863517e-07, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.19306516647338867, "step": 4085, "valid_targets_mean": 5357.6, "valid_targets_min": 818 }, { "epoch": 6.57556270096463, "grad_norm": 0.5178506022576367, "learning_rate": 4.498088162510317e-07, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.23467575013637543, "step": 4090, "valid_targets_mean": 5338.9, "valid_targets_min": 594 }, { "epoch": 6.583601286173634, "grad_norm": 0.5076224755919664, "learning_rate": 4.330559770961151e-07, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.1578923761844635, "step": 4095, "valid_targets_mean": 4803.6, "valid_targets_min": 1802 }, { "epoch": 6.591639871382637, "grad_norm": 0.4592277887151131, "learning_rate": 4.166176471105554e-07, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.15273262560367584, "step": 4100, "valid_targets_mean": 5040.8, "valid_targets_min": 1001 }, { "epoch": 6.59967845659164, "grad_norm": 0.5087668578828699, "learning_rate": 4.004940905157617e-07, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.19955775141716003, "step": 4105, "valid_targets_mean": 5567.3, "valid_targets_min": 2229 }, { "epoch": 6.607717041800643, "grad_norm": 0.5439868707343057, "learning_rate": 3.8468556647363266e-07, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.18226560950279236, "step": 4110, "valid_targets_mean": 5092.6, "valid_targets_min": 2403 }, { "epoch": 6.615755627009646, "grad_norm": 0.5026023766001185, "learning_rate": 3.691923290823951e-07, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.18940620124340057, "step": 4115, "valid_targets_mean": 5858.8, "valid_targets_min": 2205 }, { "epoch": 6.62379421221865, "grad_norm": 0.46383552678879314, "learning_rate": 3.540146273725142e-07, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.16480082273483276, "step": 4120, "valid_targets_mean": 5884.1, "valid_targets_min": 2157 }, { "epoch": 6.631832797427653, "grad_norm": 0.5348850869149254, "learning_rate": 3.391527053027033e-07, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.24536944925785065, "step": 4125, "valid_targets_mean": 5093.4, "valid_targets_min": 2222 }, { "epoch": 6.639871382636656, "grad_norm": 0.4756091936153012, "learning_rate": 3.2460680175598e-07, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.2090965211391449, "step": 4130, "valid_targets_mean": 6622.1, "valid_targets_min": 4223 }, { "epoch": 6.647909967845659, "grad_norm": 0.4963669522308755, "learning_rate": 3.103771505358499e-07, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.1624598205089569, "step": 4135, "valid_targets_mean": 5586.9, "valid_targets_min": 2579 }, { "epoch": 6.655948553054662, "grad_norm": 0.4678741621601647, "learning_rate": 2.9646398036253575e-07, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.14038006961345673, "step": 4140, "valid_targets_mean": 4843.9, "valid_targets_min": 1675 }, { "epoch": 6.663987138263666, "grad_norm": 0.47210780129474755, "learning_rate": 2.828675148693005e-07, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.16181638836860657, "step": 4145, "valid_targets_mean": 5237.2, "valid_targets_min": 2943 }, { "epoch": 6.672025723472669, "grad_norm": 0.5158718099795397, "learning_rate": 2.695879725988637e-07, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1680976003408432, "step": 4150, "valid_targets_mean": 4968.0, "valid_targets_min": 486 }, { "epoch": 6.680064308681672, "grad_norm": 0.49688533024331555, "learning_rate": 2.566255669998707e-07, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.1574384570121765, "step": 4155, "valid_targets_mean": 4732.6, "valid_targets_min": 1495 }, { "epoch": 6.688102893890675, "grad_norm": 0.4971282543462799, "learning_rate": 2.4398050642348235e-07, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.17601963877677917, "step": 4160, "valid_targets_mean": 5555.8, "valid_targets_min": 2327 }, { "epoch": 6.696141479099678, "grad_norm": 0.4679076982911688, "learning_rate": 2.3165299412001075e-07, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.14313621819019318, "step": 4165, "valid_targets_mean": 5264.6, "valid_targets_min": 1180 }, { "epoch": 6.704180064308682, "grad_norm": 0.44245119575522096, "learning_rate": 2.1964322823565532e-07, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.15354637801647186, "step": 4170, "valid_targets_mean": 5514.4, "valid_targets_min": 949 }, { "epoch": 6.712218649517685, "grad_norm": 0.4745054491408359, "learning_rate": 2.0795140180932982e-07, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.14562906324863434, "step": 4175, "valid_targets_mean": 5620.2, "valid_targets_min": 2377 }, { "epoch": 6.720257234726688, "grad_norm": 0.47955050039844965, "learning_rate": 1.9657770276953592e-07, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.24234527349472046, "step": 4180, "valid_targets_mean": 6996.8, "valid_targets_min": 1504 }, { "epoch": 6.728295819935691, "grad_norm": 0.5392328506399422, "learning_rate": 1.8552231393137e-07, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.14472296833992004, "step": 4185, "valid_targets_mean": 4974.5, "valid_targets_min": 630 }, { "epoch": 6.736334405144694, "grad_norm": 0.524110682981634, "learning_rate": 1.7478541299356332e-07, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.19961285591125488, "step": 4190, "valid_targets_mean": 5437.1, "valid_targets_min": 1492 }, { "epoch": 6.744372990353698, "grad_norm": 0.44822215241237556, "learning_rate": 1.6436717253563327e-07, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.16462916135787964, "step": 4195, "valid_targets_mean": 6963.6, "valid_targets_min": 1612 }, { "epoch": 6.752411575562701, "grad_norm": 0.5237024825611266, "learning_rate": 1.5426776001511212e-07, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.20051389932632446, "step": 4200, "valid_targets_mean": 5342.4, "valid_targets_min": 2431 }, { "epoch": 6.760450160771704, "grad_norm": 0.4934098015061834, "learning_rate": 1.444873377648537e-07, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.18957063555717468, "step": 4205, "valid_targets_mean": 6711.7, "valid_targets_min": 3013 }, { "epoch": 6.768488745980707, "grad_norm": 0.5187855790783407, "learning_rate": 1.3502606299042432e-07, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.16103804111480713, "step": 4210, "valid_targets_mean": 5401.3, "valid_targets_min": 2834 }, { "epoch": 6.776527331189711, "grad_norm": 0.47209865860791694, "learning_rate": 1.2588408776756933e-07, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.17956702411174774, "step": 4215, "valid_targets_mean": 5800.7, "valid_targets_min": 3545 }, { "epoch": 6.784565916398714, "grad_norm": 0.4701575804504904, "learning_rate": 1.1706155903977945e-07, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.20110127329826355, "step": 4220, "valid_targets_mean": 5929.1, "valid_targets_min": 2331 }, { "epoch": 6.792604501607717, "grad_norm": 0.5296390861079925, "learning_rate": 1.0855861861592376e-07, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.19427093863487244, "step": 4225, "valid_targets_mean": 5843.8, "valid_targets_min": 607 }, { "epoch": 6.80064308681672, "grad_norm": 0.5310412544676056, "learning_rate": 1.0037540316796713e-07, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.1741572916507721, "step": 4230, "valid_targets_mean": 4511.2, "valid_targets_min": 808 }, { "epoch": 6.808681672025724, "grad_norm": 0.457276791840171, "learning_rate": 9.251204422878302e-08, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.1941903531551361, "step": 4235, "valid_targets_mean": 5819.2, "valid_targets_min": 398 }, { "epoch": 6.816720257234727, "grad_norm": 0.4812323518875819, "learning_rate": 8.496866819002636e-08, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.1971593052148819, "step": 4240, "valid_targets_mean": 5406.8, "valid_targets_min": 747 }, { "epoch": 6.82475884244373, "grad_norm": 0.513399635333341, "learning_rate": 7.774539630010846e-08, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618066668510437, "step": 4245, "valid_targets_mean": 6306.6, "valid_targets_min": 2073 }, { "epoch": 6.832797427652733, "grad_norm": 0.4610409646272019, "learning_rate": 7.084234466225637e-08, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.16325844824314117, "step": 4250, "valid_targets_mean": 5903.2, "valid_targets_min": 2962 }, { "epoch": 6.840836012861736, "grad_norm": 0.48257013983282615, "learning_rate": 6.425962423262988e-08, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.2067861407995224, "step": 4255, "valid_targets_mean": 5777.6, "valid_targets_min": 1767 }, { "epoch": 6.84887459807074, "grad_norm": 0.4194055735557952, "learning_rate": 5.799734081855413e-08, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.16234293580055237, "step": 4260, "valid_targets_mean": 6958.3, "valid_targets_min": 3030 }, { "epoch": 6.856913183279743, "grad_norm": 0.5762898140474347, "learning_rate": 5.205559507680313e-08, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.16969682276248932, "step": 4265, "valid_targets_mean": 6194.4, "valid_targets_min": 3190 }, { "epoch": 6.864951768488746, "grad_norm": 0.4726219925484245, "learning_rate": 4.643448251199667e-08, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.19437849521636963, "step": 4270, "valid_targets_mean": 6152.1, "valid_targets_min": 2800 }, { "epoch": 6.872990353697749, "grad_norm": 0.626802854083221, "learning_rate": 4.113409347505926e-08, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.21149322390556335, "step": 4275, "valid_targets_mean": 4295.7, "valid_targets_min": 305 }, { "epoch": 6.881028938906752, "grad_norm": 0.5992693492880397, "learning_rate": 3.615451316176355e-08, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.22360846400260925, "step": 4280, "valid_targets_mean": 4792.6, "valid_targets_min": 1949 }, { "epoch": 6.889067524115756, "grad_norm": 0.5089549192427425, "learning_rate": 3.149582161136699e-08, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.22241082787513733, "step": 4285, "valid_targets_mean": 5543.4, "valid_targets_min": 3958 }, { "epoch": 6.897106109324759, "grad_norm": 0.49095582885510597, "learning_rate": 2.7158093705323962e-08, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.1889224797487259, "step": 4290, "valid_targets_mean": 5026.6, "valid_targets_min": 1093 }, { "epoch": 6.905144694533762, "grad_norm": 0.5161073267175579, "learning_rate": 2.3141399166080046e-08, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.1808251440525055, "step": 4295, "valid_targets_mean": 5040.4, "valid_targets_min": 705 }, { "epoch": 6.913183279742765, "grad_norm": 0.49706857696186435, "learning_rate": 1.9445802555952964e-08, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.15419217944145203, "step": 4300, "valid_targets_mean": 5024.6, "valid_targets_min": 2451 }, { "epoch": 6.921221864951768, "grad_norm": 0.5005639935906776, "learning_rate": 1.607136327609782e-08, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.180386483669281, "step": 4305, "valid_targets_mean": 5288.4, "valid_targets_min": 2894 }, { "epoch": 6.929260450160772, "grad_norm": 0.5507681061162143, "learning_rate": 1.3018135565541212e-08, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.17055736482143402, "step": 4310, "valid_targets_mean": 4294.1, "valid_targets_min": 917 }, { "epoch": 6.937299035369775, "grad_norm": 0.47076314804544284, "learning_rate": 1.0286168500324157e-08, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.18481239676475525, "step": 4315, "valid_targets_mean": 6214.2, "valid_targets_min": 1665 }, { "epoch": 6.945337620578778, "grad_norm": 0.5290017885779597, "learning_rate": 7.875505992707144e-09, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1767764687538147, "step": 4320, "valid_targets_mean": 4849.6, "valid_targets_min": 889 }, { "epoch": 6.953376205787781, "grad_norm": 0.5194272213690765, "learning_rate": 5.786186790459614e-09, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.1747482419013977, "step": 4325, "valid_targets_mean": 4611.9, "valid_targets_min": 1654 }, { "epoch": 6.961414790996785, "grad_norm": 0.4677227966120155, "learning_rate": 4.018244476240441e-09, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.16645994782447815, "step": 4330, "valid_targets_mean": 5858.0, "valid_targets_min": 2611 }, { "epoch": 6.969453376205788, "grad_norm": 0.4969571582473657, "learning_rate": 2.5717074670628116e-09, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.16073165833950043, "step": 4335, "valid_targets_mean": 5167.6, "valid_targets_min": 1905 }, { "epoch": 6.977491961414791, "grad_norm": 0.4569589126728696, "learning_rate": 1.4465990138323727e-09, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.24416705965995789, "step": 4340, "valid_targets_mean": 6487.6, "valid_targets_min": 1716 }, { "epoch": 6.985530546623794, "grad_norm": 0.5594617903547844, "learning_rate": 6.429372009719714e-10, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.25965332984924316, "step": 4345, "valid_targets_mean": 5103.3, "valid_targets_min": 424 }, { "epoch": 6.993569131832797, "grad_norm": 0.4299759834166724, "learning_rate": 1.6073494613522146e-10, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.16728906333446503, "step": 4350, "valid_targets_mean": 6768.5, "valid_targets_min": 3807 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630803495645523, "step": 4354, "total_flos": 1827324081995776.0, "train_loss": 0.23159787104006038, "train_runtime": 29184.2585, "train_samples_per_second": 2.386, "train_steps_per_second": 0.149, "valid_targets_mean": 6348.0, "valid_targets_min": 2723 } ], "logging_steps": 5, "max_steps": 4354, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1827324081995776.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }