{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 9177, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0038138825324180014, "grad_norm": 9.470755296878524, "learning_rate": 1.7429193899782138e-07, "loss": 0.8166, "loss_nan_ranks": 0, "loss_rank_avg": 0.8353788256645203, "step": 5, "valid_targets_mean": 5229.4, "valid_targets_min": 1152 }, { "epoch": 0.007627765064836003, "grad_norm": 11.999543819314578, "learning_rate": 3.921568627450981e-07, "loss": 0.8786, "loss_nan_ranks": 0, "loss_rank_avg": 1.0028491020202637, "step": 10, "valid_targets_mean": 3283.0, "valid_targets_min": 660 }, { "epoch": 0.011441647597254004, "grad_norm": 10.891241780249842, "learning_rate": 6.100217864923748e-07, "loss": 0.8257, "loss_nan_ranks": 0, "loss_rank_avg": 0.8274946212768555, "step": 15, "valid_targets_mean": 4470.2, "valid_targets_min": 1025 }, { "epoch": 0.015255530129672006, "grad_norm": 9.997792672692631, "learning_rate": 8.278867102396515e-07, "loss": 0.8311, "loss_nan_ranks": 0, "loss_rank_avg": 0.8327676653862, "step": 20, "valid_targets_mean": 4210.0, "valid_targets_min": 345 }, { "epoch": 0.01906941266209001, "grad_norm": 8.877819827048429, "learning_rate": 1.0457516339869283e-06, "loss": 0.8057, "loss_nan_ranks": 0, "loss_rank_avg": 0.7901816964149475, "step": 25, "valid_targets_mean": 4130.4, "valid_targets_min": 1404 }, { "epoch": 0.02288329519450801, "grad_norm": 8.096441526748734, "learning_rate": 1.2636165577342049e-06, "loss": 0.808, "loss_nan_ranks": 0, "loss_rank_avg": 0.7575476765632629, "step": 30, "valid_targets_mean": 3961.3, "valid_targets_min": 1118 }, { "epoch": 0.02669717772692601, "grad_norm": 5.796639402961682, "learning_rate": 1.4814814814814815e-06, "loss": 0.7743, "loss_nan_ranks": 0, "loss_rank_avg": 0.7839180827140808, "step": 35, "valid_targets_mean": 4570.6, "valid_targets_min": 782 }, { "epoch": 0.03051106025934401, "grad_norm": 4.5778398820035555, "learning_rate": 1.6993464052287585e-06, "loss": 0.7824, "loss_nan_ranks": 0, "loss_rank_avg": 0.7421620488166809, "step": 40, "valid_targets_mean": 4959.4, "valid_targets_min": 1531 }, { "epoch": 0.034324942791762014, "grad_norm": 3.104932493714994, "learning_rate": 1.917211328976035e-06, "loss": 0.6661, "loss_nan_ranks": 0, "loss_rank_avg": 0.6358296275138855, "step": 45, "valid_targets_mean": 4961.0, "valid_targets_min": 1151 }, { "epoch": 0.03813882532418002, "grad_norm": 3.2109157965025417, "learning_rate": 2.135076252723312e-06, "loss": 0.6704, "loss_nan_ranks": 0, "loss_rank_avg": 0.6529257297515869, "step": 50, "valid_targets_mean": 3586.6, "valid_targets_min": 449 }, { "epoch": 0.041952707856598014, "grad_norm": 2.150373234220549, "learning_rate": 2.3529411764705885e-06, "loss": 0.6812, "loss_nan_ranks": 0, "loss_rank_avg": 0.7103098034858704, "step": 55, "valid_targets_mean": 4680.6, "valid_targets_min": 1299 }, { "epoch": 0.04576659038901602, "grad_norm": 1.5051584529967943, "learning_rate": 2.570806100217865e-06, "loss": 0.6306, "loss_nan_ranks": 0, "loss_rank_avg": 0.6322097778320312, "step": 60, "valid_targets_mean": 4604.5, "valid_targets_min": 833 }, { "epoch": 0.04958047292143402, "grad_norm": 1.372839166404494, "learning_rate": 2.788671023965142e-06, "loss": 0.623, "loss_nan_ranks": 0, "loss_rank_avg": 0.5981409549713135, "step": 65, "valid_targets_mean": 3717.8, "valid_targets_min": 301 }, { "epoch": 0.05339435545385202, "grad_norm": 1.2972075810391417, "learning_rate": 3.0065359477124182e-06, "loss": 0.6228, "loss_nan_ranks": 0, "loss_rank_avg": 0.6940057873725891, "step": 70, "valid_targets_mean": 3829.6, "valid_targets_min": 1278 }, { "epoch": 0.057208237986270026, "grad_norm": 0.9279377869597232, "learning_rate": 3.2244008714596952e-06, "loss": 0.6054, "loss_nan_ranks": 0, "loss_rank_avg": 0.6068126559257507, "step": 75, "valid_targets_mean": 5117.9, "valid_targets_min": 938 }, { "epoch": 0.06102212051868802, "grad_norm": 0.9158878206222738, "learning_rate": 3.4422657952069723e-06, "loss": 0.5969, "loss_nan_ranks": 0, "loss_rank_avg": 0.5890101790428162, "step": 80, "valid_targets_mean": 4001.0, "valid_targets_min": 768 }, { "epoch": 0.06483600305110603, "grad_norm": 0.8582325602905675, "learning_rate": 3.6601307189542484e-06, "loss": 0.5925, "loss_nan_ranks": 0, "loss_rank_avg": 0.616851806640625, "step": 85, "valid_targets_mean": 4640.2, "valid_targets_min": 956 }, { "epoch": 0.06864988558352403, "grad_norm": 0.8125076785088601, "learning_rate": 3.8779956427015254e-06, "loss": 0.5796, "loss_nan_ranks": 0, "loss_rank_avg": 0.5934779644012451, "step": 90, "valid_targets_mean": 4000.2, "valid_targets_min": 1232 }, { "epoch": 0.07246376811594203, "grad_norm": 0.6943712006747517, "learning_rate": 4.0958605664488025e-06, "loss": 0.5544, "loss_nan_ranks": 0, "loss_rank_avg": 0.5483887195587158, "step": 95, "valid_targets_mean": 4390.5, "valid_targets_min": 659 }, { "epoch": 0.07627765064836003, "grad_norm": 0.6230323834581825, "learning_rate": 4.313725490196079e-06, "loss": 0.5606, "loss_nan_ranks": 0, "loss_rank_avg": 0.5412846803665161, "step": 100, "valid_targets_mean": 4160.7, "valid_targets_min": 972 }, { "epoch": 0.08009153318077804, "grad_norm": 0.875591747930727, "learning_rate": 4.531590413943356e-06, "loss": 0.525, "loss_nan_ranks": 0, "loss_rank_avg": 0.49036863446235657, "step": 105, "valid_targets_mean": 3680.2, "valid_targets_min": 1247 }, { "epoch": 0.08390541571319603, "grad_norm": 0.5510216943897367, "learning_rate": 4.749455337690632e-06, "loss": 0.5576, "loss_nan_ranks": 0, "loss_rank_avg": 0.4874543249607086, "step": 110, "valid_targets_mean": 4145.7, "valid_targets_min": 1149 }, { "epoch": 0.08771929824561403, "grad_norm": 0.5426893613443619, "learning_rate": 4.967320261437909e-06, "loss": 0.5387, "loss_nan_ranks": 0, "loss_rank_avg": 0.5104167461395264, "step": 115, "valid_targets_mean": 4632.5, "valid_targets_min": 1081 }, { "epoch": 0.09153318077803203, "grad_norm": 0.551676285668215, "learning_rate": 5.185185185185185e-06, "loss": 0.5484, "loss_nan_ranks": 0, "loss_rank_avg": 0.5294644236564636, "step": 120, "valid_targets_mean": 4924.3, "valid_targets_min": 1112 }, { "epoch": 0.09534706331045004, "grad_norm": 0.5270524880611899, "learning_rate": 5.403050108932463e-06, "loss": 0.5164, "loss_nan_ranks": 0, "loss_rank_avg": 0.44165608286857605, "step": 125, "valid_targets_mean": 4687.0, "valid_targets_min": 1765 }, { "epoch": 0.09916094584286804, "grad_norm": 0.48986406955989537, "learning_rate": 5.620915032679739e-06, "loss": 0.4987, "loss_nan_ranks": 0, "loss_rank_avg": 0.4905380308628082, "step": 130, "valid_targets_mean": 4783.9, "valid_targets_min": 872 }, { "epoch": 0.10297482837528604, "grad_norm": 0.5186763368356251, "learning_rate": 5.838779956427015e-06, "loss": 0.52, "loss_nan_ranks": 0, "loss_rank_avg": 0.5089920163154602, "step": 135, "valid_targets_mean": 4795.2, "valid_targets_min": 1039 }, { "epoch": 0.10678871090770405, "grad_norm": 0.5010334333520292, "learning_rate": 6.056644880174293e-06, "loss": 0.5146, "loss_nan_ranks": 0, "loss_rank_avg": 0.5307483673095703, "step": 140, "valid_targets_mean": 5161.2, "valid_targets_min": 1295 }, { "epoch": 0.11060259344012205, "grad_norm": 0.5123633336801784, "learning_rate": 6.274509803921569e-06, "loss": 0.5178, "loss_nan_ranks": 0, "loss_rank_avg": 0.4454838037490845, "step": 145, "valid_targets_mean": 3884.6, "valid_targets_min": 1002 }, { "epoch": 0.11441647597254005, "grad_norm": 0.5491751275251507, "learning_rate": 6.492374727668845e-06, "loss": 0.4921, "loss_nan_ranks": 0, "loss_rank_avg": 0.5181975364685059, "step": 150, "valid_targets_mean": 4045.0, "valid_targets_min": 1020 }, { "epoch": 0.11823035850495804, "grad_norm": 2.500737350039349, "learning_rate": 6.710239651416122e-06, "loss": 0.4828, "loss_nan_ranks": 0, "loss_rank_avg": 0.4583951532840729, "step": 155, "valid_targets_mean": 4955.4, "valid_targets_min": 1056 }, { "epoch": 0.12204424103737604, "grad_norm": 0.4536799712131569, "learning_rate": 6.928104575163399e-06, "loss": 0.501, "loss_nan_ranks": 0, "loss_rank_avg": 0.45491790771484375, "step": 160, "valid_targets_mean": 4887.3, "valid_targets_min": 1317 }, { "epoch": 0.12585812356979406, "grad_norm": 0.5705305236405581, "learning_rate": 7.145969498910676e-06, "loss": 0.7423, "loss_nan_ranks": 0, "loss_rank_avg": 0.4795728921890259, "step": 165, "valid_targets_mean": 3697.1, "valid_targets_min": 433 }, { "epoch": 0.12967200610221205, "grad_norm": 0.5378675959231818, "learning_rate": 7.363834422657953e-06, "loss": 0.5011, "loss_nan_ranks": 0, "loss_rank_avg": 0.4969773292541504, "step": 170, "valid_targets_mean": 4247.1, "valid_targets_min": 939 }, { "epoch": 0.13348588863463004, "grad_norm": 0.5413191072539879, "learning_rate": 7.581699346405229e-06, "loss": 0.4931, "loss_nan_ranks": 0, "loss_rank_avg": 0.46094343066215515, "step": 175, "valid_targets_mean": 3648.6, "valid_targets_min": 1373 }, { "epoch": 0.13729977116704806, "grad_norm": 0.4947370912132374, "learning_rate": 7.799564270152506e-06, "loss": 0.5081, "loss_nan_ranks": 0, "loss_rank_avg": 0.43682071566581726, "step": 180, "valid_targets_mean": 3943.0, "valid_targets_min": 990 }, { "epoch": 0.14111365369946605, "grad_norm": 0.5277722158585259, "learning_rate": 8.017429193899784e-06, "loss": 0.4734, "loss_nan_ranks": 0, "loss_rank_avg": 0.4734993875026703, "step": 185, "valid_targets_mean": 4291.0, "valid_targets_min": 1033 }, { "epoch": 0.14492753623188406, "grad_norm": 0.5624419217272335, "learning_rate": 8.23529411764706e-06, "loss": 0.4905, "loss_nan_ranks": 0, "loss_rank_avg": 0.46875128149986267, "step": 190, "valid_targets_mean": 3662.4, "valid_targets_min": 874 }, { "epoch": 0.14874141876430205, "grad_norm": 0.49793152277491554, "learning_rate": 8.453159041394336e-06, "loss": 0.4859, "loss_nan_ranks": 0, "loss_rank_avg": 0.47551751136779785, "step": 195, "valid_targets_mean": 4590.5, "valid_targets_min": 934 }, { "epoch": 0.15255530129672007, "grad_norm": 0.47365481578115076, "learning_rate": 8.671023965141612e-06, "loss": 0.4974, "loss_nan_ranks": 0, "loss_rank_avg": 0.509818971157074, "step": 200, "valid_targets_mean": 5085.7, "valid_targets_min": 1068 }, { "epoch": 0.15636918382913806, "grad_norm": 0.5712494209301259, "learning_rate": 8.888888888888888e-06, "loss": 0.4751, "loss_nan_ranks": 0, "loss_rank_avg": 0.4649386405944824, "step": 205, "valid_targets_mean": 3302.5, "valid_targets_min": 1013 }, { "epoch": 0.16018306636155608, "grad_norm": 0.5084803651986027, "learning_rate": 9.106753812636166e-06, "loss": 0.4449, "loss_nan_ranks": 0, "loss_rank_avg": 0.473945289850235, "step": 210, "valid_targets_mean": 4434.8, "valid_targets_min": 1002 }, { "epoch": 0.16399694889397406, "grad_norm": 0.5184435672003983, "learning_rate": 9.324618736383442e-06, "loss": 0.4346, "loss_nan_ranks": 0, "loss_rank_avg": 0.3982456624507904, "step": 215, "valid_targets_mean": 3852.2, "valid_targets_min": 870 }, { "epoch": 0.16781083142639205, "grad_norm": 0.4868051846661637, "learning_rate": 9.54248366013072e-06, "loss": 0.4829, "loss_nan_ranks": 0, "loss_rank_avg": 0.48539039492607117, "step": 220, "valid_targets_mean": 6059.0, "valid_targets_min": 865 }, { "epoch": 0.17162471395881007, "grad_norm": 0.5409139800606549, "learning_rate": 9.760348583877996e-06, "loss": 0.4629, "loss_nan_ranks": 0, "loss_rank_avg": 0.47836971282958984, "step": 225, "valid_targets_mean": 4304.7, "valid_targets_min": 890 }, { "epoch": 0.17543859649122806, "grad_norm": 0.5009648662623246, "learning_rate": 9.978213507625273e-06, "loss": 0.4451, "loss_nan_ranks": 0, "loss_rank_avg": 0.4605931043624878, "step": 230, "valid_targets_mean": 5225.0, "valid_targets_min": 1847 }, { "epoch": 0.17925247902364608, "grad_norm": 0.5140950082674012, "learning_rate": 1.0196078431372549e-05, "loss": 0.4662, "loss_nan_ranks": 0, "loss_rank_avg": 0.43352267146110535, "step": 235, "valid_targets_mean": 5232.6, "valid_targets_min": 1525 }, { "epoch": 0.18306636155606407, "grad_norm": 0.579977428231358, "learning_rate": 1.0413943355119827e-05, "loss": 0.4508, "loss_nan_ranks": 0, "loss_rank_avg": 0.4714777171611786, "step": 240, "valid_targets_mean": 4931.0, "valid_targets_min": 1398 }, { "epoch": 0.18688024408848208, "grad_norm": 0.5864749503460456, "learning_rate": 1.0631808278867104e-05, "loss": 0.4469, "loss_nan_ranks": 0, "loss_rank_avg": 0.4570702612400055, "step": 245, "valid_targets_mean": 4803.3, "valid_targets_min": 787 }, { "epoch": 0.19069412662090007, "grad_norm": 0.4372149960084067, "learning_rate": 1.0849673202614379e-05, "loss": 0.4472, "loss_nan_ranks": 0, "loss_rank_avg": 0.42177343368530273, "step": 250, "valid_targets_mean": 5634.1, "valid_targets_min": 1214 }, { "epoch": 0.1945080091533181, "grad_norm": 0.5238824399942199, "learning_rate": 1.1067538126361657e-05, "loss": 0.4621, "loss_nan_ranks": 0, "loss_rank_avg": 0.40550434589385986, "step": 255, "valid_targets_mean": 4041.0, "valid_targets_min": 1198 }, { "epoch": 0.19832189168573608, "grad_norm": 0.5263090103192474, "learning_rate": 1.1285403050108935e-05, "loss": 0.4491, "loss_nan_ranks": 0, "loss_rank_avg": 0.4669533669948578, "step": 260, "valid_targets_mean": 4864.0, "valid_targets_min": 348 }, { "epoch": 0.20213577421815407, "grad_norm": 0.4844855824860165, "learning_rate": 1.1503267973856209e-05, "loss": 0.4356, "loss_nan_ranks": 0, "loss_rank_avg": 0.4767606556415558, "step": 265, "valid_targets_mean": 4571.4, "valid_targets_min": 1294 }, { "epoch": 0.20594965675057209, "grad_norm": 0.5844330632392677, "learning_rate": 1.1721132897603487e-05, "loss": 0.4694, "loss_nan_ranks": 0, "loss_rank_avg": 0.5140058398246765, "step": 270, "valid_targets_mean": 3920.4, "valid_targets_min": 934 }, { "epoch": 0.20976353928299007, "grad_norm": 0.528817963711389, "learning_rate": 1.1938997821350765e-05, "loss": 0.4432, "loss_nan_ranks": 0, "loss_rank_avg": 0.4353533089160919, "step": 275, "valid_targets_mean": 4601.6, "valid_targets_min": 863 }, { "epoch": 0.2135774218154081, "grad_norm": 0.5006857035283947, "learning_rate": 1.215686274509804e-05, "loss": 0.461, "loss_nan_ranks": 0, "loss_rank_avg": 0.4613196551799774, "step": 280, "valid_targets_mean": 4929.3, "valid_targets_min": 981 }, { "epoch": 0.21739130434782608, "grad_norm": 0.47435927216376855, "learning_rate": 1.2374727668845317e-05, "loss": 0.4646, "loss_nan_ranks": 0, "loss_rank_avg": 0.4284130334854126, "step": 285, "valid_targets_mean": 4549.0, "valid_targets_min": 1071 }, { "epoch": 0.2212051868802441, "grad_norm": 0.48912815677244226, "learning_rate": 1.2592592592592593e-05, "loss": 0.441, "loss_nan_ranks": 0, "loss_rank_avg": 0.438406378030777, "step": 290, "valid_targets_mean": 4591.1, "valid_targets_min": 1050 }, { "epoch": 0.2250190694126621, "grad_norm": 0.4913986455786091, "learning_rate": 1.281045751633987e-05, "loss": 0.4563, "loss_nan_ranks": 0, "loss_rank_avg": 0.485249787569046, "step": 295, "valid_targets_mean": 4955.3, "valid_targets_min": 935 }, { "epoch": 0.2288329519450801, "grad_norm": 0.47839058332511075, "learning_rate": 1.3028322440087147e-05, "loss": 0.4757, "loss_nan_ranks": 0, "loss_rank_avg": 0.45996996760368347, "step": 300, "valid_targets_mean": 4854.8, "valid_targets_min": 1379 }, { "epoch": 0.2326468344774981, "grad_norm": 0.5908371229215295, "learning_rate": 1.3246187363834424e-05, "loss": 0.4286, "loss_nan_ranks": 0, "loss_rank_avg": 0.4527187645435333, "step": 305, "valid_targets_mean": 4125.8, "valid_targets_min": 1221 }, { "epoch": 0.23646071700991608, "grad_norm": 0.558504394945239, "learning_rate": 1.3464052287581701e-05, "loss": 0.4645, "loss_nan_ranks": 0, "loss_rank_avg": 0.46870169043540955, "step": 310, "valid_targets_mean": 4148.9, "valid_targets_min": 1389 }, { "epoch": 0.2402745995423341, "grad_norm": 0.5561787164121977, "learning_rate": 1.3681917211328976e-05, "loss": 0.4245, "loss_nan_ranks": 0, "loss_rank_avg": 0.407299280166626, "step": 315, "valid_targets_mean": 3703.2, "valid_targets_min": 1119 }, { "epoch": 0.2440884820747521, "grad_norm": 0.5406060809535468, "learning_rate": 1.3899782135076254e-05, "loss": 0.4362, "loss_nan_ranks": 0, "loss_rank_avg": 0.3715898096561432, "step": 320, "valid_targets_mean": 4031.1, "valid_targets_min": 1148 }, { "epoch": 0.2479023646071701, "grad_norm": 1.4983453657518973, "learning_rate": 1.4117647058823532e-05, "loss": 0.5043, "loss_nan_ranks": 0, "loss_rank_avg": 0.6690896153450012, "step": 325, "valid_targets_mean": 1204.7, "valid_targets_min": 562 }, { "epoch": 0.2517162471395881, "grad_norm": 0.9150855492826523, "learning_rate": 1.4335511982570806e-05, "loss": 0.7726, "loss_nan_ranks": 0, "loss_rank_avg": 0.5599314570426941, "step": 330, "valid_targets_mean": 1777.9, "valid_targets_min": 629 }, { "epoch": 0.2555301296720061, "grad_norm": 0.5586598650153595, "learning_rate": 1.4553376906318084e-05, "loss": 0.4435, "loss_nan_ranks": 0, "loss_rank_avg": 0.44297829270362854, "step": 335, "valid_targets_mean": 4019.2, "valid_targets_min": 610 }, { "epoch": 0.2593440122044241, "grad_norm": 0.5304240978755225, "learning_rate": 1.4771241830065362e-05, "loss": 0.4227, "loss_nan_ranks": 0, "loss_rank_avg": 0.3744999170303345, "step": 340, "valid_targets_mean": 4157.5, "valid_targets_min": 1035 }, { "epoch": 0.2631578947368421, "grad_norm": 0.669155831706647, "learning_rate": 1.4989106753812636e-05, "loss": 0.4595, "loss_nan_ranks": 0, "loss_rank_avg": 0.4575551450252533, "step": 345, "valid_targets_mean": 5283.3, "valid_targets_min": 1131 }, { "epoch": 0.2669717772692601, "grad_norm": 0.6703382325755647, "learning_rate": 1.5206971677559914e-05, "loss": 0.4406, "loss_nan_ranks": 0, "loss_rank_avg": 0.4503791332244873, "step": 350, "valid_targets_mean": 3426.8, "valid_targets_min": 1044 }, { "epoch": 0.2707856598016781, "grad_norm": 0.5788534308575273, "learning_rate": 1.5424836601307192e-05, "loss": 0.4515, "loss_nan_ranks": 0, "loss_rank_avg": 0.43128445744514465, "step": 355, "valid_targets_mean": 4059.3, "valid_targets_min": 385 }, { "epoch": 0.2745995423340961, "grad_norm": 0.5167153063531891, "learning_rate": 1.5642701525054468e-05, "loss": 0.438, "loss_nan_ranks": 0, "loss_rank_avg": 0.4530758559703827, "step": 360, "valid_targets_mean": 4845.2, "valid_targets_min": 978 }, { "epoch": 0.2784134248665141, "grad_norm": 0.5271031423011994, "learning_rate": 1.5860566448801744e-05, "loss": 0.4081, "loss_nan_ranks": 0, "loss_rank_avg": 0.41743603348731995, "step": 365, "valid_targets_mean": 3877.2, "valid_targets_min": 468 }, { "epoch": 0.2822273073989321, "grad_norm": 0.4584127185198121, "learning_rate": 1.607843137254902e-05, "loss": 0.4311, "loss_nan_ranks": 0, "loss_rank_avg": 0.3872661590576172, "step": 370, "valid_targets_mean": 4894.0, "valid_targets_min": 1049 }, { "epoch": 0.28604118993135014, "grad_norm": 0.5674756040704212, "learning_rate": 1.6296296296296297e-05, "loss": 0.4269, "loss_nan_ranks": 0, "loss_rank_avg": 0.4131319522857666, "step": 375, "valid_targets_mean": 4604.5, "valid_targets_min": 1024 }, { "epoch": 0.2898550724637681, "grad_norm": 0.49939284790297844, "learning_rate": 1.6514161220043573e-05, "loss": 0.413, "loss_nan_ranks": 0, "loss_rank_avg": 0.4175918996334076, "step": 380, "valid_targets_mean": 4370.5, "valid_targets_min": 1018 }, { "epoch": 0.2936689549961861, "grad_norm": 0.5308498919223146, "learning_rate": 1.6732026143790852e-05, "loss": 0.4101, "loss_nan_ranks": 0, "loss_rank_avg": 0.41098570823669434, "step": 385, "valid_targets_mean": 3836.2, "valid_targets_min": 336 }, { "epoch": 0.2974828375286041, "grad_norm": 0.5122991151701906, "learning_rate": 1.6949891067538125e-05, "loss": 0.4106, "loss_nan_ranks": 0, "loss_rank_avg": 0.4084223508834839, "step": 390, "valid_targets_mean": 4162.0, "valid_targets_min": 1472 }, { "epoch": 0.3012967200610221, "grad_norm": 0.5181967092269961, "learning_rate": 1.7167755991285405e-05, "loss": 0.4204, "loss_nan_ranks": 0, "loss_rank_avg": 0.3865543305873871, "step": 395, "valid_targets_mean": 4125.0, "valid_targets_min": 1314 }, { "epoch": 0.30511060259344014, "grad_norm": 0.5550861402134036, "learning_rate": 1.738562091503268e-05, "loss": 0.4397, "loss_nan_ranks": 0, "loss_rank_avg": 0.4710928499698639, "step": 400, "valid_targets_mean": 4019.8, "valid_targets_min": 1289 }, { "epoch": 0.30892448512585813, "grad_norm": 0.5438815034414402, "learning_rate": 1.7603485838779957e-05, "loss": 0.4228, "loss_nan_ranks": 0, "loss_rank_avg": 0.3929981291294098, "step": 405, "valid_targets_mean": 4301.6, "valid_targets_min": 504 }, { "epoch": 0.3127383676582761, "grad_norm": 0.6707002167342581, "learning_rate": 1.7821350762527233e-05, "loss": 0.4142, "loss_nan_ranks": 0, "loss_rank_avg": 0.422780841588974, "step": 410, "valid_targets_mean": 4865.9, "valid_targets_min": 1739 }, { "epoch": 0.3165522501906941, "grad_norm": 2.032523055369547, "learning_rate": 1.8039215686274513e-05, "loss": 0.426, "loss_nan_ranks": 0, "loss_rank_avg": 0.49667227268218994, "step": 415, "valid_targets_mean": 3822.7, "valid_targets_min": 674 }, { "epoch": 0.32036613272311215, "grad_norm": 0.5997322470060125, "learning_rate": 1.825708061002179e-05, "loss": 0.406, "loss_nan_ranks": 0, "loss_rank_avg": 0.4212714731693268, "step": 420, "valid_targets_mean": 3495.9, "valid_targets_min": 274 }, { "epoch": 0.32418001525553014, "grad_norm": 0.48011386623091284, "learning_rate": 1.8474945533769065e-05, "loss": 0.405, "loss_nan_ranks": 0, "loss_rank_avg": 0.3752917945384979, "step": 425, "valid_targets_mean": 4413.0, "valid_targets_min": 1244 }, { "epoch": 0.32799389778794813, "grad_norm": 0.6028412606566115, "learning_rate": 1.869281045751634e-05, "loss": 0.4314, "loss_nan_ranks": 0, "loss_rank_avg": 0.46982622146606445, "step": 430, "valid_targets_mean": 4495.7, "valid_targets_min": 919 }, { "epoch": 0.3318077803203661, "grad_norm": 0.5807673150953151, "learning_rate": 1.8910675381263617e-05, "loss": 0.4128, "loss_nan_ranks": 0, "loss_rank_avg": 0.41810181736946106, "step": 435, "valid_targets_mean": 4100.7, "valid_targets_min": 1543 }, { "epoch": 0.3356216628527841, "grad_norm": 0.5678000717779615, "learning_rate": 1.9128540305010894e-05, "loss": 0.4058, "loss_nan_ranks": 0, "loss_rank_avg": 0.4434739351272583, "step": 440, "valid_targets_mean": 3935.1, "valid_targets_min": 890 }, { "epoch": 0.33943554538520215, "grad_norm": 0.5469056120801911, "learning_rate": 1.9346405228758173e-05, "loss": 0.4116, "loss_nan_ranks": 0, "loss_rank_avg": 0.37859591841697693, "step": 445, "valid_targets_mean": 3676.0, "valid_targets_min": 1351 }, { "epoch": 0.34324942791762014, "grad_norm": 0.47827617322788585, "learning_rate": 1.956427015250545e-05, "loss": 0.4327, "loss_nan_ranks": 0, "loss_rank_avg": 0.4103635847568512, "step": 450, "valid_targets_mean": 5130.5, "valid_targets_min": 1279 }, { "epoch": 0.34706331045003813, "grad_norm": 0.6941453851155629, "learning_rate": 1.9782135076252725e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.4146636724472046, "step": 455, "valid_targets_mean": 4593.5, "valid_targets_min": 1281 }, { "epoch": 0.3508771929824561, "grad_norm": 0.5241578671868445, "learning_rate": 2e-05, "loss": 0.4178, "loss_nan_ranks": 0, "loss_rank_avg": 0.4084761142730713, "step": 460, "valid_targets_mean": 4143.6, "valid_targets_min": 1026 }, { "epoch": 0.35469107551487417, "grad_norm": 0.4946580310260773, "learning_rate": 2.0217864923747278e-05, "loss": 0.405, "loss_nan_ranks": 0, "loss_rank_avg": 0.3879587948322296, "step": 465, "valid_targets_mean": 4280.2, "valid_targets_min": 1094 }, { "epoch": 0.35850495804729215, "grad_norm": 0.5261377997096447, "learning_rate": 2.0435729847494557e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.4153151512145996, "step": 470, "valid_targets_mean": 4111.7, "valid_targets_min": 1306 }, { "epoch": 0.36231884057971014, "grad_norm": 0.49667981369723574, "learning_rate": 2.0653594771241834e-05, "loss": 0.4098, "loss_nan_ranks": 0, "loss_rank_avg": 0.3661862313747406, "step": 475, "valid_targets_mean": 4103.8, "valid_targets_min": 447 }, { "epoch": 0.36613272311212813, "grad_norm": 0.5674990532031673, "learning_rate": 2.0871459694989106e-05, "loss": 0.4, "loss_nan_ranks": 0, "loss_rank_avg": 0.42640629410743713, "step": 480, "valid_targets_mean": 3842.2, "valid_targets_min": 395 }, { "epoch": 0.3699466056445461, "grad_norm": 0.49164681714558667, "learning_rate": 2.1089324618736386e-05, "loss": 0.3916, "loss_nan_ranks": 0, "loss_rank_avg": 0.36857786774635315, "step": 485, "valid_targets_mean": 4493.4, "valid_targets_min": 1671 }, { "epoch": 0.37376048817696417, "grad_norm": 1.1112103673444507, "learning_rate": 2.1307189542483662e-05, "loss": 0.4382, "loss_nan_ranks": 0, "loss_rank_avg": 0.5883781313896179, "step": 490, "valid_targets_mean": 1448.0, "valid_targets_min": 675 }, { "epoch": 0.37757437070938216, "grad_norm": 0.6359095779716393, "learning_rate": 2.1525054466230938e-05, "loss": 0.5499, "loss_nan_ranks": 0, "loss_rank_avg": 0.4046311378479004, "step": 495, "valid_targets_mean": 4003.0, "valid_targets_min": 1379 }, { "epoch": 0.38138825324180015, "grad_norm": 0.4982545028617011, "learning_rate": 2.1742919389978218e-05, "loss": 0.4297, "loss_nan_ranks": 0, "loss_rank_avg": 0.4083602726459503, "step": 500, "valid_targets_mean": 4638.2, "valid_targets_min": 1044 }, { "epoch": 0.38520213577421814, "grad_norm": 0.48915512583881143, "learning_rate": 2.1960784313725494e-05, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.41862890124320984, "step": 505, "valid_targets_mean": 4827.2, "valid_targets_min": 416 }, { "epoch": 0.3890160183066362, "grad_norm": 0.517221047006931, "learning_rate": 2.2178649237472767e-05, "loss": 0.4107, "loss_nan_ranks": 0, "loss_rank_avg": 0.4069397449493408, "step": 510, "valid_targets_mean": 4566.0, "valid_targets_min": 1278 }, { "epoch": 0.39282990083905417, "grad_norm": 0.5121022744996065, "learning_rate": 2.2396514161220043e-05, "loss": 0.4108, "loss_nan_ranks": 0, "loss_rank_avg": 0.43694543838500977, "step": 515, "valid_targets_mean": 5045.8, "valid_targets_min": 1274 }, { "epoch": 0.39664378337147216, "grad_norm": 0.4800161727651644, "learning_rate": 2.2614379084967322e-05, "loss": 0.4098, "loss_nan_ranks": 0, "loss_rank_avg": 0.395797997713089, "step": 520, "valid_targets_mean": 4706.9, "valid_targets_min": 1275 }, { "epoch": 0.40045766590389015, "grad_norm": 0.46860780726922296, "learning_rate": 2.28322440087146e-05, "loss": 0.4059, "loss_nan_ranks": 0, "loss_rank_avg": 0.36623287200927734, "step": 525, "valid_targets_mean": 4559.0, "valid_targets_min": 1282 }, { "epoch": 0.40427154843630814, "grad_norm": 0.5113105070608205, "learning_rate": 2.3050108932461878e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.38678622245788574, "step": 530, "valid_targets_mean": 4872.2, "valid_targets_min": 587 }, { "epoch": 0.4080854309687262, "grad_norm": 0.4842846017374961, "learning_rate": 2.3267973856209154e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.4049014747142792, "step": 535, "valid_targets_mean": 5120.1, "valid_targets_min": 531 }, { "epoch": 0.41189931350114417, "grad_norm": 0.48187699542171236, "learning_rate": 2.3485838779956427e-05, "loss": 0.4151, "loss_nan_ranks": 0, "loss_rank_avg": 0.42579174041748047, "step": 540, "valid_targets_mean": 5236.5, "valid_targets_min": 1493 }, { "epoch": 0.41571319603356216, "grad_norm": 0.5069904951791335, "learning_rate": 2.3703703703703703e-05, "loss": 0.3864, "loss_nan_ranks": 0, "loss_rank_avg": 0.351409912109375, "step": 545, "valid_targets_mean": 4193.8, "valid_targets_min": 1929 }, { "epoch": 0.41952707856598015, "grad_norm": 0.47887731304957243, "learning_rate": 2.3921568627450983e-05, "loss": 0.3962, "loss_nan_ranks": 0, "loss_rank_avg": 0.3922696113586426, "step": 550, "valid_targets_mean": 4655.1, "valid_targets_min": 1354 }, { "epoch": 0.4233409610983982, "grad_norm": 0.4564867344774318, "learning_rate": 2.413943355119826e-05, "loss": 0.4237, "loss_nan_ranks": 0, "loss_rank_avg": 0.3802224397659302, "step": 555, "valid_targets_mean": 5557.0, "valid_targets_min": 1151 }, { "epoch": 0.4271548436308162, "grad_norm": 0.5031199121109118, "learning_rate": 2.4357298474945535e-05, "loss": 0.3761, "loss_nan_ranks": 0, "loss_rank_avg": 0.33998584747314453, "step": 560, "valid_targets_mean": 4495.2, "valid_targets_min": 999 }, { "epoch": 0.4309687261632342, "grad_norm": 0.4928451295329029, "learning_rate": 2.4575163398692815e-05, "loss": 0.415, "loss_nan_ranks": 0, "loss_rank_avg": 0.4243813753128052, "step": 565, "valid_targets_mean": 4882.1, "valid_targets_min": 987 }, { "epoch": 0.43478260869565216, "grad_norm": 0.5259224766412115, "learning_rate": 2.479302832244009e-05, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.3836231231689453, "step": 570, "valid_targets_mean": 4713.7, "valid_targets_min": 1686 }, { "epoch": 0.43859649122807015, "grad_norm": 0.5579901905077622, "learning_rate": 2.5010893246187364e-05, "loss": 0.3776, "loss_nan_ranks": 0, "loss_rank_avg": 0.3920012414455414, "step": 575, "valid_targets_mean": 3984.4, "valid_targets_min": 977 }, { "epoch": 0.4424103737604882, "grad_norm": 0.5439800495512314, "learning_rate": 2.5228758169934643e-05, "loss": 0.37, "loss_nan_ranks": 0, "loss_rank_avg": 0.33532944321632385, "step": 580, "valid_targets_mean": 3737.5, "valid_targets_min": 354 }, { "epoch": 0.4462242562929062, "grad_norm": 0.5662975384921443, "learning_rate": 2.544662309368192e-05, "loss": 0.4096, "loss_nan_ranks": 0, "loss_rank_avg": 0.4044320285320282, "step": 585, "valid_targets_mean": 3571.9, "valid_targets_min": 1005 }, { "epoch": 0.4500381388253242, "grad_norm": 0.47734947502220565, "learning_rate": 2.5664488017429196e-05, "loss": 0.3913, "loss_nan_ranks": 0, "loss_rank_avg": 0.41730186343193054, "step": 590, "valid_targets_mean": 5255.7, "valid_targets_min": 750 }, { "epoch": 0.45385202135774216, "grad_norm": 0.46089066500843384, "learning_rate": 2.5882352941176475e-05, "loss": 0.3849, "loss_nan_ranks": 0, "loss_rank_avg": 0.35630854964256287, "step": 595, "valid_targets_mean": 4318.8, "valid_targets_min": 1350 }, { "epoch": 0.4576659038901602, "grad_norm": 0.533942025808671, "learning_rate": 2.610021786492375e-05, "loss": 0.3949, "loss_nan_ranks": 0, "loss_rank_avg": 0.39351949095726013, "step": 600, "valid_targets_mean": 4463.6, "valid_targets_min": 1353 }, { "epoch": 0.4614797864225782, "grad_norm": 0.620788552352078, "learning_rate": 2.6318082788671024e-05, "loss": 0.3986, "loss_nan_ranks": 0, "loss_rank_avg": 0.4100879430770874, "step": 605, "valid_targets_mean": 4238.0, "valid_targets_min": 495 }, { "epoch": 0.4652936689549962, "grad_norm": 0.47098349815571094, "learning_rate": 2.65359477124183e-05, "loss": 0.417, "loss_nan_ranks": 0, "loss_rank_avg": 0.4212774932384491, "step": 610, "valid_targets_mean": 5455.1, "valid_targets_min": 1228 }, { "epoch": 0.4691075514874142, "grad_norm": 0.531495026436975, "learning_rate": 2.675381263616558e-05, "loss": 0.4189, "loss_nan_ranks": 0, "loss_rank_avg": 0.41660937666893005, "step": 615, "valid_targets_mean": 4546.2, "valid_targets_min": 1467 }, { "epoch": 0.47292143401983217, "grad_norm": 0.49774084718519146, "learning_rate": 2.6971677559912856e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.3917350471019745, "step": 620, "valid_targets_mean": 4665.4, "valid_targets_min": 1231 }, { "epoch": 0.4767353165522502, "grad_norm": 0.5223030282822787, "learning_rate": 2.7189542483660135e-05, "loss": 0.4062, "loss_nan_ranks": 0, "loss_rank_avg": 0.4286997318267822, "step": 625, "valid_targets_mean": 4919.1, "valid_targets_min": 401 }, { "epoch": 0.4805491990846682, "grad_norm": 0.6311171808018544, "learning_rate": 2.740740740740741e-05, "loss": 0.4148, "loss_nan_ranks": 0, "loss_rank_avg": 0.4223945140838623, "step": 630, "valid_targets_mean": 3921.5, "valid_targets_min": 807 }, { "epoch": 0.4843630816170862, "grad_norm": 0.5423403261529165, "learning_rate": 2.7625272331154684e-05, "loss": 0.3855, "loss_nan_ranks": 0, "loss_rank_avg": 0.3739047944545746, "step": 635, "valid_targets_mean": 3978.4, "valid_targets_min": 715 }, { "epoch": 0.4881769641495042, "grad_norm": 0.5833531419739164, "learning_rate": 2.784313725490196e-05, "loss": 0.3851, "loss_nan_ranks": 0, "loss_rank_avg": 0.3918963372707367, "step": 640, "valid_targets_mean": 3173.8, "valid_targets_min": 933 }, { "epoch": 0.4919908466819222, "grad_norm": 0.5888665746157846, "learning_rate": 2.806100217864924e-05, "loss": 0.4044, "loss_nan_ranks": 0, "loss_rank_avg": 0.40655291080474854, "step": 645, "valid_targets_mean": 4044.9, "valid_targets_min": 1272 }, { "epoch": 0.4958047292143402, "grad_norm": 0.6310048168490392, "learning_rate": 2.8278867102396516e-05, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.40415921807289124, "step": 650, "valid_targets_mean": 3122.2, "valid_targets_min": 457 }, { "epoch": 0.4996186117467582, "grad_norm": 0.7447980014403361, "learning_rate": 2.8496732026143792e-05, "loss": 0.677, "loss_nan_ranks": 0, "loss_rank_avg": 0.44158491492271423, "step": 655, "valid_targets_mean": 2758.2, "valid_targets_min": 574 }, { "epoch": 0.5034324942791762, "grad_norm": 0.5141237643896464, "learning_rate": 2.8714596949891072e-05, "loss": 0.3874, "loss_nan_ranks": 0, "loss_rank_avg": 0.4077136516571045, "step": 660, "valid_targets_mean": 4658.0, "valid_targets_min": 1364 }, { "epoch": 0.5072463768115942, "grad_norm": 0.6083519366022135, "learning_rate": 2.8932461873638345e-05, "loss": 0.3797, "loss_nan_ranks": 0, "loss_rank_avg": 0.3819454610347748, "step": 665, "valid_targets_mean": 4113.9, "valid_targets_min": 815 }, { "epoch": 0.5110602593440122, "grad_norm": 0.5293654642242984, "learning_rate": 2.915032679738562e-05, "loss": 0.4086, "loss_nan_ranks": 0, "loss_rank_avg": 0.35915103554725647, "step": 670, "valid_targets_mean": 4441.2, "valid_targets_min": 1100 }, { "epoch": 0.5148741418764302, "grad_norm": 0.49950432251413246, "learning_rate": 2.93681917211329e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.37206077575683594, "step": 675, "valid_targets_mean": 4198.2, "valid_targets_min": 967 }, { "epoch": 0.5186880244088482, "grad_norm": 0.4630265565067862, "learning_rate": 2.9586056644880177e-05, "loss": 0.39, "loss_nan_ranks": 0, "loss_rank_avg": 0.385885089635849, "step": 680, "valid_targets_mean": 5195.9, "valid_targets_min": 1113 }, { "epoch": 0.5225019069412662, "grad_norm": 0.5299093503446665, "learning_rate": 2.9803921568627453e-05, "loss": 0.4099, "loss_nan_ranks": 0, "loss_rank_avg": 0.4257817566394806, "step": 685, "valid_targets_mean": 3791.5, "valid_targets_min": 1313 }, { "epoch": 0.5263157894736842, "grad_norm": 0.5647217389609704, "learning_rate": 3.0021786492374732e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.4137308895587921, "step": 690, "valid_targets_mean": 3960.7, "valid_targets_min": 844 }, { "epoch": 0.5301296720061022, "grad_norm": 0.5278358373812087, "learning_rate": 3.023965141612201e-05, "loss": 0.3888, "loss_nan_ranks": 0, "loss_rank_avg": 0.4036301076412201, "step": 695, "valid_targets_mean": 4288.9, "valid_targets_min": 1040 }, { "epoch": 0.5339435545385202, "grad_norm": 0.5073909224886175, "learning_rate": 3.045751633986928e-05, "loss": 0.3906, "loss_nan_ranks": 0, "loss_rank_avg": 0.3536445200443268, "step": 700, "valid_targets_mean": 3966.4, "valid_targets_min": 1084 }, { "epoch": 0.5377574370709383, "grad_norm": 0.4830058432421143, "learning_rate": 3.067538126361656e-05, "loss": 0.388, "loss_nan_ranks": 0, "loss_rank_avg": 0.4126201868057251, "step": 705, "valid_targets_mean": 5077.2, "valid_targets_min": 1141 }, { "epoch": 0.5415713196033562, "grad_norm": 0.47042770960997, "learning_rate": 3.0893246187363834e-05, "loss": 0.3825, "loss_nan_ranks": 0, "loss_rank_avg": 0.3704334497451782, "step": 710, "valid_targets_mean": 4411.2, "valid_targets_min": 1106 }, { "epoch": 0.5453852021357742, "grad_norm": 0.5497176981288221, "learning_rate": 3.111111111111112e-05, "loss": 0.3917, "loss_nan_ranks": 0, "loss_rank_avg": 0.3955814838409424, "step": 715, "valid_targets_mean": 4098.8, "valid_targets_min": 881 }, { "epoch": 0.5491990846681922, "grad_norm": 0.5024335146851029, "learning_rate": 3.132897603485839e-05, "loss": 0.4255, "loss_nan_ranks": 0, "loss_rank_avg": 0.4101240634918213, "step": 720, "valid_targets_mean": 4925.6, "valid_targets_min": 1056 }, { "epoch": 0.5530129672006102, "grad_norm": 0.5231997517163126, "learning_rate": 3.154684095860567e-05, "loss": 0.3913, "loss_nan_ranks": 0, "loss_rank_avg": 0.4119824469089508, "step": 725, "valid_targets_mean": 4464.0, "valid_targets_min": 1397 }, { "epoch": 0.5568268497330282, "grad_norm": 0.5711284191765268, "learning_rate": 3.1764705882352945e-05, "loss": 0.3777, "loss_nan_ranks": 0, "loss_rank_avg": 0.3848339319229126, "step": 730, "valid_targets_mean": 3427.6, "valid_targets_min": 850 }, { "epoch": 0.5606407322654462, "grad_norm": 0.5389152963467714, "learning_rate": 3.198257080610022e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.3863255977630615, "step": 735, "valid_targets_mean": 3456.2, "valid_targets_min": 928 }, { "epoch": 0.5644546147978642, "grad_norm": 0.49151065077688183, "learning_rate": 3.22004357298475e-05, "loss": 0.408, "loss_nan_ranks": 0, "loss_rank_avg": 0.3926849365234375, "step": 740, "valid_targets_mean": 4422.6, "valid_targets_min": 1164 }, { "epoch": 0.5682684973302822, "grad_norm": 0.4856172845776493, "learning_rate": 3.2418300653594774e-05, "loss": 0.3676, "loss_nan_ranks": 0, "loss_rank_avg": 0.4255011975765228, "step": 745, "valid_targets_mean": 5380.8, "valid_targets_min": 1094 }, { "epoch": 0.5720823798627003, "grad_norm": 0.4676240103796647, "learning_rate": 3.263616557734205e-05, "loss": 0.3912, "loss_nan_ranks": 0, "loss_rank_avg": 0.36335039138793945, "step": 750, "valid_targets_mean": 5003.5, "valid_targets_min": 1181 }, { "epoch": 0.5758962623951183, "grad_norm": 0.6001473921317693, "learning_rate": 3.2854030501089326e-05, "loss": 0.4009, "loss_nan_ranks": 0, "loss_rank_avg": 0.4211665689945221, "step": 755, "valid_targets_mean": 3523.4, "valid_targets_min": 652 }, { "epoch": 0.5797101449275363, "grad_norm": 0.4595865924313308, "learning_rate": 3.30718954248366e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.38674649596214294, "step": 760, "valid_targets_mean": 4933.9, "valid_targets_min": 887 }, { "epoch": 0.5835240274599542, "grad_norm": 0.5168951363868316, "learning_rate": 3.328976034858388e-05, "loss": 0.3983, "loss_nan_ranks": 0, "loss_rank_avg": 0.42586424946784973, "step": 765, "valid_targets_mean": 3924.8, "valid_targets_min": 909 }, { "epoch": 0.5873379099923722, "grad_norm": 0.4723825484517219, "learning_rate": 3.3507625272331155e-05, "loss": 0.3924, "loss_nan_ranks": 0, "loss_rank_avg": 0.365474134683609, "step": 770, "valid_targets_mean": 4569.1, "valid_targets_min": 1411 }, { "epoch": 0.5911517925247902, "grad_norm": 0.4771358236427614, "learning_rate": 3.372549019607844e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.36031606793403625, "step": 775, "valid_targets_mean": 4408.3, "valid_targets_min": 1060 }, { "epoch": 0.5949656750572082, "grad_norm": 0.5880545694161227, "learning_rate": 3.3943355119825714e-05, "loss": 0.39, "loss_nan_ranks": 0, "loss_rank_avg": 0.3750080168247223, "step": 780, "valid_targets_mean": 3936.3, "valid_targets_min": 1230 }, { "epoch": 0.5987795575896262, "grad_norm": 0.489467269189964, "learning_rate": 3.416122004357299e-05, "loss": 0.3692, "loss_nan_ranks": 0, "loss_rank_avg": 0.36050716042518616, "step": 785, "valid_targets_mean": 4176.9, "valid_targets_min": 306 }, { "epoch": 0.6025934401220442, "grad_norm": 0.5536794566949234, "learning_rate": 3.4379084967320266e-05, "loss": 0.3925, "loss_nan_ranks": 0, "loss_rank_avg": 0.35600319504737854, "step": 790, "valid_targets_mean": 3812.0, "valid_targets_min": 917 }, { "epoch": 0.6064073226544623, "grad_norm": 0.4902508002712552, "learning_rate": 3.459694989106754e-05, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.34459996223449707, "step": 795, "valid_targets_mean": 4373.7, "valid_targets_min": 991 }, { "epoch": 0.6102212051868803, "grad_norm": 0.4998517004871938, "learning_rate": 3.481481481481482e-05, "loss": 0.3935, "loss_nan_ranks": 0, "loss_rank_avg": 0.411490797996521, "step": 800, "valid_targets_mean": 5246.0, "valid_targets_min": 927 }, { "epoch": 0.6140350877192983, "grad_norm": 0.47895938853802045, "learning_rate": 3.5032679738562094e-05, "loss": 0.3771, "loss_nan_ranks": 0, "loss_rank_avg": 0.38547301292419434, "step": 805, "valid_targets_mean": 5198.0, "valid_targets_min": 1305 }, { "epoch": 0.6178489702517163, "grad_norm": 0.5004860108698085, "learning_rate": 3.525054466230937e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.3470894396305084, "step": 810, "valid_targets_mean": 3868.3, "valid_targets_min": 840 }, { "epoch": 0.6216628527841342, "grad_norm": 0.5060663282767479, "learning_rate": 3.546840958605665e-05, "loss": 0.4047, "loss_nan_ranks": 0, "loss_rank_avg": 0.39354002475738525, "step": 815, "valid_targets_mean": 4378.5, "valid_targets_min": 1324 }, { "epoch": 0.6254767353165522, "grad_norm": 1.6522740852946434, "learning_rate": 3.568627450980393e-05, "loss": 0.6681, "loss_nan_ranks": 0, "loss_rank_avg": 0.7057502865791321, "step": 820, "valid_targets_mean": 834.8, "valid_targets_min": 622 }, { "epoch": 0.6292906178489702, "grad_norm": 0.5115480729000605, "learning_rate": 3.59041394335512e-05, "loss": 0.3951, "loss_nan_ranks": 0, "loss_rank_avg": 0.3566841185092926, "step": 825, "valid_targets_mean": 4504.2, "valid_targets_min": 356 }, { "epoch": 0.6331045003813882, "grad_norm": 0.5430480146137391, "learning_rate": 3.6122004357298475e-05, "loss": 0.382, "loss_nan_ranks": 0, "loss_rank_avg": 0.38058558106422424, "step": 830, "valid_targets_mean": 4257.1, "valid_targets_min": 1598 }, { "epoch": 0.6369183829138062, "grad_norm": 0.540378079231876, "learning_rate": 3.633986928104575e-05, "loss": 0.3767, "loss_nan_ranks": 0, "loss_rank_avg": 0.35072061419487, "step": 835, "valid_targets_mean": 4133.5, "valid_targets_min": 1372 }, { "epoch": 0.6407322654462243, "grad_norm": 0.5004544935516848, "learning_rate": 3.6557734204793034e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.33233800530433655, "step": 840, "valid_targets_mean": 4052.1, "valid_targets_min": 657 }, { "epoch": 0.6445461479786423, "grad_norm": 0.5183298816243558, "learning_rate": 3.677559912854031e-05, "loss": 0.3633, "loss_nan_ranks": 0, "loss_rank_avg": 0.4036792814731598, "step": 845, "valid_targets_mean": 4681.9, "valid_targets_min": 946 }, { "epoch": 0.6483600305110603, "grad_norm": 0.4847317504698284, "learning_rate": 3.699346405228759e-05, "loss": 0.4001, "loss_nan_ranks": 0, "loss_rank_avg": 0.40551283955574036, "step": 850, "valid_targets_mean": 5111.8, "valid_targets_min": 1202 }, { "epoch": 0.6521739130434783, "grad_norm": 0.4932653055447772, "learning_rate": 3.7211328976034856e-05, "loss": 0.4006, "loss_nan_ranks": 0, "loss_rank_avg": 0.4025735855102539, "step": 855, "valid_targets_mean": 5248.5, "valid_targets_min": 1118 }, { "epoch": 0.6559877955758963, "grad_norm": 0.47245011161392636, "learning_rate": 3.742919389978214e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3714592754840851, "step": 860, "valid_targets_mean": 4735.7, "valid_targets_min": 1169 }, { "epoch": 0.6598016781083142, "grad_norm": 0.48874913799650793, "learning_rate": 3.7647058823529415e-05, "loss": 0.365, "loss_nan_ranks": 0, "loss_rank_avg": 0.35503053665161133, "step": 865, "valid_targets_mean": 4341.5, "valid_targets_min": 514 }, { "epoch": 0.6636155606407322, "grad_norm": 0.4993317096416843, "learning_rate": 3.786492374727669e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.3757993280887604, "step": 870, "valid_targets_mean": 4060.4, "valid_targets_min": 793 }, { "epoch": 0.6674294431731502, "grad_norm": 0.5080718314678389, "learning_rate": 3.808278867102397e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.35796621441841125, "step": 875, "valid_targets_mean": 4294.8, "valid_targets_min": 943 }, { "epoch": 0.6712433257055682, "grad_norm": 0.5139513225612712, "learning_rate": 3.8300653594771244e-05, "loss": 0.3826, "loss_nan_ranks": 0, "loss_rank_avg": 0.40277424454689026, "step": 880, "valid_targets_mean": 4046.4, "valid_targets_min": 1159 }, { "epoch": 0.6750572082379863, "grad_norm": 0.4825425455442106, "learning_rate": 3.851851851851852e-05, "loss": 0.3807, "loss_nan_ranks": 0, "loss_rank_avg": 0.3549913465976715, "step": 885, "valid_targets_mean": 4678.9, "valid_targets_min": 1080 }, { "epoch": 0.6788710907704043, "grad_norm": 0.46169037581763467, "learning_rate": 3.8736383442265796e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.3371763229370117, "step": 890, "valid_targets_mean": 4274.1, "valid_targets_min": 1006 }, { "epoch": 0.6826849733028223, "grad_norm": 0.5736539263411012, "learning_rate": 3.895424836601307e-05, "loss": 0.3746, "loss_nan_ranks": 0, "loss_rank_avg": 0.3682954013347626, "step": 895, "valid_targets_mean": 3701.7, "valid_targets_min": 1264 }, { "epoch": 0.6864988558352403, "grad_norm": 0.4573138967748284, "learning_rate": 3.917211328976035e-05, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203882873058319, "step": 900, "valid_targets_mean": 5214.0, "valid_targets_min": 1596 }, { "epoch": 0.6903127383676583, "grad_norm": 0.5220685316176321, "learning_rate": 3.938997821350763e-05, "loss": 0.3892, "loss_nan_ranks": 0, "loss_rank_avg": 0.398406982421875, "step": 905, "valid_targets_mean": 3611.3, "valid_targets_min": 906 }, { "epoch": 0.6941266209000763, "grad_norm": 0.578745321361813, "learning_rate": 3.960784313725491e-05, "loss": 0.3721, "loss_nan_ranks": 0, "loss_rank_avg": 0.368577241897583, "step": 910, "valid_targets_mean": 3772.9, "valid_targets_min": 431 }, { "epoch": 0.6979405034324943, "grad_norm": 0.47869296323020866, "learning_rate": 3.9825708061002184e-05, "loss": 0.3771, "loss_nan_ranks": 0, "loss_rank_avg": 0.3765166699886322, "step": 915, "valid_targets_mean": 4115.8, "valid_targets_min": 843 }, { "epoch": 0.7017543859649122, "grad_norm": 0.4290499852367467, "learning_rate": 3.9999998553079044e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.34164825081825256, "step": 920, "valid_targets_mean": 4980.8, "valid_targets_min": 2055 }, { "epoch": 0.7055682684973302, "grad_norm": 0.4827158139422963, "learning_rate": 3.9999947910867415e-05, "loss": 0.3806, "loss_nan_ranks": 0, "loss_rank_avg": 0.4111228287220001, "step": 925, "valid_targets_mean": 5021.9, "valid_targets_min": 1334 }, { "epoch": 0.7093821510297483, "grad_norm": 0.565668431178144, "learning_rate": 3.9999824922817136e-05, "loss": 0.3899, "loss_nan_ranks": 0, "loss_rank_avg": 0.3945969343185425, "step": 930, "valid_targets_mean": 3504.0, "valid_targets_min": 994 }, { "epoch": 0.7131960335621663, "grad_norm": 0.5207733100448804, "learning_rate": 3.999962958937309e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.3764989674091339, "step": 935, "valid_targets_mean": 4280.6, "valid_targets_min": 1070 }, { "epoch": 0.7170099160945843, "grad_norm": 0.4961113556289845, "learning_rate": 3.999936191124184e-05, "loss": 0.3751, "loss_nan_ranks": 0, "loss_rank_avg": 0.40078458189964294, "step": 940, "valid_targets_mean": 4046.6, "valid_targets_min": 1336 }, { "epoch": 0.7208237986270023, "grad_norm": 0.5462231749803261, "learning_rate": 3.999902188939168e-05, "loss": 0.3784, "loss_nan_ranks": 0, "loss_rank_avg": 0.38428983092308044, "step": 945, "valid_targets_mean": 4143.9, "valid_targets_min": 859 }, { "epoch": 0.7246376811594203, "grad_norm": 0.4504728537471523, "learning_rate": 3.999860952505256e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.38030561804771423, "step": 950, "valid_targets_mean": 5215.9, "valid_targets_min": 1424 }, { "epoch": 0.7284515636918383, "grad_norm": 0.46112814246368733, "learning_rate": 3.999812481971613e-05, "loss": 0.3626, "loss_nan_ranks": 0, "loss_rank_avg": 0.35764268040657043, "step": 955, "valid_targets_mean": 4956.2, "valid_targets_min": 1100 }, { "epoch": 0.7322654462242563, "grad_norm": 0.5093811115162794, "learning_rate": 3.999756777513573e-05, "loss": 0.3814, "loss_nan_ranks": 0, "loss_rank_avg": 0.38869643211364746, "step": 960, "valid_targets_mean": 4663.0, "valid_targets_min": 1162 }, { "epoch": 0.7360793287566743, "grad_norm": 0.5166363577249488, "learning_rate": 3.999693839332633e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.345225065946579, "step": 965, "valid_targets_mean": 4345.2, "valid_targets_min": 1173 }, { "epoch": 0.7398932112890922, "grad_norm": 0.43456501611751824, "learning_rate": 3.9996236676564606e-05, "loss": 0.3893, "loss_nan_ranks": 0, "loss_rank_avg": 0.3924640715122223, "step": 970, "valid_targets_mean": 5048.5, "valid_targets_min": 467 }, { "epoch": 0.7437070938215103, "grad_norm": 0.4528833919025705, "learning_rate": 3.9995462627388884e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.3907564878463745, "step": 975, "valid_targets_mean": 5262.2, "valid_targets_min": 1557 }, { "epoch": 0.7475209763539283, "grad_norm": 0.44803105770779067, "learning_rate": 3.999461624859913e-05, "loss": 0.3779, "loss_nan_ranks": 0, "loss_rank_avg": 0.3801683187484741, "step": 980, "valid_targets_mean": 5022.8, "valid_targets_min": 1333 }, { "epoch": 0.7513348588863463, "grad_norm": 1.3945522001589343, "learning_rate": 3.999369754325694e-05, "loss": 0.5941, "loss_nan_ranks": 0, "loss_rank_avg": 0.7252269387245178, "step": 985, "valid_targets_mean": 882.6, "valid_targets_min": 583 }, { "epoch": 0.7551487414187643, "grad_norm": 0.4459691668091537, "learning_rate": 3.999270651468557e-05, "loss": 0.3752, "loss_nan_ranks": 0, "loss_rank_avg": 0.3678567707538605, "step": 990, "valid_targets_mean": 4537.0, "valid_targets_min": 843 }, { "epoch": 0.7589626239511823, "grad_norm": 0.6787380715262016, "learning_rate": 3.999164316646985e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.43198099732398987, "step": 995, "valid_targets_mean": 4426.8, "valid_targets_min": 1103 }, { "epoch": 0.7627765064836003, "grad_norm": 0.5234474839142296, "learning_rate": 3.999050750245624e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.3377021253108978, "step": 1000, "valid_targets_mean": 3565.2, "valid_targets_min": 1013 }, { "epoch": 0.7665903890160183, "grad_norm": 0.4701290801073301, "learning_rate": 3.998929952675278e-05, "loss": 0.3944, "loss_nan_ranks": 0, "loss_rank_avg": 0.39100274443626404, "step": 1005, "valid_targets_mean": 5459.8, "valid_targets_min": 1291 }, { "epoch": 0.7704042715484363, "grad_norm": 0.4887301565086132, "learning_rate": 3.998801924372908e-05, "loss": 0.3898, "loss_nan_ranks": 0, "loss_rank_avg": 0.41781285405158997, "step": 1010, "valid_targets_mean": 4056.2, "valid_targets_min": 1102 }, { "epoch": 0.7742181540808543, "grad_norm": 0.46737377548754167, "learning_rate": 3.99866666580163e-05, "loss": 0.3463, "loss_nan_ranks": 0, "loss_rank_avg": 0.3446056842803955, "step": 1015, "valid_targets_mean": 4130.0, "valid_targets_min": 327 }, { "epoch": 0.7780320366132724, "grad_norm": 0.47600381282403187, "learning_rate": 3.9985241774507164e-05, "loss": 0.3785, "loss_nan_ranks": 0, "loss_rank_avg": 0.3605664074420929, "step": 1020, "valid_targets_mean": 4542.7, "valid_targets_min": 1212 }, { "epoch": 0.7818459191456903, "grad_norm": 0.4522050546091532, "learning_rate": 3.998374459835591e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.36169174313545227, "step": 1025, "valid_targets_mean": 4604.6, "valid_targets_min": 420 }, { "epoch": 0.7856598016781083, "grad_norm": 0.49172411587001463, "learning_rate": 3.998217513497825e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.3846949636936188, "step": 1030, "valid_targets_mean": 4501.2, "valid_targets_min": 1410 }, { "epoch": 0.7894736842105263, "grad_norm": 0.441370684061777, "learning_rate": 3.998053339005142e-05, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.33769798278808594, "step": 1035, "valid_targets_mean": 4676.2, "valid_targets_min": 577 }, { "epoch": 0.7932875667429443, "grad_norm": 0.5082455341543946, "learning_rate": 3.9978819369514115e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.3954106569290161, "step": 1040, "valid_targets_mean": 3732.4, "valid_targets_min": 1297 }, { "epoch": 0.7971014492753623, "grad_norm": 0.5239126884155341, "learning_rate": 3.997703307956646e-05, "loss": 0.3704, "loss_nan_ranks": 0, "loss_rank_avg": 0.37683117389678955, "step": 1045, "valid_targets_mean": 4162.2, "valid_targets_min": 929 }, { "epoch": 0.8009153318077803, "grad_norm": 0.45893851228954163, "learning_rate": 3.9975174526669994e-05, "loss": 0.373, "loss_nan_ranks": 0, "loss_rank_avg": 0.3459120988845825, "step": 1050, "valid_targets_mean": 4355.8, "valid_targets_min": 1475 }, { "epoch": 0.8047292143401983, "grad_norm": 0.5054974279416519, "learning_rate": 3.997324371754767e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.38253259658813477, "step": 1055, "valid_targets_mean": 4271.6, "valid_targets_min": 877 }, { "epoch": 0.8085430968726163, "grad_norm": 0.5185372806749117, "learning_rate": 3.9971240659183805e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.4232671558856964, "step": 1060, "valid_targets_mean": 4016.3, "valid_targets_min": 1584 }, { "epoch": 0.8123569794050344, "grad_norm": 0.5512258043463327, "learning_rate": 3.996916535882407e-05, "loss": 0.3762, "loss_nan_ranks": 0, "loss_rank_avg": 0.41251853108406067, "step": 1065, "valid_targets_mean": 3834.4, "valid_targets_min": 963 }, { "epoch": 0.8161708619374524, "grad_norm": 0.49799468322654605, "learning_rate": 3.996701782397544e-05, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.3488624393939972, "step": 1070, "valid_targets_mean": 4394.7, "valid_targets_min": 971 }, { "epoch": 0.8199847444698704, "grad_norm": 0.4404711299084823, "learning_rate": 3.9964798062406205e-05, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.3426206409931183, "step": 1075, "valid_targets_mean": 5370.3, "valid_targets_min": 930 }, { "epoch": 0.8237986270022883, "grad_norm": 0.4720172689171758, "learning_rate": 3.996250608214591e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.35691210627555847, "step": 1080, "valid_targets_mean": 4801.6, "valid_targets_min": 1460 }, { "epoch": 0.8276125095347063, "grad_norm": 0.5500897649466603, "learning_rate": 3.996014189148534e-05, "loss": 0.3842, "loss_nan_ranks": 0, "loss_rank_avg": 0.39323708415031433, "step": 1085, "valid_targets_mean": 3530.9, "valid_targets_min": 516 }, { "epoch": 0.8314263920671243, "grad_norm": 0.5199194226587828, "learning_rate": 3.995770549897648e-05, "loss": 0.3816, "loss_nan_ranks": 0, "loss_rank_avg": 0.38213369250297546, "step": 1090, "valid_targets_mean": 5115.5, "valid_targets_min": 1055 }, { "epoch": 0.8352402745995423, "grad_norm": 0.762344226599133, "learning_rate": 3.9955196913432506e-05, "loss": 0.3641, "loss_nan_ranks": 0, "loss_rank_avg": 0.3407316207885742, "step": 1095, "valid_targets_mean": 4745.6, "valid_targets_min": 1724 }, { "epoch": 0.8390541571319603, "grad_norm": 0.4767081980686291, "learning_rate": 3.995261614392771e-05, "loss": 0.3519, "loss_nan_ranks": 0, "loss_rank_avg": 0.3628446161746979, "step": 1100, "valid_targets_mean": 4455.9, "valid_targets_min": 1123 }, { "epoch": 0.8428680396643783, "grad_norm": 0.4603493033632945, "learning_rate": 3.994996319979753e-05, "loss": 0.3847, "loss_nan_ranks": 0, "loss_rank_avg": 0.37550342082977295, "step": 1105, "valid_targets_mean": 4831.5, "valid_targets_min": 1362 }, { "epoch": 0.8466819221967964, "grad_norm": 0.4321868829723287, "learning_rate": 3.9947238090638455e-05, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.32966333627700806, "step": 1110, "valid_targets_mean": 5257.2, "valid_targets_min": 2401 }, { "epoch": 0.8504958047292144, "grad_norm": 0.4928212125106336, "learning_rate": 3.994444082630803e-05, "loss": 0.3718, "loss_nan_ranks": 0, "loss_rank_avg": 0.40663325786590576, "step": 1115, "valid_targets_mean": 4272.6, "valid_targets_min": 1201 }, { "epoch": 0.8543096872616324, "grad_norm": 0.5369422324647564, "learning_rate": 3.99415714169248e-05, "loss": 0.3744, "loss_nan_ranks": 0, "loss_rank_avg": 0.38518229126930237, "step": 1120, "valid_targets_mean": 4210.9, "valid_targets_min": 1195 }, { "epoch": 0.8581235697940504, "grad_norm": 0.531536440074966, "learning_rate": 3.993862987286829e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.34791314601898193, "step": 1125, "valid_targets_mean": 4195.2, "valid_targets_min": 908 }, { "epoch": 0.8619374523264683, "grad_norm": 0.5120386360242026, "learning_rate": 3.993561620477894e-05, "loss": 0.3939, "loss_nan_ranks": 0, "loss_rank_avg": 0.4098881781101227, "step": 1130, "valid_targets_mean": 4433.9, "valid_targets_min": 861 }, { "epoch": 0.8657513348588863, "grad_norm": 0.5546229292064857, "learning_rate": 3.993253042355811e-05, "loss": 0.3508, "loss_nan_ranks": 0, "loss_rank_avg": 0.38434138894081116, "step": 1135, "valid_targets_mean": 4411.3, "valid_targets_min": 1015 }, { "epoch": 0.8695652173913043, "grad_norm": 0.4847205687071689, "learning_rate": 3.992937254036798e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.35996517539024353, "step": 1140, "valid_targets_mean": 4372.5, "valid_targets_min": 730 }, { "epoch": 0.8733790999237223, "grad_norm": 0.496578789451106, "learning_rate": 3.992614256663159e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.38061416149139404, "step": 1145, "valid_targets_mean": 3699.5, "valid_targets_min": 1064 }, { "epoch": 0.8771929824561403, "grad_norm": 1.3174959384842835, "learning_rate": 3.992284051403272e-05, "loss": 0.6232, "loss_nan_ranks": 0, "loss_rank_avg": 0.7174744009971619, "step": 1150, "valid_targets_mean": 924.8, "valid_targets_min": 595 }, { "epoch": 0.8810068649885584, "grad_norm": 0.5184996714136828, "learning_rate": 3.991946639451588e-05, "loss": 0.3731, "loss_nan_ranks": 0, "loss_rank_avg": 0.36945977807044983, "step": 1155, "valid_targets_mean": 3840.2, "valid_targets_min": 1092 }, { "epoch": 0.8848207475209764, "grad_norm": 0.5374317618484389, "learning_rate": 3.991602022028628e-05, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.3723803460597992, "step": 1160, "valid_targets_mean": 4231.3, "valid_targets_min": 427 }, { "epoch": 0.8886346300533944, "grad_norm": 0.44966249003897346, "learning_rate": 3.991250200380978e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.32036292552948, "step": 1165, "valid_targets_mean": 4182.4, "valid_targets_min": 1484 }, { "epoch": 0.8924485125858124, "grad_norm": 0.4823324463114382, "learning_rate": 3.9908911757812816e-05, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.328177809715271, "step": 1170, "valid_targets_mean": 3529.1, "valid_targets_min": 437 }, { "epoch": 0.8962623951182304, "grad_norm": 0.4552734443679323, "learning_rate": 3.99052494952824e-05, "loss": 0.3835, "loss_nan_ranks": 0, "loss_rank_avg": 0.3691507875919342, "step": 1175, "valid_targets_mean": 4576.7, "valid_targets_min": 530 }, { "epoch": 0.9000762776506483, "grad_norm": 0.48871644633752215, "learning_rate": 3.9901515229466035e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.3446696698665619, "step": 1180, "valid_targets_mean": 3823.9, "valid_targets_min": 1160 }, { "epoch": 0.9038901601830663, "grad_norm": 0.49070083319956265, "learning_rate": 3.98977089738717e-05, "loss": 0.3807, "loss_nan_ranks": 0, "loss_rank_avg": 0.41360974311828613, "step": 1185, "valid_targets_mean": 4416.5, "valid_targets_min": 705 }, { "epoch": 0.9077040427154843, "grad_norm": 0.5313518804759381, "learning_rate": 3.9893830742267734e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.38949641585350037, "step": 1190, "valid_targets_mean": 6101.7, "valid_targets_min": 894 }, { "epoch": 0.9115179252479023, "grad_norm": 0.4604256113230519, "learning_rate": 3.9889880548682896e-05, "loss": 0.3696, "loss_nan_ranks": 0, "loss_rank_avg": 0.38642418384552, "step": 1195, "valid_targets_mean": 4514.3, "valid_targets_min": 1035 }, { "epoch": 0.9153318077803204, "grad_norm": 0.47292655188438054, "learning_rate": 3.988585840740623e-05, "loss": 0.3735, "loss_nan_ranks": 0, "loss_rank_avg": 0.37636706233024597, "step": 1200, "valid_targets_mean": 4110.0, "valid_targets_min": 442 }, { "epoch": 0.9191456903127384, "grad_norm": 0.43282070896702063, "learning_rate": 3.988176433298701e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.38640037178993225, "step": 1205, "valid_targets_mean": 5378.8, "valid_targets_min": 1510 }, { "epoch": 0.9229595728451564, "grad_norm": 0.5020061109814692, "learning_rate": 3.987759834023477e-05, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.363527774810791, "step": 1210, "valid_targets_mean": 4316.7, "valid_targets_min": 434 }, { "epoch": 0.9267734553775744, "grad_norm": 0.4642198593500714, "learning_rate": 3.9873360444219125e-05, "loss": 0.3755, "loss_nan_ranks": 0, "loss_rank_avg": 0.37602806091308594, "step": 1215, "valid_targets_mean": 4150.8, "valid_targets_min": 1320 }, { "epoch": 0.9305873379099924, "grad_norm": 0.5016336613847343, "learning_rate": 3.986905066026985e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.3845888674259186, "step": 1220, "valid_targets_mean": 3580.5, "valid_targets_min": 952 }, { "epoch": 0.9344012204424104, "grad_norm": 0.4361161272703576, "learning_rate": 3.9864669003976725e-05, "loss": 0.3553, "loss_nan_ranks": 0, "loss_rank_avg": 0.3639432489871979, "step": 1225, "valid_targets_mean": 5493.5, "valid_targets_min": 1451 }, { "epoch": 0.9382151029748284, "grad_norm": 0.4678700452231829, "learning_rate": 3.986021549118951e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.3865402042865753, "step": 1230, "valid_targets_mean": 4640.3, "valid_targets_min": 1688 }, { "epoch": 0.9420289855072463, "grad_norm": 0.4582516805863473, "learning_rate": 3.985569013801791e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.344419002532959, "step": 1235, "valid_targets_mean": 4298.5, "valid_targets_min": 1232 }, { "epoch": 0.9458428680396643, "grad_norm": 0.5508795531110707, "learning_rate": 3.985109296083149e-05, "loss": 0.3782, "loss_nan_ranks": 0, "loss_rank_avg": 0.35687825083732605, "step": 1240, "valid_targets_mean": 4338.5, "valid_targets_min": 1302 }, { "epoch": 0.9496567505720824, "grad_norm": 0.46268472568580293, "learning_rate": 3.9846423976259636e-05, "loss": 0.3554, "loss_nan_ranks": 0, "loss_rank_avg": 0.33932235836982727, "step": 1245, "valid_targets_mean": 4154.8, "valid_targets_min": 268 }, { "epoch": 0.9534706331045004, "grad_norm": 0.43968402739940654, "learning_rate": 3.984168320119146e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.32227084040641785, "step": 1250, "valid_targets_mean": 4389.7, "valid_targets_min": 1339 }, { "epoch": 0.9572845156369184, "grad_norm": 0.44988479442594437, "learning_rate": 3.983687065277577e-05, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.3949045240879059, "step": 1255, "valid_targets_mean": 4869.5, "valid_targets_min": 504 }, { "epoch": 0.9610983981693364, "grad_norm": 0.40537038635756434, "learning_rate": 3.983198634842103e-05, "loss": 0.3501, "loss_nan_ranks": 0, "loss_rank_avg": 0.3526088297367096, "step": 1260, "valid_targets_mean": 5280.7, "valid_targets_min": 1398 }, { "epoch": 0.9649122807017544, "grad_norm": 0.4874777591749203, "learning_rate": 3.98270303057952e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.3578772246837616, "step": 1265, "valid_targets_mean": 3603.2, "valid_targets_min": 885 }, { "epoch": 0.9687261632341724, "grad_norm": 0.5168742238318518, "learning_rate": 3.982200254282582e-05, "loss": 0.3822, "loss_nan_ranks": 0, "loss_rank_avg": 0.3917689621448517, "step": 1270, "valid_targets_mean": 4895.9, "valid_targets_min": 1220 }, { "epoch": 0.9725400457665904, "grad_norm": 0.4316036947777234, "learning_rate": 3.981690307769979e-05, "loss": 0.3573, "loss_nan_ranks": 0, "loss_rank_avg": 0.3554462194442749, "step": 1275, "valid_targets_mean": 5234.3, "valid_targets_min": 1270 }, { "epoch": 0.9763539282990084, "grad_norm": 0.429176169776203, "learning_rate": 3.981173192886344e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.3734845221042633, "step": 1280, "valid_targets_mean": 4930.2, "valid_targets_min": 1275 }, { "epoch": 0.9801678108314263, "grad_norm": 0.4957017873240747, "learning_rate": 3.9806489115022354e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.3890209496021271, "step": 1285, "valid_targets_mean": 4734.1, "valid_targets_min": 949 }, { "epoch": 0.9839816933638444, "grad_norm": 0.5143350218465076, "learning_rate": 3.980117465514138e-05, "loss": 0.3723, "loss_nan_ranks": 0, "loss_rank_avg": 0.364015132188797, "step": 1290, "valid_targets_mean": 3851.5, "valid_targets_min": 1105 }, { "epoch": 0.9877955758962624, "grad_norm": 0.45135446002856094, "learning_rate": 3.979578856844452e-05, "loss": 0.3596, "loss_nan_ranks": 0, "loss_rank_avg": 0.34121426939964294, "step": 1295, "valid_targets_mean": 4531.8, "valid_targets_min": 1130 }, { "epoch": 0.9916094584286804, "grad_norm": 0.45261428570516965, "learning_rate": 3.9790330874414866e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.3475932776927948, "step": 1300, "valid_targets_mean": 4569.3, "valid_targets_min": 1345 }, { "epoch": 0.9954233409610984, "grad_norm": 0.5036230227201647, "learning_rate": 3.978480159279455e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.40386661887168884, "step": 1305, "valid_targets_mean": 4841.8, "valid_targets_min": 1035 }, { "epoch": 0.9992372234935164, "grad_norm": 1.4960925211456237, "learning_rate": 3.9779200743584644e-05, "loss": 0.5992, "loss_nan_ranks": 0, "loss_rank_avg": 0.7448456883430481, "step": 1310, "valid_targets_mean": 893.5, "valid_targets_min": 437 }, { "epoch": 1.0030511060259344, "grad_norm": 0.4793463160181418, "learning_rate": 3.977352834704512e-05, "loss": 0.4091, "loss_nan_ranks": 0, "loss_rank_avg": 0.33799681067466736, "step": 1315, "valid_targets_mean": 5001.8, "valid_targets_min": 1201 }, { "epoch": 1.0068649885583525, "grad_norm": 0.5438675684910989, "learning_rate": 3.976778442369472e-05, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.3457205295562744, "step": 1320, "valid_targets_mean": 3972.8, "valid_targets_min": 1183 }, { "epoch": 1.0106788710907704, "grad_norm": 0.5140942413587252, "learning_rate": 3.9761968994310966e-05, "loss": 0.3708, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165968954563141, "step": 1325, "valid_targets_mean": 4328.2, "valid_targets_min": 1027 }, { "epoch": 1.0144927536231885, "grad_norm": 0.45617290652451703, "learning_rate": 3.975608207993002e-05, "loss": 0.3639, "loss_nan_ranks": 0, "loss_rank_avg": 0.3801937401294708, "step": 1330, "valid_targets_mean": 3989.0, "valid_targets_min": 1000 }, { "epoch": 1.0183066361556063, "grad_norm": 0.4341972844635562, "learning_rate": 3.9750123701846615e-05, "loss": 0.358, "loss_nan_ranks": 0, "loss_rank_avg": 0.3951098918914795, "step": 1335, "valid_targets_mean": 4721.1, "valid_targets_min": 1509 }, { "epoch": 1.0221205186880244, "grad_norm": 0.46730836638900286, "learning_rate": 3.974409388161401e-05, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.40257081389427185, "step": 1340, "valid_targets_mean": 4757.3, "valid_targets_min": 579 }, { "epoch": 1.0259344012204423, "grad_norm": 0.5515646605187918, "learning_rate": 3.973799264104387e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.36521920561790466, "step": 1345, "valid_targets_mean": 3518.1, "valid_targets_min": 703 }, { "epoch": 1.0297482837528604, "grad_norm": 0.470326967727145, "learning_rate": 3.973182000220622e-05, "loss": 0.3873, "loss_nan_ranks": 0, "loss_rank_avg": 0.38522180914878845, "step": 1350, "valid_targets_mean": 4128.1, "valid_targets_min": 1327 }, { "epoch": 1.0335621662852783, "grad_norm": 0.40705686780411454, "learning_rate": 3.972557598742938e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.3122781217098236, "step": 1355, "valid_targets_mean": 4659.9, "valid_targets_min": 1388 }, { "epoch": 1.0373760488176964, "grad_norm": 0.44803605568572163, "learning_rate": 3.9719260619299806e-05, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.36841270327568054, "step": 1360, "valid_targets_mean": 4919.1, "valid_targets_min": 825 }, { "epoch": 1.0411899313501145, "grad_norm": 0.46321347066260277, "learning_rate": 3.9712873920662096e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.3696576654911041, "step": 1365, "valid_targets_mean": 4718.7, "valid_targets_min": 1230 }, { "epoch": 1.0450038138825324, "grad_norm": 0.5080500551538887, "learning_rate": 3.970641591461886e-05, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.33408328890800476, "step": 1370, "valid_targets_mean": 3776.7, "valid_targets_min": 921 }, { "epoch": 1.0488176964149505, "grad_norm": 0.4401310958483072, "learning_rate": 3.9699886624530664e-05, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.32947924733161926, "step": 1375, "valid_targets_mean": 5090.0, "valid_targets_min": 947 }, { "epoch": 1.0526315789473684, "grad_norm": 0.45200095524939027, "learning_rate": 3.9693286074015904e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.3618582785129547, "step": 1380, "valid_targets_mean": 4528.5, "valid_targets_min": 711 }, { "epoch": 1.0564454614797865, "grad_norm": 0.47049293711643714, "learning_rate": 3.968661428695077e-05, "loss": 0.3713, "loss_nan_ranks": 0, "loss_rank_avg": 0.3690056800842285, "step": 1385, "valid_targets_mean": 4277.3, "valid_targets_min": 917 }, { "epoch": 1.0602593440122043, "grad_norm": 0.4737449066959073, "learning_rate": 3.967987128746913e-05, "loss": 0.3575, "loss_nan_ranks": 0, "loss_rank_avg": 0.4023532569408417, "step": 1390, "valid_targets_mean": 4950.3, "valid_targets_min": 1222 }, { "epoch": 1.0640732265446224, "grad_norm": 0.49450505312447235, "learning_rate": 3.967305709996243e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.3727036416530609, "step": 1395, "valid_targets_mean": 4383.7, "valid_targets_min": 531 }, { "epoch": 1.0678871090770405, "grad_norm": 0.5028180651368124, "learning_rate": 3.966617174907965e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.37223827838897705, "step": 1400, "valid_targets_mean": 3776.0, "valid_targets_min": 1426 }, { "epoch": 1.0717009916094584, "grad_norm": 0.43787090970748827, "learning_rate": 3.965921525972717e-05, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.3454868495464325, "step": 1405, "valid_targets_mean": 5180.0, "valid_targets_min": 1199 }, { "epoch": 1.0755148741418765, "grad_norm": 0.4319389732299042, "learning_rate": 3.965218765706872e-05, "loss": 0.356, "loss_nan_ranks": 0, "loss_rank_avg": 0.3510608971118927, "step": 1410, "valid_targets_mean": 5052.3, "valid_targets_min": 1547 }, { "epoch": 1.0793287566742944, "grad_norm": 0.48206632149639017, "learning_rate": 3.964508896652525e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.36549773812294006, "step": 1415, "valid_targets_mean": 4058.3, "valid_targets_min": 1098 }, { "epoch": 1.0831426392067125, "grad_norm": 0.4967406185966264, "learning_rate": 3.9637919213774874e-05, "loss": 0.3693, "loss_nan_ranks": 0, "loss_rank_avg": 0.4231281280517578, "step": 1420, "valid_targets_mean": 4121.5, "valid_targets_min": 1049 }, { "epoch": 1.0869565217391304, "grad_norm": 0.4878295316799637, "learning_rate": 3.9630678424752735e-05, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.37907230854034424, "step": 1425, "valid_targets_mean": 4030.7, "valid_targets_min": 1407 }, { "epoch": 1.0907704042715485, "grad_norm": 0.5465674854063036, "learning_rate": 3.962336662565095e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.4150486886501312, "step": 1430, "valid_targets_mean": 4677.6, "valid_targets_min": 1302 }, { "epoch": 1.0945842868039664, "grad_norm": 0.49768719325902566, "learning_rate": 3.96159838429185e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.3882100582122803, "step": 1435, "valid_targets_mean": 3504.0, "valid_targets_min": 1117 }, { "epoch": 1.0983981693363845, "grad_norm": 0.4537747668323573, "learning_rate": 3.9608530103261144e-05, "loss": 0.3349, "loss_nan_ranks": 0, "loss_rank_avg": 0.3308643400669098, "step": 1440, "valid_targets_mean": 4242.5, "valid_targets_min": 1444 }, { "epoch": 1.1022120518688023, "grad_norm": 0.5164541178291466, "learning_rate": 3.960100543364129e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.3670574128627777, "step": 1445, "valid_targets_mean": 3909.9, "valid_targets_min": 725 }, { "epoch": 1.1060259344012204, "grad_norm": 0.491392353620686, "learning_rate": 3.959340986127795e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.36460360884666443, "step": 1450, "valid_targets_mean": 3961.4, "valid_targets_min": 1059 }, { "epoch": 1.1098398169336385, "grad_norm": 0.4847216514006396, "learning_rate": 3.958574341364659e-05, "loss": 0.3736, "loss_nan_ranks": 0, "loss_rank_avg": 0.35377323627471924, "step": 1455, "valid_targets_mean": 4016.4, "valid_targets_min": 981 }, { "epoch": 1.1136536994660564, "grad_norm": 0.4406608047156622, "learning_rate": 3.957800611847907e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.3387221097946167, "step": 1460, "valid_targets_mean": 4490.6, "valid_targets_min": 1025 }, { "epoch": 1.1174675819984745, "grad_norm": 0.5213473880559113, "learning_rate": 3.95701980037635e-05, "loss": 0.351, "loss_nan_ranks": 0, "loss_rank_avg": 0.3637104332447052, "step": 1465, "valid_targets_mean": 3972.2, "valid_targets_min": 419 }, { "epoch": 1.1212814645308924, "grad_norm": 0.4556617981657067, "learning_rate": 3.956231909774421e-05, "loss": 0.358, "loss_nan_ranks": 0, "loss_rank_avg": 0.3975560665130615, "step": 1470, "valid_targets_mean": 4520.6, "valid_targets_min": 972 }, { "epoch": 1.1250953470633105, "grad_norm": 0.6469133777791192, "learning_rate": 3.955436942892156e-05, "loss": 0.572, "loss_nan_ranks": 0, "loss_rank_avg": 0.4174586534500122, "step": 1475, "valid_targets_mean": 2480.5, "valid_targets_min": 586 }, { "epoch": 1.1289092295957284, "grad_norm": 0.5042352279798316, "learning_rate": 3.9546349026051886e-05, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.3503652513027191, "step": 1480, "valid_targets_mean": 4591.0, "valid_targets_min": 1422 }, { "epoch": 1.1327231121281465, "grad_norm": 0.4639759371870002, "learning_rate": 3.953825791814743e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.3499886989593506, "step": 1485, "valid_targets_mean": 4414.1, "valid_targets_min": 802 }, { "epoch": 1.1365369946605646, "grad_norm": 0.49820487639813743, "learning_rate": 3.9530096134476155e-05, "loss": 0.3769, "loss_nan_ranks": 0, "loss_rank_avg": 0.4116916358470917, "step": 1490, "valid_targets_mean": 4242.8, "valid_targets_min": 1180 }, { "epoch": 1.1403508771929824, "grad_norm": 0.4163673959740096, "learning_rate": 3.9521863704561684e-05, "loss": 0.338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3374262750148773, "step": 1495, "valid_targets_mean": 4853.1, "valid_targets_min": 1206 }, { "epoch": 1.1441647597254005, "grad_norm": 0.4770566684957642, "learning_rate": 3.9513560658183216e-05, "loss": 0.3619, "loss_nan_ranks": 0, "loss_rank_avg": 0.3136308491230011, "step": 1500, "valid_targets_mean": 3941.9, "valid_targets_min": 771 }, { "epoch": 1.1479786422578184, "grad_norm": 0.5794955093822997, "learning_rate": 3.9505187025375346e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.342024564743042, "step": 1505, "valid_targets_mean": 4745.8, "valid_targets_min": 1322 }, { "epoch": 1.1517925247902365, "grad_norm": 0.5261646401760552, "learning_rate": 3.949674283642805e-05, "loss": 0.3701, "loss_nan_ranks": 0, "loss_rank_avg": 0.3519936501979828, "step": 1510, "valid_targets_mean": 2909.0, "valid_targets_min": 957 }, { "epoch": 1.1556064073226544, "grad_norm": 0.43176897604586745, "learning_rate": 3.94882281218865e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.3459691107273102, "step": 1515, "valid_targets_mean": 4479.5, "valid_targets_min": 1510 }, { "epoch": 1.1594202898550725, "grad_norm": 0.45134668768661756, "learning_rate": 3.9479642912550975e-05, "loss": 0.3289, "loss_nan_ranks": 0, "loss_rank_avg": 0.3575803339481354, "step": 1520, "valid_targets_mean": 4954.8, "valid_targets_min": 1624 }, { "epoch": 1.1632341723874904, "grad_norm": 0.47627942604124146, "learning_rate": 3.947098723947677e-05, "loss": 0.338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3104186952114105, "step": 1525, "valid_targets_mean": 4333.7, "valid_targets_min": 861 }, { "epoch": 1.1670480549199085, "grad_norm": 0.4585945533797258, "learning_rate": 3.9462261133974066e-05, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.37167060375213623, "step": 1530, "valid_targets_mean": 4614.9, "valid_targets_min": 1063 }, { "epoch": 1.1708619374523264, "grad_norm": 0.4392639573208927, "learning_rate": 3.945346462760781e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.3076896667480469, "step": 1535, "valid_targets_mean": 3828.2, "valid_targets_min": 1029 }, { "epoch": 1.1746758199847445, "grad_norm": 0.4428160285363157, "learning_rate": 3.944459775219762e-05, "loss": 0.3416, "loss_nan_ranks": 0, "loss_rank_avg": 0.3300919532775879, "step": 1540, "valid_targets_mean": 4357.5, "valid_targets_min": 1403 }, { "epoch": 1.1784897025171626, "grad_norm": 0.42255626498476845, "learning_rate": 3.943566053981766e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.35865628719329834, "step": 1545, "valid_targets_mean": 4991.6, "valid_targets_min": 1196 }, { "epoch": 1.1823035850495804, "grad_norm": 0.4397533808750128, "learning_rate": 3.942665302279651e-05, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.3123394846916199, "step": 1550, "valid_targets_mean": 4861.5, "valid_targets_min": 1284 }, { "epoch": 1.1861174675819985, "grad_norm": 0.4386214823026046, "learning_rate": 3.941757523371708e-05, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.35547080636024475, "step": 1555, "valid_targets_mean": 5120.7, "valid_targets_min": 1014 }, { "epoch": 1.1899313501144164, "grad_norm": 0.40482676317507504, "learning_rate": 3.940842720541647e-05, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.3050001859664917, "step": 1560, "valid_targets_mean": 5011.2, "valid_targets_min": 447 }, { "epoch": 1.1937452326468345, "grad_norm": 0.43799832347524176, "learning_rate": 3.9399208970985854e-05, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.3959282338619232, "step": 1565, "valid_targets_mean": 5331.9, "valid_targets_min": 780 }, { "epoch": 1.1975591151792524, "grad_norm": 0.4087742386160605, "learning_rate": 3.938992056377036e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.34477710723876953, "step": 1570, "valid_targets_mean": 4720.4, "valid_targets_min": 1129 }, { "epoch": 1.2013729977116705, "grad_norm": 0.47016536084109734, "learning_rate": 3.938056201736896e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.3292127549648285, "step": 1575, "valid_targets_mean": 4415.0, "valid_targets_min": 1096 }, { "epoch": 1.2051868802440886, "grad_norm": 0.4443565972939098, "learning_rate": 3.9371133365634345e-05, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.3656719923019409, "step": 1580, "valid_targets_mean": 5174.2, "valid_targets_min": 728 }, { "epoch": 1.2090007627765065, "grad_norm": 0.44083945242650846, "learning_rate": 3.936163464267277e-05, "loss": 0.3594, "loss_nan_ranks": 0, "loss_rank_avg": 0.34252461791038513, "step": 1585, "valid_targets_mean": 4408.7, "valid_targets_min": 1133 }, { "epoch": 1.2128146453089246, "grad_norm": 0.5140162937717304, "learning_rate": 3.935206588284399e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.32750964164733887, "step": 1590, "valid_targets_mean": 3657.9, "valid_targets_min": 437 }, { "epoch": 1.2166285278413425, "grad_norm": 0.5023178879375496, "learning_rate": 3.93424271207611e-05, "loss": 0.3721, "loss_nan_ranks": 0, "loss_rank_avg": 0.412407249212265, "step": 1595, "valid_targets_mean": 3667.6, "valid_targets_min": 924 }, { "epoch": 1.2204424103737606, "grad_norm": 0.4393578258491763, "learning_rate": 3.93327183912904e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.2946208715438843, "step": 1600, "valid_targets_mean": 3893.6, "valid_targets_min": 259 }, { "epoch": 1.2242562929061784, "grad_norm": 0.458741999764665, "learning_rate": 3.932293972955128e-05, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.37496721744537354, "step": 1605, "valid_targets_mean": 5185.8, "valid_targets_min": 877 }, { "epoch": 1.2280701754385965, "grad_norm": 0.418527038541922, "learning_rate": 3.931309117091612e-05, "loss": 0.3844, "loss_nan_ranks": 0, "loss_rank_avg": 0.36490917205810547, "step": 1610, "valid_targets_mean": 4935.5, "valid_targets_min": 1328 }, { "epoch": 1.2318840579710144, "grad_norm": 0.46733135474543663, "learning_rate": 3.9303172751010125e-05, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.320946604013443, "step": 1615, "valid_targets_mean": 4701.2, "valid_targets_min": 1053 }, { "epoch": 1.2356979405034325, "grad_norm": 0.45296201790488233, "learning_rate": 3.929318450571119e-05, "loss": 0.3694, "loss_nan_ranks": 0, "loss_rank_avg": 0.3832404911518097, "step": 1620, "valid_targets_mean": 4571.2, "valid_targets_min": 1179 }, { "epoch": 1.2395118230358504, "grad_norm": 0.4198962646812139, "learning_rate": 3.928312647114983e-05, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.38623082637786865, "step": 1625, "valid_targets_mean": 5367.0, "valid_targets_min": 1576 }, { "epoch": 1.2433257055682685, "grad_norm": 0.7679243209756554, "learning_rate": 3.9272998683708986e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.3500606119632721, "step": 1630, "valid_targets_mean": 4513.1, "valid_targets_min": 1114 }, { "epoch": 1.2471395881006866, "grad_norm": 0.5228173268588197, "learning_rate": 3.9262801180023906e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.37457337975502014, "step": 1635, "valid_targets_mean": 3563.4, "valid_targets_min": 1235 }, { "epoch": 1.2509534706331045, "grad_norm": 1.33047435809795, "learning_rate": 3.925253399698203e-05, "loss": 0.6628, "loss_nan_ranks": 0, "loss_rank_avg": 0.6713621616363525, "step": 1640, "valid_targets_mean": 904.5, "valid_targets_min": 535 }, { "epoch": 1.2547673531655226, "grad_norm": 0.49263940048523913, "learning_rate": 3.924219717172287e-05, "loss": 0.3783, "loss_nan_ranks": 0, "loss_rank_avg": 0.37166628241539, "step": 1645, "valid_targets_mean": 5407.8, "valid_targets_min": 967 }, { "epoch": 1.2585812356979404, "grad_norm": 0.47593125119627555, "learning_rate": 3.923179074163783e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.33608245849609375, "step": 1650, "valid_targets_mean": 4629.0, "valid_targets_min": 942 }, { "epoch": 1.2623951182303585, "grad_norm": 0.5443093285946626, "learning_rate": 3.92213147443701e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.38303980231285095, "step": 1655, "valid_targets_mean": 3721.8, "valid_targets_min": 1239 }, { "epoch": 1.2662090007627764, "grad_norm": 0.4699119549454572, "learning_rate": 3.9210769217814525e-05, "loss": 0.3571, "loss_nan_ranks": 0, "loss_rank_avg": 0.32681989669799805, "step": 1660, "valid_targets_mean": 3964.7, "valid_targets_min": 1498 }, { "epoch": 1.2700228832951945, "grad_norm": 0.5367643229818877, "learning_rate": 3.920015420011745e-05, "loss": 0.3697, "loss_nan_ranks": 0, "loss_rank_avg": 0.3740926682949066, "step": 1665, "valid_targets_mean": 3617.1, "valid_targets_min": 1119 }, { "epoch": 1.2738367658276126, "grad_norm": 0.4364917789756035, "learning_rate": 3.91894697296766e-05, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.3437977731227875, "step": 1670, "valid_targets_mean": 5194.5, "valid_targets_min": 506 }, { "epoch": 1.2776506483600305, "grad_norm": 0.4648383478668736, "learning_rate": 3.9178715845140905e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.3175346553325653, "step": 1675, "valid_targets_mean": 3968.0, "valid_targets_min": 1443 }, { "epoch": 1.2814645308924484, "grad_norm": 0.4580772095759182, "learning_rate": 3.9167892585410416e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.3617471158504486, "step": 1680, "valid_targets_mean": 4163.8, "valid_targets_min": 1016 }, { "epoch": 1.2852784134248665, "grad_norm": 0.420705068027108, "learning_rate": 3.9156999989636136e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.3555961847305298, "step": 1685, "valid_targets_mean": 4794.0, "valid_targets_min": 1423 }, { "epoch": 1.2890922959572846, "grad_norm": 0.4445370315663098, "learning_rate": 3.914603809721985e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.3598546087741852, "step": 1690, "valid_targets_mean": 4818.8, "valid_targets_min": 1828 }, { "epoch": 1.2929061784897025, "grad_norm": 0.46001476720088763, "learning_rate": 3.9135006947814046e-05, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.33533012866973877, "step": 1695, "valid_targets_mean": 3634.5, "valid_targets_min": 1127 }, { "epoch": 1.2967200610221206, "grad_norm": 0.4605186587488973, "learning_rate": 3.912390658132169e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.31520143151283264, "step": 1700, "valid_targets_mean": 3687.9, "valid_targets_min": 436 }, { "epoch": 1.3005339435545384, "grad_norm": 0.5048292450977424, "learning_rate": 3.9112737037896176e-05, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.3381100594997406, "step": 1705, "valid_targets_mean": 3859.2, "valid_targets_min": 1237 }, { "epoch": 1.3043478260869565, "grad_norm": 0.4470374365915368, "learning_rate": 3.910149835794109e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.3507278859615326, "step": 1710, "valid_targets_mean": 4842.5, "valid_targets_min": 1110 }, { "epoch": 1.3081617086193744, "grad_norm": 0.4725388725302536, "learning_rate": 3.909019058211014e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.3592679500579834, "step": 1715, "valid_targets_mean": 3800.2, "valid_targets_min": 637 }, { "epoch": 1.3119755911517925, "grad_norm": 0.5010840472800245, "learning_rate": 3.907881375130695e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.36546194553375244, "step": 1720, "valid_targets_mean": 4041.3, "valid_targets_min": 931 }, { "epoch": 1.3157894736842106, "grad_norm": 0.47479083395813454, "learning_rate": 3.906736790668495e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.34209373593330383, "step": 1725, "valid_targets_mean": 3945.6, "valid_targets_min": 872 }, { "epoch": 1.3196033562166285, "grad_norm": 0.5639829384354162, "learning_rate": 3.90558530896472e-05, "loss": 0.3469, "loss_nan_ranks": 0, "loss_rank_avg": 0.3194632828235626, "step": 1730, "valid_targets_mean": 2889.1, "valid_targets_min": 734 }, { "epoch": 1.3234172387490466, "grad_norm": 0.5903513954151072, "learning_rate": 3.904426934184628e-05, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.3566388189792633, "step": 1735, "valid_targets_mean": 4816.4, "valid_targets_min": 1084 }, { "epoch": 1.3272311212814645, "grad_norm": 0.4503945917654869, "learning_rate": 3.903261670518408e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.3107925355434418, "step": 1740, "valid_targets_mean": 3587.4, "valid_targets_min": 1143 }, { "epoch": 1.3310450038138826, "grad_norm": 0.43065662871245963, "learning_rate": 3.90208952218117e-05, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.3414647877216339, "step": 1745, "valid_targets_mean": 4295.7, "valid_targets_min": 1226 }, { "epoch": 1.3348588863463005, "grad_norm": 0.5237745139377946, "learning_rate": 3.900910493412929e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.316201388835907, "step": 1750, "valid_targets_mean": 3234.5, "valid_targets_min": 279 }, { "epoch": 1.3386727688787186, "grad_norm": 0.47093036937632515, "learning_rate": 3.899724588478586e-05, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.39046618342399597, "step": 1755, "valid_targets_mean": 4542.8, "valid_targets_min": 1109 }, { "epoch": 1.3424866514111367, "grad_norm": 0.43907041625968424, "learning_rate": 3.898531811667918e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.38379302620887756, "step": 1760, "valid_targets_mean": 4806.4, "valid_targets_min": 837 }, { "epoch": 1.3463005339435545, "grad_norm": 0.4489257140697931, "learning_rate": 3.8973321672955567e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.32360532879829407, "step": 1765, "valid_targets_mean": 4818.2, "valid_targets_min": 1553 }, { "epoch": 1.3501144164759724, "grad_norm": 0.42475418240586327, "learning_rate": 3.896125659700978e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.37827810645103455, "step": 1770, "valid_targets_mean": 4799.2, "valid_targets_min": 720 }, { "epoch": 1.3539282990083905, "grad_norm": 0.39913389476248523, "learning_rate": 3.894912293248483e-05, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.32091864943504333, "step": 1775, "valid_targets_mean": 5017.3, "valid_targets_min": 1309 }, { "epoch": 1.3577421815408086, "grad_norm": 0.4408505758029835, "learning_rate": 3.893692072327185e-05, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.32390084862709045, "step": 1780, "valid_targets_mean": 4561.3, "valid_targets_min": 1150 }, { "epoch": 1.3615560640732265, "grad_norm": 0.4294374639015818, "learning_rate": 3.89246500135099e-05, "loss": 0.35, "loss_nan_ranks": 0, "loss_rank_avg": 0.3629796504974365, "step": 1785, "valid_targets_mean": 4894.0, "valid_targets_min": 773 }, { "epoch": 1.3653699466056446, "grad_norm": 0.4357821842127782, "learning_rate": 3.8912310847585834e-05, "loss": 0.3225, "loss_nan_ranks": 0, "loss_rank_avg": 0.3116796314716339, "step": 1790, "valid_targets_mean": 4334.6, "valid_targets_min": 1197 }, { "epoch": 1.3691838291380625, "grad_norm": 0.4082665954305704, "learning_rate": 3.889990327013412e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875381410121918, "step": 1795, "valid_targets_mean": 4551.9, "valid_targets_min": 900 }, { "epoch": 1.3729977116704806, "grad_norm": 0.4160729509219186, "learning_rate": 3.8887427326036734e-05, "loss": 0.3289, "loss_nan_ranks": 0, "loss_rank_avg": 0.331479549407959, "step": 1800, "valid_targets_mean": 5323.6, "valid_targets_min": 942 }, { "epoch": 1.3768115942028984, "grad_norm": 0.5546043445045815, "learning_rate": 3.887488306042291e-05, "loss": 0.5092, "loss_nan_ranks": 0, "loss_rank_avg": 0.37859976291656494, "step": 1805, "valid_targets_mean": 3949.1, "valid_targets_min": 1206 }, { "epoch": 1.3806254767353165, "grad_norm": 0.5594497655541855, "learning_rate": 3.886227051866903e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.3657640516757965, "step": 1810, "valid_targets_mean": 3915.1, "valid_targets_min": 977 }, { "epoch": 1.3844393592677346, "grad_norm": 0.45346305540885756, "learning_rate": 3.884958974639847e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.33822956681251526, "step": 1815, "valid_targets_mean": 5037.4, "valid_targets_min": 268 }, { "epoch": 1.3882532418001525, "grad_norm": 0.4420952120039936, "learning_rate": 3.8836840789481405e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.3412349224090576, "step": 1820, "valid_targets_mean": 4367.5, "valid_targets_min": 1371 }, { "epoch": 1.3920671243325706, "grad_norm": 0.44468726024354555, "learning_rate": 3.882402369403464e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.37281331419944763, "step": 1825, "valid_targets_mean": 4771.2, "valid_targets_min": 1556 }, { "epoch": 1.3958810068649885, "grad_norm": 0.42890277592066967, "learning_rate": 3.881113850642149e-05, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.33766472339630127, "step": 1830, "valid_targets_mean": 4216.5, "valid_targets_min": 1181 }, { "epoch": 1.3996948893974066, "grad_norm": 0.4632207322961925, "learning_rate": 3.879818527325156e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.3948814868927002, "step": 1835, "valid_targets_mean": 5034.9, "valid_targets_min": 1488 }, { "epoch": 1.4035087719298245, "grad_norm": 0.4379505402410926, "learning_rate": 3.878516404138058e-05, "loss": 0.3339, "loss_nan_ranks": 0, "loss_rank_avg": 0.3263804018497467, "step": 1840, "valid_targets_mean": 4342.8, "valid_targets_min": 1501 }, { "epoch": 1.4073226544622426, "grad_norm": 0.48956467051524727, "learning_rate": 3.877207485791028e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.3223048746585846, "step": 1845, "valid_targets_mean": 3916.5, "valid_targets_min": 1133 }, { "epoch": 1.4111365369946607, "grad_norm": 0.5061823012263362, "learning_rate": 3.875891777018818e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.3740794360637665, "step": 1850, "valid_targets_mean": 4306.0, "valid_targets_min": 1533 }, { "epoch": 1.4149504195270786, "grad_norm": 0.44374624013085096, "learning_rate": 3.874569282580744e-05, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.3182269334793091, "step": 1855, "valid_targets_mean": 4329.9, "valid_targets_min": 1148 }, { "epoch": 1.4187643020594964, "grad_norm": 0.5282857561363704, "learning_rate": 3.8732400072606663e-05, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.34093889594078064, "step": 1860, "valid_targets_mean": 5093.1, "valid_targets_min": 360 }, { "epoch": 1.4225781845919145, "grad_norm": 0.45036028219991575, "learning_rate": 3.8719039558669735e-05, "loss": 0.3609, "loss_nan_ranks": 0, "loss_rank_avg": 0.37583938241004944, "step": 1865, "valid_targets_mean": 5373.0, "valid_targets_min": 338 }, { "epoch": 1.4263920671243326, "grad_norm": 0.4815351622606479, "learning_rate": 3.870561133232567e-05, "loss": 0.3257, "loss_nan_ranks": 0, "loss_rank_avg": 0.3166085183620453, "step": 1870, "valid_targets_mean": 3829.9, "valid_targets_min": 1259 }, { "epoch": 1.4302059496567505, "grad_norm": 0.48428256336366055, "learning_rate": 3.8692115442148416e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.3754858672618866, "step": 1875, "valid_targets_mean": 4023.9, "valid_targets_min": 1054 }, { "epoch": 1.4340198321891686, "grad_norm": 0.47277520631718617, "learning_rate": 3.8678551936956654e-05, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.33969607949256897, "step": 1880, "valid_targets_mean": 4289.2, "valid_targets_min": 426 }, { "epoch": 1.4378337147215865, "grad_norm": 0.43917915151002945, "learning_rate": 3.866492086581369e-05, "loss": 0.3198, "loss_nan_ranks": 0, "loss_rank_avg": 0.32609280943870544, "step": 1885, "valid_targets_mean": 4327.0, "valid_targets_min": 1432 }, { "epoch": 1.4416475972540046, "grad_norm": 0.4306387032402162, "learning_rate": 3.865122227802721e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.2789159119129181, "step": 1890, "valid_targets_mean": 3979.3, "valid_targets_min": 1352 }, { "epoch": 1.4454614797864225, "grad_norm": 0.4720251886440316, "learning_rate": 3.863745622314913e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.3516583740711212, "step": 1895, "valid_targets_mean": 3531.6, "valid_targets_min": 1374 }, { "epoch": 1.4492753623188406, "grad_norm": 0.46609842409964225, "learning_rate": 3.862362275097543e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.3093758821487427, "step": 1900, "valid_targets_mean": 4145.7, "valid_targets_min": 894 }, { "epoch": 1.4530892448512587, "grad_norm": 0.5123115804522839, "learning_rate": 3.8609721911545926e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.33074355125427246, "step": 1905, "valid_targets_mean": 3831.0, "valid_targets_min": 970 }, { "epoch": 1.4569031273836766, "grad_norm": 0.4406404957264489, "learning_rate": 3.8595753755144156e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.32660233974456787, "step": 1910, "valid_targets_mean": 4124.6, "valid_targets_min": 392 }, { "epoch": 1.4607170099160947, "grad_norm": 0.48541201400683953, "learning_rate": 3.858171833229716e-05, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.3298225700855255, "step": 1915, "valid_targets_mean": 4515.6, "valid_targets_min": 1454 }, { "epoch": 1.4645308924485125, "grad_norm": 0.4416063227875788, "learning_rate": 3.856761569377528e-05, "loss": 0.3542, "loss_nan_ranks": 0, "loss_rank_avg": 0.3587282598018646, "step": 1920, "valid_targets_mean": 5149.5, "valid_targets_min": 1237 }, { "epoch": 1.4683447749809306, "grad_norm": 0.4250346119336662, "learning_rate": 3.8553445890592015e-05, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.39043954014778137, "step": 1925, "valid_targets_mean": 5316.2, "valid_targets_min": 2132 }, { "epoch": 1.4721586575133485, "grad_norm": 0.4501574857612335, "learning_rate": 3.85392089740038e-05, "loss": 0.3397, "loss_nan_ranks": 0, "loss_rank_avg": 0.33985814452171326, "step": 1930, "valid_targets_mean": 4548.2, "valid_targets_min": 1677 }, { "epoch": 1.4759725400457666, "grad_norm": 0.4378789749328793, "learning_rate": 3.852490499550988e-05, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.32744383811950684, "step": 1935, "valid_targets_mean": 4950.3, "valid_targets_min": 917 }, { "epoch": 1.4797864225781847, "grad_norm": 0.5076618596575551, "learning_rate": 3.851053400685203e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.3824631869792938, "step": 1940, "valid_targets_mean": 4252.6, "valid_targets_min": 1206 }, { "epoch": 1.4836003051106026, "grad_norm": 0.48737116555851495, "learning_rate": 3.849609606001446e-05, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.319928914308548, "step": 1945, "valid_targets_mean": 3840.0, "valid_targets_min": 828 }, { "epoch": 1.4874141876430205, "grad_norm": 0.4236043917290313, "learning_rate": 3.848159120722357e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.3326864540576935, "step": 1950, "valid_targets_mean": 4537.5, "valid_targets_min": 1112 }, { "epoch": 1.4912280701754386, "grad_norm": 0.4598342140034555, "learning_rate": 3.846701950094779e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.3411165177822113, "step": 1955, "valid_targets_mean": 5026.8, "valid_targets_min": 1170 }, { "epoch": 1.4950419527078567, "grad_norm": 0.41914135871574276, "learning_rate": 3.845238099389736e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.33780476450920105, "step": 1960, "valid_targets_mean": 5021.2, "valid_targets_min": 952 }, { "epoch": 1.4988558352402745, "grad_norm": 1.3459003283983855, "learning_rate": 3.843767573902418e-05, "loss": 0.5818, "loss_nan_ranks": 0, "loss_rank_avg": 0.6157845854759216, "step": 1965, "valid_targets_mean": 790.2, "valid_targets_min": 583 }, { "epoch": 1.5026697177726926, "grad_norm": 0.4617732864123322, "learning_rate": 3.842290378952159e-05, "loss": 0.3401, "loss_nan_ranks": 0, "loss_rank_avg": 0.34063920378685, "step": 1970, "valid_targets_mean": 4803.4, "valid_targets_min": 839 }, { "epoch": 1.5064836003051107, "grad_norm": 0.531676865851445, "learning_rate": 3.840806519882418e-05, "loss": 0.3303, "loss_nan_ranks": 0, "loss_rank_avg": 0.2992500364780426, "step": 1975, "valid_targets_mean": 3430.1, "valid_targets_min": 613 }, { "epoch": 1.5102974828375286, "grad_norm": 0.5226518835402676, "learning_rate": 3.83931600206076e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.3798552453517914, "step": 1980, "valid_targets_mean": 3952.5, "valid_targets_min": 1128 }, { "epoch": 1.5141113653699465, "grad_norm": 0.396591484196759, "learning_rate": 3.837818830878838e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.35394302010536194, "step": 1985, "valid_targets_mean": 6165.4, "valid_targets_min": 1886 }, { "epoch": 1.5179252479023646, "grad_norm": 0.452362199986279, "learning_rate": 3.836315011752371e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.33218100666999817, "step": 1990, "valid_targets_mean": 5245.8, "valid_targets_min": 1233 }, { "epoch": 1.5217391304347827, "grad_norm": 0.45166171439918135, "learning_rate": 3.834804550121126e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.3478414714336395, "step": 1995, "valid_targets_mean": 4610.8, "valid_targets_min": 1676 }, { "epoch": 1.5255530129672006, "grad_norm": 0.4356146082165587, "learning_rate": 3.8332874514488967e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.3374311029911041, "step": 2000, "valid_targets_mean": 4473.1, "valid_targets_min": 1297 }, { "epoch": 1.5293668954996185, "grad_norm": 0.44888934608269865, "learning_rate": 3.831763721223488e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3361920416355133, "step": 2005, "valid_targets_mean": 4083.8, "valid_targets_min": 1411 }, { "epoch": 1.5331807780320366, "grad_norm": 0.4579221905167076, "learning_rate": 3.8302333649566905e-05, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.3255065679550171, "step": 2010, "valid_targets_mean": 4096.5, "valid_targets_min": 1368 }, { "epoch": 1.5369946605644547, "grad_norm": 0.4458324785747194, "learning_rate": 3.828696388184265e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.33304184675216675, "step": 2015, "valid_targets_mean": 4516.2, "valid_targets_min": 1309 }, { "epoch": 1.5408085430968725, "grad_norm": 0.4536346386160971, "learning_rate": 3.8271527964659174e-05, "loss": 0.339, "loss_nan_ranks": 0, "loss_rank_avg": 0.32771816849708557, "step": 2020, "valid_targets_mean": 4904.3, "valid_targets_min": 1127 }, { "epoch": 1.5446224256292906, "grad_norm": 0.4831566461665685, "learning_rate": 3.8256025953852865e-05, "loss": 0.3323, "loss_nan_ranks": 0, "loss_rank_avg": 0.3292129933834076, "step": 2025, "valid_targets_mean": 4137.0, "valid_targets_min": 806 }, { "epoch": 1.5484363081617087, "grad_norm": 0.47635974507726736, "learning_rate": 3.824045790549915e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.352607399225235, "step": 2030, "valid_targets_mean": 4103.1, "valid_targets_min": 818 }, { "epoch": 1.5522501906941266, "grad_norm": 0.4525772248307072, "learning_rate": 3.8224823875912356e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.34870848059654236, "step": 2035, "valid_targets_mean": 5950.1, "valid_targets_min": 1457 }, { "epoch": 1.5560640732265445, "grad_norm": 0.413493930225271, "learning_rate": 3.820912392164548e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.3418256342411041, "step": 2040, "valid_targets_mean": 4733.5, "valid_targets_min": 1069 }, { "epoch": 1.5598779557589626, "grad_norm": 0.46894070613005195, "learning_rate": 3.819335809949e-05, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.3676106631755829, "step": 2045, "valid_targets_mean": 4399.0, "valid_targets_min": 946 }, { "epoch": 1.5636918382913807, "grad_norm": 0.4766741967603851, "learning_rate": 3.817752646647563e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.30944350361824036, "step": 2050, "valid_targets_mean": 4400.2, "valid_targets_min": 1848 }, { "epoch": 1.5675057208237986, "grad_norm": 0.41158705325321077, "learning_rate": 3.816162907987016e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.3295304477214813, "step": 2055, "valid_targets_mean": 5128.7, "valid_targets_min": 1255 }, { "epoch": 1.5713196033562167, "grad_norm": 0.4284366443368262, "learning_rate": 3.8145665997179235e-05, "loss": 0.3517, "loss_nan_ranks": 0, "loss_rank_avg": 0.3419044017791748, "step": 2060, "valid_targets_mean": 5012.1, "valid_targets_min": 613 }, { "epoch": 1.5751334858886348, "grad_norm": 0.5240013370140941, "learning_rate": 3.8129637276146134e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.3423541784286499, "step": 2065, "valid_targets_mean": 3542.5, "valid_targets_min": 1116 }, { "epoch": 1.5789473684210527, "grad_norm": 0.4615080821026482, "learning_rate": 3.8113542974751565e-05, "loss": 0.3488, "loss_nan_ranks": 0, "loss_rank_avg": 0.39265763759613037, "step": 2070, "valid_targets_mean": 4613.8, "valid_targets_min": 1458 }, { "epoch": 1.5827612509534705, "grad_norm": 0.45660629131457464, "learning_rate": 3.809738315121347e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.35427650809288025, "step": 2075, "valid_targets_mean": 4815.3, "valid_targets_min": 496 }, { "epoch": 1.5865751334858886, "grad_norm": 0.4657806705792738, "learning_rate": 3.8081157863986806e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.2970011532306671, "step": 2080, "valid_targets_mean": 4139.2, "valid_targets_min": 337 }, { "epoch": 1.5903890160183067, "grad_norm": 0.4365020499059465, "learning_rate": 3.806486717176332e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.30660709738731384, "step": 2085, "valid_targets_mean": 3980.7, "valid_targets_min": 873 }, { "epoch": 1.5942028985507246, "grad_norm": 0.506656163039576, "learning_rate": 3.8048511133471356e-05, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.4007803499698639, "step": 2090, "valid_targets_mean": 4447.3, "valid_targets_min": 959 }, { "epoch": 1.5980167810831425, "grad_norm": 0.4751817793688682, "learning_rate": 3.8032089808275635e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.35235536098480225, "step": 2095, "valid_targets_mean": 4583.0, "valid_targets_min": 1399 }, { "epoch": 1.6018306636155606, "grad_norm": 0.4508540415280725, "learning_rate": 3.801560325557703e-05, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305545449256897, "step": 2100, "valid_targets_mean": 4408.1, "valid_targets_min": 737 }, { "epoch": 1.6056445461479787, "grad_norm": 0.4299155016841301, "learning_rate": 3.799905153501238e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.327955424785614, "step": 2105, "valid_targets_mean": 4504.2, "valid_targets_min": 1246 }, { "epoch": 1.6094584286803966, "grad_norm": 0.4783710619498741, "learning_rate": 3.798243470645425e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.33135396242141724, "step": 2110, "valid_targets_mean": 3603.8, "valid_targets_min": 983 }, { "epoch": 1.6132723112128147, "grad_norm": 0.37927325672645257, "learning_rate": 3.7965752830010706e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.32099059224128723, "step": 2115, "valid_targets_mean": 5331.1, "valid_targets_min": 1746 }, { "epoch": 1.6170861937452328, "grad_norm": 0.40761644497991223, "learning_rate": 3.794900596602513e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.29120543599128723, "step": 2120, "valid_targets_mean": 4769.4, "valid_targets_min": 468 }, { "epoch": 1.6209000762776506, "grad_norm": 0.45214903550117586, "learning_rate": 3.793219417507597e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.3507181704044342, "step": 2125, "valid_targets_mean": 4438.9, "valid_targets_min": 956 }, { "epoch": 1.6247139588100685, "grad_norm": 1.411976482155846, "learning_rate": 3.7915317517976544e-05, "loss": 0.5326, "loss_nan_ranks": 0, "loss_rank_avg": 0.6349965333938599, "step": 2130, "valid_targets_mean": 843.3, "valid_targets_min": 648 }, { "epoch": 1.6285278413424866, "grad_norm": 0.4296479124857058, "learning_rate": 3.7898376055774806e-05, "loss": 0.4073, "loss_nan_ranks": 0, "loss_rank_avg": 0.31556937098503113, "step": 2135, "valid_targets_mean": 4938.8, "valid_targets_min": 541 }, { "epoch": 1.6323417238749047, "grad_norm": 0.462970001455935, "learning_rate": 3.788136984975313e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.3477567136287689, "step": 2140, "valid_targets_mean": 4699.2, "valid_targets_min": 1459 }, { "epoch": 1.6361556064073226, "grad_norm": 0.48316565101860154, "learning_rate": 3.7864298961428085e-05, "loss": 0.3339, "loss_nan_ranks": 0, "loss_rank_avg": 0.32468631863594055, "step": 2145, "valid_targets_mean": 4554.4, "valid_targets_min": 1345 }, { "epoch": 1.6399694889397407, "grad_norm": 0.41679333340014413, "learning_rate": 3.784716345255022e-05, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.336759090423584, "step": 2150, "valid_targets_mean": 5775.1, "valid_targets_min": 1627 }, { "epoch": 1.6437833714721588, "grad_norm": 0.3953743824423388, "learning_rate": 3.782996338510384e-05, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.29986482858657837, "step": 2155, "valid_targets_mean": 5298.2, "valid_targets_min": 965 }, { "epoch": 1.6475972540045767, "grad_norm": 0.4736632378563593, "learning_rate": 3.781269882130677e-05, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.35674309730529785, "step": 2160, "valid_targets_mean": 4210.8, "valid_targets_min": 1120 }, { "epoch": 1.6514111365369946, "grad_norm": 0.4496270825352227, "learning_rate": 3.779536982361013e-05, "loss": 0.3509, "loss_nan_ranks": 0, "loss_rank_avg": 0.352872759103775, "step": 2165, "valid_targets_mean": 4362.2, "valid_targets_min": 526 }, { "epoch": 1.6552250190694127, "grad_norm": 0.46157964831828, "learning_rate": 3.777797645469814e-05, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.372890830039978, "step": 2170, "valid_targets_mean": 4475.5, "valid_targets_min": 1178 }, { "epoch": 1.6590389016018308, "grad_norm": 0.4952894396006391, "learning_rate": 3.776051877748785e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.3195929527282715, "step": 2175, "valid_targets_mean": 3625.1, "valid_targets_min": 452 }, { "epoch": 1.6628527841342486, "grad_norm": 0.4345556379723053, "learning_rate": 3.774299685512894e-05, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.3343975245952606, "step": 2180, "valid_targets_mean": 4466.4, "valid_targets_min": 1113 }, { "epoch": 1.6666666666666665, "grad_norm": 0.42305269061244527, "learning_rate": 3.772541075100349e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.36715126037597656, "step": 2185, "valid_targets_mean": 4677.8, "valid_targets_min": 711 }, { "epoch": 1.6704805491990846, "grad_norm": 0.42759806624710345, "learning_rate": 3.770776052872573e-05, "loss": 0.3256, "loss_nan_ranks": 0, "loss_rank_avg": 0.3473476469516754, "step": 2190, "valid_targets_mean": 5200.2, "valid_targets_min": 1401 }, { "epoch": 1.6742944317315027, "grad_norm": 0.7660926707707012, "learning_rate": 3.7690046252141826e-05, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.32988297939300537, "step": 2195, "valid_targets_mean": 4637.0, "valid_targets_min": 1224 }, { "epoch": 1.6781083142639206, "grad_norm": 0.5055398969545535, "learning_rate": 3.767226798532967e-05, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.30404260754585266, "step": 2200, "valid_targets_mean": 4207.0, "valid_targets_min": 709 }, { "epoch": 1.6819221967963387, "grad_norm": 0.4291374647287734, "learning_rate": 3.765442579259861e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.28727686405181885, "step": 2205, "valid_targets_mean": 4335.9, "valid_targets_min": 510 }, { "epoch": 1.6857360793287568, "grad_norm": 0.46292742476924886, "learning_rate": 3.763651973848923e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.31533995270729065, "step": 2210, "valid_targets_mean": 3919.2, "valid_targets_min": 1000 }, { "epoch": 1.6895499618611747, "grad_norm": 0.47316186208418975, "learning_rate": 3.761854988777312e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.3339639902114868, "step": 2215, "valid_targets_mean": 4245.3, "valid_targets_min": 1029 }, { "epoch": 1.6933638443935926, "grad_norm": 0.40865623345995916, "learning_rate": 3.760051630545264e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192019462585449, "step": 2220, "valid_targets_mean": 5094.4, "valid_targets_min": 1841 }, { "epoch": 1.6971777269260107, "grad_norm": 0.45723802330184893, "learning_rate": 3.758241905676071e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.33453646302223206, "step": 2225, "valid_targets_mean": 3709.2, "valid_targets_min": 423 }, { "epoch": 1.7009916094584288, "grad_norm": 0.4526269440545832, "learning_rate": 3.7564258207160515e-05, "loss": 0.3324, "loss_nan_ranks": 0, "loss_rank_avg": 0.3633545935153961, "step": 2230, "valid_targets_mean": 4224.0, "valid_targets_min": 1141 }, { "epoch": 1.7048054919908466, "grad_norm": 0.6122509098643096, "learning_rate": 3.754603382234533e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.307157039642334, "step": 2235, "valid_targets_mean": 3546.7, "valid_targets_min": 892 }, { "epoch": 1.7086193745232647, "grad_norm": 0.4624666321272271, "learning_rate": 3.752774596823825e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.3046889007091522, "step": 2240, "valid_targets_mean": 4233.8, "valid_targets_min": 291 }, { "epoch": 1.7124332570556828, "grad_norm": 0.44703143367338366, "learning_rate": 3.750939471099194e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.33055710792541504, "step": 2245, "valid_targets_mean": 4348.4, "valid_targets_min": 1155 }, { "epoch": 1.7162471395881007, "grad_norm": 0.4865255846967005, "learning_rate": 3.7490980116988446e-05, "loss": 0.3257, "loss_nan_ranks": 0, "loss_rank_avg": 0.35459789633750916, "step": 2250, "valid_targets_mean": 3480.5, "valid_targets_min": 454 }, { "epoch": 1.7200610221205186, "grad_norm": 0.41553778964381777, "learning_rate": 3.747250225283889e-05, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.33044007420539856, "step": 2255, "valid_targets_mean": 5068.1, "valid_targets_min": 1043 }, { "epoch": 1.7238749046529367, "grad_norm": 0.47247749062464844, "learning_rate": 3.7453961185383275e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.3662593364715576, "step": 2260, "valid_targets_mean": 4381.7, "valid_targets_min": 984 }, { "epoch": 1.7276887871853548, "grad_norm": 0.4342970807308119, "learning_rate": 3.743535698169024e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.3155607581138611, "step": 2265, "valid_targets_mean": 4959.0, "valid_targets_min": 688 }, { "epoch": 1.7315026697177727, "grad_norm": 0.4835822940202946, "learning_rate": 3.741668970905678e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.3475397527217865, "step": 2270, "valid_targets_mean": 4047.2, "valid_targets_min": 924 }, { "epoch": 1.7353165522501905, "grad_norm": 0.4143882838773366, "learning_rate": 3.739795943500807e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3046738803386688, "step": 2275, "valid_targets_mean": 4457.8, "valid_targets_min": 1307 }, { "epoch": 1.7391304347826086, "grad_norm": 0.47715588140017007, "learning_rate": 3.7379166227297134e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.36505427956581116, "step": 2280, "valid_targets_mean": 4550.1, "valid_targets_min": 1258 }, { "epoch": 1.7429443173150267, "grad_norm": 0.47746507980133923, "learning_rate": 3.7360310153904676e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.3104887306690216, "step": 2285, "valid_targets_mean": 4238.9, "valid_targets_min": 1358 }, { "epoch": 1.7467581998474446, "grad_norm": 0.4366855078559095, "learning_rate": 3.73413912830388e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3296510577201843, "step": 2290, "valid_targets_mean": 4354.8, "valid_targets_min": 1124 }, { "epoch": 1.7505720823798627, "grad_norm": 1.5920308734552946, "learning_rate": 3.7322409683134754e-05, "loss": 0.4648, "loss_nan_ranks": 0, "loss_rank_avg": 0.6426330208778381, "step": 2295, "valid_targets_mean": 798.7, "valid_targets_min": 662 }, { "epoch": 1.7543859649122808, "grad_norm": 0.4334877061500335, "learning_rate": 3.730336542285471e-05, "loss": 0.3945, "loss_nan_ranks": 0, "loss_rank_avg": 0.326994389295578, "step": 2300, "valid_targets_mean": 4903.4, "valid_targets_min": 1525 }, { "epoch": 1.7581998474446987, "grad_norm": 0.49634867580345554, "learning_rate": 3.7284258571087485e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.30348965525627136, "step": 2305, "valid_targets_mean": 3528.3, "valid_targets_min": 1120 }, { "epoch": 1.7620137299771166, "grad_norm": 0.49812732348341127, "learning_rate": 3.726508919694834e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.314765602350235, "step": 2310, "valid_targets_mean": 3092.0, "valid_targets_min": 1160 }, { "epoch": 1.7658276125095347, "grad_norm": 0.5244174030752281, "learning_rate": 3.724585736977867e-05, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.3550000488758087, "step": 2315, "valid_targets_mean": 4437.4, "valid_targets_min": 1185 }, { "epoch": 1.7696414950419528, "grad_norm": 0.4093823038328312, "learning_rate": 3.722656315914579e-05, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.3699674606323242, "step": 2320, "valid_targets_mean": 5781.1, "valid_targets_min": 1382 }, { "epoch": 1.7734553775743707, "grad_norm": 0.4082424315818475, "learning_rate": 3.7207206634842664e-05, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.2742947041988373, "step": 2325, "valid_targets_mean": 5018.0, "valid_targets_min": 1360 }, { "epoch": 1.7772692601067888, "grad_norm": 0.4250104636252426, "learning_rate": 3.7187787866887685e-05, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.3289525508880615, "step": 2330, "valid_targets_mean": 4318.1, "valid_targets_min": 1018 }, { "epoch": 1.7810831426392069, "grad_norm": 0.45335953265388873, "learning_rate": 3.7168306925524385e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.3171369135379791, "step": 2335, "valid_targets_mean": 4464.4, "valid_targets_min": 671 }, { "epoch": 1.7848970251716247, "grad_norm": 0.43854487824763294, "learning_rate": 3.71487638812212e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.31873399019241333, "step": 2340, "valid_targets_mean": 4436.9, "valid_targets_min": 1155 }, { "epoch": 1.7887109077040426, "grad_norm": 0.412063477973113, "learning_rate": 3.712915880467121e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.3235747218132019, "step": 2345, "valid_targets_mean": 5156.3, "valid_targets_min": 1447 }, { "epoch": 1.7925247902364607, "grad_norm": 0.4389626587211984, "learning_rate": 3.7109491766791886e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.3347223997116089, "step": 2350, "valid_targets_mean": 4220.4, "valid_targets_min": 834 }, { "epoch": 1.7963386727688788, "grad_norm": 0.43041614373722964, "learning_rate": 3.708976283872483e-05, "loss": 0.331, "loss_nan_ranks": 0, "loss_rank_avg": 0.302156001329422, "step": 2355, "valid_targets_mean": 4227.2, "valid_targets_min": 867 }, { "epoch": 1.8001525553012967, "grad_norm": 0.4264746043330624, "learning_rate": 3.706997209183552e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.3170943558216095, "step": 2360, "valid_targets_mean": 4943.4, "valid_targets_min": 871 }, { "epoch": 1.8039664378337146, "grad_norm": 0.4435488437349904, "learning_rate": 3.705011959771306e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.3009158670902252, "step": 2365, "valid_targets_mean": 4024.0, "valid_targets_min": 1455 }, { "epoch": 1.8077803203661327, "grad_norm": 0.40895192075459724, "learning_rate": 3.7030205428169887e-05, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.3293893039226532, "step": 2370, "valid_targets_mean": 5075.9, "valid_targets_min": 1286 }, { "epoch": 1.8115942028985508, "grad_norm": 0.41660708290497744, "learning_rate": 3.701022965524156e-05, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.31239140033721924, "step": 2375, "valid_targets_mean": 4275.4, "valid_targets_min": 1051 }, { "epoch": 1.8154080854309687, "grad_norm": 0.4453736647599715, "learning_rate": 3.6990192351186475e-05, "loss": 0.3182, "loss_nan_ranks": 0, "loss_rank_avg": 0.3469693958759308, "step": 2380, "valid_targets_mean": 4513.8, "valid_targets_min": 1277 }, { "epoch": 1.8192219679633868, "grad_norm": 0.46119885811553796, "learning_rate": 3.6970093588485594e-05, "loss": 0.3176, "loss_nan_ranks": 0, "loss_rank_avg": 0.27816879749298096, "step": 2385, "valid_targets_mean": 3789.4, "valid_targets_min": 1465 }, { "epoch": 1.8230358504958049, "grad_norm": 0.4291482862044303, "learning_rate": 3.694993343984221e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.3009355068206787, "step": 2390, "valid_targets_mean": 4632.9, "valid_targets_min": 1292 }, { "epoch": 1.8268497330282227, "grad_norm": 0.5478615406961075, "learning_rate": 3.692971197818164e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.3457231819629669, "step": 2395, "valid_targets_mean": 3948.9, "valid_targets_min": 993 }, { "epoch": 1.8306636155606406, "grad_norm": 0.479894949737753, "learning_rate": 3.6909429276651005e-05, "loss": 0.3414, "loss_nan_ranks": 0, "loss_rank_avg": 0.3317417800426483, "step": 2400, "valid_targets_mean": 4785.0, "valid_targets_min": 986 }, { "epoch": 1.8344774980930587, "grad_norm": 0.4285777476400902, "learning_rate": 3.688908540861896e-05, "loss": 0.331, "loss_nan_ranks": 0, "loss_rank_avg": 0.31536248326301575, "step": 2405, "valid_targets_mean": 4312.8, "valid_targets_min": 1685 }, { "epoch": 1.8382913806254768, "grad_norm": 0.4375917603899561, "learning_rate": 3.68686804476754e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.3218797743320465, "step": 2410, "valid_targets_mean": 4685.2, "valid_targets_min": 1185 }, { "epoch": 1.8421052631578947, "grad_norm": 0.5273066457088933, "learning_rate": 3.684821446763121e-05, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.39353689551353455, "step": 2415, "valid_targets_mean": 4030.5, "valid_targets_min": 1191 }, { "epoch": 1.8459191456903128, "grad_norm": 0.4440672321044689, "learning_rate": 3.682768754251803e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948742210865021, "step": 2420, "valid_targets_mean": 4679.3, "valid_targets_min": 1334 }, { "epoch": 1.849733028222731, "grad_norm": 0.4782127118356837, "learning_rate": 3.680709974658792e-05, "loss": 0.3176, "loss_nan_ranks": 0, "loss_rank_avg": 0.35153254866600037, "step": 2425, "valid_targets_mean": 4014.6, "valid_targets_min": 991 }, { "epoch": 1.8535469107551488, "grad_norm": 0.44745555716907837, "learning_rate": 3.678645115431313e-05, "loss": 0.3384, "loss_nan_ranks": 0, "loss_rank_avg": 0.34888049960136414, "step": 2430, "valid_targets_mean": 5085.6, "valid_targets_min": 1168 }, { "epoch": 1.8573607932875666, "grad_norm": 0.4665568435081105, "learning_rate": 3.6765741840385865e-05, "loss": 0.3277, "loss_nan_ranks": 0, "loss_rank_avg": 0.34056076407432556, "step": 2435, "valid_targets_mean": 4100.6, "valid_targets_min": 927 }, { "epoch": 1.8611746758199847, "grad_norm": 0.41128691480695334, "learning_rate": 3.674497187971794e-05, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.34780147671699524, "step": 2440, "valid_targets_mean": 5574.4, "valid_targets_min": 713 }, { "epoch": 1.8649885583524028, "grad_norm": 0.4746141475032033, "learning_rate": 3.6724141347440564e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.2898326814174652, "step": 2445, "valid_targets_mean": 3968.1, "valid_targets_min": 523 }, { "epoch": 1.8688024408848207, "grad_norm": 0.5670987020490634, "learning_rate": 3.6703250318904044e-05, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.3524753749370575, "step": 2450, "valid_targets_mean": 3708.4, "valid_targets_min": 704 }, { "epoch": 1.8726163234172386, "grad_norm": 0.4486880722932088, "learning_rate": 3.6682298869677534e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.32234349846839905, "step": 2455, "valid_targets_mean": 4402.6, "valid_targets_min": 1164 }, { "epoch": 1.8764302059496567, "grad_norm": 1.3784929400623749, "learning_rate": 3.666128707554874e-05, "loss": 0.4908, "loss_nan_ranks": 0, "loss_rank_avg": 0.6172937750816345, "step": 2460, "valid_targets_mean": 874.1, "valid_targets_min": 602 }, { "epoch": 1.8802440884820748, "grad_norm": 0.4825156091808825, "learning_rate": 3.664021501252365e-05, "loss": 0.3947, "loss_nan_ranks": 0, "loss_rank_avg": 0.34351110458374023, "step": 2465, "valid_targets_mean": 3739.3, "valid_targets_min": 886 }, { "epoch": 1.8840579710144927, "grad_norm": 0.43231635726104817, "learning_rate": 3.661908275682626e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.3112673759460449, "step": 2470, "valid_targets_mean": 4797.2, "valid_targets_min": 858 }, { "epoch": 1.8878718535469108, "grad_norm": 0.4389419887999067, "learning_rate": 3.659789038489832e-05, "loss": 0.3301, "loss_nan_ranks": 0, "loss_rank_avg": 0.3528638780117035, "step": 2475, "valid_targets_mean": 4661.2, "valid_targets_min": 844 }, { "epoch": 1.8916857360793289, "grad_norm": 0.4063170356085659, "learning_rate": 3.657663797339902e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.3472946584224701, "step": 2480, "valid_targets_mean": 5096.3, "valid_targets_min": 1602 }, { "epoch": 1.8954996186117468, "grad_norm": 0.4473609779628171, "learning_rate": 3.655532559920474e-05, "loss": 0.3346, "loss_nan_ranks": 0, "loss_rank_avg": 0.35601258277893066, "step": 2485, "valid_targets_mean": 4471.4, "valid_targets_min": 473 }, { "epoch": 1.8993135011441646, "grad_norm": 0.510089392544064, "learning_rate": 3.653395333940875e-05, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.3393765985965729, "step": 2490, "valid_targets_mean": 3695.0, "valid_targets_min": 1341 }, { "epoch": 1.9031273836765827, "grad_norm": 0.4163060605293795, "learning_rate": 3.651252127132097e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.34253692626953125, "step": 2495, "valid_targets_mean": 5056.7, "valid_targets_min": 1742 }, { "epoch": 1.9069412662090008, "grad_norm": 0.45275357622864393, "learning_rate": 3.6491029472467625e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3306049704551697, "step": 2500, "valid_targets_mean": 4381.1, "valid_targets_min": 1526 }, { "epoch": 1.9107551487414187, "grad_norm": 0.4289727513447695, "learning_rate": 3.6469478020591046e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.31081557273864746, "step": 2505, "valid_targets_mean": 4142.5, "valid_targets_min": 380 }, { "epoch": 1.9145690312738368, "grad_norm": 0.45198414914401847, "learning_rate": 3.644786699364933e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.3111429512500763, "step": 2510, "valid_targets_mean": 4001.7, "valid_targets_min": 1419 }, { "epoch": 1.918382913806255, "grad_norm": 0.41966906491588385, "learning_rate": 3.6426196469816077e-05, "loss": 0.3287, "loss_nan_ranks": 0, "loss_rank_avg": 0.29943111538887024, "step": 2515, "valid_targets_mean": 4615.5, "valid_targets_min": 1134 }, { "epoch": 1.9221967963386728, "grad_norm": 0.3990234568258909, "learning_rate": 3.6404466527480085e-05, "loss": 0.3262, "loss_nan_ranks": 0, "loss_rank_avg": 0.3199032247066498, "step": 2520, "valid_targets_mean": 5416.6, "valid_targets_min": 1373 }, { "epoch": 1.9260106788710907, "grad_norm": 0.4100126062269341, "learning_rate": 3.638267724524512e-05, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.3309996426105499, "step": 2525, "valid_targets_mean": 4957.5, "valid_targets_min": 1516 }, { "epoch": 1.9298245614035088, "grad_norm": 0.48930595113950065, "learning_rate": 3.636082870192957e-05, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.3737516403198242, "step": 2530, "valid_targets_mean": 4311.6, "valid_targets_min": 1513 }, { "epoch": 1.9336384439359269, "grad_norm": 0.396990511331678, "learning_rate": 3.6338920976566206e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.316019207239151, "step": 2535, "valid_targets_mean": 4857.2, "valid_targets_min": 447 }, { "epoch": 1.9374523264683448, "grad_norm": 0.42707664137047063, "learning_rate": 3.631695414840188e-05, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2827240526676178, "step": 2540, "valid_targets_mean": 4249.3, "valid_targets_min": 1203 }, { "epoch": 1.9412662090007626, "grad_norm": 0.39704121969088363, "learning_rate": 3.629492829689722e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.3076905310153961, "step": 2545, "valid_targets_mean": 5482.1, "valid_targets_min": 1125 }, { "epoch": 1.9450800915331807, "grad_norm": 0.489030926911963, "learning_rate": 3.627284350172637e-05, "loss": 0.3348, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305893838405609, "step": 2550, "valid_targets_mean": 4072.5, "valid_targets_min": 1354 }, { "epoch": 1.9488939740655988, "grad_norm": 0.4784627205409548, "learning_rate": 3.625069984277669e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.30123528838157654, "step": 2555, "valid_targets_mean": 3369.6, "valid_targets_min": 827 }, { "epoch": 1.9527078565980167, "grad_norm": 0.5780502983031945, "learning_rate": 3.622849740014846e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.2978937327861786, "step": 2560, "valid_targets_mean": 3833.6, "valid_targets_min": 883 }, { "epoch": 1.9565217391304348, "grad_norm": 0.4596843365698298, "learning_rate": 3.620623625415462e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.30321425199508667, "step": 2565, "valid_targets_mean": 4876.5, "valid_targets_min": 1284 }, { "epoch": 1.960335621662853, "grad_norm": 0.49794938194155713, "learning_rate": 3.618391648532043e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.3527390658855438, "step": 2570, "valid_targets_mean": 4544.0, "valid_targets_min": 1082 }, { "epoch": 1.9641495041952708, "grad_norm": 0.4306105153001951, "learning_rate": 3.616153817438323e-05, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.2867111265659332, "step": 2575, "valid_targets_mean": 4612.7, "valid_targets_min": 1333 }, { "epoch": 1.9679633867276887, "grad_norm": 0.5634464378301066, "learning_rate": 3.613910140229212e-05, "loss": 0.3341, "loss_nan_ranks": 0, "loss_rank_avg": 0.3393392860889435, "step": 2580, "valid_targets_mean": 3495.5, "valid_targets_min": 620 }, { "epoch": 1.9717772692601068, "grad_norm": 0.42643538618721466, "learning_rate": 3.6116606250207646e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.314686119556427, "step": 2585, "valid_targets_mean": 4382.7, "valid_targets_min": 505 }, { "epoch": 1.9755911517925249, "grad_norm": 0.461418186680906, "learning_rate": 3.609405279950157e-05, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.3472661077976227, "step": 2590, "valid_targets_mean": 3919.9, "valid_targets_min": 1075 }, { "epoch": 1.9794050343249427, "grad_norm": 0.46477198331279196, "learning_rate": 3.607144113175652e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.31344321370124817, "step": 2595, "valid_targets_mean": 3753.2, "valid_targets_min": 753 }, { "epoch": 1.9832189168573608, "grad_norm": 0.4705572499094467, "learning_rate": 3.6048771328765695e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.3468952476978302, "step": 2600, "valid_targets_mean": 3563.1, "valid_targets_min": 521 }, { "epoch": 1.987032799389779, "grad_norm": 0.4894559516834718, "learning_rate": 3.602604347253262e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.3458186089992523, "step": 2605, "valid_targets_mean": 4363.7, "valid_targets_min": 447 }, { "epoch": 1.9908466819221968, "grad_norm": 0.4430488468498321, "learning_rate": 3.600325764527079e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.3441220819950104, "step": 2610, "valid_targets_mean": 4790.8, "valid_targets_min": 915 }, { "epoch": 1.9946605644546147, "grad_norm": 0.48404364026741203, "learning_rate": 3.598041392940342e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.2899083197116852, "step": 2615, "valid_targets_mean": 3817.0, "valid_targets_min": 1202 }, { "epoch": 1.9984744469870328, "grad_norm": 1.695860308561902, "learning_rate": 3.5957512407563105e-05, "loss": 0.4769, "loss_nan_ranks": 0, "loss_rank_avg": 0.6421945095062256, "step": 2620, "valid_targets_mean": 780.0, "valid_targets_min": 493 }, { "epoch": 2.002288329519451, "grad_norm": 0.4518557790697791, "learning_rate": 3.593455316259155e-05, "loss": 0.4355, "loss_nan_ranks": 0, "loss_rank_avg": 0.28681135177612305, "step": 2625, "valid_targets_mean": 4816.6, "valid_targets_min": 1551 }, { "epoch": 2.006102212051869, "grad_norm": 0.44782126292756547, "learning_rate": 3.591153627753927e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.3092162013053894, "step": 2630, "valid_targets_mean": 4868.9, "valid_targets_min": 1506 }, { "epoch": 2.0099160945842867, "grad_norm": 0.527863530413975, "learning_rate": 3.588846183566527e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203107416629791, "step": 2635, "valid_targets_mean": 3651.8, "valid_targets_min": 728 }, { "epoch": 2.013729977116705, "grad_norm": 0.4487355300143573, "learning_rate": 3.586532992043677e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.3486725986003876, "step": 2640, "valid_targets_mean": 4654.1, "valid_targets_min": 1003 }, { "epoch": 2.017543859649123, "grad_norm": 0.4149528992346252, "learning_rate": 3.584214061552886e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.30172497034072876, "step": 2645, "valid_targets_mean": 4589.0, "valid_targets_min": 364 }, { "epoch": 2.0213577421815407, "grad_norm": 0.4380270269367264, "learning_rate": 3.581889400482425e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.3232972025871277, "step": 2650, "valid_targets_mean": 4193.9, "valid_targets_min": 1205 }, { "epoch": 2.0251716247139586, "grad_norm": 0.44838457623258393, "learning_rate": 3.5795590172412946e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.3213779926300049, "step": 2655, "valid_targets_mean": 5098.0, "valid_targets_min": 1071 }, { "epoch": 2.028985507246377, "grad_norm": 0.45016704498329, "learning_rate": 3.5772229202591926e-05, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.3524353504180908, "step": 2660, "valid_targets_mean": 4527.9, "valid_targets_min": 1649 }, { "epoch": 2.032799389778795, "grad_norm": 0.4465006685050878, "learning_rate": 3.574881117986486e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.3029600977897644, "step": 2665, "valid_targets_mean": 3735.4, "valid_targets_min": 601 }, { "epoch": 2.0366132723112127, "grad_norm": 0.4422827681174769, "learning_rate": 3.5725336188941785e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.2614348232746124, "step": 2670, "valid_targets_mean": 4119.3, "valid_targets_min": 668 }, { "epoch": 2.040427154843631, "grad_norm": 0.4482051429709076, "learning_rate": 3.570180431473883e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.3411577641963959, "step": 2675, "valid_targets_mean": 4912.2, "valid_targets_min": 955 }, { "epoch": 2.044241037376049, "grad_norm": 0.4869196336236238, "learning_rate": 3.567821564237787e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.34559619426727295, "step": 2680, "valid_targets_mean": 3815.8, "valid_targets_min": 1018 }, { "epoch": 2.0480549199084668, "grad_norm": 0.4897608405458026, "learning_rate": 3.565457025718624e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.3251894414424896, "step": 2685, "valid_targets_mean": 3756.0, "valid_targets_min": 814 }, { "epoch": 2.0518688024408847, "grad_norm": 0.3818311129689496, "learning_rate": 3.563086824469642e-05, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.27594801783561707, "step": 2690, "valid_targets_mean": 5182.2, "valid_targets_min": 1313 }, { "epoch": 2.055682684973303, "grad_norm": 0.40078657159991377, "learning_rate": 3.560710969064574e-05, "loss": 0.3339, "loss_nan_ranks": 0, "loss_rank_avg": 0.34894654154777527, "step": 2695, "valid_targets_mean": 5636.0, "valid_targets_min": 1050 }, { "epoch": 2.059496567505721, "grad_norm": 0.4314520672830342, "learning_rate": 3.558329468097604e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.30594441294670105, "step": 2700, "valid_targets_mean": 4584.9, "valid_targets_min": 626 }, { "epoch": 2.0633104500381387, "grad_norm": 0.4330320629369986, "learning_rate": 3.555942330183341e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.33816561102867126, "step": 2705, "valid_targets_mean": 5605.0, "valid_targets_min": 1122 }, { "epoch": 2.0671243325705566, "grad_norm": 0.432663280927747, "learning_rate": 3.553549563956779e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2950657904148102, "step": 2710, "valid_targets_mean": 4556.0, "valid_targets_min": 764 }, { "epoch": 2.070938215102975, "grad_norm": 0.3980785685365819, "learning_rate": 3.551151178073276e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.351774126291275, "step": 2715, "valid_targets_mean": 5619.8, "valid_targets_min": 535 }, { "epoch": 2.074752097635393, "grad_norm": 0.42705954615047537, "learning_rate": 3.548747181208516e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2942444086074829, "step": 2720, "valid_targets_mean": 4475.0, "valid_targets_min": 337 }, { "epoch": 2.0785659801678107, "grad_norm": 0.4250243681722831, "learning_rate": 3.5463375820584826e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.3257274925708771, "step": 2725, "valid_targets_mean": 4989.0, "valid_targets_min": 816 }, { "epoch": 2.082379862700229, "grad_norm": 0.4781865116161094, "learning_rate": 3.5439223893394185e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.36427298188209534, "step": 2730, "valid_targets_mean": 3891.9, "valid_targets_min": 989 }, { "epoch": 2.086193745232647, "grad_norm": 0.432991181042828, "learning_rate": 3.541501611787806e-05, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.29490405321121216, "step": 2735, "valid_targets_mean": 4064.3, "valid_targets_min": 1512 }, { "epoch": 2.0900076277650648, "grad_norm": 0.4358409077212192, "learning_rate": 3.5390752581603256e-05, "loss": 0.3241, "loss_nan_ranks": 0, "loss_rank_avg": 0.3720548152923584, "step": 2740, "valid_targets_mean": 5014.2, "valid_targets_min": 1590 }, { "epoch": 2.0938215102974826, "grad_norm": 0.4051452760209203, "learning_rate": 3.536643337233831e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.32935160398483276, "step": 2745, "valid_targets_mean": 5356.0, "valid_targets_min": 563 }, { "epoch": 2.097635392829901, "grad_norm": 0.4618577711694058, "learning_rate": 3.5342058578053115e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.31700313091278076, "step": 2750, "valid_targets_mean": 4074.1, "valid_targets_min": 1113 }, { "epoch": 2.101449275362319, "grad_norm": 0.4650533706947534, "learning_rate": 3.5317628286918654e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.3038328289985657, "step": 2755, "valid_targets_mean": 3777.7, "valid_targets_min": 1051 }, { "epoch": 2.1052631578947367, "grad_norm": 0.3911911315347162, "learning_rate": 3.5293142587306656e-05, "loss": 0.3206, "loss_nan_ranks": 0, "loss_rank_avg": 0.3163069784641266, "step": 2760, "valid_targets_mean": 5114.2, "valid_targets_min": 1244 }, { "epoch": 2.109077040427155, "grad_norm": 0.4528620401506649, "learning_rate": 3.526860156778927e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.3514285981655121, "step": 2765, "valid_targets_mean": 3839.7, "valid_targets_min": 1011 }, { "epoch": 2.112890922959573, "grad_norm": 0.4177167860467384, "learning_rate": 3.524400531713876e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.3051723837852478, "step": 2770, "valid_targets_mean": 5298.1, "valid_targets_min": 1803 }, { "epoch": 2.116704805491991, "grad_norm": 0.4003676926723766, "learning_rate": 3.521935392432718e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.31541749835014343, "step": 2775, "valid_targets_mean": 4743.7, "valid_targets_min": 1137 }, { "epoch": 2.1205186880244087, "grad_norm": 0.4520780702808259, "learning_rate": 3.5194647478526044e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.31706899404525757, "step": 2780, "valid_targets_mean": 4706.4, "valid_targets_min": 267 }, { "epoch": 2.124332570556827, "grad_norm": 1.4925281950577982, "learning_rate": 3.5169886069106015e-05, "loss": 0.5112, "loss_nan_ranks": 0, "loss_rank_avg": 0.637296736240387, "step": 2785, "valid_targets_mean": 864.1, "valid_targets_min": 587 }, { "epoch": 2.128146453089245, "grad_norm": 0.4277812995302766, "learning_rate": 3.5145069785636576e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.34565839171409607, "step": 2790, "valid_targets_mean": 4901.5, "valid_targets_min": 1024 }, { "epoch": 2.1319603356216628, "grad_norm": 0.4339866826762552, "learning_rate": 3.512019871788569e-05, "loss": 0.33, "loss_nan_ranks": 0, "loss_rank_avg": 0.3311890661716461, "step": 2795, "valid_targets_mean": 4585.2, "valid_targets_min": 803 }, { "epoch": 2.135774218154081, "grad_norm": 0.44356752428059937, "learning_rate": 3.509527295581951e-05, "loss": 0.33, "loss_nan_ranks": 0, "loss_rank_avg": 0.34069275856018066, "step": 2800, "valid_targets_mean": 5747.2, "valid_targets_min": 1140 }, { "epoch": 2.139588100686499, "grad_norm": 0.48873464445289144, "learning_rate": 3.507029258960203e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.3361491858959198, "step": 2805, "valid_targets_mean": 5306.7, "valid_targets_min": 1462 }, { "epoch": 2.143401983218917, "grad_norm": 0.40843884861087065, "learning_rate": 3.504525770959477e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.345804363489151, "step": 2810, "valid_targets_mean": 5229.5, "valid_targets_min": 375 }, { "epoch": 2.1472158657513347, "grad_norm": 0.4304445901977957, "learning_rate": 3.502016840635642e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.32236722111701965, "step": 2815, "valid_targets_mean": 4655.3, "valid_targets_min": 1315 }, { "epoch": 2.151029748283753, "grad_norm": 0.42379821089500375, "learning_rate": 3.4995024770642554e-05, "loss": 0.3353, "loss_nan_ranks": 0, "loss_rank_avg": 0.3316449224948883, "step": 2820, "valid_targets_mean": 4426.3, "valid_targets_min": 1482 }, { "epoch": 2.154843630816171, "grad_norm": 0.41185583474074233, "learning_rate": 3.4969826893405294e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.34358730912208557, "step": 2825, "valid_targets_mean": 5202.3, "valid_targets_min": 1354 }, { "epoch": 2.158657513348589, "grad_norm": 0.44266026669962844, "learning_rate": 3.4944574865792945e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.30736637115478516, "step": 2830, "valid_targets_mean": 4420.9, "valid_targets_min": 1073 }, { "epoch": 2.1624713958810067, "grad_norm": 0.4061991514677841, "learning_rate": 3.4919268779149696e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.31193986535072327, "step": 2835, "valid_targets_mean": 4632.8, "valid_targets_min": 1249 }, { "epoch": 2.166285278413425, "grad_norm": 0.43478104011120616, "learning_rate": 3.489390872501529e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.3487791121006012, "step": 2840, "valid_targets_mean": 4533.8, "valid_targets_min": 1392 }, { "epoch": 2.170099160945843, "grad_norm": 0.4078062523633683, "learning_rate": 3.4868494795124705e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3065103590488434, "step": 2845, "valid_targets_mean": 4814.8, "valid_targets_min": 763 }, { "epoch": 2.1739130434782608, "grad_norm": 0.4289713522809232, "learning_rate": 3.484302708140775e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.33483967185020447, "step": 2850, "valid_targets_mean": 4179.2, "valid_targets_min": 1051 }, { "epoch": 2.177726926010679, "grad_norm": 0.472220403001625, "learning_rate": 3.481750567598885e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.362771600484848, "step": 2855, "valid_targets_mean": 4404.5, "valid_targets_min": 1088 }, { "epoch": 2.181540808543097, "grad_norm": 0.3648207114064372, "learning_rate": 3.47919306711866e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925264835357666, "step": 2860, "valid_targets_mean": 5416.4, "valid_targets_min": 1482 }, { "epoch": 2.185354691075515, "grad_norm": 0.39372615878666817, "learning_rate": 3.4766302159513514e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.31346771121025085, "step": 2865, "valid_targets_mean": 5427.8, "valid_targets_min": 1130 }, { "epoch": 2.1891685736079327, "grad_norm": 0.4126857886832629, "learning_rate": 3.474062023367563e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.3509589433670044, "step": 2870, "valid_targets_mean": 5269.3, "valid_targets_min": 991 }, { "epoch": 2.192982456140351, "grad_norm": 0.411651571169999, "learning_rate": 3.471488498657222e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.3311251401901245, "step": 2875, "valid_targets_mean": 5288.4, "valid_targets_min": 763 }, { "epoch": 2.196796338672769, "grad_norm": 0.44636044736979674, "learning_rate": 3.468909651129543e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.3214028775691986, "step": 2880, "valid_targets_mean": 4051.4, "valid_targets_min": 990 }, { "epoch": 2.200610221205187, "grad_norm": 0.4449036968288949, "learning_rate": 3.466325490112993e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.2663789689540863, "step": 2885, "valid_targets_mean": 3941.7, "valid_targets_min": 605 }, { "epoch": 2.2044241037376047, "grad_norm": 0.43992016755573804, "learning_rate": 3.463736024955263e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.3127845525741577, "step": 2890, "valid_targets_mean": 5903.5, "valid_targets_min": 1002 }, { "epoch": 2.208237986270023, "grad_norm": 0.43453745171374947, "learning_rate": 3.461141265023229e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.29881763458251953, "step": 2895, "valid_targets_mean": 4015.5, "valid_targets_min": 724 }, { "epoch": 2.212051868802441, "grad_norm": 0.3852285397340729, "learning_rate": 3.4585412197029176e-05, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.29247185587882996, "step": 2900, "valid_targets_mean": 4694.1, "valid_targets_min": 1035 }, { "epoch": 2.2158657513348587, "grad_norm": 0.5136665672114349, "learning_rate": 3.455935898399479e-05, "loss": 0.3225, "loss_nan_ranks": 0, "loss_rank_avg": 0.3353908956050873, "step": 2905, "valid_targets_mean": 4370.2, "valid_targets_min": 1005 }, { "epoch": 2.219679633867277, "grad_norm": 0.4881189152233372, "learning_rate": 3.453325310537142e-05, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.3274397552013397, "step": 2910, "valid_targets_mean": 4228.9, "valid_targets_min": 1214 }, { "epoch": 2.223493516399695, "grad_norm": 0.4195992283622164, "learning_rate": 3.450709465559194e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.32342055439949036, "step": 2915, "valid_targets_mean": 4261.7, "valid_targets_min": 919 }, { "epoch": 2.227307398932113, "grad_norm": 0.4159790401363364, "learning_rate": 3.4480883729279305e-05, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.33828291296958923, "step": 2920, "valid_targets_mean": 4834.0, "valid_targets_min": 1373 }, { "epoch": 2.2311212814645307, "grad_norm": 0.4165223915561082, "learning_rate": 3.445462042124636e-05, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.3129110634326935, "step": 2925, "valid_targets_mean": 4497.5, "valid_targets_min": 1123 }, { "epoch": 2.234935163996949, "grad_norm": 0.38466587084214765, "learning_rate": 3.442830482649539e-05, "loss": 0.3256, "loss_nan_ranks": 0, "loss_rank_avg": 0.3339121341705322, "step": 2930, "valid_targets_mean": 5770.3, "valid_targets_min": 1754 }, { "epoch": 2.238749046529367, "grad_norm": 0.40262584621326525, "learning_rate": 3.440193704021783e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.31021028757095337, "step": 2935, "valid_targets_mean": 5080.9, "valid_targets_min": 1674 }, { "epoch": 2.242562929061785, "grad_norm": 0.41779524060918555, "learning_rate": 3.4375517157793927e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.32838132977485657, "step": 2940, "valid_targets_mean": 4848.7, "valid_targets_min": 1385 }, { "epoch": 2.246376811594203, "grad_norm": 0.4640321321894666, "learning_rate": 3.434904527479235e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.3334600031375885, "step": 2945, "valid_targets_mean": 4124.4, "valid_targets_min": 1203 }, { "epoch": 2.250190694126621, "grad_norm": 1.2455406449672553, "learning_rate": 3.4322521486969866e-05, "loss": 0.5444, "loss_nan_ranks": 0, "loss_rank_avg": 0.6027448773384094, "step": 2950, "valid_targets_mean": 885.0, "valid_targets_min": 551 }, { "epoch": 2.254004576659039, "grad_norm": 0.4533102457871256, "learning_rate": 3.429594589027102e-05, "loss": 0.3982, "loss_nan_ranks": 0, "loss_rank_avg": 0.31670811772346497, "step": 2955, "valid_targets_mean": 5360.8, "valid_targets_min": 1229 }, { "epoch": 2.2578184591914567, "grad_norm": 0.45007990340926657, "learning_rate": 3.426931858082775e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.27866581082344055, "step": 2960, "valid_targets_mean": 4068.8, "valid_targets_min": 978 }, { "epoch": 2.261632341723875, "grad_norm": 0.4182475658385057, "learning_rate": 3.4242639654959055e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.33048322796821594, "step": 2965, "valid_targets_mean": 5333.2, "valid_targets_min": 1035 }, { "epoch": 2.265446224256293, "grad_norm": 0.44982078901385464, "learning_rate": 3.4215909209170656e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3067856431007385, "step": 2970, "valid_targets_mean": 4327.3, "valid_targets_min": 1058 }, { "epoch": 2.269260106788711, "grad_norm": 0.4246313159105408, "learning_rate": 3.418912734015463e-05, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.3462902009487152, "step": 2975, "valid_targets_mean": 4803.1, "valid_targets_min": 403 }, { "epoch": 2.273073989321129, "grad_norm": 0.4537107473424202, "learning_rate": 3.416229414478907e-05, "loss": 0.3241, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000136911869049, "step": 2980, "valid_targets_mean": 4820.1, "valid_targets_min": 1166 }, { "epoch": 2.276887871853547, "grad_norm": 0.4202091063659574, "learning_rate": 3.4135409720137725e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.28874197602272034, "step": 2985, "valid_targets_mean": 3907.3, "valid_targets_min": 1048 }, { "epoch": 2.280701754385965, "grad_norm": 0.46834762645468975, "learning_rate": 3.4108474163449653e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.35787180066108704, "step": 2990, "valid_targets_mean": 3768.8, "valid_targets_min": 969 }, { "epoch": 2.2845156369183828, "grad_norm": 0.44621662808084633, "learning_rate": 3.40814875721589e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.3383162319660187, "step": 2995, "valid_targets_mean": 4347.9, "valid_targets_min": 681 }, { "epoch": 2.288329519450801, "grad_norm": 0.4276744418335265, "learning_rate": 3.405445004388408e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.28751322627067566, "step": 3000, "valid_targets_mean": 4021.9, "valid_targets_min": 1002 }, { "epoch": 2.292143401983219, "grad_norm": 0.43665377536255506, "learning_rate": 3.402736167642809e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.3026927411556244, "step": 3005, "valid_targets_mean": 4820.8, "valid_targets_min": 1394 }, { "epoch": 2.295957284515637, "grad_norm": 0.41102468091858063, "learning_rate": 3.400022256777772e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.29576948285102844, "step": 3010, "valid_targets_mean": 4581.5, "valid_targets_min": 1097 }, { "epoch": 2.2997711670480547, "grad_norm": 0.38434638037208735, "learning_rate": 3.39730328161033e-05, "loss": 0.311, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018251061439514, "step": 3015, "valid_targets_mean": 4958.6, "valid_targets_min": 1754 }, { "epoch": 2.303585049580473, "grad_norm": 0.4335198527505541, "learning_rate": 3.394579251975836e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881692051887512, "step": 3020, "valid_targets_mean": 4141.5, "valid_targets_min": 1515 }, { "epoch": 2.307398932112891, "grad_norm": 0.4124467111134283, "learning_rate": 3.391850177727924e-05, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.35339486598968506, "step": 3025, "valid_targets_mean": 5283.4, "valid_targets_min": 1263 }, { "epoch": 2.311212814645309, "grad_norm": 0.4661684649657449, "learning_rate": 3.389116068738482e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.31515705585479736, "step": 3030, "valid_targets_mean": 4185.0, "valid_targets_min": 492 }, { "epoch": 2.3150266971777267, "grad_norm": 0.435483883866706, "learning_rate": 3.3863769348976024e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.3099616467952728, "step": 3035, "valid_targets_mean": 4285.6, "valid_targets_min": 712 }, { "epoch": 2.318840579710145, "grad_norm": 0.4489741349463335, "learning_rate": 3.38363278611356e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.31510940194129944, "step": 3040, "valid_targets_mean": 4578.5, "valid_targets_min": 1220 }, { "epoch": 2.322654462242563, "grad_norm": 0.454132578096704, "learning_rate": 3.3808836323127666e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.31616052985191345, "step": 3045, "valid_targets_mean": 4476.0, "valid_targets_min": 924 }, { "epoch": 2.3264683447749808, "grad_norm": 0.4706189536012141, "learning_rate": 3.3781294834397416e-05, "loss": 0.3202, "loss_nan_ranks": 0, "loss_rank_avg": 0.3171687722206116, "step": 3050, "valid_targets_mean": 3822.8, "valid_targets_min": 1079 }, { "epoch": 2.330282227307399, "grad_norm": 0.4688702774722974, "learning_rate": 3.375370349457069e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.29751574993133545, "step": 3055, "valid_targets_mean": 3372.0, "valid_targets_min": 745 }, { "epoch": 2.334096109839817, "grad_norm": 0.45350633325165235, "learning_rate": 3.37260624034537e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.26518234610557556, "step": 3060, "valid_targets_mean": 3821.1, "valid_targets_min": 1002 }, { "epoch": 2.337909992372235, "grad_norm": 0.4509818679226893, "learning_rate": 3.36983716610326e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775558531284332, "step": 3065, "valid_targets_mean": 3986.3, "valid_targets_min": 1127 }, { "epoch": 2.3417238749046527, "grad_norm": 0.4220414814745815, "learning_rate": 3.3670631367473136e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.31039997935295105, "step": 3070, "valid_targets_mean": 4780.5, "valid_targets_min": 1411 }, { "epoch": 2.345537757437071, "grad_norm": 0.4625202358326965, "learning_rate": 3.364284162312032e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.3140174150466919, "step": 3075, "valid_targets_mean": 3760.7, "valid_targets_min": 1065 }, { "epoch": 2.349351639969489, "grad_norm": 0.4041288445251084, "learning_rate": 3.361500252849803e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.2915945053100586, "step": 3080, "valid_targets_mean": 4437.5, "valid_targets_min": 743 }, { "epoch": 2.353165522501907, "grad_norm": 0.42664167212219883, "learning_rate": 3.3587114184308664e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.3082127869129181, "step": 3085, "valid_targets_mean": 4920.8, "valid_targets_min": 566 }, { "epoch": 2.356979405034325, "grad_norm": 0.45595971770828464, "learning_rate": 3.355917669143276e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.314989298582077, "step": 3090, "valid_targets_mean": 3974.5, "valid_targets_min": 1242 }, { "epoch": 2.360793287566743, "grad_norm": 0.4267031520990776, "learning_rate": 3.3531190150928655e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.31824013590812683, "step": 3095, "valid_targets_mean": 4419.4, "valid_targets_min": 1017 }, { "epoch": 2.364607170099161, "grad_norm": 0.40719312557802045, "learning_rate": 3.35031546640321e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.29631316661834717, "step": 3100, "valid_targets_mean": 4890.0, "valid_targets_min": 1432 }, { "epoch": 2.3684210526315788, "grad_norm": 0.4836219301990495, "learning_rate": 3.347507033215589e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.3056109845638275, "step": 3105, "valid_targets_mean": 3523.5, "valid_targets_min": 1035 }, { "epoch": 2.372234935163997, "grad_norm": 0.46664455271321875, "learning_rate": 3.344693725688953e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.30344218015670776, "step": 3110, "valid_targets_mean": 4145.0, "valid_targets_min": 1151 }, { "epoch": 2.376048817696415, "grad_norm": 0.4709941009473953, "learning_rate": 3.341875553999883e-05, "loss": 0.4522, "loss_nan_ranks": 0, "loss_rank_avg": 0.29392245411872864, "step": 3115, "valid_targets_mean": 4008.7, "valid_targets_min": 371 }, { "epoch": 2.379862700228833, "grad_norm": 0.4204995391050676, "learning_rate": 3.339052528342554e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.34602752327919006, "step": 3120, "valid_targets_mean": 4779.5, "valid_targets_min": 1024 }, { "epoch": 2.383676582761251, "grad_norm": 0.4404868029867653, "learning_rate": 3.336224658928702e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.3412117063999176, "step": 3125, "valid_targets_mean": 4316.2, "valid_targets_min": 1087 }, { "epoch": 2.387490465293669, "grad_norm": 0.48253694746867987, "learning_rate": 3.3333919559875817e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.30176326632499695, "step": 3130, "valid_targets_mean": 3363.5, "valid_targets_min": 1126 }, { "epoch": 2.391304347826087, "grad_norm": 0.47060528945887725, "learning_rate": 3.330554429765933e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.2910543978214264, "step": 3135, "valid_targets_mean": 4389.2, "valid_targets_min": 1106 }, { "epoch": 2.395118230358505, "grad_norm": 0.40268416401652135, "learning_rate": 3.3277120905279454e-05, "loss": 0.3301, "loss_nan_ranks": 0, "loss_rank_avg": 0.3227095603942871, "step": 3140, "valid_targets_mean": 5091.1, "valid_targets_min": 379 }, { "epoch": 2.398932112890923, "grad_norm": 0.5366231607872158, "learning_rate": 3.324864948555215e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.31209537386894226, "step": 3145, "valid_targets_mean": 3523.9, "valid_targets_min": 497 }, { "epoch": 2.402745995423341, "grad_norm": 0.46305780755530407, "learning_rate": 3.3220130141467126e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.2822486460208893, "step": 3150, "valid_targets_mean": 4739.7, "valid_targets_min": 1556 }, { "epoch": 2.406559877955759, "grad_norm": 0.41772343288346137, "learning_rate": 3.319156297618744e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.29450178146362305, "step": 3155, "valid_targets_mean": 4559.1, "valid_targets_min": 1074 }, { "epoch": 2.410373760488177, "grad_norm": 0.4009891297301182, "learning_rate": 3.316294809304914e-05, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615176737308502, "step": 3160, "valid_targets_mean": 4259.6, "valid_targets_min": 320 }, { "epoch": 2.414187643020595, "grad_norm": 0.5372736697822601, "learning_rate": 3.3134285595560884e-05, "loss": 0.3216, "loss_nan_ranks": 0, "loss_rank_avg": 0.3198303282260895, "step": 3165, "valid_targets_mean": 4708.5, "valid_targets_min": 1294 }, { "epoch": 2.418001525553013, "grad_norm": 0.5006156073841829, "learning_rate": 3.310557558740356e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.28113606572151184, "step": 3170, "valid_targets_mean": 3367.2, "valid_targets_min": 773 }, { "epoch": 2.421815408085431, "grad_norm": 0.5394294222955758, "learning_rate": 3.3076818172429925e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.3090674579143524, "step": 3175, "valid_targets_mean": 3041.1, "valid_targets_min": 561 }, { "epoch": 2.425629290617849, "grad_norm": 0.3752343434469316, "learning_rate": 3.304801345466421e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2914296090602875, "step": 3180, "valid_targets_mean": 5173.1, "valid_targets_min": 1182 }, { "epoch": 2.429443173150267, "grad_norm": 0.36719834272513013, "learning_rate": 3.301916153830175e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.2869374454021454, "step": 3185, "valid_targets_mean": 5752.6, "valid_targets_min": 1254 }, { "epoch": 2.433257055682685, "grad_norm": 0.46120148501188674, "learning_rate": 3.299026252770864e-05, "loss": 0.3163, "loss_nan_ranks": 0, "loss_rank_avg": 0.30976438522338867, "step": 3190, "valid_targets_mean": 4156.0, "valid_targets_min": 952 }, { "epoch": 2.437070938215103, "grad_norm": 0.4028904691522973, "learning_rate": 3.2961316527421297e-05, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.2804625332355499, "step": 3195, "valid_targets_mean": 5134.5, "valid_targets_min": 939 }, { "epoch": 2.440884820747521, "grad_norm": 0.42739158339434313, "learning_rate": 3.293232364214613e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2903222441673279, "step": 3200, "valid_targets_mean": 4225.7, "valid_targets_min": 1532 }, { "epoch": 2.444698703279939, "grad_norm": 0.4120940942202485, "learning_rate": 3.2903283976759154e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.3225897550582886, "step": 3205, "valid_targets_mean": 4823.2, "valid_targets_min": 1258 }, { "epoch": 2.448512585812357, "grad_norm": 0.4438438890063094, "learning_rate": 3.287419763630557e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.3097473680973053, "step": 3210, "valid_targets_mean": 4313.7, "valid_targets_min": 1132 }, { "epoch": 2.4523264683447747, "grad_norm": 0.454562761903692, "learning_rate": 3.284506472599946e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.27896568179130554, "step": 3215, "valid_targets_mean": 3983.9, "valid_targets_min": 376 }, { "epoch": 2.456140350877193, "grad_norm": 0.41734956806317247, "learning_rate": 3.281588535122331e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.3313711881637573, "step": 3220, "valid_targets_mean": 4768.2, "valid_targets_min": 1079 }, { "epoch": 2.459954233409611, "grad_norm": 0.4050882230027488, "learning_rate": 3.278665961752774e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018350601196289, "step": 3225, "valid_targets_mean": 4809.2, "valid_targets_min": 1149 }, { "epoch": 2.463768115942029, "grad_norm": 0.44512875562523363, "learning_rate": 3.2757387630631015e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.3171129822731018, "step": 3230, "valid_targets_mean": 4194.5, "valid_targets_min": 1214 }, { "epoch": 2.467581998474447, "grad_norm": 0.4318883742701634, "learning_rate": 3.272806949641875e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.30675944685935974, "step": 3235, "valid_targets_mean": 4495.5, "valid_targets_min": 1280 }, { "epoch": 2.471395881006865, "grad_norm": 0.5127454111107679, "learning_rate": 3.269870532094346e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.305593341588974, "step": 3240, "valid_targets_mean": 4044.5, "valid_targets_min": 852 }, { "epoch": 2.475209763539283, "grad_norm": 0.44932328995702725, "learning_rate": 3.2669295210424216e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.3079918920993805, "step": 3245, "valid_targets_mean": 4045.1, "valid_targets_min": 829 }, { "epoch": 2.479023646071701, "grad_norm": 0.4248740581634684, "learning_rate": 3.263983927124626e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.3253237307071686, "step": 3250, "valid_targets_mean": 4557.6, "valid_targets_min": 1362 }, { "epoch": 2.482837528604119, "grad_norm": 0.47524928688800416, "learning_rate": 3.26103376099606e-05, "loss": 0.3209, "loss_nan_ranks": 0, "loss_rank_avg": 0.33182817697525024, "step": 3255, "valid_targets_mean": 4120.5, "valid_targets_min": 288 }, { "epoch": 2.486651411136537, "grad_norm": 0.4013284951011599, "learning_rate": 3.258079033328362e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.2935488522052765, "step": 3260, "valid_targets_mean": 5461.8, "valid_targets_min": 699 }, { "epoch": 2.490465293668955, "grad_norm": 0.4560281553599727, "learning_rate": 3.255119754809674e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.3281641900539398, "step": 3265, "valid_targets_mean": 3976.6, "valid_targets_min": 1316 }, { "epoch": 2.494279176201373, "grad_norm": 0.4194313669939143, "learning_rate": 3.252155936144598e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.2913791835308075, "step": 3270, "valid_targets_mean": 4450.8, "valid_targets_min": 802 }, { "epoch": 2.498093058733791, "grad_norm": 1.2583919640663648, "learning_rate": 3.249187588054158e-05, "loss": 0.4749, "loss_nan_ranks": 0, "loss_rank_avg": 0.5555517673492432, "step": 3275, "valid_targets_mean": 802.0, "valid_targets_min": 573 }, { "epoch": 2.501906941266209, "grad_norm": 0.4182243002509812, "learning_rate": 3.246214721275765e-05, "loss": 0.3603, "loss_nan_ranks": 0, "loss_rank_avg": 0.2573336064815521, "step": 3280, "valid_targets_mean": 4969.2, "valid_targets_min": 1564 }, { "epoch": 2.505720823798627, "grad_norm": 0.45724501654045097, "learning_rate": 3.2432373465631735e-05, "loss": 0.3116, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165568709373474, "step": 3285, "valid_targets_mean": 4297.0, "valid_targets_min": 514 }, { "epoch": 2.509534706331045, "grad_norm": 0.5092081567329626, "learning_rate": 3.240255474686445e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.3316061198711395, "step": 3290, "valid_targets_mean": 3906.4, "valid_targets_min": 312 }, { "epoch": 2.513348588863463, "grad_norm": 0.4128558996686412, "learning_rate": 3.23726911643191e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.3001715838909149, "step": 3295, "valid_targets_mean": 4967.5, "valid_targets_min": 1778 }, { "epoch": 2.517162471395881, "grad_norm": 0.3938186280656715, "learning_rate": 3.234278282602124e-05, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615433633327484, "step": 3300, "valid_targets_mean": 5320.2, "valid_targets_min": 1049 }, { "epoch": 2.520976353928299, "grad_norm": 0.4720418563543762, "learning_rate": 3.231282984015835e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.33653369545936584, "step": 3305, "valid_targets_mean": 4016.5, "valid_targets_min": 296 }, { "epoch": 2.524790236460717, "grad_norm": 0.4267496748398417, "learning_rate": 3.228283231507942e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.33910393714904785, "step": 3310, "valid_targets_mean": 4726.3, "valid_targets_min": 964 }, { "epoch": 2.528604118993135, "grad_norm": 0.4311391044080387, "learning_rate": 3.225279035929452e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2865217924118042, "step": 3315, "valid_targets_mean": 4205.9, "valid_targets_min": 1404 }, { "epoch": 2.532418001525553, "grad_norm": 0.43520655150199683, "learning_rate": 3.222270408147447e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.3108452558517456, "step": 3320, "valid_targets_mean": 3981.0, "valid_targets_min": 1039 }, { "epoch": 2.536231884057971, "grad_norm": 0.41681559543008706, "learning_rate": 3.219257359045039e-05, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192494213581085, "step": 3325, "valid_targets_mean": 4327.1, "valid_targets_min": 1317 }, { "epoch": 2.540045766590389, "grad_norm": 0.4184490891131059, "learning_rate": 3.2162398995213355e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.3283292353153229, "step": 3330, "valid_targets_mean": 4665.3, "valid_targets_min": 1543 }, { "epoch": 2.543859649122807, "grad_norm": 0.4100215088411221, "learning_rate": 3.213218040491397e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.32542848587036133, "step": 3335, "valid_targets_mean": 5202.1, "valid_targets_min": 1795 }, { "epoch": 2.5476735316552253, "grad_norm": 0.4581780551039809, "learning_rate": 3.2101917928861986e-05, "loss": 0.3327, "loss_nan_ranks": 0, "loss_rank_avg": 0.3427410423755646, "step": 3340, "valid_targets_mean": 4036.1, "valid_targets_min": 729 }, { "epoch": 2.551487414187643, "grad_norm": 0.46035481912473103, "learning_rate": 3.207161167652589e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.3007487952709198, "step": 3345, "valid_targets_mean": 4143.8, "valid_targets_min": 894 }, { "epoch": 2.555301296720061, "grad_norm": 0.4034052276373605, "learning_rate": 3.204126175753253e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.30226239562034607, "step": 3350, "valid_targets_mean": 4929.1, "valid_targets_min": 859 }, { "epoch": 2.559115179252479, "grad_norm": 0.45042067980684486, "learning_rate": 3.201086828166672e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.30956992506980896, "step": 3355, "valid_targets_mean": 3947.8, "valid_targets_min": 300 }, { "epoch": 2.5629290617848968, "grad_norm": 0.4208797502147041, "learning_rate": 3.1980431358870805e-05, "loss": 0.3331, "loss_nan_ranks": 0, "loss_rank_avg": 0.3373583257198334, "step": 3360, "valid_targets_mean": 5164.8, "valid_targets_min": 1035 }, { "epoch": 2.566742944317315, "grad_norm": 0.4139965067629496, "learning_rate": 3.1949951099244326e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.26954910159111023, "step": 3365, "valid_targets_mean": 4530.2, "valid_targets_min": 1172 }, { "epoch": 2.570556826849733, "grad_norm": 0.4073002785523478, "learning_rate": 3.191942761304355e-05, "loss": 0.3225, "loss_nan_ranks": 0, "loss_rank_avg": 0.2845797538757324, "step": 3370, "valid_targets_mean": 5883.5, "valid_targets_min": 1762 }, { "epoch": 2.5743707093821513, "grad_norm": 0.5005794736670965, "learning_rate": 3.188886101068113e-05, "loss": 0.3093, "loss_nan_ranks": 0, "loss_rank_avg": 0.33116093277931213, "step": 3375, "valid_targets_mean": 3936.8, "valid_targets_min": 972 }, { "epoch": 2.578184591914569, "grad_norm": 0.39563461531335153, "learning_rate": 3.185825140272569e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.31638863682746887, "step": 3380, "valid_targets_mean": 5078.9, "valid_targets_min": 946 }, { "epoch": 2.581998474446987, "grad_norm": 0.38103153537461776, "learning_rate": 3.1827598899901384e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.32187706232070923, "step": 3385, "valid_targets_mean": 5218.0, "valid_targets_min": 1187 }, { "epoch": 2.585812356979405, "grad_norm": 0.4592422549331716, "learning_rate": 3.179690361308757e-05, "loss": 0.3347, "loss_nan_ranks": 0, "loss_rank_avg": 0.3470957279205322, "step": 3390, "valid_targets_mean": 4527.9, "valid_targets_min": 498 }, { "epoch": 2.589626239511823, "grad_norm": 0.4242232229533466, "learning_rate": 3.1766165653318354e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.3074164390563965, "step": 3395, "valid_targets_mean": 4345.0, "valid_targets_min": 933 }, { "epoch": 2.593440122044241, "grad_norm": 0.4249779377292946, "learning_rate": 3.173538513178218e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875068187713623, "step": 3400, "valid_targets_mean": 4543.5, "valid_targets_min": 1172 }, { "epoch": 2.597254004576659, "grad_norm": 0.4274365869571573, "learning_rate": 3.170456215982149e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.30450737476348877, "step": 3405, "valid_targets_mean": 4374.2, "valid_targets_min": 1202 }, { "epoch": 2.601067887109077, "grad_norm": 0.45198819209554214, "learning_rate": 3.167369684893224e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.29094013571739197, "step": 3410, "valid_targets_mean": 4171.3, "valid_targets_min": 607 }, { "epoch": 2.604881769641495, "grad_norm": 0.3965480485903044, "learning_rate": 3.164278931076358e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.2770211398601532, "step": 3415, "valid_targets_mean": 5058.5, "valid_targets_min": 1084 }, { "epoch": 2.608695652173913, "grad_norm": 0.545185315512466, "learning_rate": 3.161183965711738e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.3102641701698303, "step": 3420, "valid_targets_mean": 2958.9, "valid_targets_min": 526 }, { "epoch": 2.612509534706331, "grad_norm": 0.4525570772787872, "learning_rate": 3.158084799994787e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.27811145782470703, "step": 3425, "valid_targets_mean": 4219.3, "valid_targets_min": 1192 }, { "epoch": 2.616323417238749, "grad_norm": 0.4151885367952925, "learning_rate": 3.154981445136121e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.30080297589302063, "step": 3430, "valid_targets_mean": 4943.1, "valid_targets_min": 1128 }, { "epoch": 2.620137299771167, "grad_norm": 0.4653213080790013, "learning_rate": 3.15187391236151e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.3620241582393646, "step": 3435, "valid_targets_mean": 4422.7, "valid_targets_min": 1005 }, { "epoch": 2.623951182303585, "grad_norm": 1.4191783668873799, "learning_rate": 3.148762212911837e-05, "loss": 0.4368, "loss_nan_ranks": 0, "loss_rank_avg": 0.6156240105628967, "step": 3440, "valid_targets_mean": 883.6, "valid_targets_min": 580 }, { "epoch": 2.627765064836003, "grad_norm": 0.48590288960795086, "learning_rate": 3.145646358043055e-05, "loss": 0.4271, "loss_nan_ranks": 0, "loss_rank_avg": 0.34322547912597656, "step": 3445, "valid_targets_mean": 4622.9, "valid_targets_min": 812 }, { "epoch": 2.6315789473684212, "grad_norm": 0.4771826596173598, "learning_rate": 3.1425263590261514e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.32992804050445557, "step": 3450, "valid_targets_mean": 4304.2, "valid_targets_min": 883 }, { "epoch": 2.635392829900839, "grad_norm": 1.5209723851975487, "learning_rate": 3.139402227147103e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.33348479866981506, "step": 3455, "valid_targets_mean": 4633.4, "valid_targets_min": 465 }, { "epoch": 2.639206712433257, "grad_norm": 0.5310761075855137, "learning_rate": 3.136273973706835e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.2709449231624603, "step": 3460, "valid_targets_mean": 3417.8, "valid_targets_min": 1029 }, { "epoch": 2.643020594965675, "grad_norm": 0.43586930927383066, "learning_rate": 3.133141610021184e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.2855277955532074, "step": 3465, "valid_targets_mean": 4236.7, "valid_targets_min": 1145 }, { "epoch": 2.646834477498093, "grad_norm": 0.4567606109152964, "learning_rate": 3.1300051474208524e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.2981013059616089, "step": 3470, "valid_targets_mean": 4365.1, "valid_targets_min": 1106 }, { "epoch": 2.650648360030511, "grad_norm": 0.40779512282622354, "learning_rate": 3.126864597251371e-05, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.3078835904598236, "step": 3475, "valid_targets_mean": 5027.8, "valid_targets_min": 1074 }, { "epoch": 2.654462242562929, "grad_norm": 0.4536802053876773, "learning_rate": 3.123719970873057e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.3421435058116913, "step": 3480, "valid_targets_mean": 4348.9, "valid_targets_min": 1020 }, { "epoch": 2.6582761250953473, "grad_norm": 0.45825952562012484, "learning_rate": 3.120571279660971e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.28770169615745544, "step": 3485, "valid_targets_mean": 3902.5, "valid_targets_min": 1043 }, { "epoch": 2.662090007627765, "grad_norm": 0.47396470274603764, "learning_rate": 3.1174185350048776e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.27201271057128906, "step": 3490, "valid_targets_mean": 3508.6, "valid_targets_min": 818 }, { "epoch": 2.665903890160183, "grad_norm": 0.42584203050280256, "learning_rate": 3.114261748309205e-05, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.2914293110370636, "step": 3495, "valid_targets_mean": 4368.4, "valid_targets_min": 1077 }, { "epoch": 2.669717772692601, "grad_norm": 0.4556486758423126, "learning_rate": 3.111100930993002e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.26826319098472595, "step": 3500, "valid_targets_mean": 3759.3, "valid_targets_min": 862 }, { "epoch": 2.6735316552250192, "grad_norm": 0.4313304144373171, "learning_rate": 3.107936094489897e-05, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.337573379278183, "step": 3505, "valid_targets_mean": 4508.1, "valid_targets_min": 1212 }, { "epoch": 2.677345537757437, "grad_norm": 0.503822426279713, "learning_rate": 3.104767250248056e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.29460129141807556, "step": 3510, "valid_targets_mean": 3213.6, "valid_targets_min": 1394 }, { "epoch": 2.681159420289855, "grad_norm": 0.443539023387382, "learning_rate": 3.101594409730146e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.3758798837661743, "step": 3515, "valid_targets_mean": 5032.7, "valid_targets_min": 854 }, { "epoch": 2.6849733028222733, "grad_norm": 0.41385413645152297, "learning_rate": 3.098417584413286e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.24815471470355988, "step": 3520, "valid_targets_mean": 4305.5, "valid_targets_min": 785 }, { "epoch": 2.688787185354691, "grad_norm": 0.46687358767596643, "learning_rate": 3.0952367857890116e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.29929205775260925, "step": 3525, "valid_targets_mean": 3941.3, "valid_targets_min": 472 }, { "epoch": 2.692601067887109, "grad_norm": 0.4396263260549913, "learning_rate": 3.092052025363229e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.32522842288017273, "step": 3530, "valid_targets_mean": 4580.7, "valid_targets_min": 1340 }, { "epoch": 2.696414950419527, "grad_norm": 0.4680531415671467, "learning_rate": 3.0888633146561756e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.3260200023651123, "step": 3535, "valid_targets_mean": 4359.8, "valid_targets_min": 1293 }, { "epoch": 2.700228832951945, "grad_norm": 0.4542256878885209, "learning_rate": 3.0856706652023806e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.30608275532722473, "step": 3540, "valid_targets_mean": 4218.7, "valid_targets_min": 450 }, { "epoch": 2.704042715484363, "grad_norm": 0.545077179745613, "learning_rate": 3.082474088550619e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.3118705749511719, "step": 3545, "valid_targets_mean": 3472.2, "valid_targets_min": 417 }, { "epoch": 2.707856598016781, "grad_norm": 0.46674246079597687, "learning_rate": 3.079273596263871e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.3758425712585449, "step": 3550, "valid_targets_mean": 4451.0, "valid_targets_min": 875 }, { "epoch": 2.7116704805491993, "grad_norm": 0.4322217416895522, "learning_rate": 3.0760691999192815e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.267362117767334, "step": 3555, "valid_targets_mean": 4483.9, "valid_targets_min": 300 }, { "epoch": 2.7154843630816172, "grad_norm": 0.45976089928354635, "learning_rate": 3.072860911108119e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.29339703917503357, "step": 3560, "valid_targets_mean": 4354.7, "valid_targets_min": 1286 }, { "epoch": 2.719298245614035, "grad_norm": 0.3995874661946734, "learning_rate": 3.06964874143573e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.29337623715400696, "step": 3565, "valid_targets_mean": 5228.0, "valid_targets_min": 981 }, { "epoch": 2.723112128146453, "grad_norm": 0.4521775129579294, "learning_rate": 3.0664327025214996e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.29508697986602783, "step": 3570, "valid_targets_mean": 3820.0, "valid_targets_min": 878 }, { "epoch": 2.726926010678871, "grad_norm": 0.4276913646473351, "learning_rate": 3.063212805998812e-05, "loss": 0.3085, "loss_nan_ranks": 0, "loss_rank_avg": 0.3139476478099823, "step": 3575, "valid_targets_mean": 4368.1, "valid_targets_min": 1600 }, { "epoch": 2.730739893211289, "grad_norm": 0.4514060342213421, "learning_rate": 3.059989063515001e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.3006206452846527, "step": 3580, "valid_targets_mean": 3854.9, "valid_targets_min": 494 }, { "epoch": 2.734553775743707, "grad_norm": 0.4603411167652157, "learning_rate": 3.056761486731316e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.3349507749080658, "step": 3585, "valid_targets_mean": 4717.0, "valid_targets_min": 1189 }, { "epoch": 2.738367658276125, "grad_norm": 0.44757870922058896, "learning_rate": 3.053530087322874e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.3137572705745697, "step": 3590, "valid_targets_mean": 4155.7, "valid_targets_min": 1165 }, { "epoch": 2.7421815408085433, "grad_norm": 0.4427568139153059, "learning_rate": 3.0502948769786206e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.34423160552978516, "step": 3595, "valid_targets_mean": 4736.5, "valid_targets_min": 361 }, { "epoch": 2.745995423340961, "grad_norm": 0.427371158670119, "learning_rate": 3.047055867401287e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.270975798368454, "step": 3600, "valid_targets_mean": 4545.8, "valid_targets_min": 1154 }, { "epoch": 2.749809305873379, "grad_norm": 1.452402046964983, "learning_rate": 3.043813070307347e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.5670013427734375, "step": 3605, "valid_targets_mean": 850.0, "valid_targets_min": 591 }, { "epoch": 2.753623188405797, "grad_norm": 0.48169002835878383, "learning_rate": 3.0405664974269738e-05, "loss": 0.4169, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203207850456238, "step": 3610, "valid_targets_mean": 4759.4, "valid_targets_min": 1427 }, { "epoch": 2.757437070938215, "grad_norm": 0.42776785443748766, "learning_rate": 3.037316160504001e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.30834314227104187, "step": 3615, "valid_targets_mean": 4934.1, "valid_targets_min": 1323 }, { "epoch": 2.761250953470633, "grad_norm": 0.4070539421650789, "learning_rate": 3.0340620712958765e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.30431488156318665, "step": 3620, "valid_targets_mean": 5120.2, "valid_targets_min": 1434 }, { "epoch": 2.765064836003051, "grad_norm": 0.41518918429874707, "learning_rate": 3.0308042415736215e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.3664722442626953, "step": 3625, "valid_targets_mean": 5194.8, "valid_targets_min": 1098 }, { "epoch": 2.7688787185354693, "grad_norm": 0.4102430332242187, "learning_rate": 3.0275426831217883e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.33445557951927185, "step": 3630, "valid_targets_mean": 5132.5, "valid_targets_min": 1481 }, { "epoch": 2.772692601067887, "grad_norm": 0.4735233795742744, "learning_rate": 3.024277407738416e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.2750890254974365, "step": 3635, "valid_targets_mean": 3928.4, "valid_targets_min": 1393 }, { "epoch": 2.776506483600305, "grad_norm": 0.42393895318486075, "learning_rate": 3.02100842723499e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.33074259757995605, "step": 3640, "valid_targets_mean": 4961.6, "valid_targets_min": 1262 }, { "epoch": 2.780320366132723, "grad_norm": 0.39335349576447576, "learning_rate": 3.017735753436398e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.31892308592796326, "step": 3645, "valid_targets_mean": 5054.6, "valid_targets_min": 967 }, { "epoch": 2.7841342486651413, "grad_norm": 0.4374520203995769, "learning_rate": 3.0144593981808863e-05, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934619188308716, "step": 3650, "valid_targets_mean": 4071.9, "valid_targets_min": 1746 }, { "epoch": 2.787948131197559, "grad_norm": 0.41212055790255153, "learning_rate": 3.0111793733200213e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.28573447465896606, "step": 3655, "valid_targets_mean": 4861.4, "valid_targets_min": 964 }, { "epoch": 2.791762013729977, "grad_norm": 0.4177575764120052, "learning_rate": 3.0078956907186396e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2791755795478821, "step": 3660, "valid_targets_mean": 4278.7, "valid_targets_min": 760 }, { "epoch": 2.7955758962623953, "grad_norm": 0.4328653362766987, "learning_rate": 3.0046083622548115e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922763526439667, "step": 3665, "valid_targets_mean": 4501.5, "valid_targets_min": 1257 }, { "epoch": 2.799389778794813, "grad_norm": 0.4311685870770303, "learning_rate": 3.0013173998197946e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.3213293254375458, "step": 3670, "valid_targets_mean": 4659.9, "valid_targets_min": 1254 }, { "epoch": 2.803203661327231, "grad_norm": 0.4739213958170537, "learning_rate": 2.9980228153179913e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.30476173758506775, "step": 3675, "valid_targets_mean": 4565.8, "valid_targets_min": 1223 }, { "epoch": 2.807017543859649, "grad_norm": 0.4101207028641973, "learning_rate": 2.9947246206669076e-05, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.3138103783130646, "step": 3680, "valid_targets_mean": 4624.6, "valid_targets_min": 1362 }, { "epoch": 2.8108314263920673, "grad_norm": 0.48502558987531175, "learning_rate": 2.9914228277971062e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.3027869164943695, "step": 3685, "valid_targets_mean": 4354.0, "valid_targets_min": 990 }, { "epoch": 2.814645308924485, "grad_norm": 0.4699784328853892, "learning_rate": 2.988117448652168e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.28289732336997986, "step": 3690, "valid_targets_mean": 3449.4, "valid_targets_min": 1076 }, { "epoch": 2.818459191456903, "grad_norm": 0.42719126112782174, "learning_rate": 2.9848084951886447e-05, "loss": 0.3072, "loss_nan_ranks": 0, "loss_rank_avg": 0.29756590723991394, "step": 3695, "valid_targets_mean": 4744.5, "valid_targets_min": 543 }, { "epoch": 2.8222730739893214, "grad_norm": 0.4756799163785362, "learning_rate": 2.9814959793760185e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.3334232270717621, "step": 3700, "valid_targets_mean": 4507.8, "valid_targets_min": 1165 }, { "epoch": 2.8260869565217392, "grad_norm": 0.42435957538086944, "learning_rate": 2.9781799131966575e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.34517112374305725, "step": 3705, "valid_targets_mean": 5040.6, "valid_targets_min": 1024 }, { "epoch": 2.829900839054157, "grad_norm": 0.4183943383548955, "learning_rate": 2.974860308645772e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.2884375751018524, "step": 3710, "valid_targets_mean": 4425.5, "valid_targets_min": 1392 }, { "epoch": 2.833714721586575, "grad_norm": 0.45371760515340676, "learning_rate": 2.9715371777313727e-05, "loss": 0.3109, "loss_nan_ranks": 0, "loss_rank_avg": 0.3239792287349701, "step": 3715, "valid_targets_mean": 4472.9, "valid_targets_min": 842 }, { "epoch": 2.837528604118993, "grad_norm": 0.42123373483544757, "learning_rate": 2.9682105324742246e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.30317559838294983, "step": 3720, "valid_targets_mean": 4990.8, "valid_targets_min": 1136 }, { "epoch": 2.841342486651411, "grad_norm": 0.40908457717851815, "learning_rate": 2.9648803849078062e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726430594921112, "step": 3725, "valid_targets_mean": 4901.2, "valid_targets_min": 1492 }, { "epoch": 2.845156369183829, "grad_norm": 0.5131351131948333, "learning_rate": 2.9615467470782658e-05, "loss": 0.3129, "loss_nan_ranks": 0, "loss_rank_avg": 0.32720550894737244, "step": 3730, "valid_targets_mean": 3929.0, "valid_targets_min": 424 }, { "epoch": 2.8489702517162474, "grad_norm": 0.4560432871680669, "learning_rate": 2.9582096310443753e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.27139559388160706, "step": 3735, "valid_targets_mean": 3375.7, "valid_targets_min": 554 }, { "epoch": 2.8527841342486653, "grad_norm": 0.464944255448322, "learning_rate": 2.9548690488774883e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.30860528349876404, "step": 3740, "valid_targets_mean": 4120.4, "valid_targets_min": 848 }, { "epoch": 2.856598016781083, "grad_norm": 0.4357985611831835, "learning_rate": 2.9515250126614988e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578648626804352, "step": 3745, "valid_targets_mean": 4417.2, "valid_targets_min": 1523 }, { "epoch": 2.860411899313501, "grad_norm": 0.4555909983730694, "learning_rate": 2.948177534492793e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.3738441467285156, "step": 3750, "valid_targets_mean": 5224.7, "valid_targets_min": 1249 }, { "epoch": 2.864225781845919, "grad_norm": 0.4515471831618389, "learning_rate": 2.944826626480208e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.27258816361427307, "step": 3755, "valid_targets_mean": 3902.9, "valid_targets_min": 1391 }, { "epoch": 2.8680396643783372, "grad_norm": 0.4356700442556603, "learning_rate": 2.9414723007449876e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.3169298768043518, "step": 3760, "valid_targets_mean": 4445.8, "valid_targets_min": 1054 }, { "epoch": 2.871853546910755, "grad_norm": 0.4477854060376825, "learning_rate": 2.938114569420739e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.3050214350223541, "step": 3765, "valid_targets_mean": 4350.8, "valid_targets_min": 1397 }, { "epoch": 2.875667429443173, "grad_norm": 1.498343127858281, "learning_rate": 2.934753444653389e-05, "loss": 0.3958, "loss_nan_ranks": 0, "loss_rank_avg": 0.5911208391189575, "step": 3770, "valid_targets_mean": 914.1, "valid_targets_min": 588 }, { "epoch": 2.8794813119755913, "grad_norm": 0.46199008167543115, "learning_rate": 2.9313889386011373e-05, "loss": 0.4099, "loss_nan_ranks": 0, "loss_rank_avg": 0.3243425786495209, "step": 3775, "valid_targets_mean": 4639.8, "valid_targets_min": 1284 }, { "epoch": 2.883295194508009, "grad_norm": 0.443878665174957, "learning_rate": 2.9280210634344172e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.30592426657676697, "step": 3780, "valid_targets_mean": 4357.5, "valid_targets_min": 1020 }, { "epoch": 2.887109077040427, "grad_norm": 0.4237997285481469, "learning_rate": 2.924649831335848e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.26578041911125183, "step": 3785, "valid_targets_mean": 4502.4, "valid_targets_min": 1004 }, { "epoch": 2.890922959572845, "grad_norm": 0.4445408846354412, "learning_rate": 2.9212752545001925e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063945174217224, "step": 3790, "valid_targets_mean": 4339.8, "valid_targets_min": 930 }, { "epoch": 2.8947368421052633, "grad_norm": 0.4220627608061861, "learning_rate": 2.917897345134311e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3011779487133026, "step": 3795, "valid_targets_mean": 4646.5, "valid_targets_min": 1421 }, { "epoch": 2.898550724637681, "grad_norm": 0.4253729735024821, "learning_rate": 2.9145161154571204e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.31455233693122864, "step": 3800, "valid_targets_mean": 4599.2, "valid_targets_min": 832 }, { "epoch": 2.902364607170099, "grad_norm": 0.4086984176466762, "learning_rate": 2.9111315776995474e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.28731080889701843, "step": 3805, "valid_targets_mean": 4735.2, "valid_targets_min": 826 }, { "epoch": 2.9061784897025174, "grad_norm": 0.4325378865974398, "learning_rate": 2.907743744104485e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.2914287745952606, "step": 3810, "valid_targets_mean": 4252.8, "valid_targets_min": 1127 }, { "epoch": 2.9099923722349352, "grad_norm": 0.4750481419343565, "learning_rate": 2.9043526269267476e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.324870765209198, "step": 3815, "valid_targets_mean": 3894.4, "valid_targets_min": 1215 }, { "epoch": 2.913806254767353, "grad_norm": 0.4681688455199492, "learning_rate": 2.9009582384330285e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.3059101402759552, "step": 3820, "valid_targets_mean": 4010.4, "valid_targets_min": 481 }, { "epoch": 2.917620137299771, "grad_norm": 0.4279954633684007, "learning_rate": 2.897560590901854e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.3050711452960968, "step": 3825, "valid_targets_mean": 4967.6, "valid_targets_min": 1270 }, { "epoch": 2.9214340198321893, "grad_norm": 0.4097007390277408, "learning_rate": 2.894159696623539e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.2968205511569977, "step": 3830, "valid_targets_mean": 5721.0, "valid_targets_min": 1628 }, { "epoch": 2.925247902364607, "grad_norm": 0.44134858980535835, "learning_rate": 2.8907555679001422e-05, "loss": 0.3093, "loss_nan_ranks": 0, "loss_rank_avg": 0.3263862133026123, "step": 3835, "valid_targets_mean": 4728.2, "valid_targets_min": 1357 }, { "epoch": 2.929061784897025, "grad_norm": 0.4782226338188455, "learning_rate": 2.8873482170454242e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.3298240602016449, "step": 3840, "valid_targets_mean": 3894.2, "valid_targets_min": 1206 }, { "epoch": 2.9328756674294434, "grad_norm": 0.4034262588335436, "learning_rate": 2.8839376563847995e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.2946132719516754, "step": 3845, "valid_targets_mean": 4810.2, "valid_targets_min": 1163 }, { "epoch": 2.9366895499618613, "grad_norm": 0.45988183381124215, "learning_rate": 2.880523898255293e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.35728612542152405, "step": 3850, "valid_targets_mean": 4159.2, "valid_targets_min": 1360 }, { "epoch": 2.940503432494279, "grad_norm": 0.43358117533596885, "learning_rate": 2.877106955005498e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.3028857111930847, "step": 3855, "valid_targets_mean": 4309.5, "valid_targets_min": 387 }, { "epoch": 2.944317315026697, "grad_norm": 0.47832181313680316, "learning_rate": 2.8736868389955268e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3072889745235443, "step": 3860, "valid_targets_mean": 3768.3, "valid_targets_min": 1367 }, { "epoch": 2.948131197559115, "grad_norm": 0.4028436185145172, "learning_rate": 2.8702635625969695e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.28554582595825195, "step": 3865, "valid_targets_mean": 4673.5, "valid_targets_min": 1133 }, { "epoch": 2.9519450800915332, "grad_norm": 0.448691951998679, "learning_rate": 2.8668371381928496e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.3088511526584625, "step": 3870, "valid_targets_mean": 4255.3, "valid_targets_min": 927 }, { "epoch": 2.955758962623951, "grad_norm": 0.4163765087317686, "learning_rate": 2.8634075781775763e-05, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.292270690202713, "step": 3875, "valid_targets_mean": 4703.5, "valid_targets_min": 1051 }, { "epoch": 2.9595728451563694, "grad_norm": 0.39036304470600586, "learning_rate": 2.859974894956901e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.2601741850376129, "step": 3880, "valid_targets_mean": 4793.8, "valid_targets_min": 833 }, { "epoch": 2.9633867276887873, "grad_norm": 0.42515271525416554, "learning_rate": 2.8565391009478744e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.3349475860595703, "step": 3885, "valid_targets_mean": 4686.7, "valid_targets_min": 539 }, { "epoch": 2.967200610221205, "grad_norm": 0.4970234362822981, "learning_rate": 2.8531002085787985e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.32301023602485657, "step": 3890, "valid_targets_mean": 3944.5, "valid_targets_min": 1142 }, { "epoch": 2.971014492753623, "grad_norm": 0.42196977157148824, "learning_rate": 2.8496582302891824e-05, "loss": 0.3109, "loss_nan_ranks": 0, "loss_rank_avg": 0.27662238478660583, "step": 3895, "valid_targets_mean": 4858.2, "valid_targets_min": 1367 }, { "epoch": 2.974828375286041, "grad_norm": 0.47386191834873953, "learning_rate": 2.8462131785297003e-05, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.30710312724113464, "step": 3900, "valid_targets_mean": 4201.6, "valid_targets_min": 1091 }, { "epoch": 2.9786422578184593, "grad_norm": 0.4299488991621925, "learning_rate": 2.8427650657621414e-05, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.34638655185699463, "step": 3905, "valid_targets_mean": 5343.2, "valid_targets_min": 1217 }, { "epoch": 2.982456140350877, "grad_norm": 0.4249651616035499, "learning_rate": 2.8393139044593687e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.2586444318294525, "step": 3910, "valid_targets_mean": 4284.1, "valid_targets_min": 781 }, { "epoch": 2.9862700228832955, "grad_norm": 0.41092107449889226, "learning_rate": 2.8358597071052737e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768830955028534, "step": 3915, "valid_targets_mean": 4534.6, "valid_targets_min": 487 }, { "epoch": 2.9900839054157133, "grad_norm": 0.47463601161870095, "learning_rate": 2.8324024861947284e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.30442145466804504, "step": 3920, "valid_targets_mean": 3462.0, "valid_targets_min": 603 }, { "epoch": 2.993897787948131, "grad_norm": 0.4527064420033862, "learning_rate": 2.828942254233543e-05, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.34296974539756775, "step": 3925, "valid_targets_mean": 4257.3, "valid_targets_min": 775 }, { "epoch": 2.997711670480549, "grad_norm": 1.5493618786931598, "learning_rate": 2.825479023738419e-05, "loss": 0.3772, "loss_nan_ranks": 0, "loss_rank_avg": 0.6141933798789978, "step": 3930, "valid_targets_mean": 912.7, "valid_targets_min": 582 }, { "epoch": 3.0015255530129674, "grad_norm": 0.48310757043244024, "learning_rate": 2.822012807236905e-05, "loss": 0.4621, "loss_nan_ranks": 0, "loss_rank_avg": 0.2655656039714813, "step": 3935, "valid_targets_mean": 4215.5, "valid_targets_min": 1273 }, { "epoch": 3.0053394355453853, "grad_norm": 0.5201274345684972, "learning_rate": 2.8185436172673505e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.290056049823761, "step": 3940, "valid_targets_mean": 3994.8, "valid_targets_min": 391 }, { "epoch": 3.009153318077803, "grad_norm": 0.4900178443387472, "learning_rate": 2.8150714663788607e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2928362786769867, "step": 3945, "valid_targets_mean": 3524.9, "valid_targets_min": 778 }, { "epoch": 3.012967200610221, "grad_norm": 0.4611566543168008, "learning_rate": 2.8115963671312522e-05, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.2869776785373688, "step": 3950, "valid_targets_mean": 4752.8, "valid_targets_min": 1034 }, { "epoch": 3.0167810831426394, "grad_norm": 0.4220079332151452, "learning_rate": 2.8081183320950062e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875734269618988, "step": 3955, "valid_targets_mean": 4435.6, "valid_targets_min": 477 }, { "epoch": 3.0205949656750573, "grad_norm": 0.43505589011064627, "learning_rate": 2.804637373851223e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964635193347931, "step": 3960, "valid_targets_mean": 5017.0, "valid_targets_min": 859 }, { "epoch": 3.024408848207475, "grad_norm": 0.4392891751276722, "learning_rate": 2.8011535049915787e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.3092955946922302, "step": 3965, "valid_targets_mean": 4434.5, "valid_targets_min": 1018 }, { "epoch": 3.028222730739893, "grad_norm": 0.4756626096657287, "learning_rate": 2.7976667381182755e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.33730098605155945, "step": 3970, "valid_targets_mean": 4181.9, "valid_targets_min": 1217 }, { "epoch": 3.0320366132723113, "grad_norm": 0.425272209059621, "learning_rate": 2.7941770858440013e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.308401495218277, "step": 3975, "valid_targets_mean": 4507.3, "valid_targets_min": 958 }, { "epoch": 3.035850495804729, "grad_norm": 0.47261764078577734, "learning_rate": 2.7906845607918787e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.3633866012096405, "step": 3980, "valid_targets_mean": 4527.0, "valid_targets_min": 969 }, { "epoch": 3.039664378337147, "grad_norm": 0.45027923592941194, "learning_rate": 2.7871891755954244e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875222861766815, "step": 3985, "valid_targets_mean": 4281.4, "valid_targets_min": 834 }, { "epoch": 3.0434782608695654, "grad_norm": 0.42756509589119934, "learning_rate": 2.7836909428984985e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.3177221119403839, "step": 3990, "valid_targets_mean": 4449.5, "valid_targets_min": 1005 }, { "epoch": 3.0472921434019833, "grad_norm": 0.4595474259293521, "learning_rate": 2.7801898753552646e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.304095596075058, "step": 3995, "valid_targets_mean": 4377.5, "valid_targets_min": 325 }, { "epoch": 3.051106025934401, "grad_norm": 0.4259516268464371, "learning_rate": 2.7766859856301383e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192457854747772, "step": 4000, "valid_targets_mean": 4967.5, "valid_targets_min": 933 }, { "epoch": 3.054919908466819, "grad_norm": 0.4444180247560326, "learning_rate": 2.7731792863977444e-05, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.2878134250640869, "step": 4005, "valid_targets_mean": 4432.8, "valid_targets_min": 1049 }, { "epoch": 3.0587337909992374, "grad_norm": 0.4431622200695571, "learning_rate": 2.7696697903428713e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2699919044971466, "step": 4010, "valid_targets_mean": 4070.9, "valid_targets_min": 1169 }, { "epoch": 3.0625476735316552, "grad_norm": 0.42489671707301224, "learning_rate": 2.7661575101604232e-05, "loss": 0.2992, "loss_nan_ranks": 0, "loss_rank_avg": 0.29186615347862244, "step": 4015, "valid_targets_mean": 5442.9, "valid_targets_min": 1401 }, { "epoch": 3.066361556064073, "grad_norm": 0.4245146413695337, "learning_rate": 2.7626424585553767e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.325810045003891, "step": 4020, "valid_targets_mean": 4809.8, "valid_targets_min": 1066 }, { "epoch": 3.0701754385964914, "grad_norm": 0.3791123204554425, "learning_rate": 2.7591246482427324e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.24728161096572876, "step": 4025, "valid_targets_mean": 5028.0, "valid_targets_min": 1443 }, { "epoch": 3.0739893211289093, "grad_norm": 0.43633981308469355, "learning_rate": 2.7556040919474703e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.3360931873321533, "step": 4030, "valid_targets_mean": 4940.6, "valid_targets_min": 1513 }, { "epoch": 3.077803203661327, "grad_norm": 0.39657770661164027, "learning_rate": 2.7520808024045023e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.28438836336135864, "step": 4035, "valid_targets_mean": 4996.4, "valid_targets_min": 1644 }, { "epoch": 3.081617086193745, "grad_norm": 0.45447668831956933, "learning_rate": 2.748554792358631e-05, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.27318766713142395, "step": 4040, "valid_targets_mean": 3740.3, "valid_targets_min": 1075 }, { "epoch": 3.0854309687261634, "grad_norm": 0.4367756589898555, "learning_rate": 2.745026074564495e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054395318031311, "step": 4045, "valid_targets_mean": 4505.4, "valid_targets_min": 846 }, { "epoch": 3.0892448512585813, "grad_norm": 0.4223604121541854, "learning_rate": 2.7414946617865314e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.2978456914424896, "step": 4050, "valid_targets_mean": 4903.7, "valid_targets_min": 337 }, { "epoch": 3.093058733790999, "grad_norm": 0.43033237877389213, "learning_rate": 2.737960566798924e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.2762766480445862, "step": 4055, "valid_targets_mean": 4822.3, "valid_targets_min": 1422 }, { "epoch": 3.096872616323417, "grad_norm": 0.40857330036886025, "learning_rate": 2.7344238023855584e-05, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.27897074818611145, "step": 4060, "valid_targets_mean": 4889.1, "valid_targets_min": 1257 }, { "epoch": 3.1006864988558354, "grad_norm": 0.452005688420249, "learning_rate": 2.7308843813399786e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.30446675419807434, "step": 4065, "valid_targets_mean": 4752.8, "valid_targets_min": 223 }, { "epoch": 3.1045003813882532, "grad_norm": 0.4060532799872907, "learning_rate": 2.7273423164653364e-05, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.31288203597068787, "step": 4070, "valid_targets_mean": 4683.4, "valid_targets_min": 1248 }, { "epoch": 3.108314263920671, "grad_norm": 0.4090987889175147, "learning_rate": 2.7237976205743483e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.30633795261383057, "step": 4075, "valid_targets_mean": 4901.8, "valid_targets_min": 1770 }, { "epoch": 3.1121281464530894, "grad_norm": 0.43929196666659526, "learning_rate": 2.7202503064892472e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.2629685401916504, "step": 4080, "valid_targets_mean": 4338.1, "valid_targets_min": 382 }, { "epoch": 3.1159420289855073, "grad_norm": 0.43667857011990463, "learning_rate": 2.7167003870417373e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.2743583619594574, "step": 4085, "valid_targets_mean": 3987.3, "valid_targets_min": 936 }, { "epoch": 3.119755911517925, "grad_norm": 0.432006100221033, "learning_rate": 2.7131478750729478e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.3109601140022278, "step": 4090, "valid_targets_mean": 4254.5, "valid_targets_min": 1019 }, { "epoch": 3.123569794050343, "grad_norm": 1.52971297266124, "learning_rate": 2.709592783433384e-05, "loss": 0.4114, "loss_nan_ranks": 0, "loss_rank_avg": 0.5797714591026306, "step": 4095, "valid_targets_mean": 871.8, "valid_targets_min": 612 }, { "epoch": 3.1273836765827614, "grad_norm": 0.48384704512411747, "learning_rate": 2.706035124982884e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.33182665705680847, "step": 4100, "valid_targets_mean": 4583.2, "valid_targets_min": 989 }, { "epoch": 3.1311975591151793, "grad_norm": 0.4293633304827102, "learning_rate": 2.70247491259057e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.3025500178337097, "step": 4105, "valid_targets_mean": 5153.6, "valid_targets_min": 1300 }, { "epoch": 3.135011441647597, "grad_norm": 0.4137531220478505, "learning_rate": 2.6989121591348042e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.2954184114933014, "step": 4110, "valid_targets_mean": 4562.9, "valid_targets_min": 1009 }, { "epoch": 3.138825324180015, "grad_norm": 0.44578706063633217, "learning_rate": 2.695346877503138e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.28965505957603455, "step": 4115, "valid_targets_mean": 4348.2, "valid_targets_min": 489 }, { "epoch": 3.1426392067124334, "grad_norm": 0.4231966599504782, "learning_rate": 2.6917790805922712e-05, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.3042294681072235, "step": 4120, "valid_targets_mean": 4731.0, "valid_targets_min": 1170 }, { "epoch": 3.1464530892448512, "grad_norm": 0.4382111519022077, "learning_rate": 2.6882087813079993e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.28395530581474304, "step": 4125, "valid_targets_mean": 4604.8, "valid_targets_min": 1536 }, { "epoch": 3.150266971777269, "grad_norm": 0.41220279417697464, "learning_rate": 2.684635992565172e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.2971174418926239, "step": 4130, "valid_targets_mean": 4894.4, "valid_targets_min": 1206 }, { "epoch": 3.1540808543096874, "grad_norm": 0.5066318014346421, "learning_rate": 2.6810607272876407e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.28627005219459534, "step": 4135, "valid_targets_mean": 3675.4, "valid_targets_min": 1096 }, { "epoch": 3.1578947368421053, "grad_norm": 0.42053061864748154, "learning_rate": 2.677482998408219e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.23367096483707428, "step": 4140, "valid_targets_mean": 4173.1, "valid_targets_min": 1378 }, { "epoch": 3.161708619374523, "grad_norm": 0.4314063513504651, "learning_rate": 2.67390281886863e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.2894207239151001, "step": 4145, "valid_targets_mean": 4910.4, "valid_targets_min": 1027 }, { "epoch": 3.165522501906941, "grad_norm": 0.39830842433372293, "learning_rate": 2.6703202016194617e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.2879965305328369, "step": 4150, "valid_targets_mean": 4634.0, "valid_targets_min": 353 }, { "epoch": 3.1693363844393594, "grad_norm": 0.43997400948287896, "learning_rate": 2.6667351596201207e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.28813639283180237, "step": 4155, "valid_targets_mean": 4294.4, "valid_targets_min": 841 }, { "epoch": 3.1731502669717773, "grad_norm": 0.43562273667182827, "learning_rate": 2.6631477058387836e-05, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.26361653208732605, "step": 4160, "valid_targets_mean": 4073.6, "valid_targets_min": 448 }, { "epoch": 3.176964149504195, "grad_norm": 0.4022019133128142, "learning_rate": 2.659557853252353e-05, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.2975803017616272, "step": 4165, "valid_targets_mean": 5350.9, "valid_targets_min": 1290 }, { "epoch": 3.1807780320366135, "grad_norm": 0.41775729801028555, "learning_rate": 2.6559656148464065e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.31065797805786133, "step": 4170, "valid_targets_mean": 4931.3, "valid_targets_min": 1049 }, { "epoch": 3.1845919145690313, "grad_norm": 0.42340874498162046, "learning_rate": 2.6523710036151538e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.28241145610809326, "step": 4175, "valid_targets_mean": 4305.8, "valid_targets_min": 747 }, { "epoch": 3.1884057971014492, "grad_norm": 0.4206928272872279, "learning_rate": 2.648774032561386e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.308231920003891, "step": 4180, "valid_targets_mean": 5015.2, "valid_targets_min": 962 }, { "epoch": 3.192219679633867, "grad_norm": 0.46998455382582077, "learning_rate": 2.6451747146964324e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.3151862919330597, "step": 4185, "valid_targets_mean": 4189.7, "valid_targets_min": 895 }, { "epoch": 3.1960335621662854, "grad_norm": 0.44181960848776786, "learning_rate": 2.6415730630401094e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.3007621765136719, "step": 4190, "valid_targets_mean": 4348.0, "valid_targets_min": 1047 }, { "epoch": 3.1998474446987033, "grad_norm": 0.3832339742293115, "learning_rate": 2.6379690906206774e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.31467732787132263, "step": 4195, "valid_targets_mean": 5705.5, "valid_targets_min": 1138 }, { "epoch": 3.203661327231121, "grad_norm": 0.392229055026644, "learning_rate": 2.63436281047479e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.293388694524765, "step": 4200, "valid_targets_mean": 5568.1, "valid_targets_min": 1459 }, { "epoch": 3.2074752097635395, "grad_norm": 0.5283415619583283, "learning_rate": 2.630754235647449e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.3029252588748932, "step": 4205, "valid_targets_mean": 4410.8, "valid_targets_min": 1391 }, { "epoch": 3.2112890922959574, "grad_norm": 0.4094720780562837, "learning_rate": 2.6271433791919574e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.3849099576473236, "step": 4210, "valid_targets_mean": 6173.7, "valid_targets_min": 1324 }, { "epoch": 3.2151029748283753, "grad_norm": 0.43046488665942784, "learning_rate": 2.6235302541698717e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.30120354890823364, "step": 4215, "valid_targets_mean": 4579.4, "valid_targets_min": 1042 }, { "epoch": 3.218916857360793, "grad_norm": 0.4789181271781151, "learning_rate": 2.6199148736509533e-05, "loss": 0.3147, "loss_nan_ranks": 0, "loss_rank_avg": 0.3252256512641907, "step": 4220, "valid_targets_mean": 4278.8, "valid_targets_min": 1484 }, { "epoch": 3.2227307398932115, "grad_norm": 0.43690382548291334, "learning_rate": 2.6162972507131233e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524643540382385, "step": 4225, "valid_targets_mean": 3789.8, "valid_targets_min": 850 }, { "epoch": 3.2265446224256293, "grad_norm": 0.4008308182938237, "learning_rate": 2.6126773984424136e-05, "loss": 0.3296, "loss_nan_ranks": 0, "loss_rank_avg": 0.3713483512401581, "step": 4230, "valid_targets_mean": 6207.3, "valid_targets_min": 1052 }, { "epoch": 3.230358504958047, "grad_norm": 0.41774399379354676, "learning_rate": 2.6090553299329208e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.27272287011146545, "step": 4235, "valid_targets_mean": 4272.5, "valid_targets_min": 279 }, { "epoch": 3.234172387490465, "grad_norm": 0.4093732314062262, "learning_rate": 2.605431058286759e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.3073391020298004, "step": 4240, "valid_targets_mean": 4975.9, "valid_targets_min": 706 }, { "epoch": 3.2379862700228834, "grad_norm": 0.47298284841603055, "learning_rate": 2.6018045966140105e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.3122836649417877, "step": 4245, "valid_targets_mean": 4119.1, "valid_targets_min": 291 }, { "epoch": 3.2418001525553013, "grad_norm": 0.40428395385460597, "learning_rate": 2.5981759580326796e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.3531065285205841, "step": 4250, "valid_targets_mean": 6081.3, "valid_targets_min": 1442 }, { "epoch": 3.245614035087719, "grad_norm": 0.4346135876532143, "learning_rate": 2.594545155668646e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.284991055727005, "step": 4255, "valid_targets_mean": 4164.0, "valid_targets_min": 1551 }, { "epoch": 3.2494279176201375, "grad_norm": 1.295013445237469, "learning_rate": 2.5909122026556156e-05, "loss": 0.4469, "loss_nan_ranks": 0, "loss_rank_avg": 0.5561190843582153, "step": 4260, "valid_targets_mean": 887.6, "valid_targets_min": 564 }, { "epoch": 3.2532418001525554, "grad_norm": 0.5633888295443477, "learning_rate": 2.5872771121350746e-05, "loss": 0.4165, "loss_nan_ranks": 0, "loss_rank_avg": 0.32503604888916016, "step": 4265, "valid_targets_mean": 3850.0, "valid_targets_min": 1141 }, { "epoch": 3.2570556826849733, "grad_norm": 0.5281593372478045, "learning_rate": 2.583639897256241e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.3609069883823395, "step": 4270, "valid_targets_mean": 4185.0, "valid_targets_min": 1144 }, { "epoch": 3.260869565217391, "grad_norm": 0.4891379681010717, "learning_rate": 2.580000571176017e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.29750365018844604, "step": 4275, "valid_targets_mean": 3510.4, "valid_targets_min": 1197 }, { "epoch": 3.2646834477498095, "grad_norm": 0.43956221026432685, "learning_rate": 2.5763591470589412e-05, "loss": 0.3188, "loss_nan_ranks": 0, "loss_rank_avg": 0.3253210783004761, "step": 4280, "valid_targets_mean": 4749.8, "valid_targets_min": 1060 }, { "epoch": 3.2684973302822273, "grad_norm": 0.46292002185303716, "learning_rate": 2.572715638077142e-05, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.33239755034446716, "step": 4285, "valid_targets_mean": 4043.5, "valid_targets_min": 1669 }, { "epoch": 3.272311212814645, "grad_norm": 0.5074495934712384, "learning_rate": 2.569070057410291e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.32021841406822205, "step": 4290, "valid_targets_mean": 3380.5, "valid_targets_min": 1275 }, { "epoch": 3.276125095347063, "grad_norm": 0.40410647442164166, "learning_rate": 2.5654224182455503e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.25639939308166504, "step": 4295, "valid_targets_mean": 4476.0, "valid_targets_min": 1255 }, { "epoch": 3.2799389778794814, "grad_norm": 0.4379359856829999, "learning_rate": 2.5617727337775304e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.308867871761322, "step": 4300, "valid_targets_mean": 4687.6, "valid_targets_min": 943 }, { "epoch": 3.2837528604118993, "grad_norm": 0.4635823928148595, "learning_rate": 2.5581210172082403e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.24824810028076172, "step": 4305, "valid_targets_mean": 3754.1, "valid_targets_min": 1090 }, { "epoch": 3.287566742944317, "grad_norm": 0.4683550105277778, "learning_rate": 2.554467281747039e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.28184881806373596, "step": 4310, "valid_targets_mean": 4163.5, "valid_targets_min": 842 }, { "epoch": 3.2913806254767355, "grad_norm": 0.4915064273261867, "learning_rate": 2.550811540610589e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834111750125885, "step": 4315, "valid_targets_mean": 3685.3, "valid_targets_min": 552 }, { "epoch": 3.2951945080091534, "grad_norm": 0.3914255824084369, "learning_rate": 2.5471538070228066e-05, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567122280597687, "step": 4320, "valid_targets_mean": 5006.8, "valid_targets_min": 757 }, { "epoch": 3.2990083905415712, "grad_norm": 0.472640247378806, "learning_rate": 2.5434940942148183e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.3348356783390045, "step": 4325, "valid_targets_mean": 4366.6, "valid_targets_min": 1039 }, { "epoch": 3.302822273073989, "grad_norm": 0.4923236156250513, "learning_rate": 2.5398324154249063e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.34193626046180725, "step": 4330, "valid_targets_mean": 3921.7, "valid_targets_min": 1132 }, { "epoch": 3.3066361556064074, "grad_norm": 0.471692146824963, "learning_rate": 2.5361687838984677e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.2816826403141022, "step": 4335, "valid_targets_mean": 3595.5, "valid_targets_min": 1221 }, { "epoch": 3.3104500381388253, "grad_norm": 0.42190916943969575, "learning_rate": 2.532503212887961e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746467888355255, "step": 4340, "valid_targets_mean": 4154.9, "valid_targets_min": 347 }, { "epoch": 3.314263920671243, "grad_norm": 0.453882889428085, "learning_rate": 2.5288357156528615e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.29759106040000916, "step": 4345, "valid_targets_mean": 4029.9, "valid_targets_min": 1333 }, { "epoch": 3.3180778032036615, "grad_norm": 0.49862486651056076, "learning_rate": 2.5251663054596115e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.28774699568748474, "step": 4350, "valid_targets_mean": 3458.5, "valid_targets_min": 359 }, { "epoch": 3.3218916857360794, "grad_norm": 0.4382109576845958, "learning_rate": 2.5214949955815744e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.273575097322464, "step": 4355, "valid_targets_mean": 4762.6, "valid_targets_min": 1560 }, { "epoch": 3.3257055682684973, "grad_norm": 0.3952193306320817, "learning_rate": 2.517821799298983e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.2989937365055084, "step": 4360, "valid_targets_mean": 4993.2, "valid_targets_min": 1108 }, { "epoch": 3.329519450800915, "grad_norm": 0.4299063443043704, "learning_rate": 2.5141467298988966e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.28979429602622986, "step": 4365, "valid_targets_mean": 4497.9, "valid_targets_min": 1254 }, { "epoch": 3.3333333333333335, "grad_norm": 0.4678185856388349, "learning_rate": 2.5104698006751478e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.2760257422924042, "step": 4370, "valid_targets_mean": 3716.8, "valid_targets_min": 751 }, { "epoch": 3.3371472158657514, "grad_norm": 0.44293102220158903, "learning_rate": 2.5067910249282977e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.28500014543533325, "step": 4375, "valid_targets_mean": 4523.8, "valid_targets_min": 1655 }, { "epoch": 3.3409610983981692, "grad_norm": 0.5415466643652644, "learning_rate": 2.503110415965587e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.2982900142669678, "step": 4380, "valid_targets_mean": 2946.4, "valid_targets_min": 1071 }, { "epoch": 3.3447749809305876, "grad_norm": 0.44053774022930603, "learning_rate": 2.4994279871008877e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539463937282562, "step": 4385, "valid_targets_mean": 4374.5, "valid_targets_min": 1125 }, { "epoch": 3.3485888634630054, "grad_norm": 0.44003841730672233, "learning_rate": 2.4957437516546543e-05, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.32349371910095215, "step": 4390, "valid_targets_mean": 4640.0, "valid_targets_min": 919 }, { "epoch": 3.3524027459954233, "grad_norm": 0.4464447323916682, "learning_rate": 2.4920577229538773e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.30756130814552307, "step": 4395, "valid_targets_mean": 4225.8, "valid_targets_min": 1071 }, { "epoch": 3.356216628527841, "grad_norm": 0.4147797648169543, "learning_rate": 2.4883699143320327e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.3059729039669037, "step": 4400, "valid_targets_mean": 4530.5, "valid_targets_min": 1432 }, { "epoch": 3.3600305110602595, "grad_norm": 0.48324594985252733, "learning_rate": 2.4846803391290362e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.28423330187797546, "step": 4405, "valid_targets_mean": 4117.8, "valid_targets_min": 689 }, { "epoch": 3.3638443935926774, "grad_norm": 0.39510207327738245, "learning_rate": 2.480989010691192e-05, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.29658064246177673, "step": 4410, "valid_targets_mean": 5399.8, "valid_targets_min": 1256 }, { "epoch": 3.3676582761250953, "grad_norm": 0.42497343584852565, "learning_rate": 2.4772959423711484e-05, "loss": 0.2876, "loss_nan_ranks": 0, "loss_rank_avg": 0.3150722086429596, "step": 4415, "valid_targets_mean": 4667.6, "valid_targets_min": 958 }, { "epoch": 3.3714721586575136, "grad_norm": 0.47430966618042086, "learning_rate": 2.4736011475278466e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.28610026836395264, "step": 4420, "valid_targets_mean": 4018.0, "valid_targets_min": 525 }, { "epoch": 3.3752860411899315, "grad_norm": 1.3538687602475996, "learning_rate": 2.4699046395264724e-05, "loss": 0.4153, "loss_nan_ranks": 0, "loss_rank_avg": 0.5354134440422058, "step": 4425, "valid_targets_mean": 843.5, "valid_targets_min": 555 }, { "epoch": 3.3790999237223494, "grad_norm": 0.4434389928639025, "learning_rate": 2.4662064317384093e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.321266770362854, "step": 4430, "valid_targets_mean": 5056.5, "valid_targets_min": 590 }, { "epoch": 3.3829138062547672, "grad_norm": 0.4176548333395029, "learning_rate": 2.4625065375411897e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.2966906726360321, "step": 4435, "valid_targets_mean": 4763.8, "valid_targets_min": 1576 }, { "epoch": 3.386727688787185, "grad_norm": 0.4832013590980464, "learning_rate": 2.458804970318446e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.32015255093574524, "step": 4440, "valid_targets_mean": 3990.1, "valid_targets_min": 856 }, { "epoch": 3.3905415713196034, "grad_norm": 0.43037675012382226, "learning_rate": 2.4551017434598618e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.26767686009407043, "step": 4445, "valid_targets_mean": 4260.4, "valid_targets_min": 395 }, { "epoch": 3.3943554538520213, "grad_norm": 0.4814709495318474, "learning_rate": 2.4513968703611247e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948641777038574, "step": 4450, "valid_targets_mean": 3419.1, "valid_targets_min": 531 }, { "epoch": 3.398169336384439, "grad_norm": 0.44472165177178047, "learning_rate": 2.4476903644238773e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.28508543968200684, "step": 4455, "valid_targets_mean": 4292.3, "valid_targets_min": 506 }, { "epoch": 3.4019832189168575, "grad_norm": 0.41201008799766403, "learning_rate": 2.4439822390556683e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.31197693943977356, "step": 4460, "valid_targets_mean": 5086.9, "valid_targets_min": 906 }, { "epoch": 3.4057971014492754, "grad_norm": 0.454379940882493, "learning_rate": 2.4402725076699058e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2770203649997711, "step": 4465, "valid_targets_mean": 4577.1, "valid_targets_min": 997 }, { "epoch": 3.4096109839816933, "grad_norm": 0.527988293091776, "learning_rate": 2.4365611836858045e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.31560805439949036, "step": 4470, "valid_targets_mean": 4082.6, "valid_targets_min": 545 }, { "epoch": 3.413424866514111, "grad_norm": 0.4064911273535986, "learning_rate": 2.4328482805283425e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2556368410587311, "step": 4475, "valid_targets_mean": 4709.9, "valid_targets_min": 1240 }, { "epoch": 3.4172387490465295, "grad_norm": 0.5843567476660677, "learning_rate": 2.4291338116282095e-05, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.2823584973812103, "step": 4480, "valid_targets_mean": 3790.3, "valid_targets_min": 820 }, { "epoch": 3.4210526315789473, "grad_norm": 0.4567750258288281, "learning_rate": 2.4254177904217584e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.294177383184433, "step": 4485, "valid_targets_mean": 4076.5, "valid_targets_min": 606 }, { "epoch": 3.4248665141113652, "grad_norm": 0.5011803624411254, "learning_rate": 2.4217002303509585e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2771233022212982, "step": 4490, "valid_targets_mean": 3349.8, "valid_targets_min": 1136 }, { "epoch": 3.4286803966437835, "grad_norm": 0.4659529424276567, "learning_rate": 2.417981144863344e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.3151896893978119, "step": 4495, "valid_targets_mean": 3970.9, "valid_targets_min": 844 }, { "epoch": 3.4324942791762014, "grad_norm": 0.4365423762808735, "learning_rate": 2.414260547411968e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.2706001102924347, "step": 4500, "valid_targets_mean": 4455.2, "valid_targets_min": 949 }, { "epoch": 3.4363081617086193, "grad_norm": 0.41739904226755675, "learning_rate": 2.4105384514553536e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2490123063325882, "step": 4505, "valid_targets_mean": 4767.6, "valid_targets_min": 1047 }, { "epoch": 3.440122044241037, "grad_norm": 0.44840746198558895, "learning_rate": 2.406814870457443e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.279386430978775, "step": 4510, "valid_targets_mean": 4174.1, "valid_targets_min": 571 }, { "epoch": 3.4439359267734555, "grad_norm": 0.4819890452945161, "learning_rate": 2.4030898178875505e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.26938095688819885, "step": 4515, "valid_targets_mean": 3857.3, "valid_targets_min": 414 }, { "epoch": 3.4477498093058734, "grad_norm": 0.44292361932334906, "learning_rate": 2.399363307220314e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.2844865024089813, "step": 4520, "valid_targets_mean": 4402.6, "valid_targets_min": 1365 }, { "epoch": 3.4515636918382913, "grad_norm": 0.46107216304175414, "learning_rate": 2.3956353519356457e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.33531391620635986, "step": 4525, "valid_targets_mean": 4102.7, "valid_targets_min": 335 }, { "epoch": 3.4553775743707096, "grad_norm": 0.442565568837418, "learning_rate": 2.3919059655186833e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.26467326283454895, "step": 4530, "valid_targets_mean": 4285.3, "valid_targets_min": 1265 }, { "epoch": 3.4591914569031275, "grad_norm": 0.4525205079659544, "learning_rate": 2.388175161459741e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.2614127993583679, "step": 4535, "valid_targets_mean": 4639.7, "valid_targets_min": 896 }, { "epoch": 3.4630053394355453, "grad_norm": 0.4286446055548415, "learning_rate": 2.384442953254262e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.31952324509620667, "step": 4540, "valid_targets_mean": 4769.8, "valid_targets_min": 1221 }, { "epoch": 3.466819221967963, "grad_norm": 0.4394695100350723, "learning_rate": 2.380709354402767e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.3081350326538086, "step": 4545, "valid_targets_mean": 4902.0, "valid_targets_min": 1328 }, { "epoch": 3.4706331045003815, "grad_norm": 0.44252990452185964, "learning_rate": 2.3769743784108098e-05, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925524413585663, "step": 4550, "valid_targets_mean": 4228.0, "valid_targets_min": 282 }, { "epoch": 3.4744469870327994, "grad_norm": 0.43649847593552715, "learning_rate": 2.3732380387889226e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.29324600100517273, "step": 4555, "valid_targets_mean": 4716.2, "valid_targets_min": 1282 }, { "epoch": 3.4782608695652173, "grad_norm": 0.5901540282708677, "learning_rate": 2.369500349052573e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.33937153220176697, "step": 4560, "valid_targets_mean": 6044.2, "valid_targets_min": 1284 }, { "epoch": 3.4820747520976356, "grad_norm": 0.48142713655684205, "learning_rate": 2.3657613227221102e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2688189446926117, "step": 4565, "valid_targets_mean": 3629.0, "valid_targets_min": 1103 }, { "epoch": 3.4858886346300535, "grad_norm": 0.4492333230953052, "learning_rate": 2.3620209733227192e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.25333163142204285, "step": 4570, "valid_targets_mean": 3804.1, "valid_targets_min": 887 }, { "epoch": 3.4897025171624714, "grad_norm": 0.476448139584302, "learning_rate": 2.3582793143843716e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749543786048889, "step": 4575, "valid_targets_mean": 4068.4, "valid_targets_min": 953 }, { "epoch": 3.4935163996948893, "grad_norm": 0.4359786993878809, "learning_rate": 2.3545363594417743e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.28557226061820984, "step": 4580, "valid_targets_mean": 4143.3, "valid_targets_min": 1066 }, { "epoch": 3.4973302822273076, "grad_norm": 1.3429881064610008, "learning_rate": 2.3507921220343248e-05, "loss": 0.3855, "loss_nan_ranks": 0, "loss_rank_avg": 0.5342379212379456, "step": 4585, "valid_targets_mean": 836.2, "valid_targets_min": 603 }, { "epoch": 3.5011441647597255, "grad_norm": 0.5099271236627688, "learning_rate": 2.347046615706057e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2950020730495453, "step": 4590, "valid_targets_mean": 4808.9, "valid_targets_min": 1261 }, { "epoch": 3.5049580472921433, "grad_norm": 0.45148904022167163, "learning_rate": 2.3432998540055968e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.26813894510269165, "step": 4595, "valid_targets_mean": 4466.8, "valid_targets_min": 1142 }, { "epoch": 3.5087719298245617, "grad_norm": 0.48016054420587306, "learning_rate": 2.3395518504861095e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.31315457820892334, "step": 4600, "valid_targets_mean": 3756.8, "valid_targets_min": 813 }, { "epoch": 3.5125858123569795, "grad_norm": 0.3827932809867314, "learning_rate": 2.3358026187052536e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.2498505562543869, "step": 4605, "valid_targets_mean": 5474.2, "valid_targets_min": 1300 }, { "epoch": 3.5163996948893974, "grad_norm": 0.4885836440650446, "learning_rate": 2.3320521722251308e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.3247798979282379, "step": 4610, "valid_targets_mean": 4359.9, "valid_targets_min": 1083 }, { "epoch": 3.5202135774218153, "grad_norm": 0.4165894714535205, "learning_rate": 2.328300524612236e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.3320067822933197, "step": 4615, "valid_targets_mean": 5239.2, "valid_targets_min": 1702 }, { "epoch": 3.524027459954233, "grad_norm": 0.39401369842550765, "learning_rate": 2.3245476894374087e-05, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.2737915515899658, "step": 4620, "valid_targets_mean": 5084.2, "valid_targets_min": 1785 }, { "epoch": 3.5278413424866515, "grad_norm": 0.4594224574976198, "learning_rate": 2.3207936802757844e-05, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.29349514842033386, "step": 4625, "valid_targets_mean": 4702.5, "valid_targets_min": 1313 }, { "epoch": 3.5316552250190694, "grad_norm": 0.5133283887809664, "learning_rate": 2.317038510706747e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.30904343724250793, "step": 4630, "valid_targets_mean": 3583.6, "valid_targets_min": 985 }, { "epoch": 3.5354691075514877, "grad_norm": 0.40462253402146175, "learning_rate": 2.3132821943138756e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.26162537932395935, "step": 4635, "valid_targets_mean": 4592.1, "valid_targets_min": 1251 }, { "epoch": 3.5392829900839056, "grad_norm": 0.4699941999637695, "learning_rate": 2.3095247446848986e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.2771185338497162, "step": 4640, "valid_targets_mean": 4387.5, "valid_targets_min": 1457 }, { "epoch": 3.5430968726163234, "grad_norm": 0.4482896520378407, "learning_rate": 2.305766175411643e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.26876458525657654, "step": 4645, "valid_targets_mean": 3782.0, "valid_targets_min": 1088 }, { "epoch": 3.5469107551487413, "grad_norm": 0.46170532954154736, "learning_rate": 2.302006500089988e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3280665874481201, "step": 4650, "valid_targets_mean": 4604.7, "valid_targets_min": 1161 }, { "epoch": 3.550724637681159, "grad_norm": 0.42087692641889823, "learning_rate": 2.2982457323198104e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.2573760747909546, "step": 4655, "valid_targets_mean": 4632.5, "valid_targets_min": 1194 }, { "epoch": 3.5545385202135775, "grad_norm": 0.4551534237796107, "learning_rate": 2.2944838857049422e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.25980302691459656, "step": 4660, "valid_targets_mean": 4064.3, "valid_targets_min": 338 }, { "epoch": 3.5583524027459954, "grad_norm": 0.39263337796345454, "learning_rate": 2.2907209738531152e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.3148830235004425, "step": 4665, "valid_targets_mean": 6088.7, "valid_targets_min": 1367 }, { "epoch": 3.5621662852784133, "grad_norm": 0.5187964098178377, "learning_rate": 2.2869570103759154e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.31824734807014465, "step": 4670, "valid_targets_mean": 3209.6, "valid_targets_min": 1198 }, { "epoch": 3.5659801678108316, "grad_norm": 0.39318418222353296, "learning_rate": 2.283192008888734e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.2371831089258194, "step": 4675, "valid_targets_mean": 4917.4, "valid_targets_min": 1111 }, { "epoch": 3.5697940503432495, "grad_norm": 0.47860026377836923, "learning_rate": 2.279425983010716e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.3355828821659088, "step": 4680, "valid_targets_mean": 4329.6, "valid_targets_min": 288 }, { "epoch": 3.5736079328756674, "grad_norm": 0.47204126314129596, "learning_rate": 2.2756589463647107e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.3069976270198822, "step": 4685, "valid_targets_mean": 3892.1, "valid_targets_min": 1071 }, { "epoch": 3.5774218154080852, "grad_norm": 0.44038100652623313, "learning_rate": 2.2718909125772255e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812940776348114, "step": 4690, "valid_targets_mean": 4560.3, "valid_targets_min": 1493 }, { "epoch": 3.5812356979405036, "grad_norm": 0.47684570252296454, "learning_rate": 2.2681218952783745e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.3217027485370636, "step": 4695, "valid_targets_mean": 3902.1, "valid_targets_min": 1093 }, { "epoch": 3.5850495804729214, "grad_norm": 0.4562186549419339, "learning_rate": 2.2643519081018284e-05, "loss": 0.3093, "loss_nan_ranks": 0, "loss_rank_avg": 0.30921462178230286, "step": 4700, "valid_targets_mean": 4113.0, "valid_targets_min": 1199 }, { "epoch": 3.5888634630053393, "grad_norm": 0.44993134293451825, "learning_rate": 2.2605809646847675e-05, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672576606273651, "step": 4705, "valid_targets_mean": 4444.2, "valid_targets_min": 312 }, { "epoch": 3.5926773455377576, "grad_norm": 0.5005018602677499, "learning_rate": 2.2568090786678303e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609889507293701, "step": 4710, "valid_targets_mean": 3446.8, "valid_targets_min": 957 }, { "epoch": 3.5964912280701755, "grad_norm": 0.4415676866527957, "learning_rate": 2.2530362636950646e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.27837008237838745, "step": 4715, "valid_targets_mean": 3975.3, "valid_targets_min": 368 }, { "epoch": 3.6003051106025934, "grad_norm": 0.48156304179055964, "learning_rate": 2.24926253341388e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.327156126499176, "step": 4720, "valid_targets_mean": 4176.2, "valid_targets_min": 366 }, { "epoch": 3.6041189931350113, "grad_norm": 0.4360672584760495, "learning_rate": 2.245487901474996e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536308467388153, "step": 4725, "valid_targets_mean": 4185.0, "valid_targets_min": 1214 }, { "epoch": 3.6079328756674296, "grad_norm": 0.40767628665247807, "learning_rate": 2.2417123815323936e-05, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.2984670102596283, "step": 4730, "valid_targets_mean": 5542.7, "valid_targets_min": 1423 }, { "epoch": 3.6117467581998475, "grad_norm": 0.45360199839129894, "learning_rate": 2.2379359872432662e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925918996334076, "step": 4735, "valid_targets_mean": 3912.8, "valid_targets_min": 995 }, { "epoch": 3.6155606407322654, "grad_norm": 0.4946715128075741, "learning_rate": 2.23415873226797e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.30403146147727966, "step": 4740, "valid_targets_mean": 3816.2, "valid_targets_min": 358 }, { "epoch": 3.6193745232646837, "grad_norm": 0.47406262208079786, "learning_rate": 2.2303806302699744e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.2904681861400604, "step": 4745, "valid_targets_mean": 4019.7, "valid_targets_min": 249 }, { "epoch": 3.6231884057971016, "grad_norm": 1.6624652115903416, "learning_rate": 2.2266016949158128e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.5583869218826294, "step": 4750, "valid_targets_mean": 827.7, "valid_targets_min": 481 }, { "epoch": 3.6270022883295194, "grad_norm": 0.504124880570195, "learning_rate": 2.2228219398750332e-05, "loss": 0.442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2691499590873718, "step": 4755, "valid_targets_mean": 4826.3, "valid_targets_min": 1355 }, { "epoch": 3.6308161708619373, "grad_norm": 0.4936141065951774, "learning_rate": 2.2190413788201494e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.2698126435279846, "step": 4760, "valid_targets_mean": 3571.9, "valid_targets_min": 1043 }, { "epoch": 3.634630053394355, "grad_norm": 0.4304446140565006, "learning_rate": 2.2152600254265893e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.2709462642669678, "step": 4765, "valid_targets_mean": 4900.3, "valid_targets_min": 1342 }, { "epoch": 3.6384439359267735, "grad_norm": 0.4034314385983401, "learning_rate": 2.2114778933726478e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.3143347203731537, "step": 4770, "valid_targets_mean": 5496.1, "valid_targets_min": 803 }, { "epoch": 3.6422578184591914, "grad_norm": 0.43621856626978023, "learning_rate": 2.2076949963394365e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.2733272612094879, "step": 4775, "valid_targets_mean": 4515.8, "valid_targets_min": 1413 }, { "epoch": 3.6460717009916097, "grad_norm": 0.8202631465156636, "learning_rate": 2.2039113480108333e-05, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054891526699066, "step": 4780, "valid_targets_mean": 5119.5, "valid_targets_min": 1388 }, { "epoch": 3.6498855835240276, "grad_norm": 0.4873756601176684, "learning_rate": 2.2001269620734354e-05, "loss": 0.3033, "loss_nan_ranks": 0, "loss_rank_avg": 0.3282296359539032, "step": 4785, "valid_targets_mean": 3815.8, "valid_targets_min": 1194 }, { "epoch": 3.6536994660564455, "grad_norm": 0.4301975751639404, "learning_rate": 2.1963418522165064e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.25355055928230286, "step": 4790, "valid_targets_mean": 4236.9, "valid_targets_min": 757 }, { "epoch": 3.6575133485888633, "grad_norm": 0.502083577647879, "learning_rate": 2.1925560321319292e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.2781239449977875, "step": 4795, "valid_targets_mean": 3783.9, "valid_targets_min": 366 }, { "epoch": 3.6613272311212812, "grad_norm": 0.4455469454708054, "learning_rate": 2.1887695155141565e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768062651157379, "step": 4800, "valid_targets_mean": 4387.9, "valid_targets_min": 437 }, { "epoch": 3.6651411136536995, "grad_norm": 0.43246638097368684, "learning_rate": 2.1849823160601602e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.30090662837028503, "step": 4805, "valid_targets_mean": 4708.5, "valid_targets_min": 996 }, { "epoch": 3.6689549961861174, "grad_norm": 0.48013536906608734, "learning_rate": 2.1811944474693812e-05, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.2882266342639923, "step": 4810, "valid_targets_mean": 3664.5, "valid_targets_min": 1377 }, { "epoch": 3.6727688787185357, "grad_norm": 0.4215066962223358, "learning_rate": 2.177405923443682e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.31770798563957214, "step": 4815, "valid_targets_mean": 5157.8, "valid_targets_min": 1195 }, { "epoch": 3.6765827612509536, "grad_norm": 0.4822129870662444, "learning_rate": 2.173616757687296e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803454101085663, "step": 4820, "valid_targets_mean": 4487.2, "valid_targets_min": 1171 }, { "epoch": 3.6803966437833715, "grad_norm": 0.4518314070729709, "learning_rate": 2.1698269639067772e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.30212217569351196, "step": 4825, "valid_targets_mean": 4547.0, "valid_targets_min": 807 }, { "epoch": 3.6842105263157894, "grad_norm": 0.4381394067728647, "learning_rate": 2.1660365558109522e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.2651013433933258, "step": 4830, "valid_targets_mean": 4092.2, "valid_targets_min": 460 }, { "epoch": 3.6880244088482073, "grad_norm": 0.4611168188871333, "learning_rate": 2.162245547110869e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.28754758834838867, "step": 4835, "valid_targets_mean": 4108.5, "valid_targets_min": 1266 }, { "epoch": 3.6918382913806256, "grad_norm": 0.4216410388557109, "learning_rate": 2.1584539515197476e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530418336391449, "step": 4840, "valid_targets_mean": 4882.8, "valid_targets_min": 1495 }, { "epoch": 3.6956521739130435, "grad_norm": 0.5101669538365097, "learning_rate": 2.1546617827529337e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.2959820330142975, "step": 4845, "valid_targets_mean": 3875.6, "valid_targets_min": 567 }, { "epoch": 3.6994660564454613, "grad_norm": 0.4422043707591292, "learning_rate": 2.1508690545278438e-05, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.25045129656791687, "step": 4850, "valid_targets_mean": 4307.8, "valid_targets_min": 513 }, { "epoch": 3.7032799389778797, "grad_norm": 0.48074229488333253, "learning_rate": 2.1470757805639186e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.2914007902145386, "step": 4855, "valid_targets_mean": 3635.8, "valid_targets_min": 1182 }, { "epoch": 3.7070938215102975, "grad_norm": 0.4432598278262152, "learning_rate": 2.1432819745825732e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.247156023979187, "step": 4860, "valid_targets_mean": 4326.8, "valid_targets_min": 1113 }, { "epoch": 3.7109077040427154, "grad_norm": 0.43543523339515255, "learning_rate": 2.139487650307147e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.2991539537906647, "step": 4865, "valid_targets_mean": 4774.8, "valid_targets_min": 1273 }, { "epoch": 3.7147215865751333, "grad_norm": 0.45320374074665914, "learning_rate": 2.135692821462855e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.2640787661075592, "step": 4870, "valid_targets_mean": 3983.8, "valid_targets_min": 1240 }, { "epoch": 3.7185354691075516, "grad_norm": 0.4730272978195686, "learning_rate": 2.131897501776736e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.2792348563671112, "step": 4875, "valid_targets_mean": 3923.6, "valid_targets_min": 1350 }, { "epoch": 3.7223493516399695, "grad_norm": 0.46367011168212957, "learning_rate": 2.128101704977605e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.26287421584129333, "step": 4880, "valid_targets_mean": 4225.2, "valid_targets_min": 1065 }, { "epoch": 3.7261632341723874, "grad_norm": 0.45822132449926056, "learning_rate": 2.124305444796003e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.26010265946388245, "step": 4885, "valid_targets_mean": 4470.3, "valid_targets_min": 1450 }, { "epoch": 3.7299771167048057, "grad_norm": 0.4999416286074579, "learning_rate": 2.1205087349641474e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.28680503368377686, "step": 4890, "valid_targets_mean": 4674.3, "valid_targets_min": 1425 }, { "epoch": 3.7337909992372236, "grad_norm": 1.1021522685950285, "learning_rate": 2.116711589215882e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.29555997252464294, "step": 4895, "valid_targets_mean": 4395.1, "valid_targets_min": 1035 }, { "epoch": 3.7376048817696415, "grad_norm": 0.4704972599874909, "learning_rate": 2.1129140212866268e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726249694824219, "step": 4900, "valid_targets_mean": 4035.6, "valid_targets_min": 390 }, { "epoch": 3.7414187643020593, "grad_norm": 0.4895949033004227, "learning_rate": 2.1091160449133294e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875785231590271, "step": 4905, "valid_targets_mean": 3985.5, "valid_targets_min": 1161 }, { "epoch": 3.7452326468344777, "grad_norm": 0.4732839023835256, "learning_rate": 2.105317673834415e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.3635139465332031, "step": 4910, "valid_targets_mean": 4737.2, "valid_targets_min": 759 }, { "epoch": 3.7490465293668955, "grad_norm": 0.7329967738195239, "learning_rate": 2.1015189217897364e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.3502159118652344, "step": 4915, "valid_targets_mean": 2071.2, "valid_targets_min": 576 }, { "epoch": 3.7528604118993134, "grad_norm": 0.5373102096273961, "learning_rate": 2.097719802520524e-05, "loss": 0.4261, "loss_nan_ranks": 0, "loss_rank_avg": 0.26391589641571045, "step": 4920, "valid_targets_mean": 3376.4, "valid_targets_min": 1296 }, { "epoch": 3.7566742944317317, "grad_norm": 0.5099941176506099, "learning_rate": 2.0939203297693384e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.25710639357566833, "step": 4925, "valid_targets_mean": 3332.5, "valid_targets_min": 1082 }, { "epoch": 3.7604881769641496, "grad_norm": 0.46162219390203724, "learning_rate": 2.090120517280017e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2861987054347992, "step": 4930, "valid_targets_mean": 4440.6, "valid_targets_min": 440 }, { "epoch": 3.7643020594965675, "grad_norm": 0.4620294227163194, "learning_rate": 2.086320378797626e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.29089245200157166, "step": 4935, "valid_targets_mean": 4926.2, "valid_targets_min": 1360 }, { "epoch": 3.7681159420289854, "grad_norm": 0.46269226142521863, "learning_rate": 2.0825199280684122e-05, "loss": 0.3014, "loss_nan_ranks": 0, "loss_rank_avg": 0.26844826340675354, "step": 4940, "valid_targets_mean": 4640.1, "valid_targets_min": 1372 }, { "epoch": 3.7719298245614032, "grad_norm": 0.44918665856402457, "learning_rate": 2.0787191788397503e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.2886035144329071, "step": 4945, "valid_targets_mean": 4349.8, "valid_targets_min": 1171 }, { "epoch": 3.7757437070938216, "grad_norm": 0.4611965587323673, "learning_rate": 2.0749181448600967e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.3016029894351959, "step": 4950, "valid_targets_mean": 5051.3, "valid_targets_min": 862 }, { "epoch": 3.7795575896262394, "grad_norm": 0.4769360159800852, "learning_rate": 2.0711168398789364e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.291471391916275, "step": 4955, "valid_targets_mean": 3710.4, "valid_targets_min": 1152 }, { "epoch": 3.7833714721586578, "grad_norm": 0.41686170733711136, "learning_rate": 2.0673152776467343e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.24968425929546356, "step": 4960, "valid_targets_mean": 4307.1, "valid_targets_min": 845 }, { "epoch": 3.7871853546910756, "grad_norm": 0.388968051713768, "learning_rate": 2.0635134719148873e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.2582361102104187, "step": 4965, "valid_targets_mean": 5233.7, "valid_targets_min": 1220 }, { "epoch": 3.7909992372234935, "grad_norm": 0.4120063369566906, "learning_rate": 2.0597114364356726e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2593841552734375, "step": 4970, "valid_targets_mean": 4571.8, "valid_targets_min": 1065 }, { "epoch": 3.7948131197559114, "grad_norm": 0.42356900591636804, "learning_rate": 2.0559091849621985e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.2937016785144806, "step": 4975, "valid_targets_mean": 5643.4, "valid_targets_min": 1265 }, { "epoch": 3.7986270022883293, "grad_norm": 0.404415109624401, "learning_rate": 2.0521067312483535e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.3042158782482147, "step": 4980, "valid_targets_mean": 5218.6, "valid_targets_min": 559 }, { "epoch": 3.8024408848207476, "grad_norm": 0.4155431744232426, "learning_rate": 2.048304089048759e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.21575789153575897, "step": 4985, "valid_targets_mean": 4188.2, "valid_targets_min": 1059 }, { "epoch": 3.8062547673531655, "grad_norm": 0.46950574889200086, "learning_rate": 2.044501272118718e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.3153056502342224, "step": 4990, "valid_targets_mean": 3989.5, "valid_targets_min": 581 }, { "epoch": 3.8100686498855834, "grad_norm": 0.43838438560538834, "learning_rate": 2.0406982942141646e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.291579931974411, "step": 4995, "valid_targets_mean": 4621.1, "valid_targets_min": 1325 }, { "epoch": 3.8138825324180017, "grad_norm": 0.44145322237824836, "learning_rate": 2.0368951690916166e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.2182352989912033, "step": 5000, "valid_targets_mean": 4515.5, "valid_targets_min": 1668 }, { "epoch": 3.8176964149504196, "grad_norm": 0.4504621882289278, "learning_rate": 2.0330919105081238e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.3026907742023468, "step": 5005, "valid_targets_mean": 4372.3, "valid_targets_min": 415 }, { "epoch": 3.8215102974828374, "grad_norm": 0.4929531534573359, "learning_rate": 2.0292885322212183e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.27263951301574707, "step": 5010, "valid_targets_mean": 4319.9, "valid_targets_min": 1306 }, { "epoch": 3.8253241800152553, "grad_norm": 0.41575043508311943, "learning_rate": 2.0254850479888652e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930053770542145, "step": 5015, "valid_targets_mean": 5146.0, "valid_targets_min": 577 }, { "epoch": 3.8291380625476736, "grad_norm": 0.4801883312541542, "learning_rate": 2.021681471569414e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.3446965515613556, "step": 5020, "valid_targets_mean": 4140.5, "valid_targets_min": 1019 }, { "epoch": 3.8329519450800915, "grad_norm": 0.41216892152068585, "learning_rate": 2.017877816721546e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.28163060545921326, "step": 5025, "valid_targets_mean": 4676.8, "valid_targets_min": 400 }, { "epoch": 3.8367658276125094, "grad_norm": 0.4279433137988471, "learning_rate": 2.0140740972042276e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602086365222931, "step": 5030, "valid_targets_mean": 4468.6, "valid_targets_min": 1380 }, { "epoch": 3.8405797101449277, "grad_norm": 0.4665598041153684, "learning_rate": 2.0102703267766584e-05, "loss": 0.286, "loss_nan_ranks": 0, "loss_rank_avg": 0.312650591135025, "step": 5035, "valid_targets_mean": 4409.3, "valid_targets_min": 841 }, { "epoch": 3.8443935926773456, "grad_norm": 0.44786662715514164, "learning_rate": 2.006466519198222e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.23634012043476105, "step": 5040, "valid_targets_mean": 5063.6, "valid_targets_min": 751 }, { "epoch": 3.8482074752097635, "grad_norm": 0.4974521996462959, "learning_rate": 2.0026626882284365e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2868984043598175, "step": 5045, "valid_targets_mean": 4401.0, "valid_targets_min": 1068 }, { "epoch": 3.8520213577421814, "grad_norm": 0.4303348110695608, "learning_rate": 1.998858847626906e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536643147468567, "step": 5050, "valid_targets_mean": 4594.3, "valid_targets_min": 1286 }, { "epoch": 3.8558352402745997, "grad_norm": 0.4798918018206437, "learning_rate": 1.995055011153267e-05, "loss": 0.2961, "loss_nan_ranks": 0, "loss_rank_avg": 0.28693172335624695, "step": 5055, "valid_targets_mean": 3978.6, "valid_targets_min": 1294 }, { "epoch": 3.8596491228070176, "grad_norm": 0.5833198149859566, "learning_rate": 1.9912511925671428e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2774660289287567, "step": 5060, "valid_targets_mean": 4207.2, "valid_targets_min": 1323 }, { "epoch": 3.8634630053394354, "grad_norm": 0.4438224992611823, "learning_rate": 1.987447405628092e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594674825668335, "step": 5065, "valid_targets_mean": 5099.1, "valid_targets_min": 1504 }, { "epoch": 3.8672768878718538, "grad_norm": 0.44237795466310065, "learning_rate": 1.9836436640955578e-05, "loss": 0.2686, "loss_nan_ranks": 0, "loss_rank_avg": 0.26847514510154724, "step": 5070, "valid_targets_mean": 4456.6, "valid_targets_min": 1314 }, { "epoch": 3.8710907704042716, "grad_norm": 0.43779853479233827, "learning_rate": 1.9798399817288197e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.27755558490753174, "step": 5075, "valid_targets_mean": 4562.6, "valid_targets_min": 927 }, { "epoch": 3.8749046529366895, "grad_norm": 1.14893712269878, "learning_rate": 1.976036372286943e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.41553497314453125, "step": 5080, "valid_targets_mean": 1294.0, "valid_targets_min": 629 }, { "epoch": 3.8787185354691074, "grad_norm": 0.505426898880738, "learning_rate": 1.972232849528729e-05, "loss": 0.4263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2346818894147873, "step": 5085, "valid_targets_mean": 4294.2, "valid_targets_min": 1401 }, { "epoch": 3.8825324180015257, "grad_norm": 0.44319385303652004, "learning_rate": 1.9684294272126662e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.27154862880706787, "step": 5090, "valid_targets_mean": 4119.6, "valid_targets_min": 1432 }, { "epoch": 3.8863463005339436, "grad_norm": 0.5459021377392329, "learning_rate": 1.9646261190968787e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.32108262181282043, "step": 5095, "valid_targets_mean": 4003.6, "valid_targets_min": 957 }, { "epoch": 3.8901601830663615, "grad_norm": 0.42387804406963075, "learning_rate": 1.9608229389390786e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.3090623915195465, "step": 5100, "valid_targets_mean": 4897.4, "valid_targets_min": 2186 }, { "epoch": 3.89397406559878, "grad_norm": 0.49421705023909407, "learning_rate": 1.9570199004965146e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.32566288113594055, "step": 5105, "valid_targets_mean": 4511.8, "valid_targets_min": 1021 }, { "epoch": 3.8977879481311977, "grad_norm": 0.4668014379335834, "learning_rate": 1.9532170175259225e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.2344411164522171, "step": 5110, "valid_targets_mean": 4368.4, "valid_targets_min": 480 }, { "epoch": 3.9016018306636155, "grad_norm": 0.43277753403218727, "learning_rate": 1.9494143037834778e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.30218103528022766, "step": 5115, "valid_targets_mean": 4824.0, "valid_targets_min": 447 }, { "epoch": 3.9054157131960334, "grad_norm": 0.4156421333456064, "learning_rate": 1.945611773024739e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.27466729283332825, "step": 5120, "valid_targets_mean": 4651.5, "valid_targets_min": 1039 }, { "epoch": 3.9092295957284513, "grad_norm": 0.47060667981939347, "learning_rate": 1.941809439004607e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.269515722990036, "step": 5125, "valid_targets_mean": 3880.5, "valid_targets_min": 1031 }, { "epoch": 3.9130434782608696, "grad_norm": 0.43145818157727733, "learning_rate": 1.9380073154772707e-05, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.2653549909591675, "step": 5130, "valid_targets_mean": 4223.7, "valid_targets_min": 1216 }, { "epoch": 3.9168573607932875, "grad_norm": 0.4877286412806023, "learning_rate": 1.934205416196156e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.2932646572589874, "step": 5135, "valid_targets_mean": 3868.4, "valid_targets_min": 898 }, { "epoch": 3.920671243325706, "grad_norm": 0.41908844260246153, "learning_rate": 1.9304037549138783e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.29270559549331665, "step": 5140, "valid_targets_mean": 4753.8, "valid_targets_min": 786 }, { "epoch": 3.9244851258581237, "grad_norm": 0.4784502269230572, "learning_rate": 1.926602345382192e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063240647315979, "step": 5145, "valid_targets_mean": 4156.7, "valid_targets_min": 830 }, { "epoch": 3.9282990083905416, "grad_norm": 0.4343307443707409, "learning_rate": 1.9228012013519414e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.2735506296157837, "step": 5150, "valid_targets_mean": 4672.8, "valid_targets_min": 589 }, { "epoch": 3.9321128909229595, "grad_norm": 0.4300181559503131, "learning_rate": 1.9190003365730096e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812347710132599, "step": 5155, "valid_targets_mean": 5184.3, "valid_targets_min": 257 }, { "epoch": 3.9359267734553773, "grad_norm": 0.4368057207707122, "learning_rate": 1.9151997647942702e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.31642988324165344, "step": 5160, "valid_targets_mean": 5125.9, "valid_targets_min": 1586 }, { "epoch": 3.9397406559877957, "grad_norm": 0.5006746338061084, "learning_rate": 1.9113994997635362e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.3068694472312927, "step": 5165, "valid_targets_mean": 3927.8, "valid_targets_min": 1098 }, { "epoch": 3.9435545385202135, "grad_norm": 0.479151537271904, "learning_rate": 1.9075995552275112e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.3017423450946808, "step": 5170, "valid_targets_mean": 4141.9, "valid_targets_min": 949 }, { "epoch": 3.9473684210526314, "grad_norm": 0.46514469000401915, "learning_rate": 1.9037999449317406e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.28211966156959534, "step": 5175, "valid_targets_mean": 4282.8, "valid_targets_min": 787 }, { "epoch": 3.9511823035850497, "grad_norm": 0.4460611254139414, "learning_rate": 1.9000006826205594e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.28090232610702515, "step": 5180, "valid_targets_mean": 4177.1, "valid_targets_min": 1063 }, { "epoch": 3.9549961861174676, "grad_norm": 0.4391877582917011, "learning_rate": 1.8962017820370443e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.282697468996048, "step": 5185, "valid_targets_mean": 4237.3, "valid_targets_min": 903 }, { "epoch": 3.9588100686498855, "grad_norm": 0.4187783195267498, "learning_rate": 1.892403256922964e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.23168055713176727, "step": 5190, "valid_targets_mean": 4525.2, "valid_targets_min": 528 }, { "epoch": 3.9626239511823034, "grad_norm": 0.4528277753081471, "learning_rate": 1.8886051210187277e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2916136085987091, "step": 5195, "valid_targets_mean": 4180.0, "valid_targets_min": 906 }, { "epoch": 3.9664378337147217, "grad_norm": 0.5162672915536458, "learning_rate": 1.884807388063338e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.28006768226623535, "step": 5200, "valid_targets_mean": 3554.5, "valid_targets_min": 837 }, { "epoch": 3.9702517162471396, "grad_norm": 0.421583313476623, "learning_rate": 1.8810100717943393e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.28844282031059265, "step": 5205, "valid_targets_mean": 4721.1, "valid_targets_min": 957 }, { "epoch": 3.9740655987795575, "grad_norm": 0.419280792206997, "learning_rate": 1.877213185947769e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.26939424872398376, "step": 5210, "valid_targets_mean": 4626.4, "valid_targets_min": 1120 }, { "epoch": 3.9778794813119758, "grad_norm": 0.4629473209847183, "learning_rate": 1.8734167442581072e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.24810916185379028, "step": 5215, "valid_targets_mean": 4065.1, "valid_targets_min": 871 }, { "epoch": 3.9816933638443937, "grad_norm": 0.5118809234713598, "learning_rate": 1.869620760458228e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.3038460314273834, "step": 5220, "valid_targets_mean": 3327.3, "valid_targets_min": 1278 }, { "epoch": 3.9855072463768115, "grad_norm": 0.5035213322974476, "learning_rate": 1.8658252482793485e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.292995423078537, "step": 5225, "valid_targets_mean": 4340.3, "valid_targets_min": 1044 }, { "epoch": 3.9893211289092294, "grad_norm": 0.42529772495906987, "learning_rate": 1.8620302214509804e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.23590444028377533, "step": 5230, "valid_targets_mean": 3947.8, "valid_targets_min": 258 }, { "epoch": 3.9931350114416477, "grad_norm": 0.4357103197502, "learning_rate": 1.8582356937008785e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.24585048854351044, "step": 5235, "valid_targets_mean": 5009.6, "valid_targets_min": 708 }, { "epoch": 3.9969488939740656, "grad_norm": 0.3816166815814907, "learning_rate": 1.8544416787549942e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.2795417308807373, "step": 5240, "valid_targets_mean": 5411.3, "valid_targets_min": 751 }, { "epoch": 4.000762776506484, "grad_norm": 0.5416479526027371, "learning_rate": 1.850648190337422e-05, "loss": 0.487, "loss_nan_ranks": 0, "loss_rank_avg": 0.27904537320137024, "step": 5245, "valid_targets_mean": 3583.6, "valid_targets_min": 1165 }, { "epoch": 4.004576659038902, "grad_norm": 0.5087452060708784, "learning_rate": 1.8468552421703535e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.31443047523498535, "step": 5250, "valid_targets_mean": 3674.5, "valid_targets_min": 1189 }, { "epoch": 4.00839054157132, "grad_norm": 0.47920887196013023, "learning_rate": 1.8430628479740243e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631620168685913, "step": 5255, "valid_targets_mean": 4028.5, "valid_targets_min": 732 }, { "epoch": 4.012204424103738, "grad_norm": 0.43552125958300064, "learning_rate": 1.839271021466668e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.28635895252227783, "step": 5260, "valid_targets_mean": 5221.5, "valid_targets_min": 1206 }, { "epoch": 4.016018306636155, "grad_norm": 0.46905637576964415, "learning_rate": 1.8354797763644628e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.2725812494754791, "step": 5265, "valid_targets_mean": 4305.4, "valid_targets_min": 1119 }, { "epoch": 4.019832189168573, "grad_norm": 0.43349093244065384, "learning_rate": 1.831689126381486e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.30661433935165405, "step": 5270, "valid_targets_mean": 4936.6, "valid_targets_min": 1143 }, { "epoch": 4.023646071700991, "grad_norm": 0.4918320057290233, "learning_rate": 1.8278990852296598e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.25690630078315735, "step": 5275, "valid_targets_mean": 3922.7, "valid_targets_min": 403 }, { "epoch": 4.02745995423341, "grad_norm": 0.42458062947621084, "learning_rate": 1.824109666618706e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.30049416422843933, "step": 5280, "valid_targets_mean": 4960.4, "valid_targets_min": 1542 }, { "epoch": 4.031273836765828, "grad_norm": 0.39963645779686524, "learning_rate": 1.820320884256093e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.23063836991786957, "step": 5285, "valid_targets_mean": 4685.0, "valid_targets_min": 1292 }, { "epoch": 4.035087719298246, "grad_norm": 0.41970732682492695, "learning_rate": 1.8165327518469888e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.22459344565868378, "step": 5290, "valid_targets_mean": 4371.2, "valid_targets_min": 794 }, { "epoch": 4.038901601830664, "grad_norm": 0.4908945778200589, "learning_rate": 1.8127452830942097e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.2542988359928131, "step": 5295, "valid_targets_mean": 4042.7, "valid_targets_min": 398 }, { "epoch": 4.0427154843630815, "grad_norm": 0.435112076490909, "learning_rate": 1.8089584916981714e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.22995798289775848, "step": 5300, "valid_targets_mean": 4469.0, "valid_targets_min": 1104 }, { "epoch": 4.046529366895499, "grad_norm": 0.496497698029133, "learning_rate": 1.8051723913568393e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.2845947742462158, "step": 5305, "valid_targets_mean": 3867.3, "valid_targets_min": 428 }, { "epoch": 4.050343249427917, "grad_norm": 0.4521890524780476, "learning_rate": 1.80138699576568e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707526981830597, "step": 5310, "valid_targets_mean": 4219.8, "valid_targets_min": 932 }, { "epoch": 4.054157131960336, "grad_norm": 0.44957196568861707, "learning_rate": 1.7976023186176102e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.266658216714859, "step": 5315, "valid_targets_mean": 4021.2, "valid_targets_min": 671 }, { "epoch": 4.057971014492754, "grad_norm": 0.43451221759899866, "learning_rate": 1.7938183736029473e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787042558193207, "step": 5320, "valid_targets_mean": 4478.9, "valid_targets_min": 1003 }, { "epoch": 4.061784897025172, "grad_norm": 0.4092319501876168, "learning_rate": 1.7900351744093604e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.2590319812297821, "step": 5325, "valid_targets_mean": 4576.3, "valid_targets_min": 941 }, { "epoch": 4.06559877955759, "grad_norm": 0.44767830732575387, "learning_rate": 1.7862527347218213e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.27546316385269165, "step": 5330, "valid_targets_mean": 4749.5, "valid_targets_min": 857 }, { "epoch": 4.0694126620900075, "grad_norm": 0.4185953444093869, "learning_rate": 1.7824710682225546e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.29678523540496826, "step": 5335, "valid_targets_mean": 5015.9, "valid_targets_min": 1048 }, { "epoch": 4.073226544622425, "grad_norm": 0.5216767400389845, "learning_rate": 1.7786901885909872e-05, "loss": 0.272, "loss_nan_ranks": 0, "loss_rank_avg": 0.2771632969379425, "step": 5340, "valid_targets_mean": 3328.6, "valid_targets_min": 531 }, { "epoch": 4.077040427154843, "grad_norm": 0.462063501870652, "learning_rate": 1.7749101095037004e-05, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.24681317806243896, "step": 5345, "valid_targets_mean": 4025.9, "valid_targets_min": 690 }, { "epoch": 4.080854309687262, "grad_norm": 0.45346407117733667, "learning_rate": 1.7711308446343787e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.28253352642059326, "step": 5350, "valid_targets_mean": 4707.8, "valid_targets_min": 1112 }, { "epoch": 4.08466819221968, "grad_norm": 0.4785053811062835, "learning_rate": 1.7673524076537628e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.29810595512390137, "step": 5355, "valid_targets_mean": 4859.3, "valid_targets_min": 1050 }, { "epoch": 4.088482074752098, "grad_norm": 0.4308493569201197, "learning_rate": 1.7635748122295978e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.24559128284454346, "step": 5360, "valid_targets_mean": 4339.5, "valid_targets_min": 433 }, { "epoch": 4.092295957284516, "grad_norm": 0.48191302755325544, "learning_rate": 1.7597980720265846e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.28685423731803894, "step": 5365, "valid_targets_mean": 4426.0, "valid_targets_min": 963 }, { "epoch": 4.0961098398169336, "grad_norm": 0.4875942242372229, "learning_rate": 1.7560222007063308e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2825605869293213, "step": 5370, "valid_targets_mean": 4379.4, "valid_targets_min": 1093 }, { "epoch": 4.099923722349351, "grad_norm": 0.5047475576226177, "learning_rate": 1.7522472119273004e-05, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.2979480028152466, "step": 5375, "valid_targets_mean": 4211.3, "valid_targets_min": 994 }, { "epoch": 4.103737604881769, "grad_norm": 0.47812820392617394, "learning_rate": 1.7484731193447658e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.2687206268310547, "step": 5380, "valid_targets_mean": 3960.5, "valid_targets_min": 594 }, { "epoch": 4.107551487414188, "grad_norm": 0.4620874475188822, "learning_rate": 1.7446999366107574e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.30755627155303955, "step": 5385, "valid_targets_mean": 4346.6, "valid_targets_min": 907 }, { "epoch": 4.111365369946606, "grad_norm": 0.5480698360224027, "learning_rate": 1.7409276773740136e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.27984118461608887, "step": 5390, "valid_targets_mean": 2910.8, "valid_targets_min": 1225 }, { "epoch": 4.115179252479024, "grad_norm": 0.433621353490338, "learning_rate": 1.737156355279933e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2788759171962738, "step": 5395, "valid_targets_mean": 5113.2, "valid_targets_min": 1293 }, { "epoch": 4.118993135011442, "grad_norm": 0.4639434128116733, "learning_rate": 1.7333859839705246e-05, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.2772332727909088, "step": 5400, "valid_targets_mean": 4186.8, "valid_targets_min": 1279 }, { "epoch": 4.12280701754386, "grad_norm": 1.579151123306477, "learning_rate": 1.7296165770843573e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.5295971632003784, "step": 5405, "valid_targets_mean": 806.0, "valid_targets_min": 581 }, { "epoch": 4.1266209000762775, "grad_norm": 0.5105839768882346, "learning_rate": 1.7258481482565118e-05, "loss": 0.3805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567860186100006, "step": 5410, "valid_targets_mean": 3869.5, "valid_targets_min": 1174 }, { "epoch": 4.130434782608695, "grad_norm": 0.44640858073953466, "learning_rate": 1.722080711118531e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.31472137570381165, "step": 5415, "valid_targets_mean": 4932.8, "valid_targets_min": 696 }, { "epoch": 4.134248665141113, "grad_norm": 0.5039903115695159, "learning_rate": 1.7183142792983697e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.32861748337745667, "step": 5420, "valid_targets_mean": 4283.7, "valid_targets_min": 336 }, { "epoch": 4.138062547673532, "grad_norm": 0.45734018055533465, "learning_rate": 1.714548866420348e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.2520674169063568, "step": 5425, "valid_targets_mean": 4151.8, "valid_targets_min": 1003 }, { "epoch": 4.14187643020595, "grad_norm": 0.5200103424217448, "learning_rate": 1.710784486105098e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.3251253664493561, "step": 5430, "valid_targets_mean": 3897.5, "valid_targets_min": 1039 }, { "epoch": 4.145690312738368, "grad_norm": 0.4458129550534968, "learning_rate": 1.7070211519695176e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.35341396927833557, "step": 5435, "valid_targets_mean": 5133.9, "valid_targets_min": 967 }, { "epoch": 4.149504195270786, "grad_norm": 0.4420239232383797, "learning_rate": 1.7032588776267208e-05, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.33999934792518616, "step": 5440, "valid_targets_mean": 4732.2, "valid_targets_min": 1318 }, { "epoch": 4.1533180778032035, "grad_norm": 0.4741109970058931, "learning_rate": 1.699497676685988e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.29192444682121277, "step": 5445, "valid_targets_mean": 4110.2, "valid_targets_min": 825 }, { "epoch": 4.157131960335621, "grad_norm": 0.4178824184918611, "learning_rate": 1.695737562752716e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2533215880393982, "step": 5450, "valid_targets_mean": 4636.5, "valid_targets_min": 716 }, { "epoch": 4.160945842868039, "grad_norm": 0.4723531617223507, "learning_rate": 1.6919785494283704e-05, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707185745239258, "step": 5455, "valid_targets_mean": 3819.3, "valid_targets_min": 706 }, { "epoch": 4.164759725400458, "grad_norm": 0.48034451668280265, "learning_rate": 1.6882206503104345e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.29053595662117004, "step": 5460, "valid_targets_mean": 4347.7, "valid_targets_min": 828 }, { "epoch": 4.168573607932876, "grad_norm": 0.5341006587681983, "learning_rate": 1.6844638789923626e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.31795796751976013, "step": 5465, "valid_targets_mean": 3255.6, "valid_targets_min": 873 }, { "epoch": 4.172387490465294, "grad_norm": 0.46299043551009134, "learning_rate": 1.680708249063528e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508344352245331, "step": 5470, "valid_targets_mean": 4260.3, "valid_targets_min": 831 }, { "epoch": 4.176201372997712, "grad_norm": 0.45616141827399853, "learning_rate": 1.676953774109177e-05, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717251777648926, "step": 5475, "valid_targets_mean": 4702.5, "valid_targets_min": 1005 }, { "epoch": 4.1800152555301295, "grad_norm": 0.42401454170133096, "learning_rate": 1.6732004677103758e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.29828864336013794, "step": 5480, "valid_targets_mean": 4791.1, "valid_targets_min": 1118 }, { "epoch": 4.183829138062547, "grad_norm": 0.4527669070004305, "learning_rate": 1.6694483434439656e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.25608429312705994, "step": 5485, "valid_targets_mean": 4262.0, "valid_targets_min": 1530 }, { "epoch": 4.187643020594965, "grad_norm": 0.4816221826659873, "learning_rate": 1.66569741488251e-05, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672211229801178, "step": 5490, "valid_targets_mean": 3935.8, "valid_targets_min": 903 }, { "epoch": 4.191456903127384, "grad_norm": 0.4901532290032959, "learning_rate": 1.6619476955942482e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.2634734511375427, "step": 5495, "valid_targets_mean": 3706.3, "valid_targets_min": 530 }, { "epoch": 4.195270785659802, "grad_norm": 0.44500826527307435, "learning_rate": 1.6581991991430445e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2523365914821625, "step": 5500, "valid_targets_mean": 4076.1, "valid_targets_min": 1141 }, { "epoch": 4.19908466819222, "grad_norm": 0.42766997819820646, "learning_rate": 1.654451939088341e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672201097011566, "step": 5505, "valid_targets_mean": 5251.6, "valid_targets_min": 1450 }, { "epoch": 4.202898550724638, "grad_norm": 0.5025906795175384, "learning_rate": 1.6507059289851057e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.3079371154308319, "step": 5510, "valid_targets_mean": 4642.8, "valid_targets_min": 1081 }, { "epoch": 4.206712433257056, "grad_norm": 0.48921213724608315, "learning_rate": 1.646961182383786e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.2763393819332123, "step": 5515, "valid_targets_mean": 3639.0, "valid_targets_min": 1086 }, { "epoch": 4.2105263157894735, "grad_norm": 0.45072246512454434, "learning_rate": 1.6432177128302597e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000883460044861, "step": 5520, "valid_targets_mean": 5069.9, "valid_targets_min": 1688 }, { "epoch": 4.214340198321891, "grad_norm": 0.45130665609379705, "learning_rate": 1.639475533865784e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.28898870944976807, "step": 5525, "valid_targets_mean": 4288.3, "valid_targets_min": 1208 }, { "epoch": 4.21815408085431, "grad_norm": 0.45781620819851476, "learning_rate": 1.6357346590269477e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.28579166531562805, "step": 5530, "valid_targets_mean": 4843.5, "valid_targets_min": 1194 }, { "epoch": 4.221967963386728, "grad_norm": 0.4758765538089831, "learning_rate": 1.631995101845622e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063182532787323, "step": 5535, "valid_targets_mean": 4466.1, "valid_targets_min": 880 }, { "epoch": 4.225781845919146, "grad_norm": 0.45531261671036943, "learning_rate": 1.6282568758489132e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.3045072853565216, "step": 5540, "valid_targets_mean": 4690.0, "valid_targets_min": 1236 }, { "epoch": 4.229595728451564, "grad_norm": 0.4263889830178174, "learning_rate": 1.6245199945591105e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.29434555768966675, "step": 5545, "valid_targets_mean": 5107.2, "valid_targets_min": 487 }, { "epoch": 4.233409610983982, "grad_norm": 0.49067696246605885, "learning_rate": 1.6207844714936395e-05, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.3065944015979767, "step": 5550, "valid_targets_mean": 4363.1, "valid_targets_min": 458 }, { "epoch": 4.2372234935163995, "grad_norm": 0.40948653083424746, "learning_rate": 1.6170503201650137e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.20808136463165283, "step": 5555, "valid_targets_mean": 4294.9, "valid_targets_min": 966 }, { "epoch": 4.241037376048817, "grad_norm": 0.5026832111641061, "learning_rate": 1.6133175540807824e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2692430317401886, "step": 5560, "valid_targets_mean": 3893.9, "valid_targets_min": 413 }, { "epoch": 4.244851258581235, "grad_norm": 0.4125233801311475, "learning_rate": 1.6095861867434867e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.32503649592399597, "step": 5565, "valid_targets_mean": 5176.9, "valid_targets_min": 1670 }, { "epoch": 4.248665141113654, "grad_norm": 1.5198766849042715, "learning_rate": 1.6058562316506067e-05, "loss": 0.3617, "loss_nan_ranks": 0, "loss_rank_avg": 0.5387596487998962, "step": 5570, "valid_targets_mean": 810.6, "valid_targets_min": 535 }, { "epoch": 4.252479023646072, "grad_norm": 0.5345120185370117, "learning_rate": 1.602127702294513e-05, "loss": 0.4276, "loss_nan_ranks": 0, "loss_rank_avg": 0.2753293514251709, "step": 5575, "valid_targets_mean": 4129.8, "valid_targets_min": 1107 }, { "epoch": 4.25629290617849, "grad_norm": 0.42624283846744887, "learning_rate": 1.598400612162421e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.2693823575973511, "step": 5580, "valid_targets_mean": 4639.1, "valid_targets_min": 1095 }, { "epoch": 4.260106788710908, "grad_norm": 0.4621944129281794, "learning_rate": 1.5946749747363378e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.3092004060745239, "step": 5585, "valid_targets_mean": 4519.8, "valid_targets_min": 1406 }, { "epoch": 4.2639206712433255, "grad_norm": 0.427116201066583, "learning_rate": 1.5909508034930174e-05, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.3015022873878479, "step": 5590, "valid_targets_mean": 4776.9, "valid_targets_min": 612 }, { "epoch": 4.267734553775743, "grad_norm": 0.4772384606050245, "learning_rate": 1.5872281119039092e-05, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.26618143916130066, "step": 5595, "valid_targets_mean": 4011.5, "valid_targets_min": 1010 }, { "epoch": 4.271548436308162, "grad_norm": 0.46352271693533037, "learning_rate": 1.583506913435111e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.2845820486545563, "step": 5600, "valid_targets_mean": 4406.2, "valid_targets_min": 637 }, { "epoch": 4.27536231884058, "grad_norm": 0.42304973311417576, "learning_rate": 1.579787221547318e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.28748199343681335, "step": 5605, "valid_targets_mean": 4840.3, "valid_targets_min": 419 }, { "epoch": 4.279176201372998, "grad_norm": 0.426975836904547, "learning_rate": 1.5760690496957777e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.26385220885276794, "step": 5610, "valid_targets_mean": 4914.1, "valid_targets_min": 402 }, { "epoch": 4.282990083905416, "grad_norm": 0.48513234007763295, "learning_rate": 1.5723524113302385e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.2918134033679962, "step": 5615, "valid_targets_mean": 4047.7, "valid_targets_min": 980 }, { "epoch": 4.286803966437834, "grad_norm": 0.49163740430944686, "learning_rate": 1.5686373198949e-05, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.23882454633712769, "step": 5620, "valid_targets_mean": 3536.7, "valid_targets_min": 632 }, { "epoch": 4.290617848970252, "grad_norm": 0.46719163433098254, "learning_rate": 1.564923788828369e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.26404812932014465, "step": 5625, "valid_targets_mean": 4187.7, "valid_targets_min": 1076 }, { "epoch": 4.294431731502669, "grad_norm": 0.45690373458159445, "learning_rate": 1.5612118315636052e-05, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.3266724646091461, "step": 5630, "valid_targets_mean": 4868.3, "valid_targets_min": 1105 }, { "epoch": 4.298245614035087, "grad_norm": 0.41999328222502763, "learning_rate": 1.557501461527877e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.27965047955513, "step": 5635, "valid_targets_mean": 5149.8, "valid_targets_min": 1460 }, { "epoch": 4.302059496567506, "grad_norm": 0.46175536669142053, "learning_rate": 1.5537926921427116e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.27793920040130615, "step": 5640, "valid_targets_mean": 4480.2, "valid_targets_min": 1324 }, { "epoch": 4.305873379099924, "grad_norm": 0.42147544339206316, "learning_rate": 1.5500855368238442e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.257891982793808, "step": 5645, "valid_targets_mean": 5117.4, "valid_targets_min": 1220 }, { "epoch": 4.309687261632342, "grad_norm": 0.44482482821139985, "learning_rate": 1.5463800089811743e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.24403272569179535, "step": 5650, "valid_targets_mean": 4186.8, "valid_targets_min": 1146 }, { "epoch": 4.31350114416476, "grad_norm": 0.4599350132288009, "learning_rate": 1.542676122018712e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.24115292727947235, "step": 5655, "valid_targets_mean": 3831.2, "valid_targets_min": 253 }, { "epoch": 4.317315026697178, "grad_norm": 0.49875170980568123, "learning_rate": 1.5389738893345324e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.234399676322937, "step": 5660, "valid_targets_mean": 3607.4, "valid_targets_min": 1042 }, { "epoch": 4.3211289092295955, "grad_norm": 0.46862374247924743, "learning_rate": 1.5352733243207272e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2704668939113617, "step": 5665, "valid_targets_mean": 4192.1, "valid_targets_min": 977 }, { "epoch": 4.324942791762013, "grad_norm": 0.4704412496016771, "learning_rate": 1.531574440363355e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.31678804755210876, "step": 5670, "valid_targets_mean": 4463.8, "valid_targets_min": 422 }, { "epoch": 4.328756674294432, "grad_norm": 0.46882886163215814, "learning_rate": 1.527877250842394e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.2824307382106781, "step": 5675, "valid_targets_mean": 3865.7, "valid_targets_min": 872 }, { "epoch": 4.33257055682685, "grad_norm": 0.465191078872391, "learning_rate": 1.524181769131693e-05, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.30152150988578796, "step": 5680, "valid_targets_mean": 4387.8, "valid_targets_min": 1158 }, { "epoch": 4.336384439359268, "grad_norm": 0.4866591622076078, "learning_rate": 1.5204880085989222e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.2841610610485077, "step": 5685, "valid_targets_mean": 3781.8, "valid_targets_min": 952 }, { "epoch": 4.340198321891686, "grad_norm": 0.45140279740309064, "learning_rate": 1.5167959826055269e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.30225178599357605, "step": 5690, "valid_targets_mean": 4454.2, "valid_targets_min": 1011 }, { "epoch": 4.344012204424104, "grad_norm": 0.4653747607523385, "learning_rate": 1.5131057045066783e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.2756575345993042, "step": 5695, "valid_targets_mean": 4502.6, "valid_targets_min": 1432 }, { "epoch": 4.3478260869565215, "grad_norm": 0.45942886046871895, "learning_rate": 1.5094171876512241e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.24686582386493683, "step": 5700, "valid_targets_mean": 3902.8, "valid_targets_min": 1109 }, { "epoch": 4.351639969488939, "grad_norm": 0.5051926834497391, "learning_rate": 1.505730445381641e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.2773900330066681, "step": 5705, "valid_targets_mean": 3772.5, "valid_targets_min": 315 }, { "epoch": 4.355453852021358, "grad_norm": 0.4440379992293962, "learning_rate": 1.5020454910339872e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.24155227839946747, "step": 5710, "valid_targets_mean": 4127.8, "valid_targets_min": 1115 }, { "epoch": 4.359267734553776, "grad_norm": 0.44963486053345575, "learning_rate": 1.4983623379378527e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.28549474477767944, "step": 5715, "valid_targets_mean": 4378.5, "valid_targets_min": 852 }, { "epoch": 4.363081617086194, "grad_norm": 0.4472315426767612, "learning_rate": 1.4946809994163123e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.27043840289115906, "step": 5720, "valid_targets_mean": 4515.4, "valid_targets_min": 1133 }, { "epoch": 4.366895499618612, "grad_norm": 0.49041276551147356, "learning_rate": 1.4910014887858771e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672957479953766, "step": 5725, "valid_targets_mean": 4044.7, "valid_targets_min": 957 }, { "epoch": 4.37070938215103, "grad_norm": 0.5021537373097715, "learning_rate": 1.4873238193564453e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.256434828042984, "step": 5730, "valid_targets_mean": 3531.8, "valid_targets_min": 1157 }, { "epoch": 4.3745232646834475, "grad_norm": 1.5771455277598134, "learning_rate": 1.4836480044312554e-05, "loss": 0.3403, "loss_nan_ranks": 0, "loss_rank_avg": 0.5025232434272766, "step": 5735, "valid_targets_mean": 835.1, "valid_targets_min": 688 }, { "epoch": 4.378337147215865, "grad_norm": 0.48611824526015895, "learning_rate": 1.4799740573068387e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.29094183444976807, "step": 5740, "valid_targets_mean": 4893.0, "valid_targets_min": 1417 }, { "epoch": 4.382151029748284, "grad_norm": 0.4538885965811372, "learning_rate": 1.4763019912729694e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.26907357573509216, "step": 5745, "valid_targets_mean": 4450.6, "valid_targets_min": 515 }, { "epoch": 4.385964912280702, "grad_norm": 0.4542783244954703, "learning_rate": 1.472631819612615e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.27067530155181885, "step": 5750, "valid_targets_mean": 4019.0, "valid_targets_min": 1012 }, { "epoch": 4.38977879481312, "grad_norm": 0.49891633273896363, "learning_rate": 1.468963555601894e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.28321823477745056, "step": 5755, "valid_targets_mean": 3763.9, "valid_targets_min": 359 }, { "epoch": 4.393592677345538, "grad_norm": 0.4473374870727865, "learning_rate": 1.4652972125100217e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2813161611557007, "step": 5760, "valid_targets_mean": 4015.6, "valid_targets_min": 621 }, { "epoch": 4.397406559877956, "grad_norm": 0.467832789716142, "learning_rate": 1.4616328035992667e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.26224663853645325, "step": 5765, "valid_targets_mean": 3888.2, "valid_targets_min": 896 }, { "epoch": 4.401220442410374, "grad_norm": 0.43705587434793697, "learning_rate": 1.4579703421249e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.30531108379364014, "step": 5770, "valid_targets_mean": 5288.5, "valid_targets_min": 1568 }, { "epoch": 4.4050343249427915, "grad_norm": 0.4256869545786574, "learning_rate": 1.4543098413351486e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2970990240573883, "step": 5775, "valid_targets_mean": 5047.0, "valid_targets_min": 881 }, { "epoch": 4.408848207475209, "grad_norm": 0.43583173290283295, "learning_rate": 1.4506513144711472e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.30243197083473206, "step": 5780, "valid_targets_mean": 5445.3, "valid_targets_min": 1961 }, { "epoch": 4.412662090007628, "grad_norm": 0.45939499966153063, "learning_rate": 1.4469947747668895e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.2970567047595978, "step": 5785, "valid_targets_mean": 4571.8, "valid_targets_min": 1102 }, { "epoch": 4.416475972540046, "grad_norm": 0.39838106818527075, "learning_rate": 1.4433402354491818e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2937869727611542, "step": 5790, "valid_targets_mean": 5518.0, "valid_targets_min": 1383 }, { "epoch": 4.420289855072464, "grad_norm": 0.4420135944332066, "learning_rate": 1.4396877097375942e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.33492088317871094, "step": 5795, "valid_targets_mean": 5061.8, "valid_targets_min": 973 }, { "epoch": 4.424103737604882, "grad_norm": 0.49186119929950545, "learning_rate": 1.4360372108444125e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.26581743359565735, "step": 5800, "valid_targets_mean": 3358.6, "valid_targets_min": 357 }, { "epoch": 4.4279176201373, "grad_norm": 0.44575600794041736, "learning_rate": 1.4323887519745916e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.29282018542289734, "step": 5805, "valid_targets_mean": 4706.3, "valid_targets_min": 1235 }, { "epoch": 4.4317315026697175, "grad_norm": 0.4183264646741452, "learning_rate": 1.4287423463257063e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.26400482654571533, "step": 5810, "valid_targets_mean": 4878.5, "valid_targets_min": 1455 }, { "epoch": 4.435545385202135, "grad_norm": 0.4731714728599063, "learning_rate": 1.4250980070879055e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.2791379988193512, "step": 5815, "valid_targets_mean": 4437.2, "valid_targets_min": 1131 }, { "epoch": 4.439359267734554, "grad_norm": 0.4733320793835799, "learning_rate": 1.4214557474438619e-05, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.28043392300605774, "step": 5820, "valid_targets_mean": 4277.6, "valid_targets_min": 1061 }, { "epoch": 4.443173150266972, "grad_norm": 0.45787589149165286, "learning_rate": 1.4178155805687264e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.3145343065261841, "step": 5825, "valid_targets_mean": 5004.2, "valid_targets_min": 824 }, { "epoch": 4.44698703279939, "grad_norm": 0.426977376897121, "learning_rate": 1.4141775196300796e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.2563020586967468, "step": 5830, "valid_targets_mean": 4465.5, "valid_targets_min": 1218 }, { "epoch": 4.450800915331808, "grad_norm": 0.5159147361121579, "learning_rate": 1.410541577787884e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.24296748638153076, "step": 5835, "valid_targets_mean": 4424.7, "valid_targets_min": 523 }, { "epoch": 4.454614797864226, "grad_norm": 0.4422629941501212, "learning_rate": 1.406907768194437e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830718755722046, "step": 5840, "valid_targets_mean": 4799.2, "valid_targets_min": 472 }, { "epoch": 4.4584286803966435, "grad_norm": 0.4616483695107263, "learning_rate": 1.4032761039943232e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.323681503534317, "step": 5845, "valid_targets_mean": 4502.0, "valid_targets_min": 1044 }, { "epoch": 4.462242562929061, "grad_norm": 0.44725678549137443, "learning_rate": 1.3996465983243663e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2807271480560303, "step": 5850, "valid_targets_mean": 4554.4, "valid_targets_min": 836 }, { "epoch": 4.46605644546148, "grad_norm": 0.4593516328145645, "learning_rate": 1.3960192643135817e-05, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.3010134696960449, "step": 5855, "valid_targets_mean": 4276.0, "valid_targets_min": 537 }, { "epoch": 4.469870327993898, "grad_norm": 0.48968025049502933, "learning_rate": 1.3923941150831304e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.2574882507324219, "step": 5860, "valid_targets_mean": 4256.4, "valid_targets_min": 1127 }, { "epoch": 4.473684210526316, "grad_norm": 0.45205623140214196, "learning_rate": 1.3887711637462692e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.29931384325027466, "step": 5865, "valid_targets_mean": 4524.5, "valid_targets_min": 1240 }, { "epoch": 4.477498093058734, "grad_norm": 0.4363509333460341, "learning_rate": 1.385150423408305e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.23655830323696136, "step": 5870, "valid_targets_mean": 4474.1, "valid_targets_min": 414 }, { "epoch": 4.481311975591152, "grad_norm": 0.4299324110154981, "learning_rate": 1.3815319071665465e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.2632123529911041, "step": 5875, "valid_targets_mean": 4886.5, "valid_targets_min": 531 }, { "epoch": 4.48512585812357, "grad_norm": 0.5194009105360434, "learning_rate": 1.3779156281102574e-05, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.27804139256477356, "step": 5880, "valid_targets_mean": 3514.6, "valid_targets_min": 417 }, { "epoch": 4.488939740655987, "grad_norm": 0.6032698548453926, "learning_rate": 1.3743015993206092e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.2937086522579193, "step": 5885, "valid_targets_mean": 3735.5, "valid_targets_min": 728 }, { "epoch": 4.492753623188406, "grad_norm": 0.43407844015473207, "learning_rate": 1.3706898338706328e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.27821847796440125, "step": 5890, "valid_targets_mean": 4741.5, "valid_targets_min": 1018 }, { "epoch": 4.496567505720824, "grad_norm": 1.5044846660486753, "learning_rate": 1.3670803448251724e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.5219283103942871, "step": 5895, "valid_targets_mean": 787.7, "valid_targets_min": 432 }, { "epoch": 4.500381388253242, "grad_norm": 0.4767872042750548, "learning_rate": 1.3634731452408373e-05, "loss": 0.4027, "loss_nan_ranks": 0, "loss_rank_avg": 0.30305016040802, "step": 5900, "valid_targets_mean": 4886.7, "valid_targets_min": 1604 }, { "epoch": 4.50419527078566, "grad_norm": 0.45889438457, "learning_rate": 1.3598682481659556e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751183807849884, "step": 5905, "valid_targets_mean": 4272.3, "valid_targets_min": 1270 }, { "epoch": 4.508009153318078, "grad_norm": 0.5049581257103946, "learning_rate": 1.3562656666405268e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787635028362274, "step": 5910, "valid_targets_mean": 4410.7, "valid_targets_min": 1023 }, { "epoch": 4.511823035850496, "grad_norm": 0.47197243732827343, "learning_rate": 1.3526654136961734e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.2548222839832306, "step": 5915, "valid_targets_mean": 3748.5, "valid_targets_min": 1234 }, { "epoch": 4.5156369183829135, "grad_norm": 0.531002042605842, "learning_rate": 1.3490675023560958e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.27940547466278076, "step": 5920, "valid_targets_mean": 3234.5, "valid_targets_min": 842 }, { "epoch": 4.519450800915331, "grad_norm": 0.42608539048001653, "learning_rate": 1.3454719456350227e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.2519294321537018, "step": 5925, "valid_targets_mean": 4580.6, "valid_targets_min": 850 }, { "epoch": 4.52326468344775, "grad_norm": 0.4337057125152285, "learning_rate": 1.341878756539167e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535187005996704, "step": 5930, "valid_targets_mean": 4240.9, "valid_targets_min": 896 }, { "epoch": 4.527078565980168, "grad_norm": 0.44211798863673996, "learning_rate": 1.3382879480661764e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.28309544920921326, "step": 5935, "valid_targets_mean": 4592.7, "valid_targets_min": 1101 }, { "epoch": 4.530892448512586, "grad_norm": 0.4310747429914301, "learning_rate": 1.334699533205087e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.27521029114723206, "step": 5940, "valid_targets_mean": 4518.3, "valid_targets_min": 1287 }, { "epoch": 4.534706331045004, "grad_norm": 0.4439661875246889, "learning_rate": 1.3311135249362765e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2662383019924164, "step": 5945, "valid_targets_mean": 4220.8, "valid_targets_min": 1279 }, { "epoch": 4.538520213577422, "grad_norm": 0.4158911308719578, "learning_rate": 1.3275299362314183e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.26738566160202026, "step": 5950, "valid_targets_mean": 5363.2, "valid_targets_min": 1796 }, { "epoch": 4.5423340961098395, "grad_norm": 0.5328998160967272, "learning_rate": 1.323948780053432e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578364610671997, "step": 5955, "valid_targets_mean": 3145.2, "valid_targets_min": 948 }, { "epoch": 4.546147978642258, "grad_norm": 0.4627383344985359, "learning_rate": 1.320370069356439e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.3163941204547882, "step": 5960, "valid_targets_mean": 4478.6, "valid_targets_min": 1010 }, { "epoch": 4.549961861174676, "grad_norm": 0.46521595739091043, "learning_rate": 1.3167938170857144e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.29799818992614746, "step": 5965, "valid_targets_mean": 4643.4, "valid_targets_min": 1383 }, { "epoch": 4.553775743707094, "grad_norm": 0.46932508666922923, "learning_rate": 1.3132200361776399e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.25845086574554443, "step": 5970, "valid_targets_mean": 4063.8, "valid_targets_min": 472 }, { "epoch": 4.557589626239512, "grad_norm": 0.49516638729280765, "learning_rate": 1.3096487395596587e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.26746347546577454, "step": 5975, "valid_targets_mean": 3572.2, "valid_targets_min": 432 }, { "epoch": 4.56140350877193, "grad_norm": 0.48711071485037627, "learning_rate": 1.3060799401502263e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.3077528774738312, "step": 5980, "valid_targets_mean": 4599.1, "valid_targets_min": 1437 }, { "epoch": 4.565217391304348, "grad_norm": 0.483945859673428, "learning_rate": 1.3025136508587659e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.2518140375614166, "step": 5985, "valid_targets_mean": 3965.2, "valid_targets_min": 1004 }, { "epoch": 4.5690312738367655, "grad_norm": 0.4719885943283488, "learning_rate": 1.2989498845856201e-05, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.2801418602466583, "step": 5990, "valid_targets_mean": 3937.7, "valid_targets_min": 1187 }, { "epoch": 4.572845156369183, "grad_norm": 0.42038699637659116, "learning_rate": 1.2953886542220064e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2455323487520218, "step": 5995, "valid_targets_mean": 4707.3, "valid_targets_min": 1049 }, { "epoch": 4.576659038901602, "grad_norm": 0.3969957514118753, "learning_rate": 1.2918299726499676e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.27261656522750854, "step": 6000, "valid_targets_mean": 6213.8, "valid_targets_min": 1807 }, { "epoch": 4.58047292143402, "grad_norm": 0.4541016921407842, "learning_rate": 1.2882738527423278e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.23699618875980377, "step": 6005, "valid_targets_mean": 3908.7, "valid_targets_min": 1072 }, { "epoch": 4.584286803966438, "grad_norm": 0.43712584522591535, "learning_rate": 1.2847203073626436e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.29207512736320496, "step": 6010, "valid_targets_mean": 4578.5, "valid_targets_min": 1249 }, { "epoch": 4.588100686498856, "grad_norm": 0.4478920451756276, "learning_rate": 1.2811693493651602e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.22837209701538086, "step": 6015, "valid_targets_mean": 4246.5, "valid_targets_min": 769 }, { "epoch": 4.591914569031274, "grad_norm": 0.4304258549375004, "learning_rate": 1.2776209915947627e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726576030254364, "step": 6020, "valid_targets_mean": 4741.2, "valid_targets_min": 1066 }, { "epoch": 4.595728451563692, "grad_norm": 0.4243229034746278, "learning_rate": 1.27407524688693e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.22514188289642334, "step": 6025, "valid_targets_mean": 4388.4, "valid_targets_min": 1254 }, { "epoch": 4.5995423340961095, "grad_norm": 0.4741565772839733, "learning_rate": 1.2705321280676897e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.31086888909339905, "step": 6030, "valid_targets_mean": 4512.9, "valid_targets_min": 1289 }, { "epoch": 4.603356216628528, "grad_norm": 0.427168564883841, "learning_rate": 1.2669916479535695e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.28429481387138367, "step": 6035, "valid_targets_mean": 5438.9, "valid_targets_min": 1283 }, { "epoch": 4.607170099160946, "grad_norm": 0.5386715627774374, "learning_rate": 1.2634538193515544e-05, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.24557559192180634, "step": 6040, "valid_targets_mean": 3304.1, "valid_targets_min": 852 }, { "epoch": 4.610983981693364, "grad_norm": 0.46561727285996857, "learning_rate": 1.2599186550590355e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2816053628921509, "step": 6045, "valid_targets_mean": 4762.0, "valid_targets_min": 1659 }, { "epoch": 4.614797864225782, "grad_norm": 0.4334778280310194, "learning_rate": 1.2563861678637675e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.26823705434799194, "step": 6050, "valid_targets_mean": 5187.0, "valid_targets_min": 1099 }, { "epoch": 4.6186117467582, "grad_norm": 0.4621016055707872, "learning_rate": 1.2528563705438215e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.28503915667533875, "step": 6055, "valid_targets_mean": 5040.2, "valid_targets_min": 1316 }, { "epoch": 4.622425629290618, "grad_norm": 0.5982601990337268, "learning_rate": 1.2493292758675379e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.2772160470485687, "step": 6060, "valid_targets_mean": 2937.5, "valid_targets_min": 653 }, { "epoch": 4.6262395118230355, "grad_norm": 0.640637801864729, "learning_rate": 1.245804896593481e-05, "loss": 0.4612, "loss_nan_ranks": 0, "loss_rank_avg": 0.3399999141693115, "step": 6065, "valid_targets_mean": 3138.5, "valid_targets_min": 796 }, { "epoch": 4.630053394355453, "grad_norm": 0.480477869036594, "learning_rate": 1.2422832454703925e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2532704770565033, "step": 6070, "valid_targets_mean": 3822.2, "valid_targets_min": 464 }, { "epoch": 4.633867276887872, "grad_norm": 0.5193519065919779, "learning_rate": 1.2387643352371458e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.27806735038757324, "step": 6075, "valid_targets_mean": 3533.6, "valid_targets_min": 1167 }, { "epoch": 4.63768115942029, "grad_norm": 0.45415550206324007, "learning_rate": 1.2352481786227002e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.2920186221599579, "step": 6080, "valid_targets_mean": 5147.2, "valid_targets_min": 1086 }, { "epoch": 4.641495041952708, "grad_norm": 0.4516307494153642, "learning_rate": 1.2317347883460533e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.2339109182357788, "step": 6085, "valid_targets_mean": 4068.7, "valid_targets_min": 1158 }, { "epoch": 4.645308924485126, "grad_norm": 0.533201480795766, "learning_rate": 1.228224177116197e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.30167070031166077, "step": 6090, "valid_targets_mean": 4061.7, "valid_targets_min": 580 }, { "epoch": 4.649122807017544, "grad_norm": 0.44208307954025483, "learning_rate": 1.2247163576320691e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.26982858777046204, "step": 6095, "valid_targets_mean": 4680.1, "valid_targets_min": 1126 }, { "epoch": 4.6529366895499615, "grad_norm": 0.4684962063196071, "learning_rate": 1.2212113425825108e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2656426727771759, "step": 6100, "valid_targets_mean": 4013.8, "valid_targets_min": 1228 }, { "epoch": 4.65675057208238, "grad_norm": 0.4704971087227113, "learning_rate": 1.2177091446462165e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.2484935075044632, "step": 6105, "valid_targets_mean": 4056.9, "valid_targets_min": 1235 }, { "epoch": 4.660564454614798, "grad_norm": 0.4793308933230215, "learning_rate": 1.2142097764916932e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.27687665820121765, "step": 6110, "valid_targets_mean": 4041.4, "valid_targets_min": 1256 }, { "epoch": 4.664378337147216, "grad_norm": 0.430844114668902, "learning_rate": 1.210713250777209e-05, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678356170654297, "step": 6115, "valid_targets_mean": 5247.5, "valid_targets_min": 1208 }, { "epoch": 4.668192219679634, "grad_norm": 0.4610368968711122, "learning_rate": 1.2072195801507514e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.27113208174705505, "step": 6120, "valid_targets_mean": 3816.7, "valid_targets_min": 979 }, { "epoch": 4.672006102212052, "grad_norm": 0.4783363189865354, "learning_rate": 1.20372877724998e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.22927595674991608, "step": 6125, "valid_targets_mean": 3613.3, "valid_targets_min": 880 }, { "epoch": 4.67581998474447, "grad_norm": 0.4437246147947317, "learning_rate": 1.2002408547021806e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.23522575199604034, "step": 6130, "valid_targets_mean": 5034.9, "valid_targets_min": 985 }, { "epoch": 4.679633867276888, "grad_norm": 0.4123331439857932, "learning_rate": 1.1967558251242202e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.2195393294095993, "step": 6135, "valid_targets_mean": 4580.7, "valid_targets_min": 1199 }, { "epoch": 4.6834477498093054, "grad_norm": 0.48821062186968395, "learning_rate": 1.193273701122501e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.29080095887184143, "step": 6140, "valid_targets_mean": 3972.9, "valid_targets_min": 617 }, { "epoch": 4.687261632341724, "grad_norm": 0.46089074530910856, "learning_rate": 1.1897944952929147e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.29182562232017517, "step": 6145, "valid_targets_mean": 4697.0, "valid_targets_min": 829 }, { "epoch": 4.691075514874142, "grad_norm": 0.5337402462436025, "learning_rate": 1.1863182202207977e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.26698315143585205, "step": 6150, "valid_targets_mean": 3188.3, "valid_targets_min": 453 }, { "epoch": 4.69488939740656, "grad_norm": 0.39887817966067385, "learning_rate": 1.1828448884808843e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.23282591998577118, "step": 6155, "valid_targets_mean": 5004.8, "valid_targets_min": 1170 }, { "epoch": 4.698703279938978, "grad_norm": 0.44218313890919614, "learning_rate": 1.1793745126372621e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.2869015634059906, "step": 6160, "valid_targets_mean": 4819.4, "valid_targets_min": 1478 }, { "epoch": 4.702517162471396, "grad_norm": 0.4671992817834822, "learning_rate": 1.1759071052433267e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.259736031293869, "step": 6165, "valid_targets_mean": 4065.2, "valid_targets_min": 436 }, { "epoch": 4.706331045003814, "grad_norm": 0.4158893122333823, "learning_rate": 1.1724426788417348e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.3164721131324768, "step": 6170, "valid_targets_mean": 5909.0, "valid_targets_min": 789 }, { "epoch": 4.710144927536232, "grad_norm": 0.44964144254203897, "learning_rate": 1.1689812459643612e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597438395023346, "step": 6175, "valid_targets_mean": 4044.4, "valid_targets_min": 934 }, { "epoch": 4.71395881006865, "grad_norm": 0.4621900769426731, "learning_rate": 1.1655228191322511e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.24745304882526398, "step": 6180, "valid_targets_mean": 4173.3, "valid_targets_min": 1173 }, { "epoch": 4.717772692601068, "grad_norm": 0.5019089891367999, "learning_rate": 1.1620674108555786e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.2863067090511322, "step": 6185, "valid_targets_mean": 4092.0, "valid_targets_min": 1843 }, { "epoch": 4.721586575133486, "grad_norm": 0.5402156848005659, "learning_rate": 1.1586150336335937e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.19477152824401855, "step": 6190, "valid_targets_mean": 4124.9, "valid_targets_min": 993 }, { "epoch": 4.725400457665904, "grad_norm": 0.45180783666601976, "learning_rate": 1.1551656999545879e-05, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.2611711919307709, "step": 6195, "valid_targets_mean": 4767.4, "valid_targets_min": 1080 }, { "epoch": 4.729214340198322, "grad_norm": 0.43472107197938675, "learning_rate": 1.1517194222958385e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.2774430811405182, "step": 6200, "valid_targets_mean": 4779.7, "valid_targets_min": 1768 }, { "epoch": 4.73302822273074, "grad_norm": 0.4131997148781024, "learning_rate": 1.1482762131235723e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.2677346169948578, "step": 6205, "valid_targets_mean": 5425.2, "valid_targets_min": 1425 }, { "epoch": 4.7368421052631575, "grad_norm": 0.4767133309486682, "learning_rate": 1.1448360848929125e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.2785078287124634, "step": 6210, "valid_targets_mean": 3975.9, "valid_targets_min": 680 }, { "epoch": 4.740655987795575, "grad_norm": 0.47301915164428615, "learning_rate": 1.1413990500478404e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.25078871846199036, "step": 6215, "valid_targets_mean": 4398.8, "valid_targets_min": 1321 }, { "epoch": 4.744469870327994, "grad_norm": 0.48680450680333354, "learning_rate": 1.1379651210211482e-05, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.23261241614818573, "step": 6220, "valid_targets_mean": 3989.0, "valid_targets_min": 863 }, { "epoch": 4.748283752860412, "grad_norm": 0.42575127016998615, "learning_rate": 1.1345343102343898e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.24395425617694855, "step": 6225, "valid_targets_mean": 4580.4, "valid_targets_min": 1255 }, { "epoch": 4.75209763539283, "grad_norm": 0.5622398324565753, "learning_rate": 1.1311066300978438e-05, "loss": 0.4105, "loss_nan_ranks": 0, "loss_rank_avg": 0.28262239694595337, "step": 6230, "valid_targets_mean": 2832.5, "valid_targets_min": 620 }, { "epoch": 4.755911517925248, "grad_norm": 0.48839896275848155, "learning_rate": 1.1276820930104599e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.2837162911891937, "step": 6235, "valid_targets_mean": 4031.0, "valid_targets_min": 1314 }, { "epoch": 4.759725400457666, "grad_norm": 0.4469933360053575, "learning_rate": 1.1242607113598227e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.2282828837633133, "step": 6240, "valid_targets_mean": 4210.8, "valid_targets_min": 617 }, { "epoch": 4.763539282990084, "grad_norm": 0.4459250961437655, "learning_rate": 1.1208424975220992e-05, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.26507505774497986, "step": 6245, "valid_targets_mean": 4829.0, "valid_targets_min": 867 }, { "epoch": 4.767353165522502, "grad_norm": 0.44761512621995236, "learning_rate": 1.1174274638620006e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.2591985762119293, "step": 6250, "valid_targets_mean": 5047.7, "valid_targets_min": 1386 }, { "epoch": 4.77116704805492, "grad_norm": 0.46003734262291296, "learning_rate": 1.1140156227327312e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.24344348907470703, "step": 6255, "valid_targets_mean": 3709.6, "valid_targets_min": 322 }, { "epoch": 4.774980930587338, "grad_norm": 0.4597165894813579, "learning_rate": 1.110606986475949e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2670276463031769, "step": 6260, "valid_targets_mean": 4286.9, "valid_targets_min": 995 }, { "epoch": 4.778794813119756, "grad_norm": 0.45709678873048865, "learning_rate": 1.1072015674217195e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.22857964038848877, "step": 6265, "valid_targets_mean": 4505.5, "valid_targets_min": 1520 }, { "epoch": 4.782608695652174, "grad_norm": 0.47553977436663747, "learning_rate": 1.1037993778884682e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.27654123306274414, "step": 6270, "valid_targets_mean": 4468.1, "valid_targets_min": 1259 }, { "epoch": 4.786422578184592, "grad_norm": 0.4349786674742026, "learning_rate": 1.1004004301829414e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.25767046213150024, "step": 6275, "valid_targets_mean": 4472.5, "valid_targets_min": 429 }, { "epoch": 4.79023646071701, "grad_norm": 0.4028363610927219, "learning_rate": 1.0970047366001554e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.23868699371814728, "step": 6280, "valid_targets_mean": 4960.5, "valid_targets_min": 855 }, { "epoch": 4.7940503432494275, "grad_norm": 0.48133951454517454, "learning_rate": 1.0936123094233593e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.29551172256469727, "step": 6285, "valid_targets_mean": 4206.8, "valid_targets_min": 696 }, { "epoch": 4.797864225781846, "grad_norm": 0.5032080776134414, "learning_rate": 1.0902231609239827e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717246115207672, "step": 6290, "valid_targets_mean": 3735.2, "valid_targets_min": 1154 }, { "epoch": 4.801678108314264, "grad_norm": 0.47775196462942643, "learning_rate": 1.0868373033615982e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.23652702569961548, "step": 6295, "valid_targets_mean": 4304.8, "valid_targets_min": 1440 }, { "epoch": 4.805491990846682, "grad_norm": 0.4450270865034603, "learning_rate": 1.0834547489838721e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.2865585386753082, "step": 6300, "valid_targets_mean": 5426.2, "valid_targets_min": 1185 }, { "epoch": 4.8093058733791, "grad_norm": 0.591606504521793, "learning_rate": 1.0800755100265232e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531816363334656, "step": 6305, "valid_targets_mean": 3974.3, "valid_targets_min": 971 }, { "epoch": 4.813119755911518, "grad_norm": 0.46299858012511447, "learning_rate": 1.076699598713278e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.25391659140586853, "step": 6310, "valid_targets_mean": 4571.8, "valid_targets_min": 993 }, { "epoch": 4.816933638443936, "grad_norm": 0.43866444790079595, "learning_rate": 1.0733270272558239e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.2802743911743164, "step": 6315, "valid_targets_mean": 4542.2, "valid_targets_min": 244 }, { "epoch": 4.820747520976354, "grad_norm": 0.4551570589007343, "learning_rate": 1.0699578078537694e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2353227138519287, "step": 6320, "valid_targets_mean": 4614.6, "valid_targets_min": 2119 }, { "epoch": 4.824561403508772, "grad_norm": 0.4701677190514475, "learning_rate": 1.0665919526945947e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597653567790985, "step": 6325, "valid_targets_mean": 4287.8, "valid_targets_min": 1232 }, { "epoch": 4.82837528604119, "grad_norm": 0.45065967973941917, "learning_rate": 1.0632294739536142e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.26184967160224915, "step": 6330, "valid_targets_mean": 4189.0, "valid_targets_min": 317 }, { "epoch": 4.832189168573608, "grad_norm": 0.4491956885125322, "learning_rate": 1.0598703837939248e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.26985234022140503, "step": 6335, "valid_targets_mean": 4688.4, "valid_targets_min": 1051 }, { "epoch": 4.836003051106026, "grad_norm": 0.47402852666197354, "learning_rate": 1.05651469436637e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.23498666286468506, "step": 6340, "valid_targets_mean": 5051.1, "valid_targets_min": 1277 }, { "epoch": 4.839816933638444, "grad_norm": 0.5845640550501232, "learning_rate": 1.0531624178094879e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578241229057312, "step": 6345, "valid_targets_mean": 2851.9, "valid_targets_min": 488 }, { "epoch": 4.843630816170862, "grad_norm": 0.4405871777300844, "learning_rate": 1.0498135662494735e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.27082574367523193, "step": 6350, "valid_targets_mean": 5172.5, "valid_targets_min": 728 }, { "epoch": 4.8474446987032795, "grad_norm": 0.4078096120879491, "learning_rate": 1.046468151800133e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.26433292031288147, "step": 6355, "valid_targets_mean": 5071.0, "valid_targets_min": 518 }, { "epoch": 4.851258581235698, "grad_norm": 0.45556925639901935, "learning_rate": 1.0431261865628373e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.3047320544719696, "step": 6360, "valid_targets_mean": 4966.4, "valid_targets_min": 565 }, { "epoch": 4.855072463768116, "grad_norm": 0.45539843805802527, "learning_rate": 1.0397876826264835e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.29343321919441223, "step": 6365, "valid_targets_mean": 5031.4, "valid_targets_min": 389 }, { "epoch": 4.858886346300534, "grad_norm": 0.5174457675449293, "learning_rate": 1.036452652067444e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625400722026825, "step": 6370, "valid_targets_mean": 3652.8, "valid_targets_min": 1119 }, { "epoch": 4.862700228832952, "grad_norm": 0.42023442456712606, "learning_rate": 1.033121106949532e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.27681344747543335, "step": 6375, "valid_targets_mean": 5527.3, "valid_targets_min": 1281 }, { "epoch": 4.86651411136537, "grad_norm": 0.4745097765595684, "learning_rate": 1.0297930593239483e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.25876760482788086, "step": 6380, "valid_targets_mean": 3772.8, "valid_targets_min": 609 }, { "epoch": 4.870327993897788, "grad_norm": 0.4452410560238349, "learning_rate": 1.0264685212292443e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.33578386902809143, "step": 6385, "valid_targets_mean": 4824.7, "valid_targets_min": 966 }, { "epoch": 4.874141876430206, "grad_norm": 0.44239743286286903, "learning_rate": 1.0231475046912771e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.29823407530784607, "step": 6390, "valid_targets_mean": 5004.5, "valid_targets_min": 1091 }, { "epoch": 4.877955758962624, "grad_norm": 0.5195950786044768, "learning_rate": 1.0198300217231627e-05, "loss": 0.4296, "loss_nan_ranks": 0, "loss_rank_avg": 0.30986395478248596, "step": 6395, "valid_targets_mean": 4166.0, "valid_targets_min": 580 }, { "epoch": 4.881769641495042, "grad_norm": 0.48620033251297656, "learning_rate": 1.0165160843252388e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.24216914176940918, "step": 6400, "valid_targets_mean": 3795.1, "valid_targets_min": 1023 }, { "epoch": 4.88558352402746, "grad_norm": 0.4409043094002218, "learning_rate": 1.0132057044850137e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.25296226143836975, "step": 6405, "valid_targets_mean": 4557.1, "valid_targets_min": 1657 }, { "epoch": 4.889397406559878, "grad_norm": 0.4893275906184621, "learning_rate": 1.0098988941771305e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.2721904218196869, "step": 6410, "valid_targets_mean": 4337.0, "valid_targets_min": 269 }, { "epoch": 4.893211289092296, "grad_norm": 0.473091196768073, "learning_rate": 1.0065956653633173e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775305509567261, "step": 6415, "valid_targets_mean": 4149.3, "valid_targets_min": 1155 }, { "epoch": 4.897025171624714, "grad_norm": 0.4611208289628004, "learning_rate": 1.0032960299923485e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.2669666111469269, "step": 6420, "valid_targets_mean": 4127.0, "valid_targets_min": 1402 }, { "epoch": 4.900839054157132, "grad_norm": 0.4446130762839984, "learning_rate": 1.0000000000000006e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.2863334119319916, "step": 6425, "valid_targets_mean": 5016.7, "valid_targets_min": 1316 }, { "epoch": 4.9046529366895495, "grad_norm": 0.4631447759575701, "learning_rate": 9.967075873090057e-06, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.2800535559654236, "step": 6430, "valid_targets_mean": 4280.8, "valid_targets_min": 351 }, { "epoch": 4.908466819221968, "grad_norm": 0.4866673735485943, "learning_rate": 9.934188038290144e-06, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.25013306736946106, "step": 6435, "valid_targets_mean": 3571.5, "valid_targets_min": 1055 }, { "epoch": 4.912280701754386, "grad_norm": 0.5676709320301305, "learning_rate": 9.90133661456546e-06, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.3177274763584137, "step": 6440, "valid_targets_mean": 4374.2, "valid_targets_min": 1454 }, { "epoch": 4.916094584286804, "grad_norm": 0.474411723432594, "learning_rate": 9.86852172074952e-06, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.2783035933971405, "step": 6445, "valid_targets_mean": 3933.2, "valid_targets_min": 1212 }, { "epoch": 4.919908466819222, "grad_norm": 0.4310577771224861, "learning_rate": 9.835743475543669e-06, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.25968584418296814, "step": 6450, "valid_targets_mean": 4817.0, "valid_targets_min": 1630 }, { "epoch": 4.92372234935164, "grad_norm": 0.4256333701579665, "learning_rate": 9.80300199751671e-06, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.2685914933681488, "step": 6455, "valid_targets_mean": 5068.5, "valid_targets_min": 1395 }, { "epoch": 4.927536231884058, "grad_norm": 0.4020917325980264, "learning_rate": 9.770297405104426e-06, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2310306578874588, "step": 6460, "valid_targets_mean": 5008.4, "valid_targets_min": 1203 }, { "epoch": 4.931350114416476, "grad_norm": 0.424080030882146, "learning_rate": 9.737629816609186e-06, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726290225982666, "step": 6465, "valid_targets_mean": 5150.7, "valid_targets_min": 280 }, { "epoch": 4.935163996948894, "grad_norm": 0.5078040027460309, "learning_rate": 9.704999350199512e-06, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.22907471656799316, "step": 6470, "valid_targets_mean": 3427.7, "valid_targets_min": 456 }, { "epoch": 4.938977879481312, "grad_norm": 0.47313149739798094, "learning_rate": 9.672406123909621e-06, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.26523223519325256, "step": 6475, "valid_targets_mean": 4480.9, "valid_targets_min": 480 }, { "epoch": 4.94279176201373, "grad_norm": 0.612986995052608, "learning_rate": 9.639850255639047e-06, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.3095862865447998, "step": 6480, "valid_targets_mean": 4458.4, "valid_targets_min": 1012 }, { "epoch": 4.946605644546148, "grad_norm": 0.4697376419383409, "learning_rate": 9.60733186315216e-06, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2794733941555023, "step": 6485, "valid_targets_mean": 4355.2, "valid_targets_min": 1178 }, { "epoch": 4.950419527078566, "grad_norm": 0.4347464188066338, "learning_rate": 9.574851064077805e-06, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.26758232712745667, "step": 6490, "valid_targets_mean": 5047.6, "valid_targets_min": 1477 }, { "epoch": 4.954233409610984, "grad_norm": 0.4523891272435883, "learning_rate": 9.542407975908801e-06, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.2836798131465912, "step": 6495, "valid_targets_mean": 4667.2, "valid_targets_min": 941 }, { "epoch": 4.958047292143402, "grad_norm": 0.4439635451916094, "learning_rate": 9.510002716001591e-06, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.291238009929657, "step": 6500, "valid_targets_mean": 5885.6, "valid_targets_min": 1412 }, { "epoch": 4.96186117467582, "grad_norm": 0.5153040180095564, "learning_rate": 9.477635401575752e-06, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.24549072980880737, "step": 6505, "valid_targets_mean": 3759.1, "valid_targets_min": 986 }, { "epoch": 4.965675057208238, "grad_norm": 0.5275444608815067, "learning_rate": 9.44530614971362e-06, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.27426838874816895, "step": 6510, "valid_targets_mean": 3683.1, "valid_targets_min": 948 }, { "epoch": 4.969488939740656, "grad_norm": 0.441657014255363, "learning_rate": 9.41301507735985e-06, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.29648175835609436, "step": 6515, "valid_targets_mean": 4722.1, "valid_targets_min": 1067 }, { "epoch": 4.973302822273074, "grad_norm": 0.4116526665237431, "learning_rate": 9.380762301320964e-06, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.2626621425151825, "step": 6520, "valid_targets_mean": 5578.3, "valid_targets_min": 833 }, { "epoch": 4.977116704805492, "grad_norm": 0.45738516459947337, "learning_rate": 9.348547938264993e-06, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.26601141691207886, "step": 6525, "valid_targets_mean": 4418.0, "valid_targets_min": 951 }, { "epoch": 4.98093058733791, "grad_norm": 0.43957493723393576, "learning_rate": 9.316372104720978e-06, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.2962207794189453, "step": 6530, "valid_targets_mean": 5003.0, "valid_targets_min": 1026 }, { "epoch": 4.9847444698703285, "grad_norm": 0.4406600914628833, "learning_rate": 9.284234917078618e-06, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.27836713194847107, "step": 6535, "valid_targets_mean": 4530.5, "valid_targets_min": 363 }, { "epoch": 4.988558352402746, "grad_norm": 0.4929584772121223, "learning_rate": 9.252136491587796e-06, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.30669355392456055, "step": 6540, "valid_targets_mean": 4779.3, "valid_targets_min": 855 }, { "epoch": 4.992372234935164, "grad_norm": 0.45919666024271943, "learning_rate": 9.220076944358198e-06, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2921316623687744, "step": 6545, "valid_targets_mean": 4566.1, "valid_targets_min": 993 }, { "epoch": 4.996186117467582, "grad_norm": 0.496912636598731, "learning_rate": 9.188056391358857e-06, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.33465495705604553, "step": 6550, "valid_targets_mean": 4712.3, "valid_targets_min": 1218 }, { "epoch": 5.0, "grad_norm": 1.4334764781852514, "learning_rate": 9.15607494841777e-06, "loss": 0.4533, "loss_nan_ranks": 0, "loss_rank_avg": 0.4589976370334625, "step": 6555, "valid_targets_mean": 858.8, "valid_targets_min": 497 }, { "epoch": 5.003813882532418, "grad_norm": 0.4637236359062967, "learning_rate": 9.12413273122146e-06, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.30440065264701843, "step": 6560, "valid_targets_mean": 5229.4, "valid_targets_min": 1152 }, { "epoch": 5.007627765064836, "grad_norm": 0.5731758576495917, "learning_rate": 9.092229855314541e-06, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.34112057089805603, "step": 6565, "valid_targets_mean": 3283.0, "valid_targets_min": 660 }, { "epoch": 5.011441647597254, "grad_norm": 0.46800535106530056, "learning_rate": 9.060366436099337e-06, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.2606760263442993, "step": 6570, "valid_targets_mean": 4470.2, "valid_targets_min": 1025 }, { "epoch": 5.015255530129672, "grad_norm": 0.6137644660052498, "learning_rate": 9.02854258883543e-06, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.2700829803943634, "step": 6575, "valid_targets_mean": 4210.0, "valid_targets_min": 345 }, { "epoch": 5.01906941266209, "grad_norm": 0.4878235171922639, "learning_rate": 8.996758428639276e-06, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.2577427923679352, "step": 6580, "valid_targets_mean": 4130.4, "valid_targets_min": 1404 }, { "epoch": 5.022883295194508, "grad_norm": 0.4751599864581177, "learning_rate": 8.965014070483749e-06, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.24149303138256073, "step": 6585, "valid_targets_mean": 3961.3, "valid_targets_min": 1118 }, { "epoch": 5.026697177726926, "grad_norm": 0.4592892732948017, "learning_rate": 8.933309629197773e-06, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2872866988182068, "step": 6590, "valid_targets_mean": 4570.6, "valid_targets_min": 782 }, { "epoch": 5.030511060259344, "grad_norm": 0.4243811711385429, "learning_rate": 8.901645219465848e-06, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.2821787893772125, "step": 6595, "valid_targets_mean": 4959.4, "valid_targets_min": 1531 }, { "epoch": 5.034324942791762, "grad_norm": 0.40234791333162984, "learning_rate": 8.870020955827697e-06, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.24314086139202118, "step": 6600, "valid_targets_mean": 4961.0, "valid_targets_min": 1151 }, { "epoch": 5.03813882532418, "grad_norm": 0.47734966546802016, "learning_rate": 8.838436952677819e-06, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.2361879199743271, "step": 6605, "valid_targets_mean": 3586.6, "valid_targets_min": 449 }, { "epoch": 5.041952707856598, "grad_norm": 0.49430140990989624, "learning_rate": 8.806893324265055e-06, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.3115706145763397, "step": 6610, "valid_targets_mean": 4680.6, "valid_targets_min": 1299 }, { "epoch": 5.045766590389016, "grad_norm": 0.455707973439489, "learning_rate": 8.775390184692232e-06, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.26760897040367126, "step": 6615, "valid_targets_mean": 4604.5, "valid_targets_min": 833 }, { "epoch": 5.049580472921434, "grad_norm": 0.5010384461705412, "learning_rate": 8.74392764791568e-06, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.2379763126373291, "step": 6620, "valid_targets_mean": 3717.8, "valid_targets_min": 301 }, { "epoch": 5.053394355453852, "grad_norm": 0.5298371448753371, "learning_rate": 8.712505827744898e-06, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.3061905801296234, "step": 6625, "valid_targets_mean": 3829.6, "valid_targets_min": 1278 }, { "epoch": 5.05720823798627, "grad_norm": 0.4453159473628936, "learning_rate": 8.681124837842057e-06, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787354290485382, "step": 6630, "valid_targets_mean": 5117.9, "valid_targets_min": 938 }, { "epoch": 5.061022120518688, "grad_norm": 0.47857296510039227, "learning_rate": 8.64978479172167e-06, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.26554688811302185, "step": 6635, "valid_targets_mean": 4001.0, "valid_targets_min": 768 }, { "epoch": 5.064836003051106, "grad_norm": 0.46676260966328054, "learning_rate": 8.618485802750119e-06, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.28517279028892517, "step": 6640, "valid_targets_mean": 4640.2, "valid_targets_min": 956 }, { "epoch": 5.068649885583524, "grad_norm": 0.47928071968710284, "learning_rate": 8.58722798414528e-06, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.27151843905448914, "step": 6645, "valid_targets_mean": 4000.2, "valid_targets_min": 1232 }, { "epoch": 5.072463768115942, "grad_norm": 0.4471785238558857, "learning_rate": 8.556011448976111e-06, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.25223401188850403, "step": 6650, "valid_targets_mean": 4390.5, "valid_targets_min": 659 }, { "epoch": 5.07627765064836, "grad_norm": 0.4668781382048033, "learning_rate": 8.524836310162217e-06, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625182271003723, "step": 6655, "valid_targets_mean": 4160.7, "valid_targets_min": 972 }, { "epoch": 5.080091533180778, "grad_norm": 0.497840738820478, "learning_rate": 8.493702680473481e-06, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.22448588907718658, "step": 6660, "valid_targets_mean": 3680.2, "valid_targets_min": 1247 }, { "epoch": 5.083905415713196, "grad_norm": 0.48363425185296266, "learning_rate": 8.462610672529608e-06, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.23800963163375854, "step": 6665, "valid_targets_mean": 4145.7, "valid_targets_min": 1149 }, { "epoch": 5.087719298245614, "grad_norm": 0.447347355895507, "learning_rate": 8.431560398799779e-06, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2579364478588104, "step": 6670, "valid_targets_mean": 4632.5, "valid_targets_min": 1081 }, { "epoch": 5.091533180778032, "grad_norm": 0.4394024565255274, "learning_rate": 8.400551971602171e-06, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.27306821942329407, "step": 6675, "valid_targets_mean": 4924.3, "valid_targets_min": 1112 }, { "epoch": 5.09534706331045, "grad_norm": 0.41078294685140615, "learning_rate": 8.369585503103628e-06, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.21968694031238556, "step": 6680, "valid_targets_mean": 4687.0, "valid_targets_min": 1765 }, { "epoch": 5.099160945842868, "grad_norm": 0.4286895396734995, "learning_rate": 8.338661105319186e-06, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.2512158751487732, "step": 6685, "valid_targets_mean": 4783.9, "valid_targets_min": 872 }, { "epoch": 5.102974828375286, "grad_norm": 0.4346920938094104, "learning_rate": 8.30777889011172e-06, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.2605276107788086, "step": 6690, "valid_targets_mean": 4795.2, "valid_targets_min": 1039 }, { "epoch": 5.106788710907704, "grad_norm": 0.44722763124062953, "learning_rate": 8.276938969191506e-06, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.29144763946533203, "step": 6695, "valid_targets_mean": 5161.2, "valid_targets_min": 1295 }, { "epoch": 5.110602593440122, "grad_norm": 0.46646851736725947, "learning_rate": 8.246141454115821e-06, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.22032219171524048, "step": 6700, "valid_targets_mean": 3884.6, "valid_targets_min": 1002 }, { "epoch": 5.11441647597254, "grad_norm": 0.5070689669662287, "learning_rate": 8.215386456288576e-06, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.27866432070732117, "step": 6705, "valid_targets_mean": 4045.0, "valid_targets_min": 1020 }, { "epoch": 5.118230358504958, "grad_norm": 0.9995311563170907, "learning_rate": 8.18467408695985e-06, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413589358329773, "step": 6710, "valid_targets_mean": 4955.4, "valid_targets_min": 1056 }, { "epoch": 5.122044241037376, "grad_norm": 0.40195021820199256, "learning_rate": 8.154004457225547e-06, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.23771731555461884, "step": 6715, "valid_targets_mean": 4887.3, "valid_targets_min": 1317 }, { "epoch": 5.125858123569794, "grad_norm": 0.4960976441570362, "learning_rate": 8.123377678026962e-06, "loss": 0.4059, "loss_nan_ranks": 0, "loss_rank_avg": 0.26147928833961487, "step": 6720, "valid_targets_mean": 3697.1, "valid_targets_min": 433 }, { "epoch": 5.129672006102212, "grad_norm": 0.4880702087976833, "learning_rate": 8.092793860150376e-06, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.27091705799102783, "step": 6725, "valid_targets_mean": 4247.1, "valid_targets_min": 939 }, { "epoch": 5.13348588863463, "grad_norm": 0.4984676713106216, "learning_rate": 8.062253114226688e-06, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.24456210434436798, "step": 6730, "valid_targets_mean": 3648.6, "valid_targets_min": 1373 }, { "epoch": 5.137299771167048, "grad_norm": 0.4626797380175307, "learning_rate": 8.031755550730966e-06, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.22191393375396729, "step": 6735, "valid_targets_mean": 3943.0, "valid_targets_min": 990 }, { "epoch": 5.141113653699466, "grad_norm": 0.4684925381564363, "learning_rate": 8.0013012799821e-06, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535335123538971, "step": 6740, "valid_targets_mean": 4291.0, "valid_targets_min": 1033 }, { "epoch": 5.144927536231884, "grad_norm": 0.5231522942873892, "learning_rate": 7.970890412142349e-06, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535442113876343, "step": 6745, "valid_targets_mean": 3662.4, "valid_targets_min": 874 }, { "epoch": 5.148741418764302, "grad_norm": 0.47740089425599175, "learning_rate": 7.940523057217007e-06, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.27571263909339905, "step": 6750, "valid_targets_mean": 4590.5, "valid_targets_min": 934 }, { "epoch": 5.1525553012967205, "grad_norm": 0.4694998058736014, "learning_rate": 7.910199325053926e-06, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.29670730233192444, "step": 6755, "valid_targets_mean": 5085.7, "valid_targets_min": 1068 }, { "epoch": 5.156369183829138, "grad_norm": 0.5035311411179674, "learning_rate": 7.879919325343198e-06, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.24500465393066406, "step": 6760, "valid_targets_mean": 3302.5, "valid_targets_min": 1013 }, { "epoch": 5.160183066361556, "grad_norm": 0.47053806545490146, "learning_rate": 7.849683167616706e-06, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.26875197887420654, "step": 6765, "valid_targets_mean": 4434.8, "valid_targets_min": 1002 }, { "epoch": 5.163996948893974, "grad_norm": 0.47086093470609763, "learning_rate": 7.819490961247738e-06, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.2104368805885315, "step": 6770, "valid_targets_mean": 3852.2, "valid_targets_min": 870 }, { "epoch": 5.167810831426392, "grad_norm": 0.4278205498892171, "learning_rate": 7.789342815450614e-06, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.29282939434051514, "step": 6775, "valid_targets_mean": 6059.0, "valid_targets_min": 865 }, { "epoch": 5.17162471395881, "grad_norm": 0.4634629507302458, "learning_rate": 7.759238839280245e-06, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2758885324001312, "step": 6780, "valid_targets_mean": 4304.7, "valid_targets_min": 890 }, { "epoch": 5.175438596491228, "grad_norm": 0.45836552925576557, "learning_rate": 7.729179141631804e-06, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.2779264450073242, "step": 6785, "valid_targets_mean": 5225.0, "valid_targets_min": 1847 }, { "epoch": 5.1792524790236465, "grad_norm": 0.438575576795386, "learning_rate": 7.69916383124026e-06, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508902847766876, "step": 6790, "valid_targets_mean": 5232.6, "valid_targets_min": 1525 }, { "epoch": 5.183066361556064, "grad_norm": 0.4523443599950125, "learning_rate": 7.669193016680049e-06, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2792450189590454, "step": 6795, "valid_targets_mean": 4931.0, "valid_targets_min": 1398 }, { "epoch": 5.186880244088482, "grad_norm": 0.5896330188216606, "learning_rate": 7.639266806364627e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2727765738964081, "step": 6800, "valid_targets_mean": 4803.3, "valid_targets_min": 787 }, { "epoch": 5.1906941266209, "grad_norm": 0.4007427104448006, "learning_rate": 7.60938530854612e-06, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.25615957379341125, "step": 6805, "valid_targets_mean": 5634.1, "valid_targets_min": 1214 }, { "epoch": 5.194508009153318, "grad_norm": 0.476018360455716, "learning_rate": 7.579548631314919e-06, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.22604842483997345, "step": 6810, "valid_targets_mean": 4041.0, "valid_targets_min": 1198 }, { "epoch": 5.198321891685736, "grad_norm": 0.4746406522279334, "learning_rate": 7.549756882599262e-06, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.2810885012149811, "step": 6815, "valid_targets_mean": 4864.0, "valid_targets_min": 348 }, { "epoch": 5.202135774218154, "grad_norm": 0.44123239571536454, "learning_rate": 7.520010170164897e-06, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.29340696334838867, "step": 6820, "valid_targets_mean": 4571.4, "valid_targets_min": 1294 }, { "epoch": 5.2059496567505725, "grad_norm": 0.5181410495929143, "learning_rate": 7.490308601614633e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.3056938648223877, "step": 6825, "valid_targets_mean": 3920.4, "valid_targets_min": 934 }, { "epoch": 5.20976353928299, "grad_norm": 0.43776302603903644, "learning_rate": 7.460652284388006e-06, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.2616339325904846, "step": 6830, "valid_targets_mean": 4601.6, "valid_targets_min": 863 }, { "epoch": 5.213577421815408, "grad_norm": 0.4420958323537919, "learning_rate": 7.431041325760842e-06, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.28292545676231384, "step": 6835, "valid_targets_mean": 4929.3, "valid_targets_min": 981 }, { "epoch": 5.217391304347826, "grad_norm": 0.44810324346126695, "learning_rate": 7.4014758328449134e-06, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.2579541802406311, "step": 6840, "valid_targets_mean": 4549.0, "valid_targets_min": 1071 }, { "epoch": 5.221205186880244, "grad_norm": 0.461760509560138, "learning_rate": 7.3719559125875055e-06, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631801664829254, "step": 6845, "valid_targets_mean": 4591.1, "valid_targets_min": 1050 }, { "epoch": 5.225019069412662, "grad_norm": 0.44979052496347216, "learning_rate": 7.342481671771069e-06, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.3014061152935028, "step": 6850, "valid_targets_mean": 4955.3, "valid_targets_min": 935 }, { "epoch": 5.22883295194508, "grad_norm": 0.45496952765153387, "learning_rate": 7.313053217012827e-06, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.2862650752067566, "step": 6855, "valid_targets_mean": 4854.8, "valid_targets_min": 1379 }, { "epoch": 5.232646834477498, "grad_norm": 0.4852937715560849, "learning_rate": 7.28367065476435e-06, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.27204573154449463, "step": 6860, "valid_targets_mean": 4125.8, "valid_targets_min": 1221 }, { "epoch": 5.236460717009916, "grad_norm": 0.4984472817633318, "learning_rate": 7.254334091311239e-06, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.2766822576522827, "step": 6865, "valid_targets_mean": 4148.9, "valid_targets_min": 1389 }, { "epoch": 5.240274599542334, "grad_norm": 0.5046422054288014, "learning_rate": 7.225043632772666e-06, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.23229973018169403, "step": 6870, "valid_targets_mean": 3703.2, "valid_targets_min": 1119 }, { "epoch": 5.244088482074752, "grad_norm": 0.47075224858655285, "learning_rate": 7.195799385101066e-06, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.21081803739070892, "step": 6875, "valid_targets_mean": 4031.1, "valid_targets_min": 1148 }, { "epoch": 5.24790236460717, "grad_norm": 1.06539071338913, "learning_rate": 7.166601454081674e-06, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.39799293875694275, "step": 6880, "valid_targets_mean": 1204.7, "valid_targets_min": 562 }, { "epoch": 5.251716247139588, "grad_norm": 0.8053847363374328, "learning_rate": 7.1374499453322265e-06, "loss": 0.448, "loss_nan_ranks": 0, "loss_rank_avg": 0.3278617262840271, "step": 6885, "valid_targets_mean": 1777.9, "valid_targets_min": 629 }, { "epoch": 5.255530129672006, "grad_norm": 0.49179591973926917, "learning_rate": 7.108344964302499e-06, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707764208316803, "step": 6890, "valid_targets_mean": 4019.2, "valid_targets_min": 610 }, { "epoch": 5.259344012204424, "grad_norm": 0.4672780099759257, "learning_rate": 7.079286616273986e-06, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.21976228058338165, "step": 6895, "valid_targets_mean": 4157.5, "valid_targets_min": 1035 }, { "epoch": 5.2631578947368425, "grad_norm": 0.44433342694406336, "learning_rate": 7.050275006359493e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.29698076844215393, "step": 6900, "valid_targets_mean": 5283.3, "valid_targets_min": 1131 }, { "epoch": 5.26697177726926, "grad_norm": 0.5223006039476878, "learning_rate": 7.0213102395027475e-06, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.27178704738616943, "step": 6905, "valid_targets_mean": 3426.8, "valid_targets_min": 1044 }, { "epoch": 5.270785659801678, "grad_norm": 0.4809130633033059, "learning_rate": 6.9923924204780495e-06, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610607147216797, "step": 6910, "valid_targets_mean": 4059.3, "valid_targets_min": 385 }, { "epoch": 5.274599542334096, "grad_norm": 0.5044092120968204, "learning_rate": 6.963521653889853e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.28660058975219727, "step": 6915, "valid_targets_mean": 4845.2, "valid_targets_min": 978 }, { "epoch": 5.278413424866514, "grad_norm": 0.5104496438847528, "learning_rate": 6.934698044172435e-06, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.24992434680461884, "step": 6920, "valid_targets_mean": 3877.2, "valid_targets_min": 468 }, { "epoch": 5.282227307398932, "grad_norm": 0.5110715915878371, "learning_rate": 6.905921695589461e-06, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.24427704513072968, "step": 6925, "valid_targets_mean": 4894.0, "valid_targets_min": 1049 }, { "epoch": 5.28604118993135, "grad_norm": 0.4788393046415271, "learning_rate": 6.877192712233673e-06, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2587161362171173, "step": 6930, "valid_targets_mean": 4604.5, "valid_targets_min": 1024 }, { "epoch": 5.2898550724637685, "grad_norm": 0.5212077492613079, "learning_rate": 6.8485111980264485e-06, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.25677958130836487, "step": 6935, "valid_targets_mean": 4370.5, "valid_targets_min": 1018 }, { "epoch": 5.293668954996186, "grad_norm": 0.5081127694045978, "learning_rate": 6.819877256717471e-06, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2486242800951004, "step": 6940, "valid_targets_mean": 3836.2, "valid_targets_min": 336 }, { "epoch": 5.297482837528604, "grad_norm": 0.46264486257794624, "learning_rate": 6.791290991884343e-06, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.2491236925125122, "step": 6945, "valid_targets_mean": 4162.0, "valid_targets_min": 1472 }, { "epoch": 5.301296720061022, "grad_norm": 0.5517594238630391, "learning_rate": 6.762752506932186e-06, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.23130156099796295, "step": 6950, "valid_targets_mean": 4125.0, "valid_targets_min": 1314 }, { "epoch": 5.30511060259344, "grad_norm": 0.5117419037061384, "learning_rate": 6.734261905093315e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.29466712474823, "step": 6955, "valid_targets_mean": 4019.8, "valid_targets_min": 1289 }, { "epoch": 5.308924485125858, "grad_norm": 0.4774587493320638, "learning_rate": 6.705819289426807e-06, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.23725992441177368, "step": 6960, "valid_targets_mean": 4301.6, "valid_targets_min": 504 }, { "epoch": 5.312738367658276, "grad_norm": 0.4367236063617533, "learning_rate": 6.67742476281819e-06, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.27271658182144165, "step": 6965, "valid_targets_mean": 4865.9, "valid_targets_min": 1739 }, { "epoch": 5.3165522501906946, "grad_norm": 0.5402725692551985, "learning_rate": 6.649078427979008e-06, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.31718483567237854, "step": 6970, "valid_targets_mean": 3822.7, "valid_targets_min": 674 }, { "epoch": 5.320366132723112, "grad_norm": 0.5475992817437416, "learning_rate": 6.62078038744651e-06, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607622444629669, "step": 6975, "valid_targets_mean": 3495.9, "valid_targets_min": 274 }, { "epoch": 5.32418001525553, "grad_norm": 0.44930905451217984, "learning_rate": 6.592530743583223e-06, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.23356647789478302, "step": 6980, "valid_targets_mean": 4413.0, "valid_targets_min": 1244 }, { "epoch": 5.327993897787948, "grad_norm": 0.49257972443447445, "learning_rate": 6.564329598576631e-06, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.3146706521511078, "step": 6985, "valid_targets_mean": 4495.7, "valid_targets_min": 919 }, { "epoch": 5.331807780320366, "grad_norm": 0.4915267580498807, "learning_rate": 6.536177054438777e-06, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.2633446455001831, "step": 6990, "valid_targets_mean": 4100.7, "valid_targets_min": 1543 }, { "epoch": 5.335621662852784, "grad_norm": 0.527306128608921, "learning_rate": 6.508073213005886e-06, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.28533294796943665, "step": 6995, "valid_targets_mean": 3935.1, "valid_targets_min": 890 }, { "epoch": 5.339435545385202, "grad_norm": 0.49659900179345723, "learning_rate": 6.480018175938032e-06, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.2267284244298935, "step": 7000, "valid_targets_mean": 3676.0, "valid_targets_min": 1351 }, { "epoch": 5.34324942791762, "grad_norm": 0.431485347943722, "learning_rate": 6.4520120447187366e-06, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.27338099479675293, "step": 7005, "valid_targets_mean": 5130.5, "valid_targets_min": 1279 }, { "epoch": 5.3470633104500385, "grad_norm": 0.4509333030627232, "learning_rate": 6.424054920654607e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.27152150869369507, "step": 7010, "valid_targets_mean": 4593.5, "valid_targets_min": 1281 }, { "epoch": 5.350877192982456, "grad_norm": 0.4756213671492397, "learning_rate": 6.396146904875001e-06, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602352201938629, "step": 7015, "valid_targets_mean": 4143.6, "valid_targets_min": 1026 }, { "epoch": 5.354691075514874, "grad_norm": 0.4366604334192552, "learning_rate": 6.368288098331605e-06, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2461734563112259, "step": 7020, "valid_targets_mean": 4280.2, "valid_targets_min": 1094 }, { "epoch": 5.358504958047292, "grad_norm": 0.49410785049881645, "learning_rate": 6.340478601798132e-06, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.26815125346183777, "step": 7025, "valid_targets_mean": 4111.7, "valid_targets_min": 1306 }, { "epoch": 5.36231884057971, "grad_norm": 0.45759646347454747, "learning_rate": 6.312718515869902e-06, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.22155439853668213, "step": 7030, "valid_targets_mean": 4103.8, "valid_targets_min": 447 }, { "epoch": 5.366132723112128, "grad_norm": 0.4845186523017412, "learning_rate": 6.285007940963519e-06, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.27183595299720764, "step": 7035, "valid_targets_mean": 3842.2, "valid_targets_min": 395 }, { "epoch": 5.369946605644546, "grad_norm": 0.4573500237101827, "learning_rate": 6.257346977316474e-06, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2306838482618332, "step": 7040, "valid_targets_mean": 4493.4, "valid_targets_min": 1671 }, { "epoch": 5.3737604881769645, "grad_norm": 0.9156027305404644, "learning_rate": 6.229735724986821e-06, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.3673783540725708, "step": 7045, "valid_targets_mean": 1448.0, "valid_targets_min": 675 }, { "epoch": 5.377574370709382, "grad_norm": 0.5348366671099393, "learning_rate": 6.202174283852766e-06, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.2646300494670868, "step": 7050, "valid_targets_mean": 4003.0, "valid_targets_min": 1379 }, { "epoch": 5.3813882532418, "grad_norm": 0.4493967568819422, "learning_rate": 6.174662753612355e-06, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676180601119995, "step": 7055, "valid_targets_mean": 4638.2, "valid_targets_min": 1044 }, { "epoch": 5.385202135774218, "grad_norm": 0.44339585866075004, "learning_rate": 6.147201233783087e-06, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.2779521048069, "step": 7060, "valid_targets_mean": 4827.2, "valid_targets_min": 416 }, { "epoch": 5.389016018306636, "grad_norm": 0.4916923429041741, "learning_rate": 6.119789823701548e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.26473018527030945, "step": 7065, "valid_targets_mean": 4566.0, "valid_targets_min": 1278 }, { "epoch": 5.392829900839054, "grad_norm": 0.4666991074580145, "learning_rate": 6.092428622523074e-06, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.3047803044319153, "step": 7070, "valid_targets_mean": 5045.8, "valid_targets_min": 1274 }, { "epoch": 5.396643783371472, "grad_norm": 0.4567416421356613, "learning_rate": 6.065117729221368e-06, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2584697902202606, "step": 7075, "valid_targets_mean": 4706.9, "valid_targets_min": 1275 }, { "epoch": 5.4004576659038905, "grad_norm": 0.44314444752444254, "learning_rate": 6.037857242588172e-06, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.23497982323169708, "step": 7080, "valid_targets_mean": 4559.0, "valid_targets_min": 1282 }, { "epoch": 5.404271548436308, "grad_norm": 0.48014425623093515, "learning_rate": 6.01064726123287e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.25778788328170776, "step": 7085, "valid_targets_mean": 4872.2, "valid_targets_min": 587 }, { "epoch": 5.408085430968726, "grad_norm": 0.45115923207142167, "learning_rate": 5.983487883582176e-06, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.2704853117465973, "step": 7090, "valid_targets_mean": 5120.1, "valid_targets_min": 531 }, { "epoch": 5.411899313501144, "grad_norm": 0.4945409660156044, "learning_rate": 5.9563792078797275e-06, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888518273830414, "step": 7095, "valid_targets_mean": 5236.5, "valid_targets_min": 1493 }, { "epoch": 5.415713196033562, "grad_norm": 0.4567007952044338, "learning_rate": 5.9293213321857865e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.22163493931293488, "step": 7100, "valid_targets_mean": 4193.8, "valid_targets_min": 1929 }, { "epoch": 5.41952707856598, "grad_norm": 0.4842090926003661, "learning_rate": 5.902314354376845e-06, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.25373324751853943, "step": 7105, "valid_targets_mean": 4655.1, "valid_targets_min": 1354 }, { "epoch": 5.423340961098398, "grad_norm": 0.41473599298153047, "learning_rate": 5.87535837214527e-06, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.26143643260002136, "step": 7110, "valid_targets_mean": 5557.0, "valid_targets_min": 1151 }, { "epoch": 5.427154843630817, "grad_norm": 0.4441541614997986, "learning_rate": 5.848453482998986e-06, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.2161817103624344, "step": 7115, "valid_targets_mean": 4495.2, "valid_targets_min": 999 }, { "epoch": 5.4309687261632345, "grad_norm": 0.4471035984291613, "learning_rate": 5.8215997842610695e-06, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.28700459003448486, "step": 7120, "valid_targets_mean": 4882.1, "valid_targets_min": 987 }, { "epoch": 5.434782608695652, "grad_norm": 0.47288529174681054, "learning_rate": 5.794797373069454e-06, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508050799369812, "step": 7125, "valid_targets_mean": 4713.7, "valid_targets_min": 1686 }, { "epoch": 5.43859649122807, "grad_norm": 0.4960945585855858, "learning_rate": 5.768046346376528e-06, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2533581256866455, "step": 7130, "valid_targets_mean": 3984.4, "valid_targets_min": 977 }, { "epoch": 5.442410373760488, "grad_norm": 0.49188617193973644, "learning_rate": 5.7413468009488284e-06, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.20482134819030762, "step": 7135, "valid_targets_mean": 3737.5, "valid_targets_min": 354 }, { "epoch": 5.446224256292906, "grad_norm": 0.6000775297843542, "learning_rate": 5.714698833366641e-06, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.2533903419971466, "step": 7140, "valid_targets_mean": 3571.9, "valid_targets_min": 1005 }, { "epoch": 5.450038138825324, "grad_norm": 0.45340382274911345, "learning_rate": 5.688102540023705e-06, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805597484111786, "step": 7145, "valid_targets_mean": 5255.7, "valid_targets_min": 750 }, { "epoch": 5.453852021357742, "grad_norm": 0.4410601983842463, "learning_rate": 5.661558017126834e-06, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.2243202179670334, "step": 7150, "valid_targets_mean": 4318.8, "valid_targets_min": 1350 }, { "epoch": 5.4576659038901605, "grad_norm": 0.466304205959976, "learning_rate": 5.635065360695555e-06, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.2674126625061035, "step": 7155, "valid_targets_mean": 4463.6, "valid_targets_min": 1353 }, { "epoch": 5.461479786422578, "grad_norm": 0.47987541986780025, "learning_rate": 5.608624666561799e-06, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757456302642822, "step": 7160, "valid_targets_mean": 4238.0, "valid_targets_min": 495 }, { "epoch": 5.465293668954996, "grad_norm": 0.4723114447122454, "learning_rate": 5.582236030369514e-06, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.29881516098976135, "step": 7165, "valid_targets_mean": 5455.1, "valid_targets_min": 1228 }, { "epoch": 5.469107551487414, "grad_norm": 0.47351422373374047, "learning_rate": 5.5558995475743635e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.28124120831489563, "step": 7170, "valid_targets_mean": 4546.2, "valid_targets_min": 1467 }, { "epoch": 5.472921434019832, "grad_norm": 0.4581850087130719, "learning_rate": 5.529615313443328e-06, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.263645738363266, "step": 7175, "valid_targets_mean": 4665.4, "valid_targets_min": 1231 }, { "epoch": 5.47673531655225, "grad_norm": 0.44445804803224537, "learning_rate": 5.503383423054418e-06, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.29965755343437195, "step": 7180, "valid_targets_mean": 4919.1, "valid_targets_min": 401 }, { "epoch": 5.480549199084669, "grad_norm": 0.48072448807053203, "learning_rate": 5.47720397129627e-06, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2851342558860779, "step": 7185, "valid_targets_mean": 3921.5, "valid_targets_min": 807 }, { "epoch": 5.4843630816170865, "grad_norm": 0.5429782499885556, "learning_rate": 5.451077052867859e-06, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.23518866300582886, "step": 7190, "valid_targets_mean": 3978.4, "valid_targets_min": 715 }, { "epoch": 5.488176964149504, "grad_norm": 0.5600448299096479, "learning_rate": 5.425002762278127e-06, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.23407478630542755, "step": 7195, "valid_targets_mean": 3173.8, "valid_targets_min": 933 }, { "epoch": 5.491990846681922, "grad_norm": 0.5169549649125209, "learning_rate": 5.39898119384563e-06, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2725510895252228, "step": 7200, "valid_targets_mean": 4044.9, "valid_targets_min": 1272 }, { "epoch": 5.49580472921434, "grad_norm": 0.5459825367677725, "learning_rate": 5.373012441698235e-06, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.2436116337776184, "step": 7205, "valid_targets_mean": 3122.2, "valid_targets_min": 457 }, { "epoch": 5.499618611746758, "grad_norm": 0.6737293290695994, "learning_rate": 5.347096599772732e-06, "loss": 0.4182, "loss_nan_ranks": 0, "loss_rank_avg": 0.28409695625305176, "step": 7210, "valid_targets_mean": 2758.2, "valid_targets_min": 574 }, { "epoch": 5.503432494279176, "grad_norm": 0.47869919663122357, "learning_rate": 5.3212337618145416e-06, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.2792750895023346, "step": 7215, "valid_targets_mean": 4658.0, "valid_targets_min": 1364 }, { "epoch": 5.507246376811594, "grad_norm": 0.46056094352248905, "learning_rate": 5.295424021377331e-06, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.25706204771995544, "step": 7220, "valid_targets_mean": 4113.9, "valid_targets_min": 815 }, { "epoch": 5.511060259344013, "grad_norm": 0.4464065222279077, "learning_rate": 5.269667471822721e-06, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.23010754585266113, "step": 7225, "valid_targets_mean": 4441.2, "valid_targets_min": 1100 }, { "epoch": 5.51487414187643, "grad_norm": 0.4534242612135644, "learning_rate": 5.243964206319905e-06, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.25065717101097107, "step": 7230, "valid_targets_mean": 4198.2, "valid_targets_min": 967 }, { "epoch": 5.518688024408848, "grad_norm": 0.4465601339441509, "learning_rate": 5.218314317845341e-06, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.2715952694416046, "step": 7235, "valid_targets_mean": 5195.9, "valid_targets_min": 1113 }, { "epoch": 5.522501906941266, "grad_norm": 0.49623684714776733, "learning_rate": 5.192717899182414e-06, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.2818422019481659, "step": 7240, "valid_targets_mean": 3791.5, "valid_targets_min": 1313 }, { "epoch": 5.526315789473684, "grad_norm": 0.5387411414011866, "learning_rate": 5.1671750429210706e-06, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.26141834259033203, "step": 7245, "valid_targets_mean": 3960.7, "valid_targets_min": 844 }, { "epoch": 5.530129672006102, "grad_norm": 0.4733982326591677, "learning_rate": 5.141685841457531e-06, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717835307121277, "step": 7250, "valid_targets_mean": 4288.9, "valid_targets_min": 1040 }, { "epoch": 5.53394355453852, "grad_norm": 0.4560601736804632, "learning_rate": 5.116250386993908e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.23000472784042358, "step": 7255, "valid_targets_mean": 3966.4, "valid_targets_min": 1084 }, { "epoch": 5.537757437070939, "grad_norm": 0.45789216879423134, "learning_rate": 5.090868771537918e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2920645773410797, "step": 7260, "valid_targets_mean": 5077.2, "valid_targets_min": 1141 }, { "epoch": 5.5415713196033565, "grad_norm": 0.46197101608486557, "learning_rate": 5.065541086902499e-06, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.24757897853851318, "step": 7265, "valid_targets_mean": 4411.2, "valid_targets_min": 1106 }, { "epoch": 5.545385202135774, "grad_norm": 0.49869011412423253, "learning_rate": 5.040267424705531e-06, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.26691606640815735, "step": 7270, "valid_targets_mean": 4098.8, "valid_targets_min": 881 }, { "epoch": 5.549199084668192, "grad_norm": 0.46561034630392756, "learning_rate": 5.015047876369456e-06, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.2835874557495117, "step": 7275, "valid_targets_mean": 4925.6, "valid_targets_min": 1056 }, { "epoch": 5.55301296720061, "grad_norm": 0.49268173538897586, "learning_rate": 4.989882533120985e-06, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.28856849670410156, "step": 7280, "valid_targets_mean": 4464.0, "valid_targets_min": 1397 }, { "epoch": 5.556826849733028, "grad_norm": 0.5405525220524633, "learning_rate": 4.964771485990753e-06, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.24683456122875214, "step": 7285, "valid_targets_mean": 3427.6, "valid_targets_min": 850 }, { "epoch": 5.560640732265446, "grad_norm": 0.522144174272764, "learning_rate": 4.939714825812976e-06, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.2464541345834732, "step": 7290, "valid_targets_mean": 3456.2, "valid_targets_min": 928 }, { "epoch": 5.564454614797864, "grad_norm": 0.4972765834947173, "learning_rate": 4.914712643225155e-06, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.27163538336753845, "step": 7295, "valid_targets_mean": 4422.6, "valid_targets_min": 1164 }, { "epoch": 5.5682684973302825, "grad_norm": 0.46118503283223744, "learning_rate": 4.889765028667706e-06, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.30164602398872375, "step": 7300, "valid_targets_mean": 5380.8, "valid_targets_min": 1094 }, { "epoch": 5.5720823798627, "grad_norm": 0.41517681084142244, "learning_rate": 4.8648720723836815e-06, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2422560453414917, "step": 7305, "valid_targets_mean": 5003.5, "valid_targets_min": 1181 }, { "epoch": 5.575896262395118, "grad_norm": 0.519351689521643, "learning_rate": 4.840033864418394e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.278678297996521, "step": 7310, "valid_targets_mean": 3523.4, "valid_targets_min": 652 }, { "epoch": 5.579710144927536, "grad_norm": 0.4491216603709415, "learning_rate": 4.815250494619142e-06, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643551826477051, "step": 7315, "valid_targets_mean": 4933.9, "valid_targets_min": 887 }, { "epoch": 5.583524027459954, "grad_norm": 0.49558408715788765, "learning_rate": 4.790522052634832e-06, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.29052674770355225, "step": 7320, "valid_targets_mean": 3924.8, "valid_targets_min": 909 }, { "epoch": 5.587337909992372, "grad_norm": 0.4408746776163538, "learning_rate": 4.7658486279156855e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2446516901254654, "step": 7325, "valid_targets_mean": 4569.1, "valid_targets_min": 1411 }, { "epoch": 5.591151792524791, "grad_norm": 0.4717219750374338, "learning_rate": 4.74123030971293e-06, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.24252106249332428, "step": 7330, "valid_targets_mean": 4408.3, "valid_targets_min": 1060 }, { "epoch": 5.5949656750572085, "grad_norm": 0.4964043406119739, "learning_rate": 4.716667187078426e-06, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.2528547942638397, "step": 7335, "valid_targets_mean": 3936.3, "valid_targets_min": 1230 }, { "epoch": 5.598779557589626, "grad_norm": 0.46290044328099633, "learning_rate": 4.692159348864405e-06, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.23730583488941193, "step": 7340, "valid_targets_mean": 4176.9, "valid_targets_min": 306 }, { "epoch": 5.602593440122044, "grad_norm": 0.526359122756289, "learning_rate": 4.667706883723089e-06, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.23432885110378265, "step": 7345, "valid_targets_mean": 3812.0, "valid_targets_min": 917 }, { "epoch": 5.606407322654462, "grad_norm": 0.4488365832771667, "learning_rate": 4.6433098801064216e-06, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.22697098553180695, "step": 7350, "valid_targets_mean": 4373.7, "valid_targets_min": 991 }, { "epoch": 5.61022120518688, "grad_norm": 0.4454358707434032, "learning_rate": 4.61896842626572e-06, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.2983551323413849, "step": 7355, "valid_targets_mean": 5246.0, "valid_targets_min": 927 }, { "epoch": 5.614035087719298, "grad_norm": 0.4353310092624839, "learning_rate": 4.594682610251349e-06, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707470655441284, "step": 7360, "valid_targets_mean": 5198.0, "valid_targets_min": 1305 }, { "epoch": 5.617848970251716, "grad_norm": 0.4924961276507448, "learning_rate": 4.570452519912434e-06, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.22331412136554718, "step": 7365, "valid_targets_mean": 3868.3, "valid_targets_min": 840 }, { "epoch": 5.621662852784135, "grad_norm": 0.49740165985344104, "learning_rate": 4.5462782428965e-06, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.26943090558052063, "step": 7370, "valid_targets_mean": 4378.5, "valid_targets_min": 1324 }, { "epoch": 5.6254767353165525, "grad_norm": 1.4631518670559964, "learning_rate": 4.52215986664921e-06, "loss": 0.4228, "loss_nan_ranks": 0, "loss_rank_avg": 0.42682841420173645, "step": 7375, "valid_targets_mean": 834.8, "valid_targets_min": 622 }, { "epoch": 5.62929061784897, "grad_norm": 0.4760786300585858, "learning_rate": 4.498097478413981e-06, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.24382078647613525, "step": 7380, "valid_targets_mean": 4504.2, "valid_targets_min": 356 }, { "epoch": 5.633104500381388, "grad_norm": 0.4626734833552102, "learning_rate": 4.474091165231737e-06, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557976543903351, "step": 7385, "valid_targets_mean": 4257.1, "valid_targets_min": 1598 }, { "epoch": 5.636918382913806, "grad_norm": 0.4742996077597775, "learning_rate": 4.450141013940534e-06, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.23813612759113312, "step": 7390, "valid_targets_mean": 4133.5, "valid_targets_min": 1372 }, { "epoch": 5.640732265446224, "grad_norm": 0.45938048208501386, "learning_rate": 4.426247111175297e-06, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.21757149696350098, "step": 7395, "valid_targets_mean": 4052.1, "valid_targets_min": 657 }, { "epoch": 5.644546147978643, "grad_norm": 0.46051709275793706, "learning_rate": 4.402409543367472e-06, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812298536300659, "step": 7400, "valid_targets_mean": 4681.9, "valid_targets_min": 946 }, { "epoch": 5.648360030511061, "grad_norm": 0.4520687879121962, "learning_rate": 4.378628396744717e-06, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.29354262351989746, "step": 7405, "valid_targets_mean": 5111.8, "valid_targets_min": 1202 }, { "epoch": 5.6521739130434785, "grad_norm": 0.45662177723316266, "learning_rate": 4.354903757330619e-06, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.29141366481781006, "step": 7410, "valid_targets_mean": 5248.5, "valid_targets_min": 1118 }, { "epoch": 5.655987795575896, "grad_norm": 0.5798114965925926, "learning_rate": 4.3312357109443345e-06, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.26307177543640137, "step": 7415, "valid_targets_mean": 4735.7, "valid_targets_min": 1169 }, { "epoch": 5.659801678108314, "grad_norm": 0.4632669903920861, "learning_rate": 4.307624343200332e-06, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.24400150775909424, "step": 7420, "valid_targets_mean": 4341.5, "valid_targets_min": 514 }, { "epoch": 5.663615560640732, "grad_norm": 0.47567506904850365, "learning_rate": 4.284069739508032e-06, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.2501218914985657, "step": 7425, "valid_targets_mean": 4060.4, "valid_targets_min": 793 }, { "epoch": 5.66742944317315, "grad_norm": 0.4784400024841789, "learning_rate": 4.2605719850715445e-06, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.24574881792068481, "step": 7430, "valid_targets_mean": 4294.8, "valid_targets_min": 943 }, { "epoch": 5.671243325705568, "grad_norm": 0.5133347500185746, "learning_rate": 4.237131164889321e-06, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.27007922530174255, "step": 7435, "valid_targets_mean": 4046.4, "valid_targets_min": 1159 }, { "epoch": 5.675057208237987, "grad_norm": 0.4539076379605323, "learning_rate": 4.213747363753875e-06, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.24426043033599854, "step": 7440, "valid_targets_mean": 4678.9, "valid_targets_min": 1080 }, { "epoch": 5.6788710907704045, "grad_norm": 0.4619730738815801, "learning_rate": 4.190420666251467e-06, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.22337813675403595, "step": 7445, "valid_targets_mean": 4274.1, "valid_targets_min": 1006 }, { "epoch": 5.682684973302822, "grad_norm": 0.5289760710330429, "learning_rate": 4.1671511567617816e-06, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.23961704969406128, "step": 7450, "valid_targets_mean": 3701.7, "valid_targets_min": 1264 }, { "epoch": 5.68649885583524, "grad_norm": 0.4077567627073792, "learning_rate": 4.143938919457659e-06, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.22072581946849823, "step": 7455, "valid_targets_mean": 5214.0, "valid_targets_min": 1596 }, { "epoch": 5.690312738367658, "grad_norm": 0.5715728165292766, "learning_rate": 4.120784038304743e-06, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.26193735003471375, "step": 7460, "valid_targets_mean": 3611.3, "valid_targets_min": 906 }, { "epoch": 5.694126620900076, "grad_norm": 0.5026260419778403, "learning_rate": 4.0976865970612305e-06, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.22939319908618927, "step": 7465, "valid_targets_mean": 3772.9, "valid_targets_min": 431 }, { "epoch": 5.697940503432494, "grad_norm": 0.47404174633602586, "learning_rate": 4.074646679277514e-06, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.25620734691619873, "step": 7470, "valid_targets_mean": 4115.8, "valid_targets_min": 843 }, { "epoch": 5.701754385964913, "grad_norm": 0.44644681572700895, "learning_rate": 4.051664368295931e-06, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.22743135690689087, "step": 7475, "valid_targets_mean": 4980.8, "valid_targets_min": 2055 }, { "epoch": 5.705568268497331, "grad_norm": 0.4762637154157596, "learning_rate": 4.028739747250414e-06, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.29567673802375793, "step": 7480, "valid_targets_mean": 5021.9, "valid_targets_min": 1334 }, { "epoch": 5.709382151029748, "grad_norm": 0.5331830444355757, "learning_rate": 4.005872899066232e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.26421937346458435, "step": 7485, "valid_targets_mean": 3504.0, "valid_targets_min": 994 }, { "epoch": 5.713196033562166, "grad_norm": 0.47084261096423663, "learning_rate": 3.983063906459672e-06, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.260171502828598, "step": 7490, "valid_targets_mean": 4280.6, "valid_targets_min": 1070 }, { "epoch": 5.717009916094584, "grad_norm": 0.5009028299599818, "learning_rate": 3.960312851937722e-06, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.2721886932849884, "step": 7495, "valid_targets_mean": 4046.6, "valid_targets_min": 1336 }, { "epoch": 5.720823798627002, "grad_norm": 0.5466785269273442, "learning_rate": 3.937619817797813e-06, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.26342272758483887, "step": 7500, "valid_targets_mean": 4143.9, "valid_targets_min": 859 }, { "epoch": 5.72463768115942, "grad_norm": 0.419718247363952, "learning_rate": 3.9149848861274795e-06, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.27253589034080505, "step": 7505, "valid_targets_mean": 5215.9, "valid_targets_min": 1424 }, { "epoch": 5.728451563691838, "grad_norm": 0.46579609883184436, "learning_rate": 3.8924081388040976e-06, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.24933433532714844, "step": 7510, "valid_targets_mean": 4956.2, "valid_targets_min": 1100 }, { "epoch": 5.732265446224257, "grad_norm": 0.5163794532026748, "learning_rate": 3.869889657494559e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.27208736538887024, "step": 7515, "valid_targets_mean": 4663.0, "valid_targets_min": 1162 }, { "epoch": 5.7360793287566745, "grad_norm": 0.48502196089198857, "learning_rate": 3.847429523655004e-06, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.23235277831554413, "step": 7520, "valid_targets_mean": 4345.2, "valid_targets_min": 1173 }, { "epoch": 5.739893211289092, "grad_norm": 0.48209817050203563, "learning_rate": 3.825027818530498e-06, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.2796691954135895, "step": 7525, "valid_targets_mean": 5048.5, "valid_targets_min": 467 }, { "epoch": 5.74370709382151, "grad_norm": 0.4449831601562535, "learning_rate": 3.802684623154762e-06, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.2815805673599243, "step": 7530, "valid_targets_mean": 5262.2, "valid_targets_min": 1557 }, { "epoch": 5.747520976353928, "grad_norm": 0.4479873081666714, "learning_rate": 3.780400018349872e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.27081429958343506, "step": 7535, "valid_targets_mean": 5022.8, "valid_targets_min": 1333 }, { "epoch": 5.751334858886346, "grad_norm": 1.3471935076076935, "learning_rate": 3.7581740847259495e-06, "loss": 0.3821, "loss_nan_ranks": 0, "loss_rank_avg": 0.4470458924770355, "step": 7540, "valid_targets_mean": 882.6, "valid_targets_min": 583 }, { "epoch": 5.755148741418765, "grad_norm": 0.4781128038840103, "learning_rate": 3.736006902680904e-06, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608310282230377, "step": 7545, "valid_targets_mean": 4537.0, "valid_targets_min": 843 }, { "epoch": 5.758962623951183, "grad_norm": 0.5659433332480197, "learning_rate": 3.7138985524001057e-06, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.31279221177101135, "step": 7550, "valid_targets_mean": 4426.8, "valid_targets_min": 1103 }, { "epoch": 5.7627765064836005, "grad_norm": 0.4962767932946681, "learning_rate": 3.691849113856125e-06, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.219892218708992, "step": 7555, "valid_targets_mean": 3565.2, "valid_targets_min": 1013 }, { "epoch": 5.766590389016018, "grad_norm": 0.6270615848107953, "learning_rate": 3.6698586668084214e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.2851230800151825, "step": 7560, "valid_targets_mean": 5459.8, "valid_targets_min": 1291 }, { "epoch": 5.770404271548436, "grad_norm": 0.5020336137990338, "learning_rate": 3.647927290803075e-06, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.2942732572555542, "step": 7565, "valid_targets_mean": 4056.2, "valid_targets_min": 1102 }, { "epoch": 5.774218154080854, "grad_norm": 0.47840297911651897, "learning_rate": 3.6260550651724735e-06, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.23049987852573395, "step": 7570, "valid_targets_mean": 4130.0, "valid_targets_min": 327 }, { "epoch": 5.778032036613272, "grad_norm": 0.45812668366800213, "learning_rate": 3.604242069035051e-06, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.24633507430553436, "step": 7575, "valid_targets_mean": 4542.7, "valid_targets_min": 1212 }, { "epoch": 5.78184591914569, "grad_norm": 0.4789571096088359, "learning_rate": 3.582488381294997e-06, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.254001647233963, "step": 7580, "valid_targets_mean": 4604.6, "valid_targets_min": 420 }, { "epoch": 5.785659801678109, "grad_norm": 0.4915261483074165, "learning_rate": 3.560794080641943e-06, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834867537021637, "step": 7585, "valid_targets_mean": 4501.2, "valid_targets_min": 1410 }, { "epoch": 5.7894736842105265, "grad_norm": 0.4302456126659898, "learning_rate": 3.5391592455507207e-06, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.23200945556163788, "step": 7590, "valid_targets_mean": 4676.2, "valid_targets_min": 577 }, { "epoch": 5.793287566742944, "grad_norm": 0.5125700685274149, "learning_rate": 3.517583954281041e-06, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.26258015632629395, "step": 7595, "valid_targets_mean": 3732.4, "valid_targets_min": 1297 }, { "epoch": 5.797101449275362, "grad_norm": 0.4926014789340449, "learning_rate": 3.4960682848772432e-06, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2648114264011383, "step": 7600, "valid_targets_mean": 4162.2, "valid_targets_min": 929 }, { "epoch": 5.80091533180778, "grad_norm": 0.471511291106976, "learning_rate": 3.4746123151679777e-06, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.23751680552959442, "step": 7605, "valid_targets_mean": 4355.8, "valid_targets_min": 1475 }, { "epoch": 5.804729214340198, "grad_norm": 0.47994063760768335, "learning_rate": 3.4532161227659635e-06, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726961374282837, "step": 7610, "valid_targets_mean": 4271.6, "valid_targets_min": 877 }, { "epoch": 5.808543096872616, "grad_norm": 0.5263789521198493, "learning_rate": 3.4318797850676643e-06, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.2983848452568054, "step": 7615, "valid_targets_mean": 4016.3, "valid_targets_min": 1584 }, { "epoch": 5.812356979405035, "grad_norm": 0.5441262014652823, "learning_rate": 3.4106033792530503e-06, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.29425832629203796, "step": 7620, "valid_targets_mean": 3834.4, "valid_targets_min": 963 }, { "epoch": 5.816170861937453, "grad_norm": 0.4594189691390277, "learning_rate": 3.3893869822852965e-06, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.23714977502822876, "step": 7625, "valid_targets_mean": 4394.7, "valid_targets_min": 971 }, { "epoch": 5.8199847444698705, "grad_norm": 0.44797174670219914, "learning_rate": 3.368230670910495e-06, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.24746312201023102, "step": 7630, "valid_targets_mean": 5370.3, "valid_targets_min": 930 }, { "epoch": 5.823798627002288, "grad_norm": 0.45332363493811645, "learning_rate": 3.3471345216574135e-06, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.25578317046165466, "step": 7635, "valid_targets_mean": 4801.6, "valid_targets_min": 1460 }, { "epoch": 5.827612509534706, "grad_norm": 0.5252092504310898, "learning_rate": 3.326098610837165e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.27364540100097656, "step": 7640, "valid_targets_mean": 3530.9, "valid_targets_min": 516 }, { "epoch": 5.831426392067124, "grad_norm": 0.4900065349858666, "learning_rate": 3.3051230145429834e-06, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.2814614474773407, "step": 7645, "valid_targets_mean": 5115.5, "valid_targets_min": 1055 }, { "epoch": 5.835240274599542, "grad_norm": 0.44824989551867944, "learning_rate": 3.2842078086499307e-06, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.24113915860652924, "step": 7650, "valid_targets_mean": 4745.6, "valid_targets_min": 1724 }, { "epoch": 5.83905415713196, "grad_norm": 0.4712181525145368, "learning_rate": 3.2633530688145966e-06, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.2545694410800934, "step": 7655, "valid_targets_mean": 4455.9, "valid_targets_min": 1123 }, { "epoch": 5.842868039664379, "grad_norm": 0.4882489300080456, "learning_rate": 3.24255887047487e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2780630886554718, "step": 7660, "valid_targets_mean": 4831.5, "valid_targets_min": 1362 }, { "epoch": 5.8466819221967965, "grad_norm": 0.4102481126349075, "learning_rate": 3.221825288849625e-06, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.23655253648757935, "step": 7665, "valid_targets_mean": 5257.2, "valid_targets_min": 2401 }, { "epoch": 5.850495804729214, "grad_norm": 0.4922948313278101, "learning_rate": 3.201152398938483e-06, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2933632433414459, "step": 7670, "valid_targets_mean": 4272.6, "valid_targets_min": 1201 }, { "epoch": 5.854309687261632, "grad_norm": 0.5009285178620376, "learning_rate": 3.180540275521504e-06, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608252465724945, "step": 7675, "valid_targets_mean": 4210.9, "valid_targets_min": 1195 }, { "epoch": 5.85812356979405, "grad_norm": 0.4788458917234944, "learning_rate": 3.1599889931589644e-06, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.24401216208934784, "step": 7680, "valid_targets_mean": 4195.2, "valid_targets_min": 908 }, { "epoch": 5.861937452326468, "grad_norm": 0.48355312631125696, "learning_rate": 3.1394986261910352e-06, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2997702658176422, "step": 7685, "valid_targets_mean": 4433.9, "valid_targets_min": 861 }, { "epoch": 5.865751334858887, "grad_norm": 0.48194084992498054, "learning_rate": 3.1190692487375495e-06, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.27790045738220215, "step": 7690, "valid_targets_mean": 4411.3, "valid_targets_min": 1015 }, { "epoch": 5.869565217391305, "grad_norm": 0.4792526887514992, "learning_rate": 3.0987009346977314e-06, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2566789984703064, "step": 7695, "valid_targets_mean": 4372.5, "valid_targets_min": 730 }, { "epoch": 5.8733790999237225, "grad_norm": 0.5247160658839248, "learning_rate": 3.078393757749898e-06, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623863220214844, "step": 7700, "valid_targets_mean": 3699.5, "valid_targets_min": 1064 }, { "epoch": 5.87719298245614, "grad_norm": 1.31309012160065, "learning_rate": 3.0581477913512402e-06, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.4631132185459137, "step": 7705, "valid_targets_mean": 924.8, "valid_targets_min": 595 }, { "epoch": 5.881006864988558, "grad_norm": 0.5058652384548464, "learning_rate": 3.0379631087375094e-06, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.2527218163013458, "step": 7710, "valid_targets_mean": 3840.2, "valid_targets_min": 1092 }, { "epoch": 5.884820747520976, "grad_norm": 0.48742105702963867, "learning_rate": 3.0178397829227935e-06, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.266996294260025, "step": 7715, "valid_targets_mean": 4231.3, "valid_targets_min": 427 }, { "epoch": 5.888634630053394, "grad_norm": 0.4583551693813073, "learning_rate": 2.997777886699216e-06, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.21432173252105713, "step": 7720, "valid_targets_mean": 4182.4, "valid_targets_min": 1484 }, { "epoch": 5.892448512585812, "grad_norm": 0.502015689504552, "learning_rate": 2.9777774926367153e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.22121445834636688, "step": 7725, "valid_targets_mean": 3529.1, "valid_targets_min": 437 }, { "epoch": 5.896262395118231, "grad_norm": 0.45289837614009193, "learning_rate": 2.957838673082729e-06, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.266684889793396, "step": 7730, "valid_targets_mean": 4576.7, "valid_targets_min": 530 }, { "epoch": 5.900076277650649, "grad_norm": 0.48492694694900196, "learning_rate": 2.9379615001619834e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2345353364944458, "step": 7735, "valid_targets_mean": 3823.9, "valid_targets_min": 1160 }, { "epoch": 5.9038901601830664, "grad_norm": 0.48980103900349786, "learning_rate": 2.918146045776209e-06, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.30960848927497864, "step": 7740, "valid_targets_mean": 4416.5, "valid_targets_min": 705 }, { "epoch": 5.907704042715484, "grad_norm": 0.43775365194750415, "learning_rate": 2.8983923816038628e-06, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.3002133071422577, "step": 7745, "valid_targets_mean": 6101.7, "valid_targets_min": 894 }, { "epoch": 5.911517925247902, "grad_norm": 0.4870360310259264, "learning_rate": 2.8787005790999157e-06, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.2697948217391968, "step": 7750, "valid_targets_mean": 4514.3, "valid_targets_min": 1035 }, { "epoch": 5.91533180778032, "grad_norm": 0.4816571987450125, "learning_rate": 2.859070709495535e-06, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.2682059705257416, "step": 7755, "valid_targets_mean": 4110.0, "valid_targets_min": 442 }, { "epoch": 5.919145690312739, "grad_norm": 0.4432390917784789, "learning_rate": 2.83950284379789e-06, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.29021620750427246, "step": 7760, "valid_targets_mean": 5378.8, "valid_targets_min": 1510 }, { "epoch": 5.922959572845157, "grad_norm": 0.4890666324358443, "learning_rate": 2.819997052789838e-06, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2582494914531708, "step": 7765, "valid_targets_mean": 4316.7, "valid_targets_min": 434 }, { "epoch": 5.926773455377575, "grad_norm": 0.5424078222177492, "learning_rate": 2.8005534070297092e-06, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644309997558594, "step": 7770, "valid_targets_mean": 4150.8, "valid_targets_min": 1320 }, { "epoch": 5.9305873379099925, "grad_norm": 0.5196203991335387, "learning_rate": 2.7811719768510205e-06, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673504054546356, "step": 7775, "valid_targets_mean": 3580.5, "valid_targets_min": 952 }, { "epoch": 5.93440122044241, "grad_norm": 0.4561509143165148, "learning_rate": 2.761852832362255e-06, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.27049699425697327, "step": 7780, "valid_targets_mean": 5493.5, "valid_targets_min": 1451 }, { "epoch": 5.938215102974828, "grad_norm": 0.4723195240543183, "learning_rate": 2.7425960434465794e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2836945950984955, "step": 7785, "valid_targets_mean": 4640.3, "valid_targets_min": 1688 }, { "epoch": 5.942028985507246, "grad_norm": 0.4902425169332125, "learning_rate": 2.7234016797615947e-06, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.24308143556118011, "step": 7790, "valid_targets_mean": 4298.5, "valid_targets_min": 1232 }, { "epoch": 5.945842868039664, "grad_norm": 0.5029709069193514, "learning_rate": 2.704269810739111e-06, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.2596876919269562, "step": 7795, "valid_targets_mean": 4338.5, "valid_targets_min": 1302 }, { "epoch": 5.949656750572083, "grad_norm": 0.482901901062868, "learning_rate": 2.6852005055848506e-06, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.2369847297668457, "step": 7800, "valid_targets_mean": 4154.8, "valid_targets_min": 268 }, { "epoch": 5.953470633104501, "grad_norm": 0.45917913875581223, "learning_rate": 2.6661938332782477e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.22529812157154083, "step": 7805, "valid_targets_mean": 4389.7, "valid_targets_min": 1339 }, { "epoch": 5.9572845156369185, "grad_norm": 0.446736608750938, "learning_rate": 2.6472498625721543e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.29567384719848633, "step": 7810, "valid_targets_mean": 4869.5, "valid_targets_min": 504 }, { "epoch": 5.961098398169336, "grad_norm": 0.4351896685706992, "learning_rate": 2.628368661992633e-06, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2605706751346588, "step": 7815, "valid_targets_mean": 5280.7, "valid_targets_min": 1398 }, { "epoch": 5.964912280701754, "grad_norm": 0.5221413256363302, "learning_rate": 2.6095502998386636e-06, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2452189177274704, "step": 7820, "valid_targets_mean": 3603.2, "valid_targets_min": 885 }, { "epoch": 5.968726163234172, "grad_norm": 0.4864253450865069, "learning_rate": 2.5907948441819386e-06, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.2926352620124817, "step": 7825, "valid_targets_mean": 4895.9, "valid_targets_min": 1220 }, { "epoch": 5.97254004576659, "grad_norm": 0.47427799794774056, "learning_rate": 2.5721023628665975e-06, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.26650452613830566, "step": 7830, "valid_targets_mean": 5234.3, "valid_targets_min": 1270 }, { "epoch": 5.976353928299009, "grad_norm": 0.49233848311869016, "learning_rate": 2.5534729235089685e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.2766297459602356, "step": 7835, "valid_targets_mean": 4930.2, "valid_targets_min": 1275 }, { "epoch": 5.980167810831427, "grad_norm": 0.47527502992187665, "learning_rate": 2.5349065934973593e-06, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2880236804485321, "step": 7840, "valid_targets_mean": 4734.1, "valid_targets_min": 949 }, { "epoch": 5.983981693363845, "grad_norm": 0.559391570426309, "learning_rate": 2.51640343999177e-06, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2612583339214325, "step": 7845, "valid_targets_mean": 3851.5, "valid_targets_min": 1105 }, { "epoch": 5.987795575896262, "grad_norm": 0.490844670179712, "learning_rate": 2.4979635299236926e-06, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.24493573606014252, "step": 7850, "valid_targets_mean": 4531.8, "valid_targets_min": 1130 }, { "epoch": 5.99160945842868, "grad_norm": 0.45615276740640753, "learning_rate": 2.47958692999583e-06, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.24681413173675537, "step": 7855, "valid_targets_mean": 4569.3, "valid_targets_min": 1345 }, { "epoch": 5.995423340961098, "grad_norm": 0.46989711303161386, "learning_rate": 2.461273706681888e-06, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.30878710746765137, "step": 7860, "valid_targets_mean": 4841.8, "valid_targets_min": 1035 }, { "epoch": 5.999237223493516, "grad_norm": 1.3501461018957615, "learning_rate": 2.443023926226309e-06, "loss": 0.4129, "loss_nan_ranks": 0, "loss_rank_avg": 0.49166861176490784, "step": 7865, "valid_targets_mean": 893.5, "valid_targets_min": 437 }, { "epoch": 6.003051106025935, "grad_norm": 0.48062968179889437, "learning_rate": 2.42483765464405e-06, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.2480214685201645, "step": 7870, "valid_targets_mean": 5001.8, "valid_targets_min": 1201 }, { "epoch": 6.006864988558353, "grad_norm": 0.4925864276970704, "learning_rate": 2.406714957720342e-06, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2455272078514099, "step": 7875, "valid_targets_mean": 3972.8, "valid_targets_min": 1183 }, { "epoch": 6.010678871090771, "grad_norm": 0.45788706813347363, "learning_rate": 2.3886559010104326e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.22061456739902496, "step": 7880, "valid_targets_mean": 4328.2, "valid_targets_min": 1027 }, { "epoch": 6.0144927536231885, "grad_norm": 0.47804510565235997, "learning_rate": 2.3706605498393787e-06, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.278346449136734, "step": 7885, "valid_targets_mean": 3989.0, "valid_targets_min": 1000 }, { "epoch": 6.018306636155606, "grad_norm": 0.5373527975549953, "learning_rate": 2.352728969301783e-06, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.2867368161678314, "step": 7890, "valid_targets_mean": 4721.1, "valid_targets_min": 1509 }, { "epoch": 6.022120518688024, "grad_norm": 0.47067460411820394, "learning_rate": 2.334861224261582e-06, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.30547037720680237, "step": 7895, "valid_targets_mean": 4757.3, "valid_targets_min": 579 }, { "epoch": 6.025934401220442, "grad_norm": 0.5499976280698272, "learning_rate": 2.317057379351786e-06, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2520096004009247, "step": 7900, "valid_targets_mean": 3518.1, "valid_targets_min": 703 }, { "epoch": 6.02974828375286, "grad_norm": 0.5062986771267566, "learning_rate": 2.2993174989742762e-06, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.28065720200538635, "step": 7905, "valid_targets_mean": 4128.1, "valid_targets_min": 1327 }, { "epoch": 6.033562166285279, "grad_norm": 0.4308141740962017, "learning_rate": 2.2816416472995374e-06, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.22161316871643066, "step": 7910, "valid_targets_mean": 4659.9, "valid_targets_min": 1388 }, { "epoch": 6.037376048817697, "grad_norm": 0.4557597674304979, "learning_rate": 2.264029888266457e-06, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.27463290095329285, "step": 7915, "valid_targets_mean": 4919.1, "valid_targets_min": 825 }, { "epoch": 6.0411899313501145, "grad_norm": 0.47269435901277407, "learning_rate": 2.246482285582077e-06, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803293466567993, "step": 7920, "valid_targets_mean": 4718.7, "valid_targets_min": 1230 }, { "epoch": 6.045003813882532, "grad_norm": 0.5042126557922357, "learning_rate": 2.2289989027213555e-06, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.23255133628845215, "step": 7925, "valid_targets_mean": 3776.7, "valid_targets_min": 921 }, { "epoch": 6.04881769641495, "grad_norm": 0.46979730781076023, "learning_rate": 2.2115798029269686e-06, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.23931367695331573, "step": 7930, "valid_targets_mean": 5090.0, "valid_targets_min": 947 }, { "epoch": 6.052631578947368, "grad_norm": 0.48482595112718446, "learning_rate": 2.19422504920904e-06, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.2659645974636078, "step": 7935, "valid_targets_mean": 4528.5, "valid_targets_min": 711 }, { "epoch": 6.056445461479786, "grad_norm": 0.48749706923409686, "learning_rate": 2.1769347043449486e-06, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.2688192129135132, "step": 7940, "valid_targets_mean": 4277.3, "valid_targets_min": 917 }, { "epoch": 6.060259344012205, "grad_norm": 0.4644017044390465, "learning_rate": 2.159708830879079e-06, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.3060270845890045, "step": 7945, "valid_targets_mean": 4950.3, "valid_targets_min": 1222 }, { "epoch": 6.064073226544623, "grad_norm": 0.4906142087642577, "learning_rate": 2.142547491122613e-06, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784336507320404, "step": 7950, "valid_targets_mean": 4383.7, "valid_targets_min": 531 }, { "epoch": 6.0678871090770405, "grad_norm": 0.5334373559306215, "learning_rate": 2.1254507471532837e-06, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2708498239517212, "step": 7955, "valid_targets_mean": 3776.0, "valid_targets_min": 1426 }, { "epoch": 6.071700991609458, "grad_norm": 0.4386048831830409, "learning_rate": 2.108418660815161e-06, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562674582004547, "step": 7960, "valid_targets_mean": 5180.0, "valid_targets_min": 1199 }, { "epoch": 6.075514874141876, "grad_norm": 0.4506492034727124, "learning_rate": 2.091451293718445e-06, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.26452645659446716, "step": 7965, "valid_targets_mean": 5052.3, "valid_targets_min": 1547 }, { "epoch": 6.079328756674294, "grad_norm": 0.510818194605105, "learning_rate": 2.0745487072392055e-06, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.2605459988117218, "step": 7970, "valid_targets_mean": 4058.3, "valid_targets_min": 1098 }, { "epoch": 6.083142639206712, "grad_norm": 0.5633091083246478, "learning_rate": 2.0577109625191994e-06, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.31739693880081177, "step": 7975, "valid_targets_mean": 4121.5, "valid_targets_min": 1049 }, { "epoch": 6.086956521739131, "grad_norm": 0.4949607184258331, "learning_rate": 2.0409381204656166e-06, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.2758539617061615, "step": 7980, "valid_targets_mean": 4030.7, "valid_targets_min": 1407 }, { "epoch": 6.090770404271549, "grad_norm": 0.4933453751194869, "learning_rate": 2.0242302417508887e-06, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.3091985881328583, "step": 7985, "valid_targets_mean": 4677.6, "valid_targets_min": 1302 }, { "epoch": 6.094584286803967, "grad_norm": 0.5208120342594886, "learning_rate": 2.0075873868124374e-06, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.2794772684574127, "step": 7990, "valid_targets_mean": 3504.0, "valid_targets_min": 1117 }, { "epoch": 6.0983981693363845, "grad_norm": 0.47175364867379893, "learning_rate": 1.991009615852493e-06, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2372446060180664, "step": 7995, "valid_targets_mean": 4242.5, "valid_targets_min": 1444 }, { "epoch": 6.102212051868802, "grad_norm": 0.47635870334783337, "learning_rate": 1.9744969888378507e-06, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.27210959792137146, "step": 8000, "valid_targets_mean": 3909.9, "valid_targets_min": 725 }, { "epoch": 6.10602593440122, "grad_norm": 0.4897149992424955, "learning_rate": 1.958049565499651e-06, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.2656501829624176, "step": 8005, "valid_targets_mean": 3961.4, "valid_targets_min": 1059 }, { "epoch": 6.109839816933638, "grad_norm": 0.49644054743886196, "learning_rate": 1.9416674053331874e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539803385734558, "step": 8010, "valid_targets_mean": 4016.4, "valid_targets_min": 981 }, { "epoch": 6.113653699466057, "grad_norm": 0.45827090956821354, "learning_rate": 1.9253505675976637e-06, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.2474987506866455, "step": 8015, "valid_targets_mean": 4490.6, "valid_targets_min": 1025 }, { "epoch": 6.117467581998475, "grad_norm": 0.532130189641217, "learning_rate": 1.9090991113160063e-06, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.2694808542728424, "step": 8020, "valid_targets_mean": 3972.2, "valid_targets_min": 419 }, { "epoch": 6.121281464530893, "grad_norm": 0.48835300034807266, "learning_rate": 1.8929130952746221e-06, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2953863739967346, "step": 8025, "valid_targets_mean": 4520.6, "valid_targets_min": 972 }, { "epoch": 6.1250953470633105, "grad_norm": 0.666454281494576, "learning_rate": 1.8767925780232165e-06, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.2826656997203827, "step": 8030, "valid_targets_mean": 2480.5, "valid_targets_min": 586 }, { "epoch": 6.128909229595728, "grad_norm": 0.44612454771434085, "learning_rate": 1.8607376178745507e-06, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.26308444142341614, "step": 8035, "valid_targets_mean": 4591.0, "valid_targets_min": 1422 }, { "epoch": 6.132723112128146, "grad_norm": 0.4826682472062758, "learning_rate": 1.8447482729042575e-06, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.25889599323272705, "step": 8040, "valid_targets_mean": 4414.1, "valid_targets_min": 802 }, { "epoch": 6.136536994660564, "grad_norm": 0.5109485985510919, "learning_rate": 1.8288246009506205e-06, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.3065207004547119, "step": 8045, "valid_targets_mean": 4242.8, "valid_targets_min": 1180 }, { "epoch": 6.140350877192983, "grad_norm": 0.4985109163800362, "learning_rate": 1.8129666596143525e-06, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521675229072571, "step": 8050, "valid_targets_mean": 4853.1, "valid_targets_min": 1206 }, { "epoch": 6.144164759725401, "grad_norm": 0.4901306618532278, "learning_rate": 1.7971745062584124e-06, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.22057747840881348, "step": 8055, "valid_targets_mean": 3941.9, "valid_targets_min": 771 }, { "epoch": 6.147978642257819, "grad_norm": 0.466196185868008, "learning_rate": 1.7814481980077715e-06, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.25427624583244324, "step": 8060, "valid_targets_mean": 4745.8, "valid_targets_min": 1322 }, { "epoch": 6.1517925247902365, "grad_norm": 0.589441832405084, "learning_rate": 1.7657877917492317e-06, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.23444731533527374, "step": 8065, "valid_targets_mean": 2909.0, "valid_targets_min": 957 }, { "epoch": 6.155606407322654, "grad_norm": 0.47368781222899703, "learning_rate": 1.750193344131197e-06, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.25396108627319336, "step": 8070, "valid_targets_mean": 4479.5, "valid_targets_min": 1510 }, { "epoch": 6.159420289855072, "grad_norm": 0.4450780056952024, "learning_rate": 1.734664911563486e-06, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.27313801646232605, "step": 8075, "valid_targets_mean": 4954.8, "valid_targets_min": 1624 }, { "epoch": 6.16323417238749, "grad_norm": 0.48910138411977444, "learning_rate": 1.7192025502171228e-06, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.22142617404460907, "step": 8080, "valid_targets_mean": 4333.7, "valid_targets_min": 861 }, { "epoch": 6.167048054919908, "grad_norm": 0.48170174354701956, "learning_rate": 1.7038063160241192e-06, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.2735546827316284, "step": 8085, "valid_targets_mean": 4614.9, "valid_targets_min": 1063 }, { "epoch": 6.170861937452327, "grad_norm": 0.4854645935841226, "learning_rate": 1.6884762646773033e-06, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.21456031501293182, "step": 8090, "valid_targets_mean": 3828.2, "valid_targets_min": 1029 }, { "epoch": 6.174675819984745, "grad_norm": 0.5193233563509866, "learning_rate": 1.673212451630084e-06, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.23842072486877441, "step": 8095, "valid_targets_mean": 4357.5, "valid_targets_min": 1403 }, { "epoch": 6.178489702517163, "grad_norm": 0.46674004165837635, "learning_rate": 1.658014932096279e-06, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.2715775668621063, "step": 8100, "valid_targets_mean": 4991.6, "valid_targets_min": 1196 }, { "epoch": 6.18230358504958, "grad_norm": 0.4395211421948986, "learning_rate": 1.6428837610498871e-06, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.22720418870449066, "step": 8105, "valid_targets_mean": 4861.5, "valid_targets_min": 1284 }, { "epoch": 6.186117467581998, "grad_norm": 0.4452513509591422, "learning_rate": 1.6278189932249254e-06, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.2689577043056488, "step": 8110, "valid_targets_mean": 5120.7, "valid_targets_min": 1014 }, { "epoch": 6.189931350114416, "grad_norm": 0.46574167515943166, "learning_rate": 1.6128206831151882e-06, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2244655340909958, "step": 8115, "valid_targets_mean": 5011.2, "valid_targets_min": 447 }, { "epoch": 6.193745232646834, "grad_norm": 0.4524835605573105, "learning_rate": 1.5978888849740859e-06, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.3081461489200592, "step": 8120, "valid_targets_mean": 5331.9, "valid_targets_min": 780 }, { "epoch": 6.197559115179253, "grad_norm": 0.4590513523291447, "learning_rate": 1.5830236528144393e-06, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2569229304790497, "step": 8125, "valid_targets_mean": 4720.4, "valid_targets_min": 1129 }, { "epoch": 6.201372997711671, "grad_norm": 0.49349920923341595, "learning_rate": 1.5682250404082644e-06, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.239435076713562, "step": 8130, "valid_targets_mean": 4415.0, "valid_targets_min": 1096 }, { "epoch": 6.205186880244089, "grad_norm": 0.4835711092547128, "learning_rate": 1.5534931012866073e-06, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.28328731656074524, "step": 8135, "valid_targets_mean": 5174.2, "valid_targets_min": 728 }, { "epoch": 6.2090007627765065, "grad_norm": 0.469441730252239, "learning_rate": 1.5388278887393248e-06, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.25443562865257263, "step": 8140, "valid_targets_mean": 4408.7, "valid_targets_min": 1133 }, { "epoch": 6.212814645308924, "grad_norm": 0.5158535576190626, "learning_rate": 1.5242294558149185e-06, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.2312001734972, "step": 8145, "valid_targets_mean": 3657.9, "valid_targets_min": 437 }, { "epoch": 6.216628527841342, "grad_norm": 0.553127176309931, "learning_rate": 1.5096978553203113e-06, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.30233147740364075, "step": 8150, "valid_targets_mean": 3667.6, "valid_targets_min": 924 }, { "epoch": 6.22044241037376, "grad_norm": 0.48795105972995456, "learning_rate": 1.4952331398206887e-06, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.20166908204555511, "step": 8155, "valid_targets_mean": 3893.6, "valid_targets_min": 259 }, { "epoch": 6.224256292906179, "grad_norm": 0.4551850427448832, "learning_rate": 1.480835361639279e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.29251715540885925, "step": 8160, "valid_targets_mean": 5185.8, "valid_targets_min": 877 }, { "epoch": 6.228070175438597, "grad_norm": 0.4373875864246496, "learning_rate": 1.4665045728571882e-06, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2827031910419464, "step": 8165, "valid_targets_mean": 4935.5, "valid_targets_min": 1328 }, { "epoch": 6.231884057971015, "grad_norm": 0.4731594753863616, "learning_rate": 1.4522408253132025e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.2341814786195755, "step": 8170, "valid_targets_mean": 4701.2, "valid_targets_min": 1053 }, { "epoch": 6.2356979405034325, "grad_norm": 0.5056521083824401, "learning_rate": 1.4380441706035853e-06, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.2901335060596466, "step": 8175, "valid_targets_mean": 4571.2, "valid_targets_min": 1179 }, { "epoch": 6.23951182303585, "grad_norm": 0.4462897818037207, "learning_rate": 1.4239146600819242e-06, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.3010201156139374, "step": 8180, "valid_targets_mean": 5367.0, "valid_targets_min": 1576 }, { "epoch": 6.243325705568268, "grad_norm": 0.4739465545428769, "learning_rate": 1.4098523448589085e-06, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.2658689618110657, "step": 8185, "valid_targets_mean": 4513.1, "valid_targets_min": 1114 }, { "epoch": 6.247139588100686, "grad_norm": 0.5728493918682379, "learning_rate": 1.395857275802177e-06, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.27031782269477844, "step": 8190, "valid_targets_mean": 3563.4, "valid_targets_min": 1235 }, { "epoch": 6.250953470633105, "grad_norm": 1.3211397960464706, "learning_rate": 1.3819295035361058e-06, "loss": 0.4452, "loss_nan_ranks": 0, "loss_rank_avg": 0.4577854573726654, "step": 8195, "valid_targets_mean": 904.5, "valid_targets_min": 535 }, { "epoch": 6.254767353165523, "grad_norm": 0.45784081080185146, "learning_rate": 1.3680690784416518e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961617410182953, "step": 8200, "valid_targets_mean": 5407.8, "valid_targets_min": 967 }, { "epoch": 6.258581235697941, "grad_norm": 0.46998051084917214, "learning_rate": 1.3542760506561425e-06, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2554444372653961, "step": 8205, "valid_targets_mean": 4629.0, "valid_targets_min": 942 }, { "epoch": 6.2623951182303585, "grad_norm": 0.5663180562707967, "learning_rate": 1.3405504700731187e-06, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.27484387159347534, "step": 8210, "valid_targets_mean": 3721.8, "valid_targets_min": 1239 }, { "epoch": 6.266209000762776, "grad_norm": 0.5004847910957235, "learning_rate": 1.3268923863421446e-06, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.23197054862976074, "step": 8215, "valid_targets_mean": 3964.7, "valid_targets_min": 1498 }, { "epoch": 6.270022883295194, "grad_norm": 0.5283419533962973, "learning_rate": 1.3133018488686178e-06, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.2701933979988098, "step": 8220, "valid_targets_mean": 3617.1, "valid_targets_min": 1119 }, { "epoch": 6.273836765827612, "grad_norm": 0.42300879977149064, "learning_rate": 1.2997789068136179e-06, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.26573577523231506, "step": 8225, "valid_targets_mean": 5194.5, "valid_targets_min": 506 }, { "epoch": 6.27765064836003, "grad_norm": 0.49915292987260135, "learning_rate": 1.2863236090936914e-06, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.2291276901960373, "step": 8230, "valid_targets_mean": 3968.0, "valid_targets_min": 1443 }, { "epoch": 6.281464530892449, "grad_norm": 0.4814365648176594, "learning_rate": 1.2729360043807115e-06, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2721117436885834, "step": 8235, "valid_targets_mean": 4163.8, "valid_targets_min": 1016 }, { "epoch": 6.285278413424867, "grad_norm": 0.4584146356424767, "learning_rate": 1.2596161411016761e-06, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678042948246002, "step": 8240, "valid_targets_mean": 4794.0, "valid_targets_min": 1423 }, { "epoch": 6.289092295957285, "grad_norm": 0.5086223883422862, "learning_rate": 1.2463640674385458e-06, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.28021755814552307, "step": 8245, "valid_targets_mean": 4818.8, "valid_targets_min": 1828 }, { "epoch": 6.2929061784897025, "grad_norm": 0.49136585702620744, "learning_rate": 1.233179831328062e-06, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.23660731315612793, "step": 8250, "valid_targets_mean": 3634.5, "valid_targets_min": 1127 }, { "epoch": 6.29672006102212, "grad_norm": 0.53884264245829, "learning_rate": 1.2200634804615818e-06, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.22205261886119843, "step": 8255, "valid_targets_mean": 3687.9, "valid_targets_min": 436 }, { "epoch": 6.300533943554538, "grad_norm": 0.48947114458130897, "learning_rate": 1.207015062284902e-06, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.2426479309797287, "step": 8260, "valid_targets_mean": 3859.2, "valid_targets_min": 1237 }, { "epoch": 6.304347826086957, "grad_norm": 0.4567633292464014, "learning_rate": 1.1940346239980816e-06, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.27313122153282166, "step": 8265, "valid_targets_mean": 4842.5, "valid_targets_min": 1110 }, { "epoch": 6.308161708619375, "grad_norm": 0.4995871522429241, "learning_rate": 1.1811222125552768e-06, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.2652623951435089, "step": 8270, "valid_targets_mean": 3800.2, "valid_targets_min": 637 }, { "epoch": 6.311975591151793, "grad_norm": 0.5468633135839358, "learning_rate": 1.1682778746645652e-06, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.27540352940559387, "step": 8275, "valid_targets_mean": 4041.3, "valid_targets_min": 931 }, { "epoch": 6.315789473684211, "grad_norm": 0.5313235594410799, "learning_rate": 1.1555016567877985e-06, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507777214050293, "step": 8280, "valid_targets_mean": 3945.6, "valid_targets_min": 872 }, { "epoch": 6.3196033562166285, "grad_norm": 0.630105166821167, "learning_rate": 1.1427936051403977e-06, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.21576042473316193, "step": 8285, "valid_targets_mean": 2889.1, "valid_targets_min": 734 }, { "epoch": 6.323417238749046, "grad_norm": 0.4653648737455474, "learning_rate": 1.1301537656912175e-06, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.28202584385871887, "step": 8290, "valid_targets_mean": 4816.4, "valid_targets_min": 1084 }, { "epoch": 6.327231121281464, "grad_norm": 0.5166525372254579, "learning_rate": 1.1175821841623712e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.2229657620191574, "step": 8295, "valid_targets_mean": 3587.4, "valid_targets_min": 1143 }, { "epoch": 6.331045003813882, "grad_norm": 0.4833110267231946, "learning_rate": 1.1050789060290534e-06, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544369101524353, "step": 8300, "valid_targets_mean": 4295.7, "valid_targets_min": 1226 }, { "epoch": 6.334858886346301, "grad_norm": 0.5346116958118867, "learning_rate": 1.0926439765193898e-06, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.22066330909729004, "step": 8305, "valid_targets_mean": 3234.5, "valid_targets_min": 279 }, { "epoch": 6.338672768878719, "grad_norm": 0.5235801033937233, "learning_rate": 1.080277440614268e-06, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.30774369835853577, "step": 8310, "valid_targets_mean": 4542.8, "valid_targets_min": 1109 }, { "epoch": 6.342486651411137, "grad_norm": 0.48340978591910344, "learning_rate": 1.0679793430471763e-06, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.2984248399734497, "step": 8315, "valid_targets_mean": 4806.4, "valid_targets_min": 837 }, { "epoch": 6.3463005339435545, "grad_norm": 0.4839962726354207, "learning_rate": 1.055749728304034e-06, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.24378865957260132, "step": 8320, "valid_targets_mean": 4818.2, "valid_targets_min": 1553 }, { "epoch": 6.350114416475972, "grad_norm": 0.48547846148092877, "learning_rate": 1.0435886406230522e-06, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.29921552538871765, "step": 8325, "valid_targets_mean": 4799.2, "valid_targets_min": 720 }, { "epoch": 6.35392829900839, "grad_norm": 0.4826226506202875, "learning_rate": 1.031496123994542e-06, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.2462555170059204, "step": 8330, "valid_targets_mean": 5017.3, "valid_targets_min": 1309 }, { "epoch": 6.357742181540808, "grad_norm": 0.5422536322203456, "learning_rate": 1.0194722221607823e-06, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.23788587749004364, "step": 8335, "valid_targets_mean": 4561.3, "valid_targets_min": 1150 }, { "epoch": 6.361556064073227, "grad_norm": 0.4923820461404623, "learning_rate": 1.0075169786158544e-06, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.28204765915870667, "step": 8340, "valid_targets_mean": 4894.0, "valid_targets_min": 773 }, { "epoch": 6.365369946605645, "grad_norm": 0.5055193746390563, "learning_rate": 9.956304366054682e-07, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.22904770076274872, "step": 8345, "valid_targets_mean": 4334.6, "valid_targets_min": 1197 }, { "epoch": 6.369183829138063, "grad_norm": 0.4496958094342579, "learning_rate": 9.838126391268377e-07, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.210269495844841, "step": 8350, "valid_targets_mean": 4551.9, "valid_targets_min": 900 }, { "epoch": 6.372997711670481, "grad_norm": 0.42807004915669006, "learning_rate": 9.720636289284878e-07, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618262469768524, "step": 8355, "valid_targets_mean": 5323.6, "valid_targets_min": 942 }, { "epoch": 6.3768115942028984, "grad_norm": 0.5431535643885081, "learning_rate": 9.603834485101381e-07, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.27988871932029724, "step": 8360, "valid_targets_mean": 3949.1, "valid_targets_min": 1206 }, { "epoch": 6.380625476735316, "grad_norm": 0.5151995528629127, "learning_rate": 9.487721401225137e-07, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.27052268385887146, "step": 8365, "valid_targets_mean": 3915.1, "valid_targets_min": 977 }, { "epoch": 6.384439359267734, "grad_norm": 0.4529826695504075, "learning_rate": 9.372297457672231e-07, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.260204017162323, "step": 8370, "valid_targets_mean": 5037.4, "valid_targets_min": 268 }, { "epoch": 6.388253241800153, "grad_norm": 0.476253361507551, "learning_rate": 9.257563071965792e-07, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602754533290863, "step": 8375, "valid_targets_mean": 4367.5, "valid_targets_min": 1371 }, { "epoch": 6.392067124332571, "grad_norm": 0.4609825503411047, "learning_rate": 9.143518659134676e-07, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888159453868866, "step": 8380, "valid_targets_mean": 4771.2, "valid_targets_min": 1556 }, { "epoch": 6.395881006864989, "grad_norm": 0.4615228842972912, "learning_rate": 9.030164631711957e-07, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.2512037456035614, "step": 8385, "valid_targets_mean": 4216.5, "valid_targets_min": 1181 }, { "epoch": 6.399694889397407, "grad_norm": 0.4783617043494897, "learning_rate": 8.917501399733219e-07, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.31296250224113464, "step": 8390, "valid_targets_mean": 5034.9, "valid_targets_min": 1488 }, { "epoch": 6.4035087719298245, "grad_norm": 0.4554766870515671, "learning_rate": 8.805529370735378e-07, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.24182575941085815, "step": 8395, "valid_targets_mean": 4342.8, "valid_targets_min": 1501 }, { "epoch": 6.407322654462242, "grad_norm": 0.49378415215503346, "learning_rate": 8.694248949754991e-07, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.227997824549675, "step": 8400, "valid_targets_mean": 3916.5, "valid_targets_min": 1133 }, { "epoch": 6.41113653699466, "grad_norm": 0.5026431344870141, "learning_rate": 8.583660539326911e-07, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.28937292098999023, "step": 8405, "valid_targets_mean": 4306.0, "valid_targets_min": 1533 }, { "epoch": 6.414950419527079, "grad_norm": 0.4789425873369109, "learning_rate": 8.473764539482654e-07, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.24315117299556732, "step": 8410, "valid_targets_mean": 4329.9, "valid_targets_min": 1148 }, { "epoch": 6.418764302059497, "grad_norm": 0.44425281965231356, "learning_rate": 8.364561347749279e-07, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.2703532874584198, "step": 8415, "valid_targets_mean": 5093.1, "valid_targets_min": 360 }, { "epoch": 6.422578184591915, "grad_norm": 0.4504345015374403, "learning_rate": 8.256051359147554e-07, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.3007253408432007, "step": 8420, "valid_targets_mean": 5373.0, "valid_targets_min": 338 }, { "epoch": 6.426392067124333, "grad_norm": 0.49903685482553933, "learning_rate": 8.14823496619086e-07, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.22903098165988922, "step": 8425, "valid_targets_mean": 3829.9, "valid_targets_min": 1259 }, { "epoch": 6.4302059496567505, "grad_norm": 0.5012525211737092, "learning_rate": 8.041112558883557e-07, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.2882510721683502, "step": 8430, "valid_targets_mean": 4023.9, "valid_targets_min": 1054 }, { "epoch": 6.434019832189168, "grad_norm": 0.5099919723651475, "learning_rate": 7.934684524719683e-07, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.2546488344669342, "step": 8435, "valid_targets_mean": 4289.2, "valid_targets_min": 426 }, { "epoch": 6.437833714721586, "grad_norm": 0.4654407478835626, "learning_rate": 7.828951248681505e-07, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.24574923515319824, "step": 8440, "valid_targets_mean": 4327.0, "valid_targets_min": 1432 }, { "epoch": 6.441647597254004, "grad_norm": 0.4612414886820737, "learning_rate": 7.723913113238146e-07, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.19901114702224731, "step": 8445, "valid_targets_mean": 3979.3, "valid_targets_min": 1352 }, { "epoch": 6.445461479786423, "grad_norm": 0.5342280212284785, "learning_rate": 7.619570498344209e-07, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609269618988037, "step": 8450, "valid_targets_mean": 3531.6, "valid_targets_min": 1374 }, { "epoch": 6.449275362318841, "grad_norm": 0.5046481339850619, "learning_rate": 7.51592378143835e-07, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.2273874282836914, "step": 8455, "valid_targets_mean": 4145.7, "valid_targets_min": 894 }, { "epoch": 6.453089244851259, "grad_norm": 0.5046175752574743, "learning_rate": 7.412973337441997e-07, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.24711179733276367, "step": 8460, "valid_targets_mean": 3831.0, "valid_targets_min": 970 }, { "epoch": 6.4569031273836766, "grad_norm": 0.5089035875525534, "learning_rate": 7.310719538757927e-07, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.24454724788665771, "step": 8465, "valid_targets_mean": 4124.6, "valid_targets_min": 392 }, { "epoch": 6.460717009916094, "grad_norm": 0.46416602732457035, "learning_rate": 7.209162755268928e-07, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.25188159942626953, "step": 8470, "valid_targets_mean": 4515.6, "valid_targets_min": 1454 }, { "epoch": 6.464530892448512, "grad_norm": 0.4499441231883731, "learning_rate": 7.108303354336544e-07, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.28176894783973694, "step": 8475, "valid_targets_mean": 5149.5, "valid_targets_min": 1237 }, { "epoch": 6.46834477498093, "grad_norm": 0.8435636493276955, "learning_rate": 7.008141700799531e-07, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.30925872921943665, "step": 8480, "valid_targets_mean": 5316.2, "valid_targets_min": 2132 }, { "epoch": 6.472158657513349, "grad_norm": 0.4849813862200653, "learning_rate": 6.90867815697287e-07, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.25278136134147644, "step": 8485, "valid_targets_mean": 4548.2, "valid_targets_min": 1677 }, { "epoch": 6.475972540045767, "grad_norm": 0.46129805261149925, "learning_rate": 6.809913082646113e-07, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.25576576590538025, "step": 8490, "valid_targets_mean": 4950.3, "valid_targets_min": 917 }, { "epoch": 6.479786422578185, "grad_norm": 0.626575600377628, "learning_rate": 6.711846835082325e-07, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.2927459180355072, "step": 8495, "valid_targets_mean": 4252.6, "valid_targets_min": 1206 }, { "epoch": 6.483600305110603, "grad_norm": 0.5192502057353363, "learning_rate": 6.614479769016657e-07, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.238042950630188, "step": 8500, "valid_targets_mean": 3840.0, "valid_targets_min": 828 }, { "epoch": 6.4874141876430205, "grad_norm": 0.4570662293657686, "learning_rate": 6.517812236655152e-07, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.25383320450782776, "step": 8505, "valid_targets_mean": 4537.5, "valid_targets_min": 1112 }, { "epoch": 6.491228070175438, "grad_norm": 0.5727447284814335, "learning_rate": 6.421844587673365e-07, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.26463204622268677, "step": 8510, "valid_targets_mean": 5026.8, "valid_targets_min": 1170 }, { "epoch": 6.495041952707856, "grad_norm": 0.47162991186897507, "learning_rate": 6.326577169215231e-07, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.26361772418022156, "step": 8515, "valid_targets_mean": 5021.2, "valid_targets_min": 952 }, { "epoch": 6.498855835240275, "grad_norm": 1.3899956907574107, "learning_rate": 6.232010325891735e-07, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.4216398000717163, "step": 8520, "valid_targets_mean": 790.2, "valid_targets_min": 583 }, { "epoch": 6.502669717772693, "grad_norm": 0.4694331442372106, "learning_rate": 6.1381443997796e-07, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.26441314816474915, "step": 8525, "valid_targets_mean": 4803.4, "valid_targets_min": 839 }, { "epoch": 6.506483600305111, "grad_norm": 0.5044007854322652, "learning_rate": 6.044979730420198e-07, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.21473665535449982, "step": 8530, "valid_targets_mean": 3430.1, "valid_targets_min": 613 }, { "epoch": 6.510297482837529, "grad_norm": 0.5403224413072797, "learning_rate": 5.952516654818197e-07, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875039875507355, "step": 8535, "valid_targets_mean": 3952.5, "valid_targets_min": 1128 }, { "epoch": 6.5141113653699465, "grad_norm": 0.43010869493650594, "learning_rate": 5.86075550744043e-07, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.2839283049106598, "step": 8540, "valid_targets_mean": 6165.4, "valid_targets_min": 1886 }, { "epoch": 6.517925247902364, "grad_norm": 0.442055090560568, "learning_rate": 5.769696620214582e-07, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.264087051153183, "step": 8545, "valid_targets_mean": 5245.8, "valid_targets_min": 1233 }, { "epoch": 6.521739130434782, "grad_norm": 0.5380539845910357, "learning_rate": 5.679340322528126e-07, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.26377812027931213, "step": 8550, "valid_targets_mean": 4610.8, "valid_targets_min": 1676 }, { "epoch": 6.525553012967201, "grad_norm": 0.4692104990180008, "learning_rate": 5.589686941226991e-07, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.25884586572647095, "step": 8555, "valid_targets_mean": 4473.1, "valid_targets_min": 1297 }, { "epoch": 6.529366895499619, "grad_norm": 0.5133962979482154, "learning_rate": 5.500736800614492e-07, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.25123903155326843, "step": 8560, "valid_targets_mean": 4083.8, "valid_targets_min": 1411 }, { "epoch": 6.533180778032037, "grad_norm": 0.6838627983702491, "learning_rate": 5.412490222450095e-07, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.2431752234697342, "step": 8565, "valid_targets_mean": 4096.5, "valid_targets_min": 1368 }, { "epoch": 6.536994660564455, "grad_norm": 0.4805436149387146, "learning_rate": 5.324947525948254e-07, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567639648914337, "step": 8570, "valid_targets_mean": 4516.2, "valid_targets_min": 1309 }, { "epoch": 6.5408085430968725, "grad_norm": 0.454962448002056, "learning_rate": 5.238109027777283e-07, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.2514365613460541, "step": 8575, "valid_targets_mean": 4904.3, "valid_targets_min": 1127 }, { "epoch": 6.54462242562929, "grad_norm": 0.4793575688943854, "learning_rate": 5.151975042058244e-07, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.24711287021636963, "step": 8580, "valid_targets_mean": 4137.0, "valid_targets_min": 806 }, { "epoch": 6.548436308161708, "grad_norm": 0.4801693917051084, "learning_rate": 5.066545880363638e-07, "loss": 0.2843, "loss_nan_ranks": 0, "loss_rank_avg": 0.27172407507896423, "step": 8585, "valid_targets_mean": 4103.1, "valid_targets_min": 818 }, { "epoch": 6.552250190694126, "grad_norm": 0.4288887079935217, "learning_rate": 4.981821851716562e-07, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.2810297906398773, "step": 8590, "valid_targets_mean": 5950.1, "valid_targets_min": 1457 }, { "epoch": 6.556064073226545, "grad_norm": 0.447417911964289, "learning_rate": 4.897803262589285e-07, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.2641676962375641, "step": 8595, "valid_targets_mean": 4733.5, "valid_targets_min": 1069 }, { "epoch": 6.559877955758963, "grad_norm": 0.5130635758947727, "learning_rate": 4.814490416902451e-07, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.28340986371040344, "step": 8600, "valid_targets_mean": 4399.0, "valid_targets_min": 946 }, { "epoch": 6.563691838291381, "grad_norm": 0.48860800754653405, "learning_rate": 4.731883616023658e-07, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.23458512127399445, "step": 8605, "valid_targets_mean": 4400.2, "valid_targets_min": 1848 }, { "epoch": 6.567505720823799, "grad_norm": 0.4486519842249868, "learning_rate": 4.649983158766658e-07, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.2617599070072174, "step": 8610, "valid_targets_mean": 5128.7, "valid_targets_min": 1255 }, { "epoch": 6.5713196033562165, "grad_norm": 0.4613068465948873, "learning_rate": 4.568789341390023e-07, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2712768614292145, "step": 8615, "valid_targets_mean": 5012.1, "valid_targets_min": 613 }, { "epoch": 6.575133485888634, "grad_norm": 0.5413147396470408, "learning_rate": 4.4883024575963055e-07, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.25305524468421936, "step": 8620, "valid_targets_mean": 3542.5, "valid_targets_min": 1116 }, { "epoch": 6.578947368421053, "grad_norm": 0.47959906526653856, "learning_rate": 4.40852279853079e-07, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.3105383813381195, "step": 8625, "valid_targets_mean": 4613.8, "valid_targets_min": 1458 }, { "epoch": 6.582761250953471, "grad_norm": 0.5194487070204782, "learning_rate": 4.3294506527805425e-07, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2872951626777649, "step": 8630, "valid_targets_mean": 4815.3, "valid_targets_min": 496 }, { "epoch": 6.586575133485889, "grad_norm": 0.5190367669623117, "learning_rate": 4.2510863063734087e-07, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.22017668187618256, "step": 8635, "valid_targets_mean": 4139.2, "valid_targets_min": 337 }, { "epoch": 6.590389016018307, "grad_norm": 0.4694041403487881, "learning_rate": 4.173430042776749e-07, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.22927264869213104, "step": 8640, "valid_targets_mean": 3980.7, "valid_targets_min": 873 }, { "epoch": 6.594202898550725, "grad_norm": 0.5066127295615718, "learning_rate": 4.0964821428967516e-07, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.3201106786727905, "step": 8645, "valid_targets_mean": 4447.3, "valid_targets_min": 959 }, { "epoch": 6.5980167810831425, "grad_norm": 0.4723010578935397, "learning_rate": 4.020242885077097e-07, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768709659576416, "step": 8650, "valid_targets_mean": 4583.0, "valid_targets_min": 1399 }, { "epoch": 6.60183066361556, "grad_norm": 0.4707835769721507, "learning_rate": 3.944712545098206e-07, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.25435635447502136, "step": 8655, "valid_targets_mean": 4408.1, "valid_targets_min": 737 }, { "epoch": 6.605644546147978, "grad_norm": 0.46052357212783235, "learning_rate": 3.8698913961760396e-07, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.2501215934753418, "step": 8660, "valid_targets_mean": 4504.2, "valid_targets_min": 1246 }, { "epoch": 6.609458428680397, "grad_norm": 0.5958375550063665, "learning_rate": 3.795779708961278e-07, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.24585700035095215, "step": 8665, "valid_targets_mean": 3603.8, "valid_targets_min": 983 }, { "epoch": 6.613272311212815, "grad_norm": 0.44664158445770247, "learning_rate": 3.722377751538187e-07, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540818154811859, "step": 8670, "valid_targets_mean": 5331.1, "valid_targets_min": 1746 }, { "epoch": 6.617086193745233, "grad_norm": 0.4249148441892047, "learning_rate": 3.6496857894237735e-07, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.22584165632724762, "step": 8675, "valid_targets_mean": 4769.4, "valid_targets_min": 468 }, { "epoch": 6.620900076277651, "grad_norm": 0.4972869734589808, "learning_rate": 3.5777040855668356e-07, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749437391757965, "step": 8680, "valid_targets_mean": 4438.9, "valid_targets_min": 956 }, { "epoch": 6.6247139588100685, "grad_norm": 1.3596860424548278, "learning_rate": 3.506432900346779e-07, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.43016377091407776, "step": 8685, "valid_targets_mean": 843.3, "valid_targets_min": 648 }, { "epoch": 6.628527841342486, "grad_norm": 0.4567195254428743, "learning_rate": 3.4358724915730667e-07, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.2491716593503952, "step": 8690, "valid_targets_mean": 4938.8, "valid_targets_min": 541 }, { "epoch": 6.632341723874904, "grad_norm": 0.46756573873403356, "learning_rate": 3.366023114483885e-07, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.27434781193733215, "step": 8695, "valid_targets_mean": 4699.2, "valid_targets_min": 1459 }, { "epoch": 6.636155606407323, "grad_norm": 0.48085087252841974, "learning_rate": 3.2968850217455216e-07, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507885694503784, "step": 8700, "valid_targets_mean": 4554.4, "valid_targets_min": 1345 }, { "epoch": 6.639969488939741, "grad_norm": 0.4305286168328577, "learning_rate": 3.228458463451256e-07, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.27329325675964355, "step": 8705, "valid_targets_mean": 5775.1, "valid_targets_min": 1627 }, { "epoch": 6.643783371472159, "grad_norm": 0.4335818665288777, "learning_rate": 3.1607436871206043e-07, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.23998205363750458, "step": 8710, "valid_targets_mean": 5298.2, "valid_targets_min": 965 }, { "epoch": 6.647597254004577, "grad_norm": 0.5511616117071578, "learning_rate": 3.0937409376982975e-07, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.279064804315567, "step": 8715, "valid_targets_mean": 4210.8, "valid_targets_min": 1120 }, { "epoch": 6.651411136536995, "grad_norm": 0.49819383972885306, "learning_rate": 3.0274504575534603e-07, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.2777750790119171, "step": 8720, "valid_targets_mean": 4362.2, "valid_targets_min": 526 }, { "epoch": 6.655225019069412, "grad_norm": 0.48970859152321294, "learning_rate": 2.9618724864787896e-07, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.29505303502082825, "step": 8725, "valid_targets_mean": 4475.5, "valid_targets_min": 1178 }, { "epoch": 6.65903890160183, "grad_norm": 0.5365787991296255, "learning_rate": 2.8970072616895326e-07, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.23452679812908173, "step": 8730, "valid_targets_mean": 3625.1, "valid_targets_min": 452 }, { "epoch": 6.662852784134248, "grad_norm": 0.4616599271545656, "learning_rate": 2.8328550178227556e-07, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.2593431770801544, "step": 8735, "valid_targets_mean": 4466.4, "valid_targets_min": 1113 }, { "epoch": 6.666666666666667, "grad_norm": 0.6455949927025287, "learning_rate": 2.7694159869364525e-07, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934395372867584, "step": 8740, "valid_targets_mean": 4677.8, "valid_targets_min": 711 }, { "epoch": 6.670480549199085, "grad_norm": 0.45477101496916916, "learning_rate": 2.706690398508727e-07, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.2759816646575928, "step": 8745, "valid_targets_mean": 5200.2, "valid_targets_min": 1401 }, { "epoch": 6.674294431731503, "grad_norm": 0.4579561242619741, "learning_rate": 2.644678479436924e-07, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.2668015956878662, "step": 8750, "valid_targets_mean": 4637.0, "valid_targets_min": 1224 }, { "epoch": 6.678108314263921, "grad_norm": 0.5483706726448575, "learning_rate": 2.5833804540368545e-07, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.2324792742729187, "step": 8755, "valid_targets_mean": 4207.0, "valid_targets_min": 709 }, { "epoch": 6.6819221967963385, "grad_norm": 0.4616777266359128, "learning_rate": 2.522796544041928e-07, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.2218731790781021, "step": 8760, "valid_targets_mean": 4335.9, "valid_targets_min": 510 }, { "epoch": 6.685736079328756, "grad_norm": 0.5125443947686906, "learning_rate": 2.4629269686024195e-07, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.2388933151960373, "step": 8765, "valid_targets_mean": 3919.2, "valid_targets_min": 1000 }, { "epoch": 6.689549961861175, "grad_norm": 0.5000080999041109, "learning_rate": 2.4037719442846497e-07, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521762251853943, "step": 8770, "valid_targets_mean": 4245.3, "valid_targets_min": 1029 }, { "epoch": 6.693363844393593, "grad_norm": 0.4614214393159042, "learning_rate": 2.345331685070118e-07, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2523350417613983, "step": 8775, "valid_targets_mean": 5094.4, "valid_targets_min": 1841 }, { "epoch": 6.697177726926011, "grad_norm": 0.49785359302904225, "learning_rate": 2.2876064023549028e-07, "loss": 0.2484, "loss_nan_ranks": 0, "loss_rank_avg": 0.25749513506889343, "step": 8780, "valid_targets_mean": 3709.2, "valid_targets_min": 423 }, { "epoch": 6.700991609458429, "grad_norm": 0.5382263987761529, "learning_rate": 2.2305963049487068e-07, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.28535568714141846, "step": 8785, "valid_targets_mean": 4224.0, "valid_targets_min": 1141 }, { "epoch": 6.704805491990847, "grad_norm": 0.515491071106708, "learning_rate": 2.1743015990742576e-07, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.2274818867444992, "step": 8790, "valid_targets_mean": 3546.7, "valid_targets_min": 892 }, { "epoch": 6.7086193745232645, "grad_norm": 0.4904593792098621, "learning_rate": 2.1187224883664425e-07, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.23734210431575775, "step": 8795, "valid_targets_mean": 4233.8, "valid_targets_min": 291 }, { "epoch": 6.712433257055682, "grad_norm": 0.4764836214210563, "learning_rate": 2.063859173871685e-07, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.25665369629859924, "step": 8800, "valid_targets_mean": 4348.4, "valid_targets_min": 1155 }, { "epoch": 6.7162471395881, "grad_norm": 0.5364539012840841, "learning_rate": 2.009711854047125e-07, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.26761090755462646, "step": 8805, "valid_targets_mean": 3480.5, "valid_targets_min": 454 }, { "epoch": 6.720061022120519, "grad_norm": 0.43633373903725753, "learning_rate": 1.956280724759907e-07, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615395486354828, "step": 8810, "valid_targets_mean": 5068.1, "valid_targets_min": 1043 }, { "epoch": 6.723874904652937, "grad_norm": 0.5009990477100269, "learning_rate": 1.903565979286559e-07, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.2951163947582245, "step": 8815, "valid_targets_mean": 4381.7, "valid_targets_min": 984 }, { "epoch": 6.727688787185355, "grad_norm": 0.4884652809586842, "learning_rate": 1.8515678083121936e-07, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.24884463846683502, "step": 8820, "valid_targets_mean": 4959.0, "valid_targets_min": 688 }, { "epoch": 6.731502669717773, "grad_norm": 0.5180850457811853, "learning_rate": 1.8002863999298624e-07, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.2687952220439911, "step": 8825, "valid_targets_mean": 4047.2, "valid_targets_min": 924 }, { "epoch": 6.7353165522501905, "grad_norm": 0.4893545194267149, "learning_rate": 1.749721939639848e-07, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.23527388274669647, "step": 8830, "valid_targets_mean": 4457.8, "valid_targets_min": 1307 }, { "epoch": 6.739130434782608, "grad_norm": 0.5488105797549294, "learning_rate": 1.6998746103490838e-07, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.29204466938972473, "step": 8835, "valid_targets_mean": 4550.1, "valid_targets_min": 1258 }, { "epoch": 6.742944317315027, "grad_norm": 0.47929795689362814, "learning_rate": 1.650744592370357e-07, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.23622556030750275, "step": 8840, "valid_targets_mean": 4238.9, "valid_targets_min": 1358 }, { "epoch": 6.746758199847445, "grad_norm": 0.48193540879637353, "learning_rate": 1.602332063421752e-07, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.2542840540409088, "step": 8845, "valid_targets_mean": 4354.8, "valid_targets_min": 1124 }, { "epoch": 6.750572082379863, "grad_norm": 1.6083685967329227, "learning_rate": 1.5546371986259856e-07, "loss": 0.3409, "loss_nan_ranks": 0, "loss_rank_avg": 0.4540012776851654, "step": 8850, "valid_targets_mean": 798.7, "valid_targets_min": 662 }, { "epoch": 6.754385964912281, "grad_norm": 0.4479560061910448, "learning_rate": 1.5076601705097171e-07, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.26199549436569214, "step": 8855, "valid_targets_mean": 4903.4, "valid_targets_min": 1525 }, { "epoch": 6.758199847444699, "grad_norm": 0.5167509652707176, "learning_rate": 1.4614011490030833e-07, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.21811072528362274, "step": 8860, "valid_targets_mean": 3528.3, "valid_targets_min": 1120 }, { "epoch": 6.762013729977117, "grad_norm": 0.5466567892986032, "learning_rate": 1.4158603014388317e-07, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.22469651699066162, "step": 8865, "valid_targets_mean": 3092.0, "valid_targets_min": 1160 }, { "epoch": 6.7658276125095345, "grad_norm": 0.5078871078005721, "learning_rate": 1.3710377925520102e-07, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2852909564971924, "step": 8870, "valid_targets_mean": 4437.4, "valid_targets_min": 1185 }, { "epoch": 6.769641495041952, "grad_norm": 0.4667897106491802, "learning_rate": 1.3269337844790565e-07, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.30474594235420227, "step": 8875, "valid_targets_mean": 5781.1, "valid_targets_min": 1382 }, { "epoch": 6.77345537757437, "grad_norm": 0.45330866220580385, "learning_rate": 1.283548436757509e-07, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.2104359120130539, "step": 8880, "valid_targets_mean": 5018.0, "valid_targets_min": 1360 }, { "epoch": 6.777269260106789, "grad_norm": 0.47262441892560764, "learning_rate": 1.2408819063252531e-07, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537544071674347, "step": 8885, "valid_targets_mean": 4318.1, "valid_targets_min": 1018 }, { "epoch": 6.781083142639207, "grad_norm": 0.4688379872758674, "learning_rate": 1.1989343475199422e-07, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.2471754550933838, "step": 8890, "valid_targets_mean": 4464.4, "valid_targets_min": 671 }, { "epoch": 6.784897025171625, "grad_norm": 0.46613067717925505, "learning_rate": 1.1577059120785994e-07, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.24822942912578583, "step": 8895, "valid_targets_mean": 4436.9, "valid_targets_min": 1155 }, { "epoch": 6.788710907704043, "grad_norm": 0.4246933283721545, "learning_rate": 1.1171967491368396e-07, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.2612958252429962, "step": 8900, "valid_targets_mean": 5156.3, "valid_targets_min": 1447 }, { "epoch": 6.7925247902364605, "grad_norm": 0.488048889984009, "learning_rate": 1.0774070052285367e-07, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610219419002533, "step": 8905, "valid_targets_mean": 4220.4, "valid_targets_min": 834 }, { "epoch": 6.796338672768878, "grad_norm": 0.45744606793079273, "learning_rate": 1.0383368242852021e-07, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.2370743304491043, "step": 8910, "valid_targets_mean": 4227.2, "valid_targets_min": 867 }, { "epoch": 6.800152555301297, "grad_norm": 0.44106979768649596, "learning_rate": 9.999863476354289e-08, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2570864260196686, "step": 8915, "valid_targets_mean": 4943.4, "valid_targets_min": 871 }, { "epoch": 6.803966437833715, "grad_norm": 0.4655514026103222, "learning_rate": 9.623557140044481e-08, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.2311626523733139, "step": 8920, "valid_targets_mean": 4024.0, "valid_targets_min": 1455 }, { "epoch": 6.807780320366133, "grad_norm": 0.4400894039415246, "learning_rate": 9.254450595136188e-08, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.2622435986995697, "step": 8925, "valid_targets_mean": 5075.9, "valid_targets_min": 1286 }, { "epoch": 6.811594202898551, "grad_norm": 0.4603549740303837, "learning_rate": 8.892545176799161e-08, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.24099206924438477, "step": 8930, "valid_targets_mean": 4275.4, "valid_targets_min": 1051 }, { "epoch": 6.815408085430969, "grad_norm": 0.45744142908056945, "learning_rate": 8.537842194153767e-08, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.27880170941352844, "step": 8935, "valid_targets_mean": 4513.8, "valid_targets_min": 1277 }, { "epoch": 6.8192219679633865, "grad_norm": 0.4933018643513688, "learning_rate": 8.190342930268325e-08, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.20053613185882568, "step": 8940, "valid_targets_mean": 3789.4, "valid_targets_min": 1465 }, { "epoch": 6.823035850495804, "grad_norm": 0.4545423866647215, "learning_rate": 7.850048642151775e-08, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.23181915283203125, "step": 8945, "valid_targets_mean": 4632.9, "valid_targets_min": 1292 }, { "epoch": 6.826849733028222, "grad_norm": 0.4902945311689018, "learning_rate": 7.516960560751462e-08, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.2742360532283783, "step": 8950, "valid_targets_mean": 3948.9, "valid_targets_min": 993 }, { "epoch": 6.830663615560641, "grad_norm": 0.4498076800376056, "learning_rate": 7.19107989094736e-08, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.26429128646850586, "step": 8955, "valid_targets_mean": 4785.0, "valid_targets_min": 986 }, { "epoch": 6.834477498093059, "grad_norm": 0.4649434981304079, "learning_rate": 6.872407811547855e-08, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.24602733552455902, "step": 8960, "valid_targets_mean": 4312.8, "valid_targets_min": 1685 }, { "epoch": 6.838291380625477, "grad_norm": 0.4584733518995103, "learning_rate": 6.560945475285741e-08, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.2534709572792053, "step": 8965, "valid_targets_mean": 4685.2, "valid_targets_min": 1185 }, { "epoch": 6.842105263157895, "grad_norm": 0.5254599972627705, "learning_rate": 6.256694008814679e-08, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.3134000301361084, "step": 8970, "valid_targets_mean": 4030.5, "valid_targets_min": 1191 }, { "epoch": 6.845919145690313, "grad_norm": 0.4796585637484957, "learning_rate": 5.9596545127036385e-08, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.22937195003032684, "step": 8975, "valid_targets_mean": 4679.3, "valid_targets_min": 1334 }, { "epoch": 6.8497330282227304, "grad_norm": 0.5194624420495947, "learning_rate": 5.669828061433791e-08, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.2806025445461273, "step": 8980, "valid_targets_mean": 4014.6, "valid_targets_min": 991 }, { "epoch": 6.853546910755149, "grad_norm": 0.4705120799985797, "learning_rate": 5.387215703395177e-08, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.28963637351989746, "step": 8985, "valid_targets_mean": 5085.6, "valid_targets_min": 1168 }, { "epoch": 6.857360793287567, "grad_norm": 0.5819980638824224, "learning_rate": 5.111818460881379e-08, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.26628777384757996, "step": 8990, "valid_targets_mean": 4100.6, "valid_targets_min": 927 }, { "epoch": 6.861174675819985, "grad_norm": 0.4388922287444261, "learning_rate": 4.843637330087525e-08, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.28951165080070496, "step": 8995, "valid_targets_mean": 5574.4, "valid_targets_min": 713 }, { "epoch": 6.864988558352403, "grad_norm": 0.5130442634203314, "learning_rate": 4.582673281105621e-08, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.22083990275859833, "step": 9000, "valid_targets_mean": 3968.1, "valid_targets_min": 523 }, { "epoch": 6.868802440884821, "grad_norm": 0.519678895479751, "learning_rate": 4.3289272579212226e-08, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769645154476166, "step": 9005, "valid_targets_mean": 3708.4, "valid_targets_min": 704 }, { "epoch": 6.872616323417239, "grad_norm": 0.48803210237269884, "learning_rate": 4.082400178409884e-08, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.24909156560897827, "step": 9010, "valid_targets_mean": 4402.6, "valid_targets_min": 1164 }, { "epoch": 6.8764302059496565, "grad_norm": 1.310490122044137, "learning_rate": 3.843092934334714e-08, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.42711055278778076, "step": 9015, "valid_targets_mean": 874.1, "valid_targets_min": 602 }, { "epoch": 6.880244088482074, "grad_norm": 0.5194420306200203, "learning_rate": 3.6110063913419314e-08, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.270808607339859, "step": 9020, "valid_targets_mean": 3739.3, "valid_targets_min": 886 }, { "epoch": 6.884057971014493, "grad_norm": 0.4523455589120904, "learning_rate": 3.386141388958652e-08, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.24892598390579224, "step": 9025, "valid_targets_mean": 4797.2, "valid_targets_min": 858 }, { "epoch": 6.887871853546911, "grad_norm": 0.48287864804733494, "learning_rate": 3.1684987405891096e-08, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.28461983799934387, "step": 9030, "valid_targets_mean": 4661.2, "valid_targets_min": 844 }, { "epoch": 6.891685736079329, "grad_norm": 0.4721016692882381, "learning_rate": 2.9580792335126562e-08, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.28126761317253113, "step": 9035, "valid_targets_mean": 5096.3, "valid_targets_min": 1602 }, { "epoch": 6.895499618611747, "grad_norm": 0.4841861982217126, "learning_rate": 2.7548836288797675e-08, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.28836727142333984, "step": 9040, "valid_targets_mean": 4471.4, "valid_targets_min": 473 }, { "epoch": 6.899313501144165, "grad_norm": 0.682082195562495, "learning_rate": 2.5589126617102666e-08, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2549896538257599, "step": 9045, "valid_targets_mean": 3695.0, "valid_targets_min": 1341 }, { "epoch": 6.9031273836765825, "grad_norm": 0.4430357315125749, "learning_rate": 2.3701670408904365e-08, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2781337797641754, "step": 9050, "valid_targets_mean": 5056.7, "valid_targets_min": 1742 }, { "epoch": 6.906941266209, "grad_norm": 0.4961634791637363, "learning_rate": 2.1886474491699116e-08, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2650142014026642, "step": 9055, "valid_targets_mean": 4381.1, "valid_targets_min": 1526 }, { "epoch": 6.910755148741419, "grad_norm": 0.4766223024157269, "learning_rate": 2.014354543159458e-08, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.24406524002552032, "step": 9060, "valid_targets_mean": 4142.5, "valid_targets_min": 380 }, { "epoch": 6.914569031273837, "grad_norm": 0.5041571799311416, "learning_rate": 1.847288953329418e-08, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.2359909564256668, "step": 9065, "valid_targets_mean": 4001.7, "valid_targets_min": 1419 }, { "epoch": 6.918382913806255, "grad_norm": 0.4689832398936382, "learning_rate": 1.6874512840063806e-08, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.23846976459026337, "step": 9070, "valid_targets_mean": 4615.5, "valid_targets_min": 1134 }, { "epoch": 6.922196796338673, "grad_norm": 0.4215746760654066, "learning_rate": 1.5348421133711822e-08, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2647766172885895, "step": 9075, "valid_targets_mean": 5416.6, "valid_targets_min": 1373 }, { "epoch": 6.926010678871091, "grad_norm": 0.47434945452469185, "learning_rate": 1.3894619934571307e-08, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696935534477234, "step": 9080, "valid_targets_mean": 4957.5, "valid_targets_min": 1516 }, { "epoch": 6.9298245614035086, "grad_norm": 0.5140704574961166, "learning_rate": 1.2513114501482294e-08, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.29723748564720154, "step": 9085, "valid_targets_mean": 4311.6, "valid_targets_min": 1513 }, { "epoch": 6.933638443935926, "grad_norm": 0.44704021411153305, "learning_rate": 1.1203909831762893e-08, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530190050601959, "step": 9090, "valid_targets_mean": 4857.2, "valid_targets_min": 447 }, { "epoch": 6.937452326468344, "grad_norm": 0.4606405386761923, "learning_rate": 9.967010661204868e-09, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.2141771763563156, "step": 9095, "valid_targets_mean": 4249.3, "valid_targets_min": 1203 }, { "epoch": 6.941266209000763, "grad_norm": 0.4346601417829936, "learning_rate": 8.802421464040312e-09, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.2532062828540802, "step": 9100, "valid_targets_mean": 5482.1, "valid_targets_min": 1125 }, { "epoch": 6.945080091533181, "grad_norm": 0.5138564719167915, "learning_rate": 7.710146452941658e-09, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.25881847739219666, "step": 9105, "valid_targets_mean": 4072.5, "valid_targets_min": 1354 }, { "epoch": 6.948893974065599, "grad_norm": 0.5443768694531692, "learning_rate": 6.690189578999473e-09, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.22537367045879364, "step": 9110, "valid_targets_mean": 3369.6, "valid_targets_min": 827 }, { "epoch": 6.952707856598017, "grad_norm": 0.5109364822190952, "learning_rate": 5.742554531700251e-09, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.23135484755039215, "step": 9115, "valid_targets_mean": 3833.6, "valid_targets_min": 883 }, { "epoch": 6.956521739130435, "grad_norm": 0.46466195137513505, "learning_rate": 4.8672447389286335e-09, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.24387897551059723, "step": 9120, "valid_targets_mean": 4876.5, "valid_targets_min": 1284 }, { "epoch": 6.9603356216628525, "grad_norm": 0.5300251711812586, "learning_rate": 4.064263366942989e-09, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.2824271023273468, "step": 9125, "valid_targets_mean": 4544.0, "valid_targets_min": 1082 }, { "epoch": 6.964149504195271, "grad_norm": 0.4806841321702372, "learning_rate": 3.333613320368745e-09, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.22269928455352783, "step": 9130, "valid_targets_mean": 4612.7, "valid_targets_min": 1333 }, { "epoch": 6.967963386727689, "grad_norm": 0.5416974736321651, "learning_rate": 2.6752972421895117e-09, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618859112262726, "step": 9135, "valid_targets_mean": 3495.5, "valid_targets_min": 620 }, { "epoch": 6.971777269260107, "grad_norm": 0.459511556904324, "learning_rate": 2.0893175137293163e-09, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535509169101715, "step": 9140, "valid_targets_mean": 4382.7, "valid_targets_min": 505 }, { "epoch": 6.975591151792525, "grad_norm": 0.48437983570830595, "learning_rate": 1.5756762546570437e-09, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.2759089469909668, "step": 9145, "valid_targets_mean": 3919.9, "valid_targets_min": 1075 }, { "epoch": 6.979405034324943, "grad_norm": 0.49415357039663277, "learning_rate": 1.1343753229642317e-09, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.23885183036327362, "step": 9150, "valid_targets_mean": 3753.2, "valid_targets_min": 753 }, { "epoch": 6.983218916857361, "grad_norm": 0.5461652605442551, "learning_rate": 7.654163149717342e-10, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608436048030853, "step": 9155, "valid_targets_mean": 3563.1, "valid_targets_min": 521 }, { "epoch": 6.9870327993897785, "grad_norm": 0.545724031102777, "learning_rate": 4.688005653163963e-10, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.27841898798942566, "step": 9160, "valid_targets_mean": 4363.7, "valid_targets_min": 447 }, { "epoch": 6.990846681922196, "grad_norm": 0.4705636484040312, "learning_rate": 2.44529146942174e-10, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812120020389557, "step": 9165, "valid_targets_mean": 4790.8, "valid_targets_min": 915 }, { "epoch": 6.994660564454615, "grad_norm": 0.5291991743545336, "learning_rate": 9.260287111123589e-11, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.2218012809753418, "step": 9170, "valid_targets_mean": 3817.0, "valid_targets_min": 1202 }, { "epoch": 6.998474446987033, "grad_norm": 1.5469628469507675, "learning_rate": 1.3022287386199594e-11, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.4602835476398468, "step": 9175, "valid_targets_mean": 780.0, "valid_targets_min": 493 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.4288143217563629, "step": 9177, "total_flos": 4631781651513344.0, "train_loss": 0.31498055520031176, "train_runtime": 65837.0719, "train_samples_per_second": 3.345, "train_steps_per_second": 0.139, "valid_targets_mean": 858.8, "valid_targets_min": 497 } ], "logging_steps": 5, "max_steps": 9177, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 4631781651513344.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }