{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4382, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007987220447284345, "grad_norm": 15.17248931781073, "learning_rate": 3.644646924829157e-07, "loss": 0.9519, "loss_nan_ranks": 0, "loss_rank_avg": 0.873810887336731, "step": 5, "valid_targets_mean": 3127.7, "valid_targets_min": 927 }, { "epoch": 0.01597444089456869, "grad_norm": 16.0447046422443, "learning_rate": 8.200455580865605e-07, "loss": 0.9762, "loss_nan_ranks": 0, "loss_rank_avg": 1.0120545625686646, "step": 10, "valid_targets_mean": 2819.0, "valid_targets_min": 1221 }, { "epoch": 0.023961661341853034, "grad_norm": 15.982841317309331, "learning_rate": 1.2756264236902052e-06, "loss": 0.9655, "loss_nan_ranks": 0, "loss_rank_avg": 0.9404536485671997, "step": 15, "valid_targets_mean": 2939.2, "valid_targets_min": 1003 }, { "epoch": 0.03194888178913738, "grad_norm": 16.68150841790565, "learning_rate": 1.7312072892938498e-06, "loss": 0.9297, "loss_nan_ranks": 0, "loss_rank_avg": 1.0098234415054321, "step": 20, "valid_targets_mean": 2228.9, "valid_targets_min": 1122 }, { "epoch": 0.039936102236421724, "grad_norm": 7.699726336060192, "learning_rate": 2.1867881548974945e-06, "loss": 0.883, "loss_nan_ranks": 0, "loss_rank_avg": 0.8025753498077393, "step": 25, "valid_targets_mean": 3127.9, "valid_targets_min": 978 }, { "epoch": 0.04792332268370607, "grad_norm": 5.236211849772423, "learning_rate": 2.642369020501139e-06, "loss": 0.825, "loss_nan_ranks": 0, "loss_rank_avg": 0.7962996959686279, "step": 30, "valid_targets_mean": 2854.4, "valid_targets_min": 1089 }, { "epoch": 0.05591054313099041, "grad_norm": 3.7746117759364175, "learning_rate": 3.0979498861047843e-06, "loss": 0.7731, "loss_nan_ranks": 0, "loss_rank_avg": 0.7613115310668945, "step": 35, "valid_targets_mean": 2395.0, "valid_targets_min": 1120 }, { "epoch": 0.06389776357827476, "grad_norm": 2.169032644755572, "learning_rate": 3.5535307517084285e-06, "loss": 0.7068, "loss_nan_ranks": 0, "loss_rank_avg": 0.7297231554985046, "step": 40, "valid_targets_mean": 2835.4, "valid_targets_min": 1046 }, { "epoch": 0.07188498402555911, "grad_norm": 1.8529712575405926, "learning_rate": 4.009111617312073e-06, "loss": 0.7178, "loss_nan_ranks": 0, "loss_rank_avg": 0.7068992853164673, "step": 45, "valid_targets_mean": 2749.2, "valid_targets_min": 1262 }, { "epoch": 0.07987220447284345, "grad_norm": 1.74129413182321, "learning_rate": 4.464692482915718e-06, "loss": 0.7158, "loss_nan_ranks": 0, "loss_rank_avg": 0.7441062927246094, "step": 50, "valid_targets_mean": 2308.6, "valid_targets_min": 895 }, { "epoch": 0.0878594249201278, "grad_norm": 1.1261969765312332, "learning_rate": 4.920273348519363e-06, "loss": 0.6573, "loss_nan_ranks": 0, "loss_rank_avg": 0.6407957673072815, "step": 55, "valid_targets_mean": 2901.4, "valid_targets_min": 1280 }, { "epoch": 0.09584664536741214, "grad_norm": 1.189556858462003, "learning_rate": 5.375854214123008e-06, "loss": 0.682, "loss_nan_ranks": 0, "loss_rank_avg": 0.6844934821128845, "step": 60, "valid_targets_mean": 2235.0, "valid_targets_min": 1097 }, { "epoch": 0.10383386581469649, "grad_norm": 1.0707090957182381, "learning_rate": 5.831435079726651e-06, "loss": 0.6523, "loss_nan_ranks": 0, "loss_rank_avg": 0.6878713965415955, "step": 65, "valid_targets_mean": 2627.6, "valid_targets_min": 1230 }, { "epoch": 0.11182108626198083, "grad_norm": 1.0142874088661866, "learning_rate": 6.287015945330297e-06, "loss": 0.6362, "loss_nan_ranks": 0, "loss_rank_avg": 0.6870459914207458, "step": 70, "valid_targets_mean": 2840.0, "valid_targets_min": 1380 }, { "epoch": 0.11980830670926518, "grad_norm": 0.8175505785622187, "learning_rate": 6.742596810933942e-06, "loss": 0.643, "loss_nan_ranks": 0, "loss_rank_avg": 0.6377227306365967, "step": 75, "valid_targets_mean": 3428.4, "valid_targets_min": 1015 }, { "epoch": 0.12779552715654952, "grad_norm": 0.9047440311266008, "learning_rate": 7.1981776765375854e-06, "loss": 0.6375, "loss_nan_ranks": 0, "loss_rank_avg": 0.5993684530258179, "step": 80, "valid_targets_mean": 2613.2, "valid_targets_min": 855 }, { "epoch": 0.13578274760383385, "grad_norm": 0.8299903165340285, "learning_rate": 7.65375854214123e-06, "loss": 0.6111, "loss_nan_ranks": 0, "loss_rank_avg": 0.5948533415794373, "step": 85, "valid_targets_mean": 2690.9, "valid_targets_min": 1286 }, { "epoch": 0.14376996805111822, "grad_norm": 0.9198314766136052, "learning_rate": 8.109339407744875e-06, "loss": 0.6151, "loss_nan_ranks": 0, "loss_rank_avg": 0.5966804027557373, "step": 90, "valid_targets_mean": 2349.4, "valid_targets_min": 1028 }, { "epoch": 0.15175718849840256, "grad_norm": 0.7995206251913056, "learning_rate": 8.564920273348521e-06, "loss": 0.5595, "loss_nan_ranks": 0, "loss_rank_avg": 0.47535890340805054, "step": 95, "valid_targets_mean": 2481.7, "valid_targets_min": 1112 }, { "epoch": 0.1597444089456869, "grad_norm": 0.8508182370502543, "learning_rate": 9.020501138952164e-06, "loss": 0.5852, "loss_nan_ranks": 0, "loss_rank_avg": 0.6482516527175903, "step": 100, "valid_targets_mean": 2932.8, "valid_targets_min": 1364 }, { "epoch": 0.16773162939297126, "grad_norm": 0.8203564655537686, "learning_rate": 9.47608200455581e-06, "loss": 0.548, "loss_nan_ranks": 0, "loss_rank_avg": 0.5478312969207764, "step": 105, "valid_targets_mean": 2946.6, "valid_targets_min": 931 }, { "epoch": 0.1757188498402556, "grad_norm": 0.7569799752444644, "learning_rate": 9.931662870159453e-06, "loss": 0.5804, "loss_nan_ranks": 0, "loss_rank_avg": 0.5435867309570312, "step": 110, "valid_targets_mean": 3103.2, "valid_targets_min": 1609 }, { "epoch": 0.18370607028753994, "grad_norm": 0.8900695073471566, "learning_rate": 1.03872437357631e-05, "loss": 0.5534, "loss_nan_ranks": 0, "loss_rank_avg": 0.5765122175216675, "step": 115, "valid_targets_mean": 3199.2, "valid_targets_min": 701 }, { "epoch": 0.19169329073482427, "grad_norm": 0.8583125214810088, "learning_rate": 1.0842824601366744e-05, "loss": 0.5527, "loss_nan_ranks": 0, "loss_rank_avg": 0.537767767906189, "step": 120, "valid_targets_mean": 2467.8, "valid_targets_min": 1100 }, { "epoch": 0.19968051118210864, "grad_norm": 0.7006043396902825, "learning_rate": 1.1298405466970387e-05, "loss": 0.5509, "loss_nan_ranks": 0, "loss_rank_avg": 0.5513736605644226, "step": 125, "valid_targets_mean": 3579.0, "valid_targets_min": 1342 }, { "epoch": 0.20766773162939298, "grad_norm": 0.766820394134251, "learning_rate": 1.1753986332574032e-05, "loss": 0.5702, "loss_nan_ranks": 0, "loss_rank_avg": 0.5789293050765991, "step": 130, "valid_targets_mean": 2847.6, "valid_targets_min": 1180 }, { "epoch": 0.21565495207667731, "grad_norm": 1.5002638242695263, "learning_rate": 1.2209567198177677e-05, "loss": 0.5899, "loss_nan_ranks": 0, "loss_rank_avg": 0.6096343398094177, "step": 135, "valid_targets_mean": 2303.8, "valid_targets_min": 866 }, { "epoch": 0.22364217252396165, "grad_norm": 0.7423434999018708, "learning_rate": 1.2665148063781323e-05, "loss": 0.5697, "loss_nan_ranks": 0, "loss_rank_avg": 0.5750610828399658, "step": 140, "valid_targets_mean": 3315.2, "valid_targets_min": 1237 }, { "epoch": 0.23162939297124602, "grad_norm": 0.8496784328818882, "learning_rate": 1.3120728929384968e-05, "loss": 0.5676, "loss_nan_ranks": 0, "loss_rank_avg": 0.5569379329681396, "step": 145, "valid_targets_mean": 2489.4, "valid_targets_min": 1083 }, { "epoch": 0.23961661341853036, "grad_norm": 0.7627769903145462, "learning_rate": 1.357630979498861e-05, "loss": 0.5495, "loss_nan_ranks": 0, "loss_rank_avg": 0.5773597955703735, "step": 150, "valid_targets_mean": 3161.5, "valid_targets_min": 1192 }, { "epoch": 0.2476038338658147, "grad_norm": 0.8821586946530701, "learning_rate": 1.4031890660592255e-05, "loss": 0.5394, "loss_nan_ranks": 0, "loss_rank_avg": 0.5083107948303223, "step": 155, "valid_targets_mean": 2946.1, "valid_targets_min": 787 }, { "epoch": 0.25559105431309903, "grad_norm": 0.909958221284572, "learning_rate": 1.4487471526195902e-05, "loss": 0.5419, "loss_nan_ranks": 0, "loss_rank_avg": 0.5862777233123779, "step": 160, "valid_targets_mean": 2436.4, "valid_targets_min": 1083 }, { "epoch": 0.26357827476038337, "grad_norm": 0.854377313552898, "learning_rate": 1.4943052391799546e-05, "loss": 0.5346, "loss_nan_ranks": 0, "loss_rank_avg": 0.5437299609184265, "step": 165, "valid_targets_mean": 2534.8, "valid_targets_min": 810 }, { "epoch": 0.2715654952076677, "grad_norm": 0.9103282941916306, "learning_rate": 1.539863325740319e-05, "loss": 0.5074, "loss_nan_ranks": 0, "loss_rank_avg": 0.4946935474872589, "step": 170, "valid_targets_mean": 2139.8, "valid_targets_min": 1156 }, { "epoch": 0.2795527156549521, "grad_norm": 0.88133799748646, "learning_rate": 1.5854214123006836e-05, "loss": 0.5215, "loss_nan_ranks": 0, "loss_rank_avg": 0.5952520370483398, "step": 175, "valid_targets_mean": 2498.9, "valid_targets_min": 957 }, { "epoch": 0.28753993610223644, "grad_norm": 0.6850615122575533, "learning_rate": 1.630979498861048e-05, "loss": 0.5123, "loss_nan_ranks": 0, "loss_rank_avg": 0.4720776677131653, "step": 180, "valid_targets_mean": 3554.1, "valid_targets_min": 1052 }, { "epoch": 0.2955271565495208, "grad_norm": 0.8550204357494533, "learning_rate": 1.6765375854214125e-05, "loss": 0.5473, "loss_nan_ranks": 0, "loss_rank_avg": 0.5485037565231323, "step": 185, "valid_targets_mean": 2786.8, "valid_targets_min": 948 }, { "epoch": 0.3035143769968051, "grad_norm": 0.8206472164048848, "learning_rate": 1.722095671981777e-05, "loss": 0.5584, "loss_nan_ranks": 0, "loss_rank_avg": 0.5042972564697266, "step": 190, "valid_targets_mean": 2728.0, "valid_targets_min": 712 }, { "epoch": 0.31150159744408945, "grad_norm": 0.6728094856065869, "learning_rate": 1.7676537585421415e-05, "loss": 0.5269, "loss_nan_ranks": 0, "loss_rank_avg": 0.5326317548751831, "step": 195, "valid_targets_mean": 3720.7, "valid_targets_min": 1523 }, { "epoch": 0.3194888178913738, "grad_norm": 0.7728618092725199, "learning_rate": 1.813211845102506e-05, "loss": 0.5197, "loss_nan_ranks": 0, "loss_rank_avg": 0.4793850779533386, "step": 200, "valid_targets_mean": 2741.7, "valid_targets_min": 861 }, { "epoch": 0.3274760383386581, "grad_norm": 0.7801842035185508, "learning_rate": 1.8587699316628704e-05, "loss": 0.518, "loss_nan_ranks": 0, "loss_rank_avg": 0.5253409147262573, "step": 205, "valid_targets_mean": 2814.8, "valid_targets_min": 861 }, { "epoch": 0.3354632587859425, "grad_norm": 0.9863154154066794, "learning_rate": 1.904328018223235e-05, "loss": 0.5542, "loss_nan_ranks": 0, "loss_rank_avg": 0.6215020418167114, "step": 210, "valid_targets_mean": 2646.8, "valid_targets_min": 955 }, { "epoch": 0.34345047923322686, "grad_norm": 0.7331588617100306, "learning_rate": 1.9498861047835993e-05, "loss": 0.5255, "loss_nan_ranks": 0, "loss_rank_avg": 0.4908156096935272, "step": 215, "valid_targets_mean": 3356.9, "valid_targets_min": 1352 }, { "epoch": 0.3514376996805112, "grad_norm": 0.8791842141556658, "learning_rate": 1.9954441913439638e-05, "loss": 0.5239, "loss_nan_ranks": 0, "loss_rank_avg": 0.5295369625091553, "step": 220, "valid_targets_mean": 2351.9, "valid_targets_min": 1185 }, { "epoch": 0.35942492012779553, "grad_norm": 0.7787307287825401, "learning_rate": 2.0410022779043283e-05, "loss": 0.4988, "loss_nan_ranks": 0, "loss_rank_avg": 0.48588457703590393, "step": 225, "valid_targets_mean": 2535.1, "valid_targets_min": 1259 }, { "epoch": 0.36741214057507987, "grad_norm": 0.8556036439676711, "learning_rate": 2.0865603644646927e-05, "loss": 0.5863, "loss_nan_ranks": 0, "loss_rank_avg": 0.6629254817962646, "step": 230, "valid_targets_mean": 2723.0, "valid_targets_min": 1005 }, { "epoch": 0.3753993610223642, "grad_norm": 0.8057536275212785, "learning_rate": 2.1321184510250572e-05, "loss": 0.5399, "loss_nan_ranks": 0, "loss_rank_avg": 0.6240401864051819, "step": 235, "valid_targets_mean": 2943.8, "valid_targets_min": 1330 }, { "epoch": 0.38338658146964855, "grad_norm": 0.9850495934806481, "learning_rate": 2.1776765375854217e-05, "loss": 0.5133, "loss_nan_ranks": 0, "loss_rank_avg": 0.49222493171691895, "step": 240, "valid_targets_mean": 1964.6, "valid_targets_min": 946 }, { "epoch": 0.3913738019169329, "grad_norm": 0.8186455781999009, "learning_rate": 2.223234624145786e-05, "loss": 0.5153, "loss_nan_ranks": 0, "loss_rank_avg": 0.5153531432151794, "step": 245, "valid_targets_mean": 2717.8, "valid_targets_min": 1133 }, { "epoch": 0.3993610223642173, "grad_norm": 1.9660992396620858, "learning_rate": 2.2687927107061506e-05, "loss": 0.5278, "loss_nan_ranks": 0, "loss_rank_avg": 0.5080440044403076, "step": 250, "valid_targets_mean": 3080.2, "valid_targets_min": 1306 }, { "epoch": 0.4073482428115016, "grad_norm": 0.6777855096046905, "learning_rate": 2.314350797266515e-05, "loss": 0.5092, "loss_nan_ranks": 0, "loss_rank_avg": 0.45302075147628784, "step": 255, "valid_targets_mean": 3767.1, "valid_targets_min": 1306 }, { "epoch": 0.41533546325878595, "grad_norm": 0.8427065918822899, "learning_rate": 2.3599088838268792e-05, "loss": 0.4911, "loss_nan_ranks": 0, "loss_rank_avg": 0.5029305219650269, "step": 260, "valid_targets_mean": 2818.7, "valid_targets_min": 1464 }, { "epoch": 0.4233226837060703, "grad_norm": 0.7968222858710973, "learning_rate": 2.4054669703872436e-05, "loss": 0.5159, "loss_nan_ranks": 0, "loss_rank_avg": 0.5117211937904358, "step": 265, "valid_targets_mean": 2781.1, "valid_targets_min": 1213 }, { "epoch": 0.43130990415335463, "grad_norm": 0.8271573611997252, "learning_rate": 2.4510250569476085e-05, "loss": 0.5422, "loss_nan_ranks": 0, "loss_rank_avg": 0.4576948583126068, "step": 270, "valid_targets_mean": 2558.8, "valid_targets_min": 1229 }, { "epoch": 0.43929712460063897, "grad_norm": 0.7901461972408579, "learning_rate": 2.496583143507973e-05, "loss": 0.4954, "loss_nan_ranks": 0, "loss_rank_avg": 0.49033161997795105, "step": 275, "valid_targets_mean": 3283.5, "valid_targets_min": 871 }, { "epoch": 0.4472843450479233, "grad_norm": 0.8814296735699261, "learning_rate": 2.5421412300683374e-05, "loss": 0.4931, "loss_nan_ranks": 0, "loss_rank_avg": 0.5419114828109741, "step": 280, "valid_targets_mean": 2600.2, "valid_targets_min": 497 }, { "epoch": 0.45527156549520764, "grad_norm": 0.8843077229773383, "learning_rate": 2.587699316628702e-05, "loss": 0.4964, "loss_nan_ranks": 0, "loss_rank_avg": 0.5407685041427612, "step": 285, "valid_targets_mean": 2370.4, "valid_targets_min": 901 }, { "epoch": 0.46325878594249204, "grad_norm": 1.0771357872311227, "learning_rate": 2.6332574031890663e-05, "loss": 0.5295, "loss_nan_ranks": 0, "loss_rank_avg": 0.6103911995887756, "step": 290, "valid_targets_mean": 2440.1, "valid_targets_min": 1380 }, { "epoch": 0.4712460063897764, "grad_norm": 0.7179319622664404, "learning_rate": 2.6788154897494308e-05, "loss": 0.4741, "loss_nan_ranks": 0, "loss_rank_avg": 0.4417612552642822, "step": 295, "valid_targets_mean": 3418.1, "valid_targets_min": 1392 }, { "epoch": 0.4792332268370607, "grad_norm": 0.714979713777273, "learning_rate": 2.7243735763097953e-05, "loss": 0.5061, "loss_nan_ranks": 0, "loss_rank_avg": 0.44420793652534485, "step": 300, "valid_targets_mean": 3550.5, "valid_targets_min": 1539 }, { "epoch": 0.48722044728434505, "grad_norm": 0.832676511155696, "learning_rate": 2.7699316628701597e-05, "loss": 0.49, "loss_nan_ranks": 0, "loss_rank_avg": 0.5182697772979736, "step": 305, "valid_targets_mean": 2901.4, "valid_targets_min": 1270 }, { "epoch": 0.4952076677316294, "grad_norm": 1.2011451937543158, "learning_rate": 2.815489749430524e-05, "loss": 0.5109, "loss_nan_ranks": 0, "loss_rank_avg": 0.5339452624320984, "step": 310, "valid_targets_mean": 3127.3, "valid_targets_min": 1080 }, { "epoch": 0.5031948881789138, "grad_norm": 1.1011304858781235, "learning_rate": 2.8610478359908883e-05, "loss": 0.489, "loss_nan_ranks": 0, "loss_rank_avg": 0.4957484304904938, "step": 315, "valid_targets_mean": 2123.2, "valid_targets_min": 960 }, { "epoch": 0.5111821086261981, "grad_norm": 0.7518434901268846, "learning_rate": 2.906605922551253e-05, "loss": 0.4972, "loss_nan_ranks": 0, "loss_rank_avg": 0.5477015972137451, "step": 320, "valid_targets_mean": 3466.9, "valid_targets_min": 1186 }, { "epoch": 0.5191693290734825, "grad_norm": 0.818548220458573, "learning_rate": 2.9521640091116176e-05, "loss": 0.5047, "loss_nan_ranks": 0, "loss_rank_avg": 0.4946255087852478, "step": 325, "valid_targets_mean": 2968.8, "valid_targets_min": 873 }, { "epoch": 0.5271565495207667, "grad_norm": 0.9354909961997221, "learning_rate": 2.997722095671982e-05, "loss": 0.4983, "loss_nan_ranks": 0, "loss_rank_avg": 0.5147006511688232, "step": 330, "valid_targets_mean": 2093.4, "valid_targets_min": 811 }, { "epoch": 0.5351437699680511, "grad_norm": 0.8861773466418632, "learning_rate": 3.0432801822323465e-05, "loss": 0.5012, "loss_nan_ranks": 0, "loss_rank_avg": 0.5008596777915955, "step": 335, "valid_targets_mean": 3097.7, "valid_targets_min": 921 }, { "epoch": 0.5431309904153354, "grad_norm": 0.7688169713732055, "learning_rate": 3.088838268792711e-05, "loss": 0.5055, "loss_nan_ranks": 0, "loss_rank_avg": 0.496390700340271, "step": 340, "valid_targets_mean": 3200.6, "valid_targets_min": 1282 }, { "epoch": 0.5511182108626198, "grad_norm": 0.8113792447780495, "learning_rate": 3.1343963553530755e-05, "loss": 0.5209, "loss_nan_ranks": 0, "loss_rank_avg": 0.5141535997390747, "step": 345, "valid_targets_mean": 2751.6, "valid_targets_min": 1031 }, { "epoch": 0.5591054313099042, "grad_norm": 2.1321863058940393, "learning_rate": 3.17995444191344e-05, "loss": 0.4779, "loss_nan_ranks": 0, "loss_rank_avg": 0.5301027297973633, "step": 350, "valid_targets_mean": 2933.4, "valid_targets_min": 1160 }, { "epoch": 0.5670926517571885, "grad_norm": 0.6806494335642181, "learning_rate": 3.2255125284738044e-05, "loss": 0.4775, "loss_nan_ranks": 0, "loss_rank_avg": 0.506610095500946, "step": 355, "valid_targets_mean": 3795.7, "valid_targets_min": 1294 }, { "epoch": 0.5750798722044729, "grad_norm": 0.8467603882079074, "learning_rate": 3.271070615034169e-05, "loss": 0.4982, "loss_nan_ranks": 0, "loss_rank_avg": 0.4562826156616211, "step": 360, "valid_targets_mean": 2606.6, "valid_targets_min": 981 }, { "epoch": 0.5830670926517572, "grad_norm": 0.8022847528326496, "learning_rate": 3.316628701594533e-05, "loss": 0.5121, "loss_nan_ranks": 0, "loss_rank_avg": 0.531557559967041, "step": 365, "valid_targets_mean": 2998.2, "valid_targets_min": 1473 }, { "epoch": 0.5910543130990416, "grad_norm": 0.8556604547740909, "learning_rate": 3.362186788154898e-05, "loss": 0.4987, "loss_nan_ranks": 0, "loss_rank_avg": 0.5079728364944458, "step": 370, "valid_targets_mean": 2428.6, "valid_targets_min": 892 }, { "epoch": 0.5990415335463258, "grad_norm": 0.7394590411511266, "learning_rate": 3.407744874715262e-05, "loss": 0.4861, "loss_nan_ranks": 0, "loss_rank_avg": 0.4963635206222534, "step": 375, "valid_targets_mean": 3267.9, "valid_targets_min": 1407 }, { "epoch": 0.6070287539936102, "grad_norm": 0.6521727148571741, "learning_rate": 3.453302961275627e-05, "loss": 0.5189, "loss_nan_ranks": 0, "loss_rank_avg": 0.48329901695251465, "step": 380, "valid_targets_mean": 3911.4, "valid_targets_min": 849 }, { "epoch": 0.6150159744408946, "grad_norm": 0.8229679295931809, "learning_rate": 3.498861047835991e-05, "loss": 0.4934, "loss_nan_ranks": 0, "loss_rank_avg": 0.4811190366744995, "step": 385, "valid_targets_mean": 2285.9, "valid_targets_min": 826 }, { "epoch": 0.6230031948881789, "grad_norm": 0.9071810840956518, "learning_rate": 3.5444191343963557e-05, "loss": 0.4721, "loss_nan_ranks": 0, "loss_rank_avg": 0.4603239893913269, "step": 390, "valid_targets_mean": 2446.5, "valid_targets_min": 1318 }, { "epoch": 0.6309904153354633, "grad_norm": 0.8673398873329051, "learning_rate": 3.58997722095672e-05, "loss": 0.4829, "loss_nan_ranks": 0, "loss_rank_avg": 0.5173234939575195, "step": 395, "valid_targets_mean": 2453.8, "valid_targets_min": 969 }, { "epoch": 0.6389776357827476, "grad_norm": 0.7684733433083464, "learning_rate": 3.6355353075170846e-05, "loss": 0.5033, "loss_nan_ranks": 0, "loss_rank_avg": 0.5281765460968018, "step": 400, "valid_targets_mean": 2919.4, "valid_targets_min": 920 }, { "epoch": 0.646964856230032, "grad_norm": 0.8185705410175095, "learning_rate": 3.681093394077449e-05, "loss": 0.4779, "loss_nan_ranks": 0, "loss_rank_avg": 0.4623745083808899, "step": 405, "valid_targets_mean": 2701.0, "valid_targets_min": 1169 }, { "epoch": 0.6549520766773163, "grad_norm": 0.7773039011766039, "learning_rate": 3.7266514806378135e-05, "loss": 0.46, "loss_nan_ranks": 0, "loss_rank_avg": 0.486310213804245, "step": 410, "valid_targets_mean": 2514.9, "valid_targets_min": 970 }, { "epoch": 0.6629392971246006, "grad_norm": 0.737226072296739, "learning_rate": 3.772209567198178e-05, "loss": 0.4686, "loss_nan_ranks": 0, "loss_rank_avg": 0.4548845589160919, "step": 415, "valid_targets_mean": 3062.8, "valid_targets_min": 1112 }, { "epoch": 0.670926517571885, "grad_norm": 0.8207102057499368, "learning_rate": 3.8177676537585425e-05, "loss": 0.5013, "loss_nan_ranks": 0, "loss_rank_avg": 0.5302478075027466, "step": 420, "valid_targets_mean": 2693.4, "valid_targets_min": 913 }, { "epoch": 0.6789137380191693, "grad_norm": 0.8145687731562341, "learning_rate": 3.863325740318907e-05, "loss": 0.5151, "loss_nan_ranks": 0, "loss_rank_avg": 0.5070667266845703, "step": 425, "valid_targets_mean": 2775.8, "valid_targets_min": 1168 }, { "epoch": 0.6869009584664537, "grad_norm": 0.8111716683915323, "learning_rate": 3.9088838268792714e-05, "loss": 0.4944, "loss_nan_ranks": 0, "loss_rank_avg": 0.4909268915653229, "step": 430, "valid_targets_mean": 2921.1, "valid_targets_min": 1126 }, { "epoch": 0.694888178913738, "grad_norm": 0.7411546696567747, "learning_rate": 3.954441913439636e-05, "loss": 0.4783, "loss_nan_ranks": 0, "loss_rank_avg": 0.4458876848220825, "step": 435, "valid_targets_mean": 3290.1, "valid_targets_min": 1084 }, { "epoch": 0.7028753993610224, "grad_norm": 0.7518470194155535, "learning_rate": 4e-05, "loss": 0.4812, "loss_nan_ranks": 0, "loss_rank_avg": 0.4502463638782501, "step": 440, "valid_targets_mean": 2823.3, "valid_targets_min": 1108 }, { "epoch": 0.7108626198083067, "grad_norm": 0.7640155259479486, "learning_rate": 3.999984129682125e-05, "loss": 0.4932, "loss_nan_ranks": 0, "loss_rank_avg": 0.46215182542800903, "step": 445, "valid_targets_mean": 2613.8, "valid_targets_min": 960 }, { "epoch": 0.7188498402555911, "grad_norm": 0.7415555019488704, "learning_rate": 3.9999365189803684e-05, "loss": 0.4708, "loss_nan_ranks": 0, "loss_rank_avg": 0.4664982557296753, "step": 450, "valid_targets_mean": 3100.8, "valid_targets_min": 1095 }, { "epoch": 0.7268370607028753, "grad_norm": 0.802377503314035, "learning_rate": 3.9998571686503264e-05, "loss": 0.4866, "loss_nan_ranks": 0, "loss_rank_avg": 0.4585043489933014, "step": 455, "valid_targets_mean": 2264.9, "valid_targets_min": 909 }, { "epoch": 0.7348242811501597, "grad_norm": 0.708085049519949, "learning_rate": 3.9997460799513134e-05, "loss": 0.4845, "loss_nan_ranks": 0, "loss_rank_avg": 0.5432193279266357, "step": 460, "valid_targets_mean": 3839.4, "valid_targets_min": 873 }, { "epoch": 0.7428115015974441, "grad_norm": 0.7879120589505894, "learning_rate": 3.999603254646343e-05, "loss": 0.475, "loss_nan_ranks": 0, "loss_rank_avg": 0.46323227882385254, "step": 465, "valid_targets_mean": 3269.4, "valid_targets_min": 1072 }, { "epoch": 0.7507987220447284, "grad_norm": 0.749075306348792, "learning_rate": 3.9994286950020986e-05, "loss": 0.507, "loss_nan_ranks": 0, "loss_rank_avg": 0.4851936101913452, "step": 470, "valid_targets_mean": 3137.9, "valid_targets_min": 1124 }, { "epoch": 0.7587859424920128, "grad_norm": 0.7129540444830214, "learning_rate": 3.999222403788896e-05, "loss": 0.4729, "loss_nan_ranks": 0, "loss_rank_avg": 0.4908882975578308, "step": 475, "valid_targets_mean": 3526.2, "valid_targets_min": 1146 }, { "epoch": 0.7667731629392971, "grad_norm": 0.73095835831582, "learning_rate": 3.9989843842806435e-05, "loss": 0.4863, "loss_nan_ranks": 0, "loss_rank_avg": 0.43629252910614014, "step": 480, "valid_targets_mean": 3166.7, "valid_targets_min": 1356 }, { "epoch": 0.7747603833865815, "grad_norm": 0.8481950002243562, "learning_rate": 3.998714640254786e-05, "loss": 0.4703, "loss_nan_ranks": 0, "loss_rank_avg": 0.4779198169708252, "step": 485, "valid_targets_mean": 2446.2, "valid_targets_min": 1053 }, { "epoch": 0.7827476038338658, "grad_norm": 0.9252979170092325, "learning_rate": 3.998413175992247e-05, "loss": 0.4909, "loss_nan_ranks": 0, "loss_rank_avg": 0.4803544878959656, "step": 490, "valid_targets_mean": 2121.9, "valid_targets_min": 1006 }, { "epoch": 0.7907348242811502, "grad_norm": 0.9413520178628827, "learning_rate": 3.99807999627736e-05, "loss": 0.5062, "loss_nan_ranks": 0, "loss_rank_avg": 0.5145155191421509, "step": 495, "valid_targets_mean": 2570.1, "valid_targets_min": 1079 }, { "epoch": 0.7987220447284346, "grad_norm": 0.8048047081738046, "learning_rate": 3.997715106397794e-05, "loss": 0.4847, "loss_nan_ranks": 0, "loss_rank_avg": 0.4717975854873657, "step": 500, "valid_targets_mean": 2329.3, "valid_targets_min": 938 }, { "epoch": 0.8067092651757188, "grad_norm": 0.7643728322556019, "learning_rate": 3.997318512144465e-05, "loss": 0.4873, "loss_nan_ranks": 0, "loss_rank_avg": 0.46637722849845886, "step": 505, "valid_targets_mean": 2817.7, "valid_targets_min": 715 }, { "epoch": 0.8146964856230032, "grad_norm": 0.8279624349532135, "learning_rate": 3.9968902198114516e-05, "loss": 0.4673, "loss_nan_ranks": 0, "loss_rank_avg": 0.5180720686912537, "step": 510, "valid_targets_mean": 2913.6, "valid_targets_min": 823 }, { "epoch": 0.8226837060702875, "grad_norm": 0.8109766155806294, "learning_rate": 3.996430236195889e-05, "loss": 0.4805, "loss_nan_ranks": 0, "loss_rank_avg": 0.49160677194595337, "step": 515, "valid_targets_mean": 2462.8, "valid_targets_min": 1046 }, { "epoch": 0.8306709265175719, "grad_norm": 0.7956373398673393, "learning_rate": 3.995938568597864e-05, "loss": 0.4909, "loss_nan_ranks": 0, "loss_rank_avg": 0.42897269129753113, "step": 520, "valid_targets_mean": 2364.6, "valid_targets_min": 1400 }, { "epoch": 0.8386581469648562, "grad_norm": 0.7414841411842699, "learning_rate": 3.995415224820297e-05, "loss": 0.4887, "loss_nan_ranks": 0, "loss_rank_avg": 0.5362697839736938, "step": 525, "valid_targets_mean": 3108.9, "valid_targets_min": 1195 }, { "epoch": 0.8466453674121406, "grad_norm": 0.8317859182220397, "learning_rate": 3.994860213168819e-05, "loss": 0.469, "loss_nan_ranks": 0, "loss_rank_avg": 0.483562171459198, "step": 530, "valid_targets_mean": 2305.6, "valid_targets_min": 1103 }, { "epoch": 0.854632587859425, "grad_norm": 0.8462535217865819, "learning_rate": 3.9942735424516435e-05, "loss": 0.4811, "loss_nan_ranks": 0, "loss_rank_avg": 0.4656353294849396, "step": 535, "valid_targets_mean": 2399.4, "valid_targets_min": 613 }, { "epoch": 0.8626198083067093, "grad_norm": 0.7834889362197252, "learning_rate": 3.9936552219794196e-05, "loss": 0.4826, "loss_nan_ranks": 0, "loss_rank_avg": 0.4877358675003052, "step": 540, "valid_targets_mean": 3244.2, "valid_targets_min": 837 }, { "epoch": 0.8706070287539937, "grad_norm": 0.8102216918022214, "learning_rate": 3.993005261565091e-05, "loss": 0.4716, "loss_nan_ranks": 0, "loss_rank_avg": 0.4835214614868164, "step": 545, "valid_targets_mean": 2657.9, "valid_targets_min": 895 }, { "epoch": 0.8785942492012779, "grad_norm": 0.7484190976431879, "learning_rate": 3.992323671523735e-05, "loss": 0.4861, "loss_nan_ranks": 0, "loss_rank_avg": 0.4827854037284851, "step": 550, "valid_targets_mean": 2936.5, "valid_targets_min": 769 }, { "epoch": 0.8865814696485623, "grad_norm": 0.8298777988018279, "learning_rate": 3.991610462672403e-05, "loss": 0.4842, "loss_nan_ranks": 0, "loss_rank_avg": 0.509543240070343, "step": 555, "valid_targets_mean": 2912.0, "valid_targets_min": 1159 }, { "epoch": 0.8945686900958466, "grad_norm": 0.7034233322649788, "learning_rate": 3.9908656463299456e-05, "loss": 0.4695, "loss_nan_ranks": 0, "loss_rank_avg": 0.4778456389904022, "step": 560, "valid_targets_mean": 3026.8, "valid_targets_min": 1167 }, { "epoch": 0.902555910543131, "grad_norm": 0.7349295369253303, "learning_rate": 3.990089234316835e-05, "loss": 0.4771, "loss_nan_ranks": 0, "loss_rank_avg": 0.42017149925231934, "step": 565, "valid_targets_mean": 2561.4, "valid_targets_min": 1007 }, { "epoch": 0.9105431309904153, "grad_norm": 0.8513539946715051, "learning_rate": 3.989281238954978e-05, "loss": 0.4812, "loss_nan_ranks": 0, "loss_rank_avg": 0.45802587270736694, "step": 570, "valid_targets_mean": 2120.5, "valid_targets_min": 962 }, { "epoch": 0.9185303514376997, "grad_norm": 0.7971530719267699, "learning_rate": 3.9884416730675155e-05, "loss": 0.4671, "loss_nan_ranks": 0, "loss_rank_avg": 0.48669928312301636, "step": 575, "valid_targets_mean": 3067.6, "valid_targets_min": 1125 }, { "epoch": 0.9265175718849841, "grad_norm": 0.7526750754328368, "learning_rate": 3.987570549978626e-05, "loss": 0.4601, "loss_nan_ranks": 0, "loss_rank_avg": 0.4806230962276459, "step": 580, "valid_targets_mean": 2587.2, "valid_targets_min": 1150 }, { "epoch": 0.9345047923322684, "grad_norm": 0.8137737946062722, "learning_rate": 3.986667883513311e-05, "loss": 0.4563, "loss_nan_ranks": 0, "loss_rank_avg": 0.518112301826477, "step": 585, "valid_targets_mean": 2852.7, "valid_targets_min": 1193 }, { "epoch": 0.9424920127795527, "grad_norm": 0.8659103970463817, "learning_rate": 3.985733687997173e-05, "loss": 0.489, "loss_nan_ranks": 0, "loss_rank_avg": 0.5319004058837891, "step": 590, "valid_targets_mean": 2343.2, "valid_targets_min": 1225 }, { "epoch": 0.950479233226837, "grad_norm": 0.7469614351703592, "learning_rate": 3.984767978256192e-05, "loss": 0.4564, "loss_nan_ranks": 0, "loss_rank_avg": 0.4597756266593933, "step": 595, "valid_targets_mean": 2952.0, "valid_targets_min": 1383 }, { "epoch": 0.9584664536741214, "grad_norm": 0.7861886747969548, "learning_rate": 3.983770769616488e-05, "loss": 0.4622, "loss_nan_ranks": 0, "loss_rank_avg": 0.4694702923297882, "step": 600, "valid_targets_mean": 2704.9, "valid_targets_min": 855 }, { "epoch": 0.9664536741214057, "grad_norm": 0.7149924456313416, "learning_rate": 3.9827420779040805e-05, "loss": 0.4772, "loss_nan_ranks": 0, "loss_rank_avg": 0.4691518545150757, "step": 605, "valid_targets_mean": 3017.1, "valid_targets_min": 1070 }, { "epoch": 0.9744408945686901, "grad_norm": 0.6590357190461086, "learning_rate": 3.981681919444633e-05, "loss": 0.4613, "loss_nan_ranks": 0, "loss_rank_avg": 0.416545569896698, "step": 610, "valid_targets_mean": 3355.1, "valid_targets_min": 865 }, { "epoch": 0.9824281150159745, "grad_norm": 0.7704139751683394, "learning_rate": 3.980590311063197e-05, "loss": 0.479, "loss_nan_ranks": 0, "loss_rank_avg": 0.5077451467514038, "step": 615, "valid_targets_mean": 2788.4, "valid_targets_min": 651 }, { "epoch": 0.9904153354632588, "grad_norm": 0.738816152478186, "learning_rate": 3.9794672700839455e-05, "loss": 0.4779, "loss_nan_ranks": 0, "loss_rank_avg": 0.47935396432876587, "step": 620, "valid_targets_mean": 2682.5, "valid_targets_min": 1006 }, { "epoch": 0.9984025559105432, "grad_norm": 0.7573465905776805, "learning_rate": 3.9783128143298945e-05, "loss": 0.4591, "loss_nan_ranks": 0, "loss_rank_avg": 0.5034106969833374, "step": 625, "valid_targets_mean": 2697.0, "valid_targets_min": 878 }, { "epoch": 1.0063897763578276, "grad_norm": 0.7685082899437944, "learning_rate": 3.977126962122625e-05, "loss": 0.4473, "loss_nan_ranks": 0, "loss_rank_avg": 0.4544332027435303, "step": 630, "valid_targets_mean": 2484.2, "valid_targets_min": 1257 }, { "epoch": 1.0143769968051117, "grad_norm": 0.7630287431391214, "learning_rate": 3.975909732281988e-05, "loss": 0.4815, "loss_nan_ranks": 0, "loss_rank_avg": 0.5001740455627441, "step": 635, "valid_targets_mean": 2804.8, "valid_targets_min": 1111 }, { "epoch": 1.0223642172523961, "grad_norm": 0.8349889620121833, "learning_rate": 3.974661144125808e-05, "loss": 0.4379, "loss_nan_ranks": 0, "loss_rank_avg": 0.44968223571777344, "step": 640, "valid_targets_mean": 2246.1, "valid_targets_min": 934 }, { "epoch": 1.0303514376996805, "grad_norm": 0.7289354674087208, "learning_rate": 3.973381217469576e-05, "loss": 0.4177, "loss_nan_ranks": 0, "loss_rank_avg": 0.39167508482933044, "step": 645, "valid_targets_mean": 2778.6, "valid_targets_min": 1312 }, { "epoch": 1.038338658146965, "grad_norm": 0.7610454326773037, "learning_rate": 3.972069972626135e-05, "loss": 0.4489, "loss_nan_ranks": 0, "loss_rank_avg": 0.4945276379585266, "step": 650, "valid_targets_mean": 2881.5, "valid_targets_min": 1154 }, { "epoch": 1.0463258785942493, "grad_norm": 0.7529804157949619, "learning_rate": 3.970727430405357e-05, "loss": 0.4461, "loss_nan_ranks": 0, "loss_rank_avg": 0.4402261972427368, "step": 655, "valid_targets_mean": 3169.2, "valid_targets_min": 881 }, { "epoch": 1.0543130990415335, "grad_norm": 0.7479368522385385, "learning_rate": 3.969353612113815e-05, "loss": 0.4171, "loss_nan_ranks": 0, "loss_rank_avg": 0.45113587379455566, "step": 660, "valid_targets_mean": 2818.9, "valid_targets_min": 904 }, { "epoch": 1.0623003194888179, "grad_norm": 0.7429987740189701, "learning_rate": 3.96794853955444e-05, "loss": 0.4416, "loss_nan_ranks": 0, "loss_rank_avg": 0.3951209783554077, "step": 665, "valid_targets_mean": 2721.9, "valid_targets_min": 855 }, { "epoch": 1.0702875399361023, "grad_norm": 0.6988528547787896, "learning_rate": 3.966512235026182e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.44669538736343384, "step": 670, "valid_targets_mean": 3886.9, "valid_targets_min": 970 }, { "epoch": 1.0782747603833867, "grad_norm": 0.7685049413282936, "learning_rate": 3.96504472132365e-05, "loss": 0.4628, "loss_nan_ranks": 0, "loss_rank_avg": 0.46493786573410034, "step": 675, "valid_targets_mean": 2864.7, "valid_targets_min": 912 }, { "epoch": 1.0862619808306708, "grad_norm": 0.7321617108406029, "learning_rate": 3.9635460217367513e-05, "loss": 0.4508, "loss_nan_ranks": 0, "loss_rank_avg": 0.41404807567596436, "step": 680, "valid_targets_mean": 2885.9, "valid_targets_min": 1079 }, { "epoch": 1.0942492012779552, "grad_norm": 0.7592802978135224, "learning_rate": 3.962016160050327e-05, "loss": 0.4482, "loss_nan_ranks": 0, "loss_rank_avg": 0.41572150588035583, "step": 685, "valid_targets_mean": 2479.6, "valid_targets_min": 913 }, { "epoch": 1.1022364217252396, "grad_norm": 0.732817568596785, "learning_rate": 3.960455160543767e-05, "loss": 0.4626, "loss_nan_ranks": 0, "loss_rank_avg": 0.42624184489250183, "step": 690, "valid_targets_mean": 2974.9, "valid_targets_min": 928 }, { "epoch": 1.110223642172524, "grad_norm": 0.76011633776547, "learning_rate": 3.958863047990631e-05, "loss": 0.4283, "loss_nan_ranks": 0, "loss_rank_avg": 0.43110883235931396, "step": 695, "valid_targets_mean": 2901.8, "valid_targets_min": 938 }, { "epoch": 1.1182108626198084, "grad_norm": 0.8431475807189021, "learning_rate": 3.95723984765825e-05, "loss": 0.4612, "loss_nan_ranks": 0, "loss_rank_avg": 0.5132505893707275, "step": 700, "valid_targets_mean": 2484.8, "valid_targets_min": 1412 }, { "epoch": 1.1261980830670926, "grad_norm": 0.9220223660266152, "learning_rate": 3.955585585307329e-05, "loss": 0.46, "loss_nan_ranks": 0, "loss_rank_avg": 0.44615116715431213, "step": 705, "valid_targets_mean": 2291.6, "valid_targets_min": 884 }, { "epoch": 1.134185303514377, "grad_norm": 1.019334003630654, "learning_rate": 3.9539002871915395e-05, "loss": 0.4542, "loss_nan_ranks": 0, "loss_rank_avg": 0.43944239616394043, "step": 710, "valid_targets_mean": 2567.4, "valid_targets_min": 1308 }, { "epoch": 1.1421725239616614, "grad_norm": 0.7795615708622041, "learning_rate": 3.952183980057096e-05, "loss": 0.4325, "loss_nan_ranks": 0, "loss_rank_avg": 0.4104035496711731, "step": 715, "valid_targets_mean": 2444.2, "valid_targets_min": 803 }, { "epoch": 1.1501597444089458, "grad_norm": 0.8468623107296779, "learning_rate": 3.950436691142339e-05, "loss": 0.4401, "loss_nan_ranks": 0, "loss_rank_avg": 0.43115919828414917, "step": 720, "valid_targets_mean": 2466.9, "valid_targets_min": 1406 }, { "epoch": 1.15814696485623, "grad_norm": 0.8529964274281423, "learning_rate": 3.948658448177299e-05, "loss": 0.4524, "loss_nan_ranks": 0, "loss_rank_avg": 0.48739194869995117, "step": 725, "valid_targets_mean": 2443.1, "valid_targets_min": 1168 }, { "epoch": 1.1661341853035143, "grad_norm": 0.7172046757160037, "learning_rate": 3.946849279383258e-05, "loss": 0.4257, "loss_nan_ranks": 0, "loss_rank_avg": 0.3758084774017334, "step": 730, "valid_targets_mean": 2842.2, "valid_targets_min": 1077 }, { "epoch": 1.1741214057507987, "grad_norm": 0.711565411890527, "learning_rate": 3.9450092134722984e-05, "loss": 0.4377, "loss_nan_ranks": 0, "loss_rank_avg": 0.4145118296146393, "step": 735, "valid_targets_mean": 3007.6, "valid_targets_min": 507 }, { "epoch": 1.182108626198083, "grad_norm": 0.8309877125516639, "learning_rate": 3.943138279646853e-05, "loss": 0.4421, "loss_nan_ranks": 0, "loss_rank_avg": 0.46872472763061523, "step": 740, "valid_targets_mean": 2660.7, "valid_targets_min": 818 }, { "epoch": 1.1900958466453675, "grad_norm": 0.8195558428978243, "learning_rate": 3.941236507599234e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.4253050982952118, "step": 745, "valid_targets_mean": 2162.1, "valid_targets_min": 877 }, { "epoch": 1.1980830670926517, "grad_norm": 0.7757463661583209, "learning_rate": 3.93930392751117e-05, "loss": 0.4283, "loss_nan_ranks": 0, "loss_rank_avg": 0.41354313492774963, "step": 750, "valid_targets_mean": 2641.2, "valid_targets_min": 1158 }, { "epoch": 1.206070287539936, "grad_norm": 0.8685777071160953, "learning_rate": 3.9373405700533204e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.4196351170539856, "step": 755, "valid_targets_mean": 2522.3, "valid_targets_min": 733 }, { "epoch": 1.2140575079872205, "grad_norm": 0.7508846483862592, "learning_rate": 3.935346466384793e-05, "loss": 0.4199, "loss_nan_ranks": 0, "loss_rank_avg": 0.44403281807899475, "step": 760, "valid_targets_mean": 3216.3, "valid_targets_min": 1101 }, { "epoch": 1.2220447284345048, "grad_norm": 0.758240824860655, "learning_rate": 3.933321648152646e-05, "loss": 0.4384, "loss_nan_ranks": 0, "loss_rank_avg": 0.4567496180534363, "step": 765, "valid_targets_mean": 2950.4, "valid_targets_min": 1193 }, { "epoch": 1.230031948881789, "grad_norm": 0.7200839121536595, "learning_rate": 3.931266147491389e-05, "loss": 0.4516, "loss_nan_ranks": 0, "loss_rank_avg": 0.4802227020263672, "step": 770, "valid_targets_mean": 3282.1, "valid_targets_min": 1203 }, { "epoch": 1.2380191693290734, "grad_norm": 0.6572973431050214, "learning_rate": 3.929179997022471e-05, "loss": 0.4278, "loss_nan_ranks": 0, "loss_rank_avg": 0.39114686846733093, "step": 775, "valid_targets_mean": 3843.3, "valid_targets_min": 992 }, { "epoch": 1.2460063897763578, "grad_norm": 0.6844582042432027, "learning_rate": 3.927063229853763e-05, "loss": 0.4535, "loss_nan_ranks": 0, "loss_rank_avg": 0.4484739303588867, "step": 780, "valid_targets_mean": 3771.4, "valid_targets_min": 1028 }, { "epoch": 1.2539936102236422, "grad_norm": 0.7829452545267517, "learning_rate": 3.9249158795790316e-05, "loss": 0.4315, "loss_nan_ranks": 0, "loss_rank_avg": 0.4051206707954407, "step": 785, "valid_targets_mean": 2456.8, "valid_targets_min": 764 }, { "epoch": 1.2619808306709266, "grad_norm": 0.8420722089855658, "learning_rate": 3.9227379802774106e-05, "loss": 0.4634, "loss_nan_ranks": 0, "loss_rank_avg": 0.4935472011566162, "step": 790, "valid_targets_mean": 2295.8, "valid_targets_min": 816 }, { "epoch": 1.269968051118211, "grad_norm": 0.7215521455732657, "learning_rate": 3.920529566512852e-05, "loss": 0.4358, "loss_nan_ranks": 0, "loss_rank_avg": 0.4593965709209442, "step": 795, "valid_targets_mean": 3036.1, "valid_targets_min": 1362 }, { "epoch": 1.2779552715654952, "grad_norm": 0.6783023396300084, "learning_rate": 3.918290673333585e-05, "loss": 0.437, "loss_nan_ranks": 0, "loss_rank_avg": 0.4560937285423279, "step": 800, "valid_targets_mean": 3412.9, "valid_targets_min": 893 }, { "epoch": 1.2859424920127795, "grad_norm": 0.8802145850392343, "learning_rate": 3.916021336271556e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.42020413279533386, "step": 805, "valid_targets_mean": 2170.1, "valid_targets_min": 722 }, { "epoch": 1.293929712460064, "grad_norm": 0.8120285437652148, "learning_rate": 3.913721591341867e-05, "loss": 0.4176, "loss_nan_ranks": 0, "loss_rank_avg": 0.41880103945732117, "step": 810, "valid_targets_mean": 2954.5, "valid_targets_min": 1212 }, { "epoch": 1.3019169329073481, "grad_norm": 0.8288104538653214, "learning_rate": 3.9113914750421985e-05, "loss": 0.4255, "loss_nan_ranks": 0, "loss_rank_avg": 0.41077354550361633, "step": 815, "valid_targets_mean": 2509.9, "valid_targets_min": 1417 }, { "epoch": 1.3099041533546325, "grad_norm": 0.8618512146438632, "learning_rate": 3.9090310243522394e-05, "loss": 0.4259, "loss_nan_ranks": 0, "loss_rank_avg": 0.44943004846572876, "step": 820, "valid_targets_mean": 2502.8, "valid_targets_min": 1461 }, { "epoch": 1.317891373801917, "grad_norm": 0.7760318158209316, "learning_rate": 3.90664027673309e-05, "loss": 0.4501, "loss_nan_ranks": 0, "loss_rank_avg": 0.4216914772987366, "step": 825, "valid_targets_mean": 2769.1, "valid_targets_min": 1289 }, { "epoch": 1.3258785942492013, "grad_norm": 0.6906923363443747, "learning_rate": 3.904219270126677e-05, "loss": 0.4191, "loss_nan_ranks": 0, "loss_rank_avg": 0.415194571018219, "step": 830, "valid_targets_mean": 3361.9, "valid_targets_min": 1049 }, { "epoch": 1.3338658146964857, "grad_norm": 0.8174353322181585, "learning_rate": 3.901768042955144e-05, "loss": 0.4324, "loss_nan_ranks": 0, "loss_rank_avg": 0.45407986640930176, "step": 835, "valid_targets_mean": 2556.1, "valid_targets_min": 1003 }, { "epoch": 1.34185303514377, "grad_norm": 0.7692657856870714, "learning_rate": 3.8992866341202446e-05, "loss": 0.4124, "loss_nan_ranks": 0, "loss_rank_avg": 0.393581748008728, "step": 840, "valid_targets_mean": 2292.6, "valid_targets_min": 981 }, { "epoch": 1.3498402555910542, "grad_norm": 0.7721910677108021, "learning_rate": 3.8967750830027277e-05, "loss": 0.4225, "loss_nan_ranks": 0, "loss_rank_avg": 0.43121227622032166, "step": 845, "valid_targets_mean": 2591.4, "valid_targets_min": 1106 }, { "epoch": 1.3578274760383386, "grad_norm": 0.7607761762713008, "learning_rate": 3.894233429461706e-05, "loss": 0.4357, "loss_nan_ranks": 0, "loss_rank_avg": 0.45984774827957153, "step": 850, "valid_targets_mean": 2971.3, "valid_targets_min": 1249 }, { "epoch": 1.365814696485623, "grad_norm": 0.7549358056556162, "learning_rate": 3.89166171383403e-05, "loss": 0.4134, "loss_nan_ranks": 0, "loss_rank_avg": 0.4264622926712036, "step": 855, "valid_targets_mean": 2585.4, "valid_targets_min": 1483 }, { "epoch": 1.3738019169329074, "grad_norm": 0.721426310472384, "learning_rate": 3.889059976933644e-05, "loss": 0.4258, "loss_nan_ranks": 0, "loss_rank_avg": 0.4268583059310913, "step": 860, "valid_targets_mean": 2885.3, "valid_targets_min": 1173 }, { "epoch": 1.3817891373801916, "grad_norm": 0.7720799009636946, "learning_rate": 3.88642826005094e-05, "loss": 0.4505, "loss_nan_ranks": 0, "loss_rank_avg": 0.42852962017059326, "step": 865, "valid_targets_mean": 2731.6, "valid_targets_min": 871 }, { "epoch": 1.389776357827476, "grad_norm": 0.8470631851658071, "learning_rate": 3.883766604952102e-05, "loss": 0.4547, "loss_nan_ranks": 0, "loss_rank_avg": 0.49135443568229675, "step": 870, "valid_targets_mean": 2234.6, "valid_targets_min": 999 }, { "epoch": 1.3977635782747604, "grad_norm": 0.7411779868421573, "learning_rate": 3.8810750538784404e-05, "loss": 0.4435, "loss_nan_ranks": 0, "loss_rank_avg": 0.4041995406150818, "step": 875, "valid_targets_mean": 2670.5, "valid_targets_min": 1122 }, { "epoch": 1.4057507987220448, "grad_norm": 0.7140299672524761, "learning_rate": 3.878353649545728e-05, "loss": 0.4402, "loss_nan_ranks": 0, "loss_rank_avg": 0.435030996799469, "step": 880, "valid_targets_mean": 3004.1, "valid_targets_min": 1197 }, { "epoch": 1.4137380191693292, "grad_norm": 0.7923681119897052, "learning_rate": 3.875602435143517e-05, "loss": 0.4411, "loss_nan_ranks": 0, "loss_rank_avg": 0.3961261510848999, "step": 885, "valid_targets_mean": 2766.9, "valid_targets_min": 862 }, { "epoch": 1.4217252396166133, "grad_norm": 0.7705589230089058, "learning_rate": 3.872821454334453e-05, "loss": 0.4351, "loss_nan_ranks": 0, "loss_rank_avg": 0.4006156921386719, "step": 890, "valid_targets_mean": 2416.2, "valid_targets_min": 1003 }, { "epoch": 1.4297124600638977, "grad_norm": 0.6925517039660947, "learning_rate": 3.870010751253587e-05, "loss": 0.4377, "loss_nan_ranks": 0, "loss_rank_avg": 0.4088160991668701, "step": 895, "valid_targets_mean": 3179.1, "valid_targets_min": 763 }, { "epoch": 1.4376996805111821, "grad_norm": 0.8307106887932786, "learning_rate": 3.867170370507668e-05, "loss": 0.4581, "loss_nan_ranks": 0, "loss_rank_avg": 0.4864905774593353, "step": 900, "valid_targets_mean": 2541.1, "valid_targets_min": 778 }, { "epoch": 1.4456869009584665, "grad_norm": 0.9623816866236481, "learning_rate": 3.8643003571744445e-05, "loss": 0.4486, "loss_nan_ranks": 0, "loss_rank_avg": 0.4354180693626404, "step": 905, "valid_targets_mean": 2225.6, "valid_targets_min": 1063 }, { "epoch": 1.4536741214057507, "grad_norm": 0.7716245831699764, "learning_rate": 3.861400756801938e-05, "loss": 0.4606, "loss_nan_ranks": 0, "loss_rank_avg": 0.4495222568511963, "step": 910, "valid_targets_mean": 3027.4, "valid_targets_min": 919 }, { "epoch": 1.461661341853035, "grad_norm": 0.7484846052853862, "learning_rate": 3.8584716154077286e-05, "loss": 0.4305, "loss_nan_ranks": 0, "loss_rank_avg": 0.4441258907318115, "step": 915, "valid_targets_mean": 3202.1, "valid_targets_min": 1124 }, { "epoch": 1.4696485623003195, "grad_norm": 0.7368859538362733, "learning_rate": 3.855512979478222e-05, "loss": 0.4252, "loss_nan_ranks": 0, "loss_rank_avg": 0.3749830722808838, "step": 920, "valid_targets_mean": 2625.4, "valid_targets_min": 1193 }, { "epoch": 1.4776357827476039, "grad_norm": 0.6049367824225332, "learning_rate": 3.852524895967911e-05, "loss": 0.4246, "loss_nan_ranks": 0, "loss_rank_avg": 0.38308608531951904, "step": 925, "valid_targets_mean": 4036.0, "valid_targets_min": 1111 }, { "epoch": 1.4856230031948883, "grad_norm": 0.7427843372018998, "learning_rate": 3.8495074122986296e-05, "loss": 0.4265, "loss_nan_ranks": 0, "loss_rank_avg": 0.4193194806575775, "step": 930, "valid_targets_mean": 2806.4, "valid_targets_min": 789 }, { "epoch": 1.4936102236421724, "grad_norm": 0.679197562951001, "learning_rate": 3.846460576358804e-05, "loss": 0.4365, "loss_nan_ranks": 0, "loss_rank_avg": 0.44789695739746094, "step": 935, "valid_targets_mean": 3683.1, "valid_targets_min": 1532 }, { "epoch": 1.5015974440894568, "grad_norm": 0.6722746741760623, "learning_rate": 3.843384436502688e-05, "loss": 0.4293, "loss_nan_ranks": 0, "loss_rank_avg": 0.4009643793106079, "step": 940, "valid_targets_mean": 3287.3, "valid_targets_min": 1028 }, { "epoch": 1.5095846645367412, "grad_norm": 0.7368258927731269, "learning_rate": 3.8402790415496e-05, "loss": 0.4549, "loss_nan_ranks": 0, "loss_rank_avg": 0.43784040212631226, "step": 945, "valid_targets_mean": 2733.6, "valid_targets_min": 1148 }, { "epoch": 1.5175718849840254, "grad_norm": 0.7152894771456657, "learning_rate": 3.837144440783144e-05, "loss": 0.4161, "loss_nan_ranks": 0, "loss_rank_avg": 0.44536614418029785, "step": 950, "valid_targets_mean": 3164.2, "valid_targets_min": 1067 }, { "epoch": 1.5255591054313098, "grad_norm": 0.7947534576481916, "learning_rate": 3.833980683950431e-05, "loss": 0.4814, "loss_nan_ranks": 0, "loss_rank_avg": 0.4934665858745575, "step": 955, "valid_targets_mean": 2351.3, "valid_targets_min": 651 }, { "epoch": 1.5335463258785942, "grad_norm": 0.7875282517828147, "learning_rate": 3.8307878212612886e-05, "loss": 0.4418, "loss_nan_ranks": 0, "loss_rank_avg": 0.43938589096069336, "step": 960, "valid_targets_mean": 2303.6, "valid_targets_min": 1131 }, { "epoch": 1.5415335463258786, "grad_norm": 0.5923903169412785, "learning_rate": 3.827565903387461e-05, "loss": 0.4374, "loss_nan_ranks": 0, "loss_rank_avg": 0.41518276929855347, "step": 965, "valid_targets_mean": 4034.9, "valid_targets_min": 1231 }, { "epoch": 1.549520766773163, "grad_norm": 0.8910911155444613, "learning_rate": 3.82431498146181e-05, "loss": 0.4357, "loss_nan_ranks": 0, "loss_rank_avg": 0.4936522841453552, "step": 970, "valid_targets_mean": 2327.3, "valid_targets_min": 834 }, { "epoch": 1.5575079872204474, "grad_norm": 0.6459335309997667, "learning_rate": 3.821035107077499e-05, "loss": 0.4358, "loss_nan_ranks": 0, "loss_rank_avg": 0.41498053073883057, "step": 975, "valid_targets_mean": 3341.9, "valid_targets_min": 1006 }, { "epoch": 1.5654952076677318, "grad_norm": 0.6926152294260767, "learning_rate": 3.817726332287179e-05, "loss": 0.4259, "loss_nan_ranks": 0, "loss_rank_avg": 0.4034827947616577, "step": 980, "valid_targets_mean": 3087.4, "valid_targets_min": 1153 }, { "epoch": 1.573482428115016, "grad_norm": 0.8034994479627938, "learning_rate": 3.814388709602155e-05, "loss": 0.4412, "loss_nan_ranks": 0, "loss_rank_avg": 0.43312889337539673, "step": 985, "valid_targets_mean": 2240.4, "valid_targets_min": 1043 }, { "epoch": 1.5814696485623003, "grad_norm": 0.7989642353413773, "learning_rate": 3.8110222919915626e-05, "loss": 0.4381, "loss_nan_ranks": 0, "loss_rank_avg": 0.4340096414089203, "step": 990, "valid_targets_mean": 2381.8, "valid_targets_min": 791 }, { "epoch": 1.5894568690095847, "grad_norm": 0.6447498747286449, "learning_rate": 3.8076271328815175e-05, "loss": 0.4441, "loss_nan_ranks": 0, "loss_rank_avg": 0.42020028829574585, "step": 995, "valid_targets_mean": 3908.2, "valid_targets_min": 1254 }, { "epoch": 1.5974440894568689, "grad_norm": 0.6380365159848356, "learning_rate": 3.804203286154275e-05, "loss": 0.4065, "loss_nan_ranks": 0, "loss_rank_avg": 0.4114200472831726, "step": 1000, "valid_targets_mean": 3355.1, "valid_targets_min": 1473 }, { "epoch": 1.6054313099041533, "grad_norm": 0.636811929140562, "learning_rate": 3.800750806147371e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.4242017865180969, "step": 1005, "valid_targets_mean": 3736.1, "valid_targets_min": 1562 }, { "epoch": 1.6134185303514377, "grad_norm": 0.7542875453304175, "learning_rate": 3.79726974765276e-05, "loss": 0.4566, "loss_nan_ranks": 0, "loss_rank_avg": 0.4269424080848694, "step": 1010, "valid_targets_mean": 3016.4, "valid_targets_min": 848 }, { "epoch": 1.621405750798722, "grad_norm": 0.6894222849805512, "learning_rate": 3.793760165915947e-05, "loss": 0.4412, "loss_nan_ranks": 0, "loss_rank_avg": 0.4064532518386841, "step": 1015, "valid_targets_mean": 3785.7, "valid_targets_min": 737 }, { "epoch": 1.6293929712460065, "grad_norm": 0.7778570976152539, "learning_rate": 3.7902221166351106e-05, "loss": 0.4165, "loss_nan_ranks": 0, "loss_rank_avg": 0.4298957586288452, "step": 1020, "valid_targets_mean": 2434.3, "valid_targets_min": 864 }, { "epoch": 1.6373801916932909, "grad_norm": 0.6857539738494024, "learning_rate": 3.786655655960216e-05, "loss": 0.4267, "loss_nan_ranks": 0, "loss_rank_avg": 0.4040903151035309, "step": 1025, "valid_targets_mean": 2788.6, "valid_targets_min": 1324 }, { "epoch": 1.645367412140575, "grad_norm": 0.7706739406760523, "learning_rate": 3.7830608404921294e-05, "loss": 0.4269, "loss_nan_ranks": 0, "loss_rank_avg": 0.457536906003952, "step": 1030, "valid_targets_mean": 2625.8, "valid_targets_min": 1098 }, { "epoch": 1.6533546325878594, "grad_norm": 0.7189631307182224, "learning_rate": 3.7794377272817144e-05, "loss": 0.4513, "loss_nan_ranks": 0, "loss_rank_avg": 0.4552885591983795, "step": 1035, "valid_targets_mean": 3002.1, "valid_targets_min": 1346 }, { "epoch": 1.6613418530351438, "grad_norm": 0.6939968937775858, "learning_rate": 3.775786373828929e-05, "loss": 0.4401, "loss_nan_ranks": 0, "loss_rank_avg": 0.42244094610214233, "step": 1040, "valid_targets_mean": 3193.0, "valid_targets_min": 1181 }, { "epoch": 1.669329073482428, "grad_norm": 0.8310645339562641, "learning_rate": 3.7721068380819135e-05, "loss": 0.449, "loss_nan_ranks": 0, "loss_rank_avg": 0.4165183901786804, "step": 1045, "valid_targets_mean": 2545.9, "valid_targets_min": 1071 }, { "epoch": 1.6773162939297124, "grad_norm": 0.6767363971798981, "learning_rate": 3.768399178436069e-05, "loss": 0.439, "loss_nan_ranks": 0, "loss_rank_avg": 0.44542649388313293, "step": 1050, "valid_targets_mean": 3308.1, "valid_targets_min": 995 }, { "epoch": 1.6853035143769968, "grad_norm": 0.6972061039612378, "learning_rate": 3.764663453733135e-05, "loss": 0.4617, "loss_nan_ranks": 0, "loss_rank_avg": 0.48311084508895874, "step": 1055, "valid_targets_mean": 3087.3, "valid_targets_min": 1261 }, { "epoch": 1.6932907348242812, "grad_norm": 0.7005302044576569, "learning_rate": 3.7608997232602475e-05, "loss": 0.421, "loss_nan_ranks": 0, "loss_rank_avg": 0.38864031434059143, "step": 1060, "valid_targets_mean": 2687.6, "valid_targets_min": 923 }, { "epoch": 1.7012779552715656, "grad_norm": 0.6895071074838427, "learning_rate": 3.757108046749006e-05, "loss": 0.449, "loss_nan_ranks": 0, "loss_rank_avg": 0.41667845845222473, "step": 1065, "valid_targets_mean": 2960.2, "valid_targets_min": 1043 }, { "epoch": 1.70926517571885, "grad_norm": 0.7256933741627416, "learning_rate": 3.753288484374524e-05, "loss": 0.439, "loss_nan_ranks": 0, "loss_rank_avg": 0.4952039420604706, "step": 1070, "valid_targets_mean": 2882.8, "valid_targets_min": 1440 }, { "epoch": 1.7172523961661343, "grad_norm": 0.7266869951359273, "learning_rate": 3.7494410967544674e-05, "loss": 0.4438, "loss_nan_ranks": 0, "loss_rank_avg": 0.4499083161354065, "step": 1075, "valid_targets_mean": 2684.9, "valid_targets_min": 891 }, { "epoch": 1.7252396166134185, "grad_norm": 0.7287210054336749, "learning_rate": 3.745565944948103e-05, "loss": 0.4326, "loss_nan_ranks": 0, "loss_rank_avg": 0.4443957507610321, "step": 1080, "valid_targets_mean": 3179.3, "valid_targets_min": 1110 }, { "epoch": 1.733226837060703, "grad_norm": 0.7302401962493207, "learning_rate": 3.7416630904553205e-05, "loss": 0.42, "loss_nan_ranks": 0, "loss_rank_avg": 0.3901965618133545, "step": 1085, "valid_targets_mean": 2506.9, "valid_targets_min": 1108 }, { "epoch": 1.741214057507987, "grad_norm": 0.7621719007011174, "learning_rate": 3.737732595215663e-05, "loss": 0.4318, "loss_nan_ranks": 0, "loss_rank_avg": 0.49417999386787415, "step": 1090, "valid_targets_mean": 2648.5, "valid_targets_min": 966 }, { "epoch": 1.7492012779552715, "grad_norm": 0.7488069211998931, "learning_rate": 3.733774521607338e-05, "loss": 0.4237, "loss_nan_ranks": 0, "loss_rank_avg": 0.45603471994400024, "step": 1095, "valid_targets_mean": 2818.9, "valid_targets_min": 1088 }, { "epoch": 1.7571884984025559, "grad_norm": 0.8084202592590568, "learning_rate": 3.729788932446231e-05, "loss": 0.4242, "loss_nan_ranks": 0, "loss_rank_avg": 0.45258504152297974, "step": 1100, "valid_targets_mean": 2080.5, "valid_targets_min": 1112 }, { "epoch": 1.7651757188498403, "grad_norm": 0.6611827236924629, "learning_rate": 3.7257758909849107e-05, "loss": 0.4394, "loss_nan_ranks": 0, "loss_rank_avg": 0.44405344128608704, "step": 1105, "valid_targets_mean": 3858.6, "valid_targets_min": 808 }, { "epoch": 1.7731629392971247, "grad_norm": 0.6162135150058156, "learning_rate": 3.72173546091162e-05, "loss": 0.4372, "loss_nan_ranks": 0, "loss_rank_avg": 0.42961829900741577, "step": 1110, "valid_targets_mean": 3943.2, "valid_targets_min": 1108 }, { "epoch": 1.781150159744409, "grad_norm": 0.7394032295272298, "learning_rate": 3.7176677063492685e-05, "loss": 0.4463, "loss_nan_ranks": 0, "loss_rank_avg": 0.45540672540664673, "step": 1115, "valid_targets_mean": 2557.6, "valid_targets_min": 970 }, { "epoch": 1.7891373801916934, "grad_norm": 0.7739659694704212, "learning_rate": 3.713572691854414e-05, "loss": 0.4132, "loss_nan_ranks": 0, "loss_rank_avg": 0.4244069457054138, "step": 1120, "valid_targets_mean": 2507.1, "valid_targets_min": 912 }, { "epoch": 1.7971246006389776, "grad_norm": 0.7905713199175826, "learning_rate": 3.709450482416239e-05, "loss": 0.4084, "loss_nan_ranks": 0, "loss_rank_avg": 0.4046608805656433, "step": 1125, "valid_targets_mean": 2224.6, "valid_targets_min": 1342 }, { "epoch": 1.805111821086262, "grad_norm": 0.7853975413698725, "learning_rate": 3.7053011434555165e-05, "loss": 0.4181, "loss_nan_ranks": 0, "loss_rank_avg": 0.4040316343307495, "step": 1130, "valid_targets_mean": 2187.2, "valid_targets_min": 949 }, { "epoch": 1.8130990415335462, "grad_norm": 1.5880148849392963, "learning_rate": 3.701124740823575e-05, "loss": 0.4296, "loss_nan_ranks": 0, "loss_rank_avg": 0.4547976553440094, "step": 1135, "valid_targets_mean": 1833.9, "valid_targets_min": 430 }, { "epoch": 1.8210862619808306, "grad_norm": 0.7259644824294608, "learning_rate": 3.696921340801253e-05, "loss": 0.4415, "loss_nan_ranks": 0, "loss_rank_avg": 0.4141627550125122, "step": 1140, "valid_targets_mean": 3010.8, "valid_targets_min": 1068 }, { "epoch": 1.829073482428115, "grad_norm": 0.6763295168488686, "learning_rate": 3.6926910100978444e-05, "loss": 0.4196, "loss_nan_ranks": 0, "loss_rank_avg": 0.4594937860965729, "step": 1145, "valid_targets_mean": 3553.1, "valid_targets_min": 923 }, { "epoch": 1.8370607028753994, "grad_norm": 0.7698782558795708, "learning_rate": 3.688433815850041e-05, "loss": 0.4235, "loss_nan_ranks": 0, "loss_rank_avg": 0.4128667712211609, "step": 1150, "valid_targets_mean": 2459.1, "valid_targets_min": 923 }, { "epoch": 1.8450479233226837, "grad_norm": 0.958655027556145, "learning_rate": 3.68414982562087e-05, "loss": 0.42, "loss_nan_ranks": 0, "loss_rank_avg": 0.4355429410934448, "step": 1155, "valid_targets_mean": 1698.6, "valid_targets_min": 934 }, { "epoch": 1.8530351437699681, "grad_norm": 0.7513635672673216, "learning_rate": 3.679839107398618e-05, "loss": 0.4176, "loss_nan_ranks": 0, "loss_rank_avg": 0.45161160826683044, "step": 1160, "valid_targets_mean": 3201.0, "valid_targets_min": 1142 }, { "epoch": 1.8610223642172525, "grad_norm": 0.7754798547552919, "learning_rate": 3.6755017295957536e-05, "loss": 0.4402, "loss_nan_ranks": 0, "loss_rank_avg": 0.47688138484954834, "step": 1165, "valid_targets_mean": 2819.0, "valid_targets_min": 1346 }, { "epoch": 1.8690095846645367, "grad_norm": 0.7883052596756699, "learning_rate": 3.67113776104784e-05, "loss": 0.424, "loss_nan_ranks": 0, "loss_rank_avg": 0.4371069669723511, "step": 1170, "valid_targets_mean": 2428.7, "valid_targets_min": 1220 }, { "epoch": 1.876996805111821, "grad_norm": 0.6696947561840654, "learning_rate": 3.6667472710124475e-05, "loss": 0.4416, "loss_nan_ranks": 0, "loss_rank_avg": 0.4349396228790283, "step": 1175, "valid_targets_mean": 3369.9, "valid_targets_min": 1130 }, { "epoch": 1.8849840255591053, "grad_norm": 0.8979562437261165, "learning_rate": 3.6623303291680465e-05, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.4136584997177124, "step": 1180, "valid_targets_mean": 2837.1, "valid_targets_min": 747 }, { "epoch": 1.8929712460063897, "grad_norm": 0.6747106007234754, "learning_rate": 3.6578870056129086e-05, "loss": 0.4259, "loss_nan_ranks": 0, "loss_rank_avg": 0.39019960165023804, "step": 1185, "valid_targets_mean": 3195.2, "valid_targets_min": 1219 }, { "epoch": 1.900958466453674, "grad_norm": 0.6216752591895326, "learning_rate": 3.653417370863992e-05, "loss": 0.423, "loss_nan_ranks": 0, "loss_rank_avg": 0.41113990545272827, "step": 1190, "valid_targets_mean": 3552.1, "valid_targets_min": 1157 }, { "epoch": 1.9089456869009584, "grad_norm": 0.6107745396982358, "learning_rate": 3.6489214958558206e-05, "loss": 0.4376, "loss_nan_ranks": 0, "loss_rank_avg": 0.4672267436981201, "step": 1195, "valid_targets_mean": 4152.6, "valid_targets_min": 1233 }, { "epoch": 1.9169329073482428, "grad_norm": 0.6564451674349974, "learning_rate": 3.644399451939358e-05, "loss": 0.4168, "loss_nan_ranks": 0, "loss_rank_avg": 0.39774927496910095, "step": 1200, "valid_targets_mean": 2968.9, "valid_targets_min": 1242 }, { "epoch": 1.9249201277955272, "grad_norm": 0.7771431898711396, "learning_rate": 3.639851310880881e-05, "loss": 0.4622, "loss_nan_ranks": 0, "loss_rank_avg": 0.5002536773681641, "step": 1205, "valid_targets_mean": 2619.9, "valid_targets_min": 1063 }, { "epoch": 1.9329073482428116, "grad_norm": 0.7533507907086239, "learning_rate": 3.635277144860834e-05, "loss": 0.4209, "loss_nan_ranks": 0, "loss_rank_avg": 0.4327402710914612, "step": 1210, "valid_targets_mean": 2435.6, "valid_targets_min": 657 }, { "epoch": 1.9408945686900958, "grad_norm": 0.6838599740152425, "learning_rate": 3.630677026472684e-05, "loss": 0.4354, "loss_nan_ranks": 0, "loss_rank_avg": 0.42494964599609375, "step": 1215, "valid_targets_mean": 2926.8, "valid_targets_min": 860 }, { "epoch": 1.9488817891373802, "grad_norm": 0.7046006759588175, "learning_rate": 3.626051028721773e-05, "loss": 0.4446, "loss_nan_ranks": 0, "loss_rank_avg": 0.4118865132331848, "step": 1220, "valid_targets_mean": 2795.1, "valid_targets_min": 740 }, { "epoch": 1.9568690095846646, "grad_norm": 0.7846235878176491, "learning_rate": 3.621399225024156e-05, "loss": 0.4277, "loss_nan_ranks": 0, "loss_rank_avg": 0.4167096018791199, "step": 1225, "valid_targets_mean": 2380.5, "valid_targets_min": 869 }, { "epoch": 1.9648562300319488, "grad_norm": 0.6729799838262991, "learning_rate": 3.616721689205436e-05, "loss": 0.4147, "loss_nan_ranks": 0, "loss_rank_avg": 0.3980925381183624, "step": 1230, "valid_targets_mean": 2988.2, "valid_targets_min": 1022 }, { "epoch": 1.9728434504792332, "grad_norm": 0.7826130416711469, "learning_rate": 3.612018495499594e-05, "loss": 0.4399, "loss_nan_ranks": 0, "loss_rank_avg": 0.42765045166015625, "step": 1235, "valid_targets_mean": 2436.8, "valid_targets_min": 1103 }, { "epoch": 1.9808306709265175, "grad_norm": 0.662773336531969, "learning_rate": 3.6072897185478074e-05, "loss": 0.4131, "loss_nan_ranks": 0, "loss_rank_avg": 0.43413665890693665, "step": 1240, "valid_targets_mean": 3430.6, "valid_targets_min": 1036 }, { "epoch": 1.988817891373802, "grad_norm": 0.6600752452234055, "learning_rate": 3.6025354333972714e-05, "loss": 0.4079, "loss_nan_ranks": 0, "loss_rank_avg": 0.41904622316360474, "step": 1245, "valid_targets_mean": 3193.2, "valid_targets_min": 1213 }, { "epoch": 1.9968051118210863, "grad_norm": 0.7364834761692404, "learning_rate": 3.597755715500002e-05, "loss": 0.4179, "loss_nan_ranks": 0, "loss_rank_avg": 0.4459013342857361, "step": 1250, "valid_targets_mean": 2883.5, "valid_targets_min": 1221 }, { "epoch": 2.0047923322683707, "grad_norm": 0.6757605852428736, "learning_rate": 3.592950640711642e-05, "loss": 0.3716, "loss_nan_ranks": 0, "loss_rank_avg": 0.3445654511451721, "step": 1255, "valid_targets_mean": 2511.2, "valid_targets_min": 1113 }, { "epoch": 2.012779552715655, "grad_norm": 0.7920973856730682, "learning_rate": 3.5881202852902543e-05, "loss": 0.3774, "loss_nan_ranks": 0, "loss_rank_avg": 0.37682023644447327, "step": 1260, "valid_targets_mean": 2531.8, "valid_targets_min": 803 }, { "epoch": 2.0207667731629395, "grad_norm": 0.7084485618774308, "learning_rate": 3.583264725895117e-05, "loss": 0.4095, "loss_nan_ranks": 0, "loss_rank_avg": 0.40177470445632935, "step": 1265, "valid_targets_mean": 3139.1, "valid_targets_min": 722 }, { "epoch": 2.0287539936102235, "grad_norm": 0.8654181955391402, "learning_rate": 3.5783840395854984e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.34793633222579956, "step": 1270, "valid_targets_mean": 2136.0, "valid_targets_min": 784 }, { "epoch": 2.036741214057508, "grad_norm": 0.8291615059541649, "learning_rate": 3.5734783038194446e-05, "loss": 0.4007, "loss_nan_ranks": 0, "loss_rank_avg": 0.46559375524520874, "step": 1275, "valid_targets_mean": 2901.5, "valid_targets_min": 1184 }, { "epoch": 2.0447284345047922, "grad_norm": 0.7323741707579677, "learning_rate": 3.5685475964525396e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.37584206461906433, "step": 1280, "valid_targets_mean": 3211.1, "valid_targets_min": 957 }, { "epoch": 2.0527156549520766, "grad_norm": 0.7363883381038177, "learning_rate": 3.5635919957366775e-05, "loss": 0.398, "loss_nan_ranks": 0, "loss_rank_avg": 0.41028380393981934, "step": 1285, "valid_targets_mean": 2933.5, "valid_targets_min": 1190 }, { "epoch": 2.060702875399361, "grad_norm": 0.7315517816142877, "learning_rate": 3.558611580318817e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.4214468002319336, "step": 1290, "valid_targets_mean": 3097.8, "valid_targets_min": 1193 }, { "epoch": 2.0686900958466454, "grad_norm": 0.7175863284248388, "learning_rate": 3.5536064292397334e-05, "loss": 0.4115, "loss_nan_ranks": 0, "loss_rank_avg": 0.38822758197784424, "step": 1295, "valid_targets_mean": 3118.4, "valid_targets_min": 1089 }, { "epoch": 2.07667731629393, "grad_norm": 0.6909079310550906, "learning_rate": 3.548576621932766e-05, "loss": 0.4088, "loss_nan_ranks": 0, "loss_rank_avg": 0.37539142370224, "step": 1300, "valid_targets_mean": 3059.8, "valid_targets_min": 1378 }, { "epoch": 2.084664536741214, "grad_norm": 0.8341553393326651, "learning_rate": 3.543522238222555e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.39283639192581177, "step": 1305, "valid_targets_mean": 2444.9, "valid_targets_min": 733 }, { "epoch": 2.0926517571884986, "grad_norm": 0.7467643791808043, "learning_rate": 3.538443358323777e-05, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.4031786322593689, "step": 1310, "valid_targets_mean": 3537.6, "valid_targets_min": 671 }, { "epoch": 2.1006389776357826, "grad_norm": 0.7427721777091812, "learning_rate": 3.5333400628398696e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.35075265169143677, "step": 1315, "valid_targets_mean": 3124.6, "valid_targets_min": 1320 }, { "epoch": 2.108626198083067, "grad_norm": 0.723617897881399, "learning_rate": 3.5282124327617556e-05, "loss": 0.3989, "loss_nan_ranks": 0, "loss_rank_avg": 0.4392593502998352, "step": 1320, "valid_targets_mean": 3268.4, "valid_targets_min": 614 }, { "epoch": 2.1166134185303513, "grad_norm": 0.788438144653811, "learning_rate": 3.5230605494665535e-05, "loss": 0.3774, "loss_nan_ranks": 0, "loss_rank_avg": 0.3712785840034485, "step": 1325, "valid_targets_mean": 2644.2, "valid_targets_min": 463 }, { "epoch": 2.1246006389776357, "grad_norm": 0.8022216072730797, "learning_rate": 3.517884494716289e-05, "loss": 0.4069, "loss_nan_ranks": 0, "loss_rank_avg": 0.4960511028766632, "step": 1330, "valid_targets_mean": 3651.8, "valid_targets_min": 836 }, { "epoch": 2.13258785942492, "grad_norm": 0.6925487153270358, "learning_rate": 3.512684350656596e-05, "loss": 0.375, "loss_nan_ranks": 0, "loss_rank_avg": 0.37404677271842957, "step": 1335, "valid_targets_mean": 3246.2, "valid_targets_min": 1109 }, { "epoch": 2.1405750798722045, "grad_norm": 0.8170016680451098, "learning_rate": 3.507460199815414e-05, "loss": 0.407, "loss_nan_ranks": 0, "loss_rank_avg": 0.3906192183494568, "step": 1340, "valid_targets_mean": 2524.4, "valid_targets_min": 1046 }, { "epoch": 2.148562300319489, "grad_norm": 0.8211212957436506, "learning_rate": 3.5022121251016786e-05, "loss": 0.3728, "loss_nan_ranks": 0, "loss_rank_avg": 0.36858224868774414, "step": 1345, "valid_targets_mean": 2289.2, "valid_targets_min": 1063 }, { "epoch": 2.1565495207667733, "grad_norm": 0.7865399000617666, "learning_rate": 3.4969402098040015e-05, "loss": 0.3767, "loss_nan_ranks": 0, "loss_rank_avg": 0.38670629262924194, "step": 1350, "valid_targets_mean": 2472.7, "valid_targets_min": 723 }, { "epoch": 2.1645367412140577, "grad_norm": 0.6781855298456426, "learning_rate": 3.491644537589356e-05, "loss": 0.393, "loss_nan_ranks": 0, "loss_rank_avg": 0.42566969990730286, "step": 1355, "valid_targets_mean": 3834.5, "valid_targets_min": 1217 }, { "epoch": 2.1725239616613417, "grad_norm": 0.7316618715739758, "learning_rate": 3.486325192501743e-05, "loss": 0.3876, "loss_nan_ranks": 0, "loss_rank_avg": 0.34030255675315857, "step": 1360, "valid_targets_mean": 2474.6, "valid_targets_min": 851 }, { "epoch": 2.180511182108626, "grad_norm": 0.780177709972403, "learning_rate": 3.480982258960859e-05, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.4071018695831299, "step": 1365, "valid_targets_mean": 2566.9, "valid_targets_min": 1108 }, { "epoch": 2.1884984025559104, "grad_norm": 0.7401670928315446, "learning_rate": 3.47561582176076e-05, "loss": 0.3765, "loss_nan_ranks": 0, "loss_rank_avg": 0.34878408908843994, "step": 1370, "valid_targets_mean": 2431.8, "valid_targets_min": 732 }, { "epoch": 2.196485623003195, "grad_norm": 0.8285074677263214, "learning_rate": 3.470225966068507e-05, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.38772809505462646, "step": 1375, "valid_targets_mean": 2775.9, "valid_targets_min": 1309 }, { "epoch": 2.2044728434504792, "grad_norm": 0.6951035757973937, "learning_rate": 3.464812777422826e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.33720552921295166, "step": 1380, "valid_targets_mean": 2747.8, "valid_targets_min": 1107 }, { "epoch": 2.2124600638977636, "grad_norm": 0.6933666013886233, "learning_rate": 3.459376341732741e-05, "loss": 0.3755, "loss_nan_ranks": 0, "loss_rank_avg": 0.3822613060474396, "step": 1385, "valid_targets_mean": 3665.7, "valid_targets_min": 1010 }, { "epoch": 2.220447284345048, "grad_norm": 0.844133409567668, "learning_rate": 3.453916745276213e-05, "loss": 0.3849, "loss_nan_ranks": 0, "loss_rank_avg": 0.40487003326416016, "step": 1390, "valid_targets_mean": 2339.1, "valid_targets_min": 1010 }, { "epoch": 2.2284345047923324, "grad_norm": 0.7635668779470315, "learning_rate": 3.4484340746987745e-05, "loss": 0.3745, "loss_nan_ranks": 0, "loss_rank_avg": 0.40360257029533386, "step": 1395, "valid_targets_mean": 3000.1, "valid_targets_min": 617 }, { "epoch": 2.236421725239617, "grad_norm": 0.8939714206815781, "learning_rate": 3.4429284170121494e-05, "loss": 0.3828, "loss_nan_ranks": 0, "loss_rank_avg": 0.39973244071006775, "step": 1400, "valid_targets_mean": 2310.8, "valid_targets_min": 1108 }, { "epoch": 2.244408945686901, "grad_norm": 0.7965029242154419, "learning_rate": 3.4373998595928764e-05, "loss": 0.3769, "loss_nan_ranks": 0, "loss_rank_avg": 0.35486793518066406, "step": 1405, "valid_targets_mean": 2493.4, "valid_targets_min": 1100 }, { "epoch": 2.252396166134185, "grad_norm": 0.8968879107376081, "learning_rate": 3.431848490180919e-05, "loss": 0.385, "loss_nan_ranks": 0, "loss_rank_avg": 0.3879396319389343, "step": 1410, "valid_targets_mean": 1842.8, "valid_targets_min": 641 }, { "epoch": 2.2603833865814695, "grad_norm": 0.6571979135953678, "learning_rate": 3.4262743968782736e-05, "loss": 0.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.3954229950904846, "step": 1415, "valid_targets_mean": 3515.6, "valid_targets_min": 1404 }, { "epoch": 2.268370607028754, "grad_norm": 0.7277635785906069, "learning_rate": 3.4206776681475737e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.36266952753067017, "step": 1420, "valid_targets_mean": 2741.3, "valid_targets_min": 1230 }, { "epoch": 2.2763578274760383, "grad_norm": 0.7907521602479675, "learning_rate": 3.415058392810682e-05, "loss": 0.4066, "loss_nan_ranks": 0, "loss_rank_avg": 0.4322172999382019, "step": 1425, "valid_targets_mean": 2997.9, "valid_targets_min": 1321 }, { "epoch": 2.2843450479233227, "grad_norm": 0.8176547611925157, "learning_rate": 3.409416660047286e-05, "loss": 0.3977, "loss_nan_ranks": 0, "loss_rank_avg": 0.3814924955368042, "step": 1430, "valid_targets_mean": 2555.4, "valid_targets_min": 1205 }, { "epoch": 2.292332268370607, "grad_norm": 0.822452014818755, "learning_rate": 3.403752559393477e-05, "loss": 0.3974, "loss_nan_ranks": 0, "loss_rank_avg": 0.4026378393173218, "step": 1435, "valid_targets_mean": 2191.9, "valid_targets_min": 958 }, { "epoch": 2.3003194888178915, "grad_norm": 0.8046031130809067, "learning_rate": 3.398066180740332e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.3843550384044647, "step": 1440, "valid_targets_mean": 2522.8, "valid_targets_min": 1101 }, { "epoch": 2.308306709265176, "grad_norm": 0.7274042476803793, "learning_rate": 3.39235761433249e-05, "loss": 0.3742, "loss_nan_ranks": 0, "loss_rank_avg": 0.3560572564601898, "step": 1445, "valid_targets_mean": 2997.4, "valid_targets_min": 970 }, { "epoch": 2.31629392971246, "grad_norm": 0.7942573376789508, "learning_rate": 3.386626950766713e-05, "loss": 0.408, "loss_nan_ranks": 0, "loss_rank_avg": 0.4524349570274353, "step": 1450, "valid_targets_mean": 2827.2, "valid_targets_min": 847 }, { "epoch": 2.3242811501597442, "grad_norm": 0.7144054959460292, "learning_rate": 3.380874280990454e-05, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.43069761991500854, "step": 1455, "valid_targets_mean": 2820.1, "valid_targets_min": 815 }, { "epoch": 2.3322683706070286, "grad_norm": 0.7615884351566543, "learning_rate": 3.37509969630041e-05, "loss": 0.3902, "loss_nan_ranks": 0, "loss_rank_avg": 0.3636676073074341, "step": 1460, "valid_targets_mean": 2552.9, "valid_targets_min": 1197 }, { "epoch": 2.340255591054313, "grad_norm": 0.7256710670235811, "learning_rate": 3.369303288341078e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.4177743196487427, "step": 1465, "valid_targets_mean": 3103.6, "valid_targets_min": 1031 }, { "epoch": 2.3482428115015974, "grad_norm": 0.7877476651897006, "learning_rate": 3.363485149103292e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.35964199900627136, "step": 1470, "valid_targets_mean": 2302.8, "valid_targets_min": 1014 }, { "epoch": 2.356230031948882, "grad_norm": 0.7861951999481999, "learning_rate": 3.357645370922772e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.3646368682384491, "step": 1475, "valid_targets_mean": 2470.4, "valid_targets_min": 892 }, { "epoch": 2.364217252396166, "grad_norm": 0.8067034022369052, "learning_rate": 3.351784046478655e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.37805867195129395, "step": 1480, "valid_targets_mean": 2684.4, "valid_targets_min": 903 }, { "epoch": 2.3722044728434506, "grad_norm": 0.6891254864220063, "learning_rate": 3.345901268792022e-05, "loss": 0.3801, "loss_nan_ranks": 0, "loss_rank_avg": 0.34303462505340576, "step": 1485, "valid_targets_mean": 2823.6, "valid_targets_min": 1036 }, { "epoch": 2.380191693290735, "grad_norm": 0.6714839482371276, "learning_rate": 3.3399971312244255e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3872262239456177, "step": 1490, "valid_targets_mean": 3700.4, "valid_targets_min": 1165 }, { "epoch": 2.3881789137380194, "grad_norm": 0.7565316440719079, "learning_rate": 3.334071727476406e-05, "loss": 0.4195, "loss_nan_ranks": 0, "loss_rank_avg": 0.4261237680912018, "step": 1495, "valid_targets_mean": 2838.0, "valid_targets_min": 1114 }, { "epoch": 2.3961661341853033, "grad_norm": 0.8114152537250999, "learning_rate": 3.3281251515860035e-05, "loss": 0.395, "loss_nan_ranks": 0, "loss_rank_avg": 0.45717281103134155, "step": 1500, "valid_targets_mean": 2492.4, "valid_targets_min": 951 }, { "epoch": 2.4041533546325877, "grad_norm": 0.6856900658234324, "learning_rate": 3.3221574979272676e-05, "loss": 0.3724, "loss_nan_ranks": 0, "loss_rank_avg": 0.39079922437667847, "step": 1505, "valid_targets_mean": 3183.8, "valid_targets_min": 1362 }, { "epoch": 2.412140575079872, "grad_norm": 0.7703186250399462, "learning_rate": 3.316168861208759e-05, "loss": 0.3763, "loss_nan_ranks": 0, "loss_rank_avg": 0.39759039878845215, "step": 1510, "valid_targets_mean": 2748.0, "valid_targets_min": 1040 }, { "epoch": 2.4201277955271565, "grad_norm": 0.8048967002212241, "learning_rate": 3.310159336472047e-05, "loss": 0.3875, "loss_nan_ranks": 0, "loss_rank_avg": 0.41734617948532104, "step": 1515, "valid_targets_mean": 2613.1, "valid_targets_min": 1191 }, { "epoch": 2.428115015974441, "grad_norm": 0.8314543068705672, "learning_rate": 3.304129019090198e-05, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.41389578580856323, "step": 1520, "valid_targets_mean": 2517.2, "valid_targets_min": 891 }, { "epoch": 2.4361022364217253, "grad_norm": 0.6926011452341558, "learning_rate": 3.298078004766267e-05, "loss": 0.3905, "loss_nan_ranks": 0, "loss_rank_avg": 0.37540772557258606, "step": 1525, "valid_targets_mean": 2965.9, "valid_targets_min": 864 }, { "epoch": 2.4440894568690097, "grad_norm": 0.8162573999638001, "learning_rate": 3.292006389531774e-05, "loss": 0.3909, "loss_nan_ranks": 0, "loss_rank_avg": 0.4161120355129242, "step": 1530, "valid_targets_mean": 2317.8, "valid_targets_min": 848 }, { "epoch": 2.452076677316294, "grad_norm": 0.8074891222439363, "learning_rate": 3.2859142697451835e-05, "loss": 0.3772, "loss_nan_ranks": 0, "loss_rank_avg": 0.37793317437171936, "step": 1535, "valid_targets_mean": 2300.7, "valid_targets_min": 944 }, { "epoch": 2.460063897763578, "grad_norm": 0.6859073178237398, "learning_rate": 3.279801742090372e-05, "loss": 0.3817, "loss_nan_ranks": 0, "loss_rank_avg": 0.3530294895172119, "step": 1540, "valid_targets_mean": 2976.5, "valid_targets_min": 1095 }, { "epoch": 2.4680511182108624, "grad_norm": 0.7497080904501119, "learning_rate": 3.2736689035750975e-05, "loss": 0.4002, "loss_nan_ranks": 0, "loss_rank_avg": 0.38208550214767456, "step": 1545, "valid_targets_mean": 2632.4, "valid_targets_min": 1187 }, { "epoch": 2.476038338658147, "grad_norm": 0.7658848802289646, "learning_rate": 3.2675158515294554e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.34464403986930847, "step": 1550, "valid_targets_mean": 2718.4, "valid_targets_min": 1097 }, { "epoch": 2.484025559105431, "grad_norm": 0.7295384665652668, "learning_rate": 3.2613426836043386e-05, "loss": 0.3898, "loss_nan_ranks": 0, "loss_rank_avg": 0.40557998418807983, "step": 1555, "valid_targets_mean": 2924.6, "valid_targets_min": 1126 }, { "epoch": 2.4920127795527156, "grad_norm": 0.7865606199528011, "learning_rate": 3.2551494977698844e-05, "loss": 0.3832, "loss_nan_ranks": 0, "loss_rank_avg": 0.3619915246963501, "step": 1560, "valid_targets_mean": 2832.5, "valid_targets_min": 1204 }, { "epoch": 2.5, "grad_norm": 0.7442594029658458, "learning_rate": 3.248936392313921e-05, "loss": 0.3836, "loss_nan_ranks": 0, "loss_rank_avg": 0.3640132546424866, "step": 1565, "valid_targets_mean": 2665.8, "valid_targets_min": 1110 }, { "epoch": 2.5079872204472844, "grad_norm": 0.7749328364765504, "learning_rate": 3.2427034658404056e-05, "loss": 0.374, "loss_nan_ranks": 0, "loss_rank_avg": 0.38298264145851135, "step": 1570, "valid_targets_mean": 2361.2, "valid_targets_min": 895 }, { "epoch": 2.515974440894569, "grad_norm": 0.70714901394141, "learning_rate": 3.236450817267863e-05, "loss": 0.3994, "loss_nan_ranks": 0, "loss_rank_avg": 0.42880868911743164, "step": 1575, "valid_targets_mean": 3301.9, "valid_targets_min": 1134 }, { "epoch": 2.523961661341853, "grad_norm": 0.711423892950476, "learning_rate": 3.230178545827814e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.3938032388687134, "step": 1580, "valid_targets_mean": 3337.3, "valid_targets_min": 1438 }, { "epoch": 2.5319488817891376, "grad_norm": 0.8058935995764296, "learning_rate": 3.223886751063201e-05, "loss": 0.3766, "loss_nan_ranks": 0, "loss_rank_avg": 0.3802354037761688, "step": 1585, "valid_targets_mean": 2979.3, "valid_targets_min": 944 }, { "epoch": 2.539936102236422, "grad_norm": 0.7118888640775775, "learning_rate": 3.2175755328268054e-05, "loss": 0.374, "loss_nan_ranks": 0, "loss_rank_avg": 0.3789049983024597, "step": 1590, "valid_targets_mean": 2948.6, "valid_targets_min": 1146 }, { "epoch": 2.547923322683706, "grad_norm": 0.7725216659459194, "learning_rate": 3.2112449912796675e-05, "loss": 0.379, "loss_nan_ranks": 0, "loss_rank_avg": 0.4516969919204712, "step": 1595, "valid_targets_mean": 2919.0, "valid_targets_min": 1147 }, { "epoch": 2.5559105431309903, "grad_norm": 0.7527073447886554, "learning_rate": 3.204895226889494e-05, "loss": 0.3986, "loss_nan_ranks": 0, "loss_rank_avg": 0.38789334893226624, "step": 1600, "valid_targets_mean": 2791.0, "valid_targets_min": 1026 }, { "epoch": 2.5638977635782747, "grad_norm": 0.6299428402315908, "learning_rate": 3.1985263404290634e-05, "loss": 0.3749, "loss_nan_ranks": 0, "loss_rank_avg": 0.327023446559906, "step": 1605, "valid_targets_mean": 3438.7, "valid_targets_min": 992 }, { "epoch": 2.571884984025559, "grad_norm": 0.9685044209773557, "learning_rate": 3.19213843297463e-05, "loss": 0.3827, "loss_nan_ranks": 0, "loss_rank_avg": 0.4428490102291107, "step": 1610, "valid_targets_mean": 2068.7, "valid_targets_min": 822 }, { "epoch": 2.5798722044728435, "grad_norm": 1.0295969468634165, "learning_rate": 3.1857316059043144e-05, "loss": 0.3998, "loss_nan_ranks": 0, "loss_rank_avg": 0.4081227779388428, "step": 1615, "valid_targets_mean": 2919.2, "valid_targets_min": 1251 }, { "epoch": 2.587859424920128, "grad_norm": 1.6563488775796265, "learning_rate": 3.1793059608964986e-05, "loss": 0.3901, "loss_nan_ranks": 0, "loss_rank_avg": 0.4232986271381378, "step": 1620, "valid_targets_mean": 3450.8, "valid_targets_min": 1362 }, { "epoch": 2.5958466453674123, "grad_norm": 0.9155041657894906, "learning_rate": 3.172861599928212e-05, "loss": 0.4202, "loss_nan_ranks": 0, "loss_rank_avg": 0.4846240282058716, "step": 1625, "valid_targets_mean": 2145.2, "valid_targets_min": 859 }, { "epoch": 2.6038338658146962, "grad_norm": 0.8120340384610485, "learning_rate": 3.166398625273512e-05, "loss": 0.3737, "loss_nan_ranks": 0, "loss_rank_avg": 0.4154743552207947, "step": 1630, "valid_targets_mean": 2617.1, "valid_targets_min": 1098 }, { "epoch": 2.6118210862619806, "grad_norm": 0.849225033810179, "learning_rate": 3.15991713950186e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.4135674238204956, "step": 1635, "valid_targets_mean": 2334.0, "valid_targets_min": 1142 }, { "epoch": 2.619808306709265, "grad_norm": 0.8157392444586056, "learning_rate": 3.153417245476495e-05, "loss": 0.3922, "loss_nan_ranks": 0, "loss_rank_avg": 0.39707255363464355, "step": 1640, "valid_targets_mean": 2494.3, "valid_targets_min": 870 }, { "epoch": 2.6277955271565494, "grad_norm": 0.6334451346931158, "learning_rate": 3.146899046352804e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.35084402561187744, "step": 1645, "valid_targets_mean": 3740.7, "valid_targets_min": 1049 }, { "epoch": 2.635782747603834, "grad_norm": 0.7762569328884342, "learning_rate": 3.140362645576676e-05, "loss": 0.3856, "loss_nan_ranks": 0, "loss_rank_avg": 0.37259939312934875, "step": 1650, "valid_targets_mean": 2511.3, "valid_targets_min": 1421 }, { "epoch": 2.643769968051118, "grad_norm": 0.8186237289070231, "learning_rate": 3.133808146882871e-05, "loss": 0.3835, "loss_nan_ranks": 0, "loss_rank_avg": 0.4084286093711853, "step": 1655, "valid_targets_mean": 2329.6, "valid_targets_min": 778 }, { "epoch": 2.6517571884984026, "grad_norm": 0.7125590887289628, "learning_rate": 3.1272356542933654e-05, "loss": 0.3972, "loss_nan_ranks": 0, "loss_rank_avg": 0.3703764081001282, "step": 1660, "valid_targets_mean": 2906.2, "valid_targets_min": 1050 }, { "epoch": 2.659744408945687, "grad_norm": 0.731708037956391, "learning_rate": 3.120645272115707e-05, "loss": 0.3943, "loss_nan_ranks": 0, "loss_rank_avg": 0.4325590431690216, "step": 1665, "valid_targets_mean": 2983.2, "valid_targets_min": 1067 }, { "epoch": 2.6677316293929714, "grad_norm": 0.8035997324197389, "learning_rate": 3.114037104941355e-05, "loss": 0.4001, "loss_nan_ranks": 0, "loss_rank_avg": 0.38742709159851074, "step": 1670, "valid_targets_mean": 2473.9, "valid_targets_min": 1059 }, { "epoch": 2.6757188498402558, "grad_norm": 0.6844167171779404, "learning_rate": 3.1074112576440236e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.368588924407959, "step": 1675, "valid_targets_mean": 2882.1, "valid_targets_min": 1749 }, { "epoch": 2.68370607028754, "grad_norm": 0.6163401323400775, "learning_rate": 3.1007678353780154e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.32983940839767456, "step": 1680, "valid_targets_mean": 3723.4, "valid_targets_min": 878 }, { "epoch": 2.6916932907348246, "grad_norm": 0.6365023740994403, "learning_rate": 3.094106943576553e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.3705146908760071, "step": 1685, "valid_targets_mean": 3389.1, "valid_targets_min": 948 }, { "epoch": 2.6996805111821085, "grad_norm": 0.7475402505642063, "learning_rate": 3.087428687950108e-05, "loss": 0.3958, "loss_nan_ranks": 0, "loss_rank_avg": 0.43426042795181274, "step": 1690, "valid_targets_mean": 2593.7, "valid_targets_min": 1178 }, { "epoch": 2.707667731629393, "grad_norm": 0.7686145007215354, "learning_rate": 3.080733174484719e-05, "loss": 0.3871, "loss_nan_ranks": 0, "loss_rank_avg": 0.4154050350189209, "step": 1695, "valid_targets_mean": 2665.8, "valid_targets_min": 1084 }, { "epoch": 2.7156549520766773, "grad_norm": 0.8563812199578894, "learning_rate": 3.074020509440313e-05, "loss": 0.3829, "loss_nan_ranks": 0, "loss_rank_avg": 0.3860825300216675, "step": 1700, "valid_targets_mean": 2129.1, "valid_targets_min": 879 }, { "epoch": 2.7236421725239617, "grad_norm": 0.75128835829166, "learning_rate": 3.0672907993490183e-05, "loss": 0.3772, "loss_nan_ranks": 0, "loss_rank_avg": 0.4196065366268158, "step": 1705, "valid_targets_mean": 2710.2, "valid_targets_min": 1105 }, { "epoch": 2.731629392971246, "grad_norm": 0.7438973966543126, "learning_rate": 3.060544151013473e-05, "loss": 0.383, "loss_nan_ranks": 0, "loss_rank_avg": 0.38597315549850464, "step": 1710, "valid_targets_mean": 2584.2, "valid_targets_min": 737 }, { "epoch": 2.7396166134185305, "grad_norm": 0.7183303748877556, "learning_rate": 3.053780671505132e-05, "loss": 0.3738, "loss_nan_ranks": 0, "loss_rank_avg": 0.3752416968345642, "step": 1715, "valid_targets_mean": 2927.7, "valid_targets_min": 1360 }, { "epoch": 2.747603833865815, "grad_norm": 0.5587721821728815, "learning_rate": 3.047000468162563e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.36852502822875977, "step": 1720, "valid_targets_mean": 4415.8, "valid_targets_min": 848 }, { "epoch": 2.755591054313099, "grad_norm": 0.7912750974825519, "learning_rate": 3.0402036485897496e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.3481713533401489, "step": 1725, "valid_targets_mean": 2150.6, "valid_targets_min": 573 }, { "epoch": 2.763578274760383, "grad_norm": 0.7655378909490561, "learning_rate": 3.0333903206543786e-05, "loss": 0.4075, "loss_nan_ranks": 0, "loss_rank_avg": 0.4195517897605896, "step": 1730, "valid_targets_mean": 2745.0, "valid_targets_min": 1068 }, { "epoch": 2.7715654952076676, "grad_norm": 0.7429503561714476, "learning_rate": 3.02656059248613e-05, "loss": 0.3752, "loss_nan_ranks": 0, "loss_rank_avg": 0.38314008712768555, "step": 1735, "valid_targets_mean": 2676.4, "valid_targets_min": 1083 }, { "epoch": 2.779552715654952, "grad_norm": 0.6847140253857491, "learning_rate": 3.0197145724749615e-05, "loss": 0.3835, "loss_nan_ranks": 0, "loss_rank_avg": 0.35597318410873413, "step": 1740, "valid_targets_mean": 2626.1, "valid_targets_min": 907 }, { "epoch": 2.7875399361022364, "grad_norm": 0.7618474409520442, "learning_rate": 3.0128523692693865e-05, "loss": 0.3888, "loss_nan_ranks": 0, "loss_rank_avg": 0.353215754032135, "step": 1745, "valid_targets_mean": 2811.6, "valid_targets_min": 857 }, { "epoch": 2.7955271565495208, "grad_norm": 0.6759274934133018, "learning_rate": 3.005974091774751e-05, "loss": 0.397, "loss_nan_ranks": 0, "loss_rank_avg": 0.39466995000839233, "step": 1750, "valid_targets_mean": 3399.4, "valid_targets_min": 901 }, { "epoch": 2.803514376996805, "grad_norm": 0.6799590705617894, "learning_rate": 2.999079849151505e-05, "loss": 0.399, "loss_nan_ranks": 0, "loss_rank_avg": 0.43251582980155945, "step": 1755, "valid_targets_mean": 3441.4, "valid_targets_min": 1312 }, { "epoch": 2.8115015974440896, "grad_norm": 0.6610130288469123, "learning_rate": 2.992169750813471e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.39097756147384644, "step": 1760, "valid_targets_mean": 3311.8, "valid_targets_min": 1011 }, { "epoch": 2.819488817891374, "grad_norm": 0.7671727157019489, "learning_rate": 2.985243906426106e-05, "loss": 0.3821, "loss_nan_ranks": 0, "loss_rank_avg": 0.40966904163360596, "step": 1765, "valid_targets_mean": 2718.1, "valid_targets_min": 995 }, { "epoch": 2.8274760383386583, "grad_norm": 0.6650031120553905, "learning_rate": 2.9783024259047617e-05, "loss": 0.3815, "loss_nan_ranks": 0, "loss_rank_avg": 0.425026535987854, "step": 1770, "valid_targets_mean": 3584.0, "valid_targets_min": 1194 }, { "epoch": 2.8354632587859427, "grad_norm": 0.8517674686517855, "learning_rate": 2.971345419412941e-05, "loss": 0.3923, "loss_nan_ranks": 0, "loss_rank_avg": 0.36157435178756714, "step": 1775, "valid_targets_mean": 2832.7, "valid_targets_min": 1040 }, { "epoch": 2.8434504792332267, "grad_norm": 0.6566982803729622, "learning_rate": 2.964372997360548e-05, "loss": 0.388, "loss_nan_ranks": 0, "loss_rank_avg": 0.33444786071777344, "step": 1780, "valid_targets_mean": 3122.9, "valid_targets_min": 768 }, { "epoch": 2.851437699680511, "grad_norm": 0.7060484582940764, "learning_rate": 2.957385270402137e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.37771087884902954, "step": 1785, "valid_targets_mean": 3694.4, "valid_targets_min": 1073 }, { "epoch": 2.8594249201277955, "grad_norm": 0.7198209681558054, "learning_rate": 2.9503823494351565e-05, "loss": 0.3719, "loss_nan_ranks": 0, "loss_rank_avg": 0.3737558126449585, "step": 1790, "valid_targets_mean": 3059.6, "valid_targets_min": 1135 }, { "epoch": 2.86741214057508, "grad_norm": 0.7055818423441181, "learning_rate": 2.9433643455981874e-05, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.39843347668647766, "step": 1795, "valid_targets_mean": 3255.6, "valid_targets_min": 927 }, { "epoch": 2.8753993610223643, "grad_norm": 0.7843389401141818, "learning_rate": 2.9363313702691827e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.41534000635147095, "step": 1800, "valid_targets_mean": 2498.8, "valid_targets_min": 1019 }, { "epoch": 2.8833865814696487, "grad_norm": 0.6724104574364067, "learning_rate": 2.9292835350636957e-05, "loss": 0.4022, "loss_nan_ranks": 0, "loss_rank_avg": 0.38030463457107544, "step": 1805, "valid_targets_mean": 3430.4, "valid_targets_min": 1112 }, { "epoch": 2.891373801916933, "grad_norm": 0.5916718834917873, "learning_rate": 2.922220951833111e-05, "loss": 0.3808, "loss_nan_ranks": 0, "loss_rank_avg": 0.31356799602508545, "step": 1810, "valid_targets_mean": 3772.6, "valid_targets_min": 951 }, { "epoch": 2.899361022364217, "grad_norm": 0.7654937514668824, "learning_rate": 2.9151437326628706e-05, "loss": 0.3866, "loss_nan_ranks": 0, "loss_rank_avg": 0.3887610137462616, "step": 1815, "valid_targets_mean": 2553.3, "valid_targets_min": 936 }, { "epoch": 2.9073482428115014, "grad_norm": 0.7480115771607395, "learning_rate": 2.908051989870692e-05, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.3808180093765259, "step": 1820, "valid_targets_mean": 3117.8, "valid_targets_min": 791 }, { "epoch": 2.915335463258786, "grad_norm": 0.7187356737229668, "learning_rate": 2.9009458360047867e-05, "loss": 0.3829, "loss_nan_ranks": 0, "loss_rank_avg": 0.4151441752910614, "step": 1825, "valid_targets_mean": 2946.7, "valid_targets_min": 1304 }, { "epoch": 2.92332268370607, "grad_norm": 0.6464747283506714, "learning_rate": 2.8938253838420762e-05, "loss": 0.3949, "loss_nan_ranks": 0, "loss_rank_avg": 0.39368531107902527, "step": 1830, "valid_targets_mean": 3852.4, "valid_targets_min": 875 }, { "epoch": 2.9313099041533546, "grad_norm": 0.7244350087292859, "learning_rate": 2.8866907463864006e-05, "loss": 0.378, "loss_nan_ranks": 0, "loss_rank_avg": 0.3935213088989258, "step": 1835, "valid_targets_mean": 2723.6, "valid_targets_min": 988 }, { "epoch": 2.939297124600639, "grad_norm": 0.6851586503030473, "learning_rate": 2.8795420368667225e-05, "loss": 0.3717, "loss_nan_ranks": 0, "loss_rank_avg": 0.41738811135292053, "step": 1840, "valid_targets_mean": 3267.9, "valid_targets_min": 924 }, { "epoch": 2.9472843450479234, "grad_norm": 0.6915563143903232, "learning_rate": 2.8723793687353354e-05, "loss": 0.3893, "loss_nan_ranks": 0, "loss_rank_avg": 0.38308918476104736, "step": 1845, "valid_targets_mean": 3031.2, "valid_targets_min": 974 }, { "epoch": 2.9552715654952078, "grad_norm": 0.6819090921664839, "learning_rate": 2.8652028556660593e-05, "loss": 0.4031, "loss_nan_ranks": 0, "loss_rank_avg": 0.36406490206718445, "step": 1850, "valid_targets_mean": 3324.1, "valid_targets_min": 1575 }, { "epoch": 2.963258785942492, "grad_norm": 0.7719683466940759, "learning_rate": 2.8580126115524373e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.38270652294158936, "step": 1855, "valid_targets_mean": 2710.7, "valid_targets_min": 1122 }, { "epoch": 2.9712460063897765, "grad_norm": 0.7584408057005778, "learning_rate": 2.8508087505059302e-05, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.40344762802124023, "step": 1860, "valid_targets_mean": 2602.8, "valid_targets_min": 1057 }, { "epoch": 2.979233226837061, "grad_norm": 0.8095860463062092, "learning_rate": 2.843591386854102e-05, "loss": 0.3794, "loss_nan_ranks": 0, "loss_rank_avg": 0.3777475953102112, "step": 1865, "valid_targets_mean": 2237.3, "valid_targets_min": 1016 }, { "epoch": 2.987220447284345, "grad_norm": 0.8139871848333652, "learning_rate": 2.8363606351388068e-05, "loss": 0.4007, "loss_nan_ranks": 0, "loss_rank_avg": 0.3748500943183899, "step": 1870, "valid_targets_mean": 2634.4, "valid_targets_min": 981 }, { "epoch": 2.9952076677316293, "grad_norm": 0.6031621618600853, "learning_rate": 2.829116610114375e-05, "loss": 0.3663, "loss_nan_ranks": 0, "loss_rank_avg": 0.309096097946167, "step": 1875, "valid_targets_mean": 3321.8, "valid_targets_min": 918 }, { "epoch": 3.0031948881789137, "grad_norm": 0.7010853523494205, "learning_rate": 2.821859426745786e-05, "loss": 0.377, "loss_nan_ranks": 0, "loss_rank_avg": 0.3830505609512329, "step": 1880, "valid_targets_mean": 3283.0, "valid_targets_min": 1103 }, { "epoch": 3.011182108626198, "grad_norm": 0.7997009121695763, "learning_rate": 2.8145892002068454e-05, "loss": 0.3306, "loss_nan_ranks": 0, "loss_rank_avg": 0.33155494928359985, "step": 1885, "valid_targets_mean": 2721.9, "valid_targets_min": 1253 }, { "epoch": 3.0191693290734825, "grad_norm": 0.880787133238318, "learning_rate": 2.8073060458783606e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.31442296504974365, "step": 1890, "valid_targets_mean": 2083.6, "valid_targets_min": 1019 }, { "epoch": 3.027156549520767, "grad_norm": 0.851278068434791, "learning_rate": 2.8000100793463056e-05, "loss": 0.3341, "loss_nan_ranks": 0, "loss_rank_avg": 0.33716338872909546, "step": 1895, "valid_targets_mean": 2149.1, "valid_targets_min": 971 }, { "epoch": 3.0351437699680512, "grad_norm": 0.7724207654837609, "learning_rate": 2.792701416399988e-05, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.37443485856056213, "step": 1900, "valid_targets_mean": 2977.1, "valid_targets_min": 1171 }, { "epoch": 3.0431309904153356, "grad_norm": 0.8292296160816116, "learning_rate": 2.7853801730302134e-05, "loss": 0.3506, "loss_nan_ranks": 0, "loss_rank_avg": 0.33334457874298096, "step": 1905, "valid_targets_mean": 2229.8, "valid_targets_min": 1298 }, { "epoch": 3.0511182108626196, "grad_norm": 0.7738562965360346, "learning_rate": 2.7780464654274396e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.34110739827156067, "step": 1910, "valid_targets_mean": 2591.9, "valid_targets_min": 810 }, { "epoch": 3.059105431309904, "grad_norm": 0.7004842336637774, "learning_rate": 2.770700409979938e-05, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925085723400116, "step": 1915, "valid_targets_mean": 2646.9, "valid_targets_min": 959 }, { "epoch": 3.0670926517571884, "grad_norm": 0.8088128682511053, "learning_rate": 2.7633421232719442e-05, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.3746018409729004, "step": 1920, "valid_targets_mean": 2762.9, "valid_targets_min": 497 }, { "epoch": 3.0750798722044728, "grad_norm": 0.6921108063117793, "learning_rate": 2.7559717220818067e-05, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.33677250146865845, "step": 1925, "valid_targets_mean": 3465.4, "valid_targets_min": 1438 }, { "epoch": 3.083067092651757, "grad_norm": 0.7792472115673951, "learning_rate": 2.7485893233801366e-05, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.3244081139564514, "step": 1930, "valid_targets_mean": 2584.4, "valid_targets_min": 912 }, { "epoch": 3.0910543130990416, "grad_norm": 0.8282891276383806, "learning_rate": 2.7411950443279458e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.3384396433830261, "step": 1935, "valid_targets_mean": 2538.3, "valid_targets_min": 1040 }, { "epoch": 3.099041533546326, "grad_norm": 0.7315591962767853, "learning_rate": 2.7337890022747945e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.32630831003189087, "step": 1940, "valid_targets_mean": 3223.4, "valid_targets_min": 907 }, { "epoch": 3.1070287539936103, "grad_norm": 0.6369586602339742, "learning_rate": 2.7263713147569243e-05, "loss": 0.3601, "loss_nan_ranks": 0, "loss_rank_avg": 0.34071576595306396, "step": 1945, "valid_targets_mean": 4314.2, "valid_targets_min": 1241 }, { "epoch": 3.1150159744408947, "grad_norm": 0.7067109985051314, "learning_rate": 2.7189420994953945e-05, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.37993860244750977, "step": 1950, "valid_targets_mean": 3673.4, "valid_targets_min": 1263 }, { "epoch": 3.123003194888179, "grad_norm": 0.8025979082829126, "learning_rate": 2.7115014743942114e-05, "loss": 0.3525, "loss_nan_ranks": 0, "loss_rank_avg": 0.3262211084365845, "step": 1955, "valid_targets_mean": 2655.9, "valid_targets_min": 1046 }, { "epoch": 3.130990415335463, "grad_norm": 0.6708281987337977, "learning_rate": 2.704049557538461e-05, "loss": 0.3669, "loss_nan_ranks": 0, "loss_rank_avg": 0.34278061985969543, "step": 1960, "valid_targets_mean": 3530.3, "valid_targets_min": 1110 }, { "epoch": 3.1389776357827475, "grad_norm": 0.732176646472642, "learning_rate": 2.696586467192434e-05, "loss": 0.3438, "loss_nan_ranks": 0, "loss_rank_avg": 0.36904671788215637, "step": 1965, "valid_targets_mean": 3570.9, "valid_targets_min": 1321 }, { "epoch": 3.146964856230032, "grad_norm": 0.7557915517558162, "learning_rate": 2.6891123217977448e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.3248704969882965, "step": 1970, "valid_targets_mean": 3341.5, "valid_targets_min": 972 }, { "epoch": 3.1549520766773163, "grad_norm": 0.8328040999163244, "learning_rate": 2.681627239971458e-05, "loss": 0.355, "loss_nan_ranks": 0, "loss_rank_avg": 0.33000561594963074, "step": 1975, "valid_targets_mean": 2162.9, "valid_targets_min": 937 }, { "epoch": 3.1629392971246006, "grad_norm": 0.6796313251895518, "learning_rate": 2.6741313405041997e-05, "loss": 0.355, "loss_nan_ranks": 0, "loss_rank_avg": 0.34723204374313354, "step": 1980, "valid_targets_mean": 3633.1, "valid_targets_min": 1367 }, { "epoch": 3.170926517571885, "grad_norm": 0.6915824013782956, "learning_rate": 2.666624742358279e-05, "loss": 0.3424, "loss_nan_ranks": 0, "loss_rank_avg": 0.2982881963253021, "step": 1985, "valid_targets_mean": 3259.9, "valid_targets_min": 1035 }, { "epoch": 3.1789137380191694, "grad_norm": 0.8885716130967903, "learning_rate": 2.659107564665794e-05, "loss": 0.3507, "loss_nan_ranks": 0, "loss_rank_avg": 0.38301947712898254, "step": 1990, "valid_targets_mean": 2289.6, "valid_targets_min": 931 }, { "epoch": 3.186900958466454, "grad_norm": 0.7696659351010584, "learning_rate": 2.6515799267267445e-05, "loss": 0.3543, "loss_nan_ranks": 0, "loss_rank_avg": 0.32373887300491333, "step": 1995, "valid_targets_mean": 2755.4, "valid_targets_min": 1083 }, { "epoch": 3.194888178913738, "grad_norm": 0.666620619178921, "learning_rate": 2.6440419480071366e-05, "loss": 0.3542, "loss_nan_ranks": 0, "loss_rank_avg": 0.33515575528144836, "step": 2000, "valid_targets_mean": 3775.8, "valid_targets_min": 938 }, { "epoch": 3.202875399361022, "grad_norm": 0.8605815354678277, "learning_rate": 2.6364937481370887e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.32717159390449524, "step": 2005, "valid_targets_mean": 1861.2, "valid_targets_min": 848 }, { "epoch": 3.2108626198083066, "grad_norm": 0.8139366969767636, "learning_rate": 2.628935446908933e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.3549983501434326, "step": 2010, "valid_targets_mean": 2780.7, "valid_targets_min": 924 }, { "epoch": 3.218849840255591, "grad_norm": 0.6178267872235499, "learning_rate": 2.6213671642753124e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.27505552768707275, "step": 2015, "valid_targets_mean": 3498.8, "valid_targets_min": 901 }, { "epoch": 3.2268370607028753, "grad_norm": 0.7498197701531762, "learning_rate": 2.6137890203472786e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.28516024351119995, "step": 2020, "valid_targets_mean": 2339.2, "valid_targets_min": 1043 }, { "epoch": 3.2348242811501597, "grad_norm": 0.779750885550688, "learning_rate": 2.606201135392383e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.32652050256729126, "step": 2025, "valid_targets_mean": 3031.4, "valid_targets_min": 938 }, { "epoch": 3.242811501597444, "grad_norm": 0.8362104239003927, "learning_rate": 2.5986036298327725e-05, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.320258229970932, "step": 2030, "valid_targets_mean": 2208.7, "valid_targets_min": 1122 }, { "epoch": 3.2507987220447285, "grad_norm": 0.7593338041815918, "learning_rate": 2.590996624243276e-05, "loss": 0.3248, "loss_nan_ranks": 0, "loss_rank_avg": 0.3281738758087158, "step": 2035, "valid_targets_mean": 2861.4, "valid_targets_min": 1047 }, { "epoch": 3.258785942492013, "grad_norm": 0.738061021392302, "learning_rate": 2.5833802393494897e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.37253719568252563, "step": 2040, "valid_targets_mean": 3137.3, "valid_targets_min": 873 }, { "epoch": 3.2667731629392973, "grad_norm": 0.805662472760199, "learning_rate": 2.5757545960258638e-05, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.35318508744239807, "step": 2045, "valid_targets_mean": 2663.6, "valid_targets_min": 927 }, { "epoch": 3.2747603833865817, "grad_norm": 0.874774468106856, "learning_rate": 2.5681198152937804e-05, "loss": 0.3528, "loss_nan_ranks": 0, "loss_rank_avg": 0.42066410183906555, "step": 2050, "valid_targets_mean": 2673.9, "valid_targets_min": 1028 }, { "epoch": 3.2827476038338657, "grad_norm": 0.9367992662401398, "learning_rate": 2.5604760183196377e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.3702118396759033, "step": 2055, "valid_targets_mean": 2392.5, "valid_targets_min": 732 }, { "epoch": 3.29073482428115, "grad_norm": 0.7835028898995575, "learning_rate": 2.5528233264129228e-05, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.34959307312965393, "step": 2060, "valid_targets_mean": 2777.4, "valid_targets_min": 1040 }, { "epoch": 3.2987220447284344, "grad_norm": 0.8490015562097194, "learning_rate": 2.54516186102429e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.37757542729377747, "step": 2065, "valid_targets_mean": 2506.2, "valid_targets_min": 1072 }, { "epoch": 3.306709265175719, "grad_norm": 0.829876673769117, "learning_rate": 2.5374917437436294e-05, "loss": 0.3498, "loss_nan_ranks": 0, "loss_rank_avg": 0.3559834957122803, "step": 2070, "valid_targets_mean": 2435.7, "valid_targets_min": 1130 }, { "epoch": 3.3146964856230032, "grad_norm": 0.7782930862626647, "learning_rate": 2.5298130962981403e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.32831066846847534, "step": 2075, "valid_targets_mean": 2370.1, "valid_targets_min": 1399 }, { "epoch": 3.3226837060702876, "grad_norm": 0.6821850671644661, "learning_rate": 2.5221260405503985e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.3372279405593872, "step": 2080, "valid_targets_mean": 3202.9, "valid_targets_min": 1192 }, { "epoch": 3.330670926517572, "grad_norm": 0.706369945800584, "learning_rate": 2.5144306984964225e-05, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.3640979826450348, "step": 2085, "valid_targets_mean": 3496.9, "valid_targets_min": 1220 }, { "epoch": 3.3386581469648564, "grad_norm": 0.6858521053933514, "learning_rate": 2.5067271922637377e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.354512482881546, "step": 2090, "valid_targets_mean": 3103.3, "valid_targets_min": 842 }, { "epoch": 3.3466453674121404, "grad_norm": 0.7050974701444196, "learning_rate": 2.499015644109435e-05, "loss": 0.339, "loss_nan_ranks": 0, "loss_rank_avg": 0.340786337852478, "step": 2095, "valid_targets_mean": 3263.6, "valid_targets_min": 1263 }, { "epoch": 3.3546325878594248, "grad_norm": 0.7792547408720658, "learning_rate": 2.491296176418236e-05, "loss": 0.3488, "loss_nan_ranks": 0, "loss_rank_avg": 0.31993260979652405, "step": 2100, "valid_targets_mean": 2408.8, "valid_targets_min": 861 }, { "epoch": 3.362619808306709, "grad_norm": 0.8472394542146415, "learning_rate": 2.4835689117005472e-05, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.3624585270881653, "step": 2105, "valid_targets_mean": 2521.1, "valid_targets_min": 1138 }, { "epoch": 3.3706070287539935, "grad_norm": 0.685542276172253, "learning_rate": 2.4758339725905152e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.39794886112213135, "step": 2110, "valid_targets_mean": 3648.8, "valid_targets_min": 1537 }, { "epoch": 3.378594249201278, "grad_norm": 0.8289815185367049, "learning_rate": 2.4680914818440823e-05, "loss": 0.3427, "loss_nan_ranks": 0, "loss_rank_avg": 0.3529765009880066, "step": 2115, "valid_targets_mean": 2447.1, "valid_targets_min": 1186 }, { "epoch": 3.3865814696485623, "grad_norm": 0.79580361575995, "learning_rate": 2.4603415623370387e-05, "loss": 0.3688, "loss_nan_ranks": 0, "loss_rank_avg": 0.3427412509918213, "step": 2120, "valid_targets_mean": 2492.4, "valid_targets_min": 1044 }, { "epoch": 3.3945686900958467, "grad_norm": 0.9174018660679429, "learning_rate": 2.4525843370630697e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.35740599036216736, "step": 2125, "valid_targets_mean": 2116.4, "valid_targets_min": 743 }, { "epoch": 3.402555910543131, "grad_norm": 0.92058483539087, "learning_rate": 2.4448199291318058e-05, "loss": 0.3518, "loss_nan_ranks": 0, "loss_rank_avg": 0.35286015272140503, "step": 2130, "valid_targets_mean": 2801.2, "valid_targets_min": 871 }, { "epoch": 3.4105431309904155, "grad_norm": 0.786887928884236, "learning_rate": 2.4370484617668707e-05, "loss": 0.3635, "loss_nan_ranks": 0, "loss_rank_avg": 0.33476051688194275, "step": 2135, "valid_targets_mean": 2596.9, "valid_targets_min": 742 }, { "epoch": 3.4185303514377, "grad_norm": 0.7258313848476246, "learning_rate": 2.4292700583039194e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.3154415786266327, "step": 2140, "valid_targets_mean": 3060.0, "valid_targets_min": 1183 }, { "epoch": 3.426517571884984, "grad_norm": 0.8298449989955331, "learning_rate": 2.4214848421886893e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.39987191557884216, "step": 2145, "valid_targets_mean": 2922.6, "valid_targets_min": 708 }, { "epoch": 3.4345047923322682, "grad_norm": 0.8571042529668489, "learning_rate": 2.4136929369750344e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.37515556812286377, "step": 2150, "valid_targets_mean": 2234.4, "valid_targets_min": 763 }, { "epoch": 3.4424920127795526, "grad_norm": 0.69019555021873, "learning_rate": 2.4058944663229672e-05, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.341417133808136, "step": 2155, "valid_targets_mean": 3493.2, "valid_targets_min": 1130 }, { "epoch": 3.450479233226837, "grad_norm": 0.7666734882023155, "learning_rate": 2.398089553996696e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.3008880019187927, "step": 2160, "valid_targets_mean": 2677.6, "valid_targets_min": 1190 }, { "epoch": 3.4584664536741214, "grad_norm": 0.7843770052937605, "learning_rate": 2.3902783238626604e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.34043818712234497, "step": 2165, "valid_targets_mean": 2748.9, "valid_targets_min": 782 }, { "epoch": 3.466453674121406, "grad_norm": 0.8052459554106886, "learning_rate": 2.3824608998875652e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.3473026156425476, "step": 2170, "valid_targets_mean": 2772.2, "valid_targets_min": 1174 }, { "epoch": 3.47444089456869, "grad_norm": 0.7451939406088447, "learning_rate": 2.3746374061364138e-05, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.29451632499694824, "step": 2175, "valid_targets_mean": 2728.6, "valid_targets_min": 690 }, { "epoch": 3.4824281150159746, "grad_norm": 0.6512980105925289, "learning_rate": 2.3668079667705404e-05, "loss": 0.3495, "loss_nan_ranks": 0, "loss_rank_avg": 0.34157970547676086, "step": 2180, "valid_targets_mean": 3575.4, "valid_targets_min": 1726 }, { "epoch": 3.4904153354632586, "grad_norm": 0.7079499032301315, "learning_rate": 2.3589727060456342e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.3626313805580139, "step": 2185, "valid_targets_mean": 3225.8, "valid_targets_min": 1124 }, { "epoch": 3.498402555910543, "grad_norm": 0.7295675412562281, "learning_rate": 2.3511317483097753e-05, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.3401775658130646, "step": 2190, "valid_targets_mean": 2835.4, "valid_targets_min": 1325 }, { "epoch": 3.5063897763578273, "grad_norm": 0.6970730857646832, "learning_rate": 2.3432852180014548e-05, "loss": 0.3578, "loss_nan_ranks": 0, "loss_rank_avg": 0.32114821672439575, "step": 2195, "valid_targets_mean": 3394.9, "valid_targets_min": 871 }, { "epoch": 3.5143769968051117, "grad_norm": 0.7359279593183425, "learning_rate": 2.3354332396476026e-05, "loss": 0.3304, "loss_nan_ranks": 0, "loss_rank_avg": 0.3173915445804596, "step": 2200, "valid_targets_mean": 2769.9, "valid_targets_min": 817 }, { "epoch": 3.522364217252396, "grad_norm": 0.8670971142439949, "learning_rate": 2.327575937861612e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.3821990489959717, "step": 2205, "valid_targets_mean": 2721.3, "valid_targets_min": 1028 }, { "epoch": 3.5303514376996805, "grad_norm": 0.7495600483899891, "learning_rate": 2.3197134373413595e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.3791123032569885, "step": 2210, "valid_targets_mean": 2959.6, "valid_targets_min": 963 }, { "epoch": 3.538338658146965, "grad_norm": 0.7631701646338969, "learning_rate": 2.3118458628672272e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.33027756214141846, "step": 2215, "valid_targets_mean": 2739.8, "valid_targets_min": 1139 }, { "epoch": 3.5463258785942493, "grad_norm": 0.7210960761349475, "learning_rate": 2.3039733393001233e-05, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.314005970954895, "step": 2220, "valid_targets_mean": 3064.6, "valid_targets_min": 1529 }, { "epoch": 3.5543130990415337, "grad_norm": 0.7300448411862375, "learning_rate": 2.2960959915794998e-05, "loss": 0.3464, "loss_nan_ranks": 0, "loss_rank_avg": 0.3501545786857605, "step": 2225, "valid_targets_mean": 3272.5, "valid_targets_min": 884 }, { "epoch": 3.562300319488818, "grad_norm": 0.7352570371980378, "learning_rate": 2.2882139447213673e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.367412269115448, "step": 2230, "valid_targets_mean": 2964.4, "valid_targets_min": 1122 }, { "epoch": 3.5702875399361025, "grad_norm": 0.7266777124532515, "learning_rate": 2.280327323816317e-05, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.3345056176185608, "step": 2235, "valid_targets_mean": 3415.9, "valid_targets_min": 1112 }, { "epoch": 3.5782747603833864, "grad_norm": 0.7833280724460969, "learning_rate": 2.2724362540275288e-05, "loss": 0.3541, "loss_nan_ranks": 0, "loss_rank_avg": 0.3198665380477905, "step": 2240, "valid_targets_mean": 2523.6, "valid_targets_min": 723 }, { "epoch": 3.586261980830671, "grad_norm": 0.6515565530417812, "learning_rate": 2.2645408605887882e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.3271835446357727, "step": 2245, "valid_targets_mean": 3502.6, "valid_targets_min": 999 }, { "epoch": 3.594249201277955, "grad_norm": 0.7096257136610091, "learning_rate": 2.2566412688025003e-05, "loss": 0.3645, "loss_nan_ranks": 0, "loss_rank_avg": 0.3631103038787842, "step": 2250, "valid_targets_mean": 3502.5, "valid_targets_min": 1024 }, { "epoch": 3.6022364217252396, "grad_norm": 0.9151425698789424, "learning_rate": 2.2487376040376958e-05, "loss": 0.3735, "loss_nan_ranks": 0, "loss_rank_avg": 0.37757572531700134, "step": 2255, "valid_targets_mean": 3347.0, "valid_targets_min": 877 }, { "epoch": 3.610223642172524, "grad_norm": 0.7347384259209934, "learning_rate": 2.240829991728048e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.34199997782707214, "step": 2260, "valid_targets_mean": 3051.1, "valid_targets_min": 786 }, { "epoch": 3.6182108626198084, "grad_norm": 0.94549554675444, "learning_rate": 2.2329185573698778e-05, "loss": 0.3339, "loss_nan_ranks": 0, "loss_rank_avg": 0.36203259229660034, "step": 2265, "valid_targets_mean": 2668.2, "valid_targets_min": 811 }, { "epoch": 3.626198083067093, "grad_norm": 0.711777124378337, "learning_rate": 2.225003426520163e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.34062519669532776, "step": 2270, "valid_targets_mean": 3257.0, "valid_targets_min": 1230 }, { "epoch": 3.6341853035143767, "grad_norm": 0.8097999383376286, "learning_rate": 2.2170847247945466e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.3180551528930664, "step": 2275, "valid_targets_mean": 2292.1, "valid_targets_min": 1108 }, { "epoch": 3.642172523961661, "grad_norm": 0.7944952102142546, "learning_rate": 2.209162577865342e-05, "loss": 0.3608, "loss_nan_ranks": 0, "loss_rank_avg": 0.3482610881328583, "step": 2280, "valid_targets_mean": 2589.2, "valid_targets_min": 1683 }, { "epoch": 3.6501597444089455, "grad_norm": 0.8244274418365245, "learning_rate": 2.201237111459539e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.3237827718257904, "step": 2285, "valid_targets_mean": 2413.6, "valid_targets_min": 955 }, { "epoch": 3.65814696485623, "grad_norm": 0.8893899727490636, "learning_rate": 2.193308451356809e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.3441276252269745, "step": 2290, "valid_targets_mean": 2140.9, "valid_targets_min": 1085 }, { "epoch": 3.6661341853035143, "grad_norm": 0.7931807861635283, "learning_rate": 2.1853767233875084e-05, "loss": 0.3479, "loss_nan_ranks": 0, "loss_rank_avg": 0.32396748661994934, "step": 2295, "valid_targets_mean": 2703.6, "valid_targets_min": 1040 }, { "epoch": 3.6741214057507987, "grad_norm": 0.7323099605303646, "learning_rate": 2.1774420534306812e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.37023335695266724, "step": 2300, "valid_targets_mean": 3230.1, "valid_targets_min": 847 }, { "epoch": 3.682108626198083, "grad_norm": 0.8215600687589895, "learning_rate": 2.1695045674120615e-05, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.3557538390159607, "step": 2305, "valid_targets_mean": 2377.7, "valid_targets_min": 1184 }, { "epoch": 3.6900958466453675, "grad_norm": 0.8134770011066427, "learning_rate": 2.1615643913020755e-05, "loss": 0.3593, "loss_nan_ranks": 0, "loss_rank_avg": 0.33311760425567627, "step": 2310, "valid_targets_mean": 2857.2, "valid_targets_min": 1311 }, { "epoch": 3.698083067092652, "grad_norm": 0.812226985002325, "learning_rate": 2.1536216511138423e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.3659121096134186, "step": 2315, "valid_targets_mean": 2604.5, "valid_targets_min": 1130 }, { "epoch": 3.7060702875399363, "grad_norm": 0.8800310047756553, "learning_rate": 2.145676472901174e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.3661636412143707, "step": 2320, "valid_targets_mean": 2165.9, "valid_targets_min": 1010 }, { "epoch": 3.7140575079872207, "grad_norm": 0.7143058958135756, "learning_rate": 2.1377289827565734e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.33318227529525757, "step": 2325, "valid_targets_mean": 3463.3, "valid_targets_min": 1056 }, { "epoch": 3.722044728434505, "grad_norm": 0.7011841853877164, "learning_rate": 2.129779306809236e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.31508100032806396, "step": 2330, "valid_targets_mean": 2909.1, "valid_targets_min": 876 }, { "epoch": 3.730031948881789, "grad_norm": 0.8357370303330102, "learning_rate": 2.121827571223046e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.3638567328453064, "step": 2335, "valid_targets_mean": 2311.0, "valid_targets_min": 747 }, { "epoch": 3.7380191693290734, "grad_norm": 0.8037478490130382, "learning_rate": 2.113873902194575e-05, "loss": 0.3573, "loss_nan_ranks": 0, "loss_rank_avg": 0.37670642137527466, "step": 2340, "valid_targets_mean": 3250.2, "valid_targets_min": 1181 }, { "epoch": 3.746006389776358, "grad_norm": 0.8700223589429951, "learning_rate": 2.1059184259510786e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.386318564414978, "step": 2345, "valid_targets_mean": 2267.0, "valid_targets_min": 962 }, { "epoch": 3.753993610223642, "grad_norm": 0.7600210560294047, "learning_rate": 2.0979612687484935e-05, "loss": 0.3502, "loss_nan_ranks": 0, "loss_rank_avg": 0.36681851744651794, "step": 2350, "valid_targets_mean": 2949.6, "valid_targets_min": 1248 }, { "epoch": 3.7619808306709266, "grad_norm": 0.8561255238812737, "learning_rate": 2.0900025568694334e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.4018840193748474, "step": 2355, "valid_targets_mean": 2649.2, "valid_targets_min": 834 }, { "epoch": 3.769968051118211, "grad_norm": 0.7901922853076591, "learning_rate": 2.082042416621187e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.3670767843723297, "step": 2360, "valid_targets_mean": 2619.1, "valid_targets_min": 855 }, { "epoch": 3.777955271565495, "grad_norm": 0.7216134214426689, "learning_rate": 2.0740809743337095e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.3147008419036865, "step": 2365, "valid_targets_mean": 2834.6, "valid_targets_min": 917 }, { "epoch": 3.7859424920127793, "grad_norm": 0.7955391112654346, "learning_rate": 2.0661183563576202e-05, "loss": 0.3525, "loss_nan_ranks": 0, "loss_rank_avg": 0.36277374625205994, "step": 2370, "valid_targets_mean": 2651.1, "valid_targets_min": 988 }, { "epoch": 3.7939297124600637, "grad_norm": 0.772152693083288, "learning_rate": 2.0581546890621986e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.33806949853897095, "step": 2375, "valid_targets_mean": 2821.8, "valid_targets_min": 1116 }, { "epoch": 3.801916932907348, "grad_norm": 0.8085716379516211, "learning_rate": 2.0501900988333755e-05, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.3489188551902771, "step": 2380, "valid_targets_mean": 2745.3, "valid_targets_min": 430 }, { "epoch": 3.8099041533546325, "grad_norm": 0.6954666725539379, "learning_rate": 2.0422247120717304e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.3149593472480774, "step": 2385, "valid_targets_mean": 2903.2, "valid_targets_min": 1232 }, { "epoch": 3.817891373801917, "grad_norm": 0.7492864017320584, "learning_rate": 2.0342586551904824e-05, "loss": 0.3627, "loss_nan_ranks": 0, "loss_rank_avg": 0.33550161123275757, "step": 2390, "valid_targets_mean": 2524.8, "valid_targets_min": 1136 }, { "epoch": 3.8258785942492013, "grad_norm": 0.7379062354051015, "learning_rate": 2.026292054613486e-05, "loss": 0.3554, "loss_nan_ranks": 0, "loss_rank_avg": 0.35174477100372314, "step": 2395, "valid_targets_mean": 3198.4, "valid_targets_min": 1011 }, { "epoch": 3.8338658146964857, "grad_norm": 0.826138505521665, "learning_rate": 2.0183250367732253e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.3427872061729431, "step": 2400, "valid_targets_mean": 2487.9, "valid_targets_min": 904 }, { "epoch": 3.84185303514377, "grad_norm": 0.7229382012400196, "learning_rate": 2.0103577281088065e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.3543205261230469, "step": 2405, "valid_targets_mean": 3393.3, "valid_targets_min": 836 }, { "epoch": 3.8498402555910545, "grad_norm": 0.7250967838290785, "learning_rate": 2.00239025506395e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.32540053129196167, "step": 2410, "valid_targets_mean": 3386.4, "valid_targets_min": 1153 }, { "epoch": 3.857827476038339, "grad_norm": 0.8104290152544857, "learning_rate": 1.9944227440849856e-05, "loss": 0.3532, "loss_nan_ranks": 0, "loss_rank_avg": 0.3654288053512573, "step": 2415, "valid_targets_mean": 2680.6, "valid_targets_min": 1050 }, { "epoch": 3.8658146964856233, "grad_norm": 0.7592811553776619, "learning_rate": 1.9864553216188454e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.3243311643600464, "step": 2420, "valid_targets_mean": 2721.1, "valid_targets_min": 1003 }, { "epoch": 3.873801916932907, "grad_norm": 0.8600247524167637, "learning_rate": 1.978488114111057e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.3664115369319916, "step": 2425, "valid_targets_mean": 2369.9, "valid_targets_min": 897 }, { "epoch": 3.8817891373801916, "grad_norm": 0.9127949248834691, "learning_rate": 1.970521248003735e-05, "loss": 0.3522, "loss_nan_ranks": 0, "loss_rank_avg": 0.3474576771259308, "step": 2430, "valid_targets_mean": 1944.6, "valid_targets_min": 1207 }, { "epoch": 3.889776357827476, "grad_norm": 0.8067494948013632, "learning_rate": 1.9625548497335783e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.33465152978897095, "step": 2435, "valid_targets_mean": 2467.1, "valid_targets_min": 927 }, { "epoch": 3.8977635782747604, "grad_norm": 0.880971732697506, "learning_rate": 1.9545890457298592e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.351280152797699, "step": 2440, "valid_targets_mean": 2193.3, "valid_targets_min": 949 }, { "epoch": 3.905750798722045, "grad_norm": 0.8521094362994456, "learning_rate": 1.9466239624124203e-05, "loss": 0.3403, "loss_nan_ranks": 0, "loss_rank_avg": 0.3590460419654846, "step": 2445, "valid_targets_mean": 2435.9, "valid_targets_min": 1120 }, { "epoch": 3.913738019169329, "grad_norm": 0.868802266909435, "learning_rate": 1.938659726189663e-05, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.30706340074539185, "step": 2450, "valid_targets_mean": 2211.0, "valid_targets_min": 857 }, { "epoch": 3.9217252396166136, "grad_norm": 0.8259636849763473, "learning_rate": 1.9306964634565505e-05, "loss": 0.327, "loss_nan_ranks": 0, "loss_rank_avg": 0.3763893246650696, "step": 2455, "valid_targets_mean": 2577.2, "valid_targets_min": 1141 }, { "epoch": 3.9297124600638975, "grad_norm": 0.8213105655209398, "learning_rate": 1.9227343005925926e-05, "loss": 0.3341, "loss_nan_ranks": 0, "loss_rank_avg": 0.3701975345611572, "step": 2460, "valid_targets_mean": 2671.8, "valid_targets_min": 1206 }, { "epoch": 3.937699680511182, "grad_norm": 0.7207468257354757, "learning_rate": 1.914773363959845e-05, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.3682279586791992, "step": 2465, "valid_targets_mean": 3327.1, "valid_targets_min": 1211 }, { "epoch": 3.9456869009584663, "grad_norm": 0.7740903599176833, "learning_rate": 1.906813779900903e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.3290952444076538, "step": 2470, "valid_targets_mean": 2429.8, "valid_targets_min": 1173 }, { "epoch": 3.9536741214057507, "grad_norm": 0.6969816315594596, "learning_rate": 1.8988556747368953e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.31143099069595337, "step": 2475, "valid_targets_mean": 3285.7, "valid_targets_min": 901 }, { "epoch": 3.961661341853035, "grad_norm": 0.6900509589111553, "learning_rate": 1.890899174765481e-05, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.32233577966690063, "step": 2480, "valid_targets_mean": 3132.6, "valid_targets_min": 1216 }, { "epoch": 3.9696485623003195, "grad_norm": 0.7531324107571046, "learning_rate": 1.8829444062588433e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.3661973476409912, "step": 2485, "valid_targets_mean": 2683.5, "valid_targets_min": 722 }, { "epoch": 3.977635782747604, "grad_norm": 0.8859610638059474, "learning_rate": 1.8749914954616882e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.39797261357307434, "step": 2490, "valid_targets_mean": 2247.5, "valid_targets_min": 920 }, { "epoch": 3.9856230031948883, "grad_norm": 0.727951884939237, "learning_rate": 1.867040568589236e-05, "loss": 0.352, "loss_nan_ranks": 0, "loss_rank_avg": 0.31643036007881165, "step": 2495, "valid_targets_mean": 3139.8, "valid_targets_min": 733 }, { "epoch": 3.9936102236421727, "grad_norm": 0.7051175961125331, "learning_rate": 1.859091751825225e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.31299465894699097, "step": 2500, "valid_targets_mean": 2929.7, "valid_targets_min": 1181 }, { "epoch": 4.001597444089457, "grad_norm": 0.7836980808537842, "learning_rate": 1.8511451713199038e-05, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.320000022649765, "step": 2505, "valid_targets_mean": 2379.3, "valid_targets_min": 803 }, { "epoch": 4.0095846645367414, "grad_norm": 0.7784914545094099, "learning_rate": 1.843200953188031e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.2952941060066223, "step": 2510, "valid_targets_mean": 3074.2, "valid_targets_min": 1215 }, { "epoch": 4.017571884984026, "grad_norm": 0.7642112879241275, "learning_rate": 1.8352592235068735e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.2828487157821655, "step": 2515, "valid_targets_mean": 2811.1, "valid_targets_min": 1026 }, { "epoch": 4.02555910543131, "grad_norm": 0.8934842633384591, "learning_rate": 1.8273201083142056e-05, "loss": 0.3116, "loss_nan_ranks": 0, "loss_rank_avg": 0.3350905179977417, "step": 2520, "valid_targets_mean": 2196.1, "valid_targets_min": 1139 }, { "epoch": 4.033546325878595, "grad_norm": 0.8830460996681451, "learning_rate": 1.8193837336063096e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3144967257976532, "step": 2525, "valid_targets_mean": 2362.4, "valid_targets_min": 829 }, { "epoch": 4.041533546325879, "grad_norm": 0.7589694170525213, "learning_rate": 1.8114502253359745e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.329261839389801, "step": 2530, "valid_targets_mean": 3463.7, "valid_targets_min": 1162 }, { "epoch": 4.0495207667731625, "grad_norm": 2.6987601954147147, "learning_rate": 1.8035197094104986e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.3215765357017517, "step": 2535, "valid_targets_mean": 3010.8, "valid_targets_min": 1144 }, { "epoch": 4.057507987220447, "grad_norm": 0.8913192131103218, "learning_rate": 1.7955923116896908e-05, "loss": 0.344, "loss_nan_ranks": 0, "loss_rank_avg": 0.34397605061531067, "step": 2540, "valid_targets_mean": 2805.3, "valid_targets_min": 916 }, { "epoch": 4.065495207667731, "grad_norm": 0.7455487784175526, "learning_rate": 1.787668157983872e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.35729163885116577, "step": 2545, "valid_targets_mean": 3363.3, "valid_targets_min": 1378 }, { "epoch": 4.073482428115016, "grad_norm": 0.7873618036052649, "learning_rate": 1.779747374051881e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.31921112537384033, "step": 2550, "valid_targets_mean": 3040.9, "valid_targets_min": 1310 }, { "epoch": 4.0814696485623, "grad_norm": 0.7841123654379275, "learning_rate": 1.7718300855990767e-05, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.30261629819869995, "step": 2555, "valid_targets_mean": 2832.1, "valid_targets_min": 1085 }, { "epoch": 4.0894568690095845, "grad_norm": 0.8354232619995942, "learning_rate": 1.7639164182753434e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2939416170120239, "step": 2560, "valid_targets_mean": 2348.6, "valid_targets_min": 851 }, { "epoch": 4.097444089456869, "grad_norm": 0.8279010105207609, "learning_rate": 1.7560064976730967e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.2960469722747803, "step": 2565, "valid_targets_mean": 2403.9, "valid_targets_min": 1514 }, { "epoch": 4.105431309904153, "grad_norm": 0.7720855666104548, "learning_rate": 1.7481004493252915e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.29527148604393005, "step": 2570, "valid_targets_mean": 3140.0, "valid_targets_min": 1130 }, { "epoch": 4.113418530351438, "grad_norm": 0.8561385263509396, "learning_rate": 1.740198398703428e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.3038601875305176, "step": 2575, "valid_targets_mean": 2381.4, "valid_targets_min": 1130 }, { "epoch": 4.121405750798722, "grad_norm": 0.732786585841618, "learning_rate": 1.7323004712155613e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.31189507246017456, "step": 2580, "valid_targets_mean": 3734.1, "valid_targets_min": 1187 }, { "epoch": 4.1293929712460065, "grad_norm": 0.7953181249120669, "learning_rate": 1.724406792204312e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.3025287389755249, "step": 2585, "valid_targets_mean": 2656.2, "valid_targets_min": 1215 }, { "epoch": 4.137380191693291, "grad_norm": 0.7744633063634144, "learning_rate": 1.7165174869448738e-05, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2929438650608063, "step": 2590, "valid_targets_mean": 2507.7, "valid_targets_min": 1224 }, { "epoch": 4.145367412140575, "grad_norm": 0.7745147678616877, "learning_rate": 1.7086326806430298e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.304587721824646, "step": 2595, "valid_targets_mean": 2938.4, "valid_targets_min": 1284 }, { "epoch": 4.15335463258786, "grad_norm": 0.8991912650145979, "learning_rate": 1.7007524984331623e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.32008877396583557, "step": 2600, "valid_targets_mean": 2276.9, "valid_targets_min": 988 }, { "epoch": 4.161341853035144, "grad_norm": 0.8738895750174318, "learning_rate": 1.692877065376268e-05, "loss": 0.3149, "loss_nan_ranks": 0, "loss_rank_avg": 0.30264782905578613, "step": 2605, "valid_targets_mean": 2370.2, "valid_targets_min": 971 }, { "epoch": 4.169329073482428, "grad_norm": 0.8046516983143223, "learning_rate": 1.6850065064579724e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3758092522621155, "step": 2610, "valid_targets_mean": 2888.1, "valid_targets_min": 1101 }, { "epoch": 4.177316293929713, "grad_norm": 0.7816553623092369, "learning_rate": 1.677140946586548e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.3018527328968048, "step": 2615, "valid_targets_mean": 3292.1, "valid_targets_min": 823 }, { "epoch": 4.185303514376997, "grad_norm": 0.7701069701455311, "learning_rate": 1.66928051059093e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.29624032974243164, "step": 2620, "valid_targets_mean": 3122.0, "valid_targets_min": 1020 }, { "epoch": 4.193290734824281, "grad_norm": 0.8468234652278214, "learning_rate": 1.6614253232187363e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.3546920120716095, "step": 2625, "valid_targets_mean": 3006.4, "valid_targets_min": 985 }, { "epoch": 4.201277955271565, "grad_norm": 0.7804812824667207, "learning_rate": 1.6535755091342876e-05, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.2810975909233093, "step": 2630, "valid_targets_mean": 3003.0, "valid_targets_min": 1330 }, { "epoch": 4.2092651757188495, "grad_norm": 0.8314006980762537, "learning_rate": 1.6457311929166286e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3335530161857605, "step": 2635, "valid_targets_mean": 2748.6, "valid_targets_min": 797 }, { "epoch": 4.217252396166134, "grad_norm": 1.2682211032574355, "learning_rate": 1.637892499057551e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.32898035645484924, "step": 2640, "valid_targets_mean": 2015.6, "valid_targets_min": 1038 }, { "epoch": 4.225239616613418, "grad_norm": 0.6756060081334775, "learning_rate": 1.6300595519596177e-05, "loss": 0.3214, "loss_nan_ranks": 0, "loss_rank_avg": 0.3469483256340027, "step": 2645, "valid_targets_mean": 4125.4, "valid_targets_min": 906 }, { "epoch": 4.233226837060703, "grad_norm": 0.830457676846521, "learning_rate": 1.6222324759341897e-05, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.372150182723999, "step": 2650, "valid_targets_mean": 2774.6, "valid_targets_min": 978 }, { "epoch": 4.241214057507987, "grad_norm": 0.8301772168189655, "learning_rate": 1.6144113951994515e-05, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.3426179885864258, "step": 2655, "valid_targets_mean": 2936.2, "valid_targets_min": 1189 }, { "epoch": 4.2492012779552715, "grad_norm": 0.7442017453136883, "learning_rate": 1.60659643387844e-05, "loss": 0.3342, "loss_nan_ranks": 0, "loss_rank_avg": 0.32107579708099365, "step": 2660, "valid_targets_mean": 3388.4, "valid_targets_min": 929 }, { "epoch": 4.257188498402556, "grad_norm": 0.7989995875352693, "learning_rate": 1.5987877159970765e-05, "loss": 0.3218, "loss_nan_ranks": 0, "loss_rank_avg": 0.3555402457714081, "step": 2665, "valid_targets_mean": 2872.1, "valid_targets_min": 1153 }, { "epoch": 4.26517571884984, "grad_norm": 0.9194992318413938, "learning_rate": 1.5909853654821947e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.34973281621932983, "step": 2670, "valid_targets_mean": 2280.6, "valid_targets_min": 837 }, { "epoch": 4.273162939297125, "grad_norm": 0.7793815135340966, "learning_rate": 1.583189506159579e-05, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.32121002674102783, "step": 2675, "valid_targets_mean": 3233.8, "valid_targets_min": 1172 }, { "epoch": 4.281150159744409, "grad_norm": 0.7419814536244536, "learning_rate": 1.575400261751993e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.26411211490631104, "step": 2680, "valid_targets_mean": 2861.4, "valid_targets_min": 888 }, { "epoch": 4.289137380191693, "grad_norm": 0.8190096841902706, "learning_rate": 1.567617755877223e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.31602364778518677, "step": 2685, "valid_targets_mean": 3839.0, "valid_targets_min": 737 }, { "epoch": 4.297124600638978, "grad_norm": 0.8513254156626134, "learning_rate": 1.5598421120461106e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.34726378321647644, "step": 2690, "valid_targets_mean": 3125.2, "valid_targets_min": 1159 }, { "epoch": 4.305111821086262, "grad_norm": 0.8742879239076529, "learning_rate": 1.552073453660595e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.2954450249671936, "step": 2695, "valid_targets_mean": 2049.4, "valid_targets_min": 1043 }, { "epoch": 4.313099041533547, "grad_norm": 0.8803976612275924, "learning_rate": 1.5443119040117544e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.31700998544692993, "step": 2700, "valid_targets_mean": 2607.2, "valid_targets_min": 1532 }, { "epoch": 4.321086261980831, "grad_norm": 0.7893323019925185, "learning_rate": 1.536557586277849e-05, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.3041345477104187, "step": 2705, "valid_targets_mean": 3251.6, "valid_targets_min": 1152 }, { "epoch": 4.329073482428115, "grad_norm": 0.8702685258904816, "learning_rate": 1.5288106235223655e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.3005998730659485, "step": 2710, "valid_targets_mean": 2477.4, "valid_targets_min": 853 }, { "epoch": 4.3370607028754, "grad_norm": 0.6841522781915828, "learning_rate": 1.521071138692066e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.31260186433792114, "step": 2715, "valid_targets_mean": 3646.8, "valid_targets_min": 1019 }, { "epoch": 4.345047923322683, "grad_norm": 0.8793770134129358, "learning_rate": 1.5133392546150347e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.3228303790092468, "step": 2720, "valid_targets_mean": 2257.6, "valid_targets_min": 1119 }, { "epoch": 4.353035143769968, "grad_norm": 0.7356041781956482, "learning_rate": 1.5056150939987303e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.2978741526603699, "step": 2725, "valid_targets_mean": 3256.1, "valid_targets_min": 1130 }, { "epoch": 4.361022364217252, "grad_norm": 0.8575488601782734, "learning_rate": 1.4978987794280363e-05, "loss": 0.338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3490545153617859, "step": 2730, "valid_targets_mean": 2729.2, "valid_targets_min": 651 }, { "epoch": 4.3690095846645365, "grad_norm": 0.8487291733521595, "learning_rate": 1.4901904333633179e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.3031385540962219, "step": 2735, "valid_targets_mean": 2487.4, "valid_targets_min": 969 }, { "epoch": 4.376996805111821, "grad_norm": 0.822564579116967, "learning_rate": 1.4824901781384777e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881549894809723, "step": 2740, "valid_targets_mean": 2674.9, "valid_targets_min": 876 }, { "epoch": 4.384984025559105, "grad_norm": 0.869337603970582, "learning_rate": 1.4747981359590138e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.3272026777267456, "step": 2745, "valid_targets_mean": 2358.8, "valid_targets_min": 1083 }, { "epoch": 4.39297124600639, "grad_norm": 0.8621433957032326, "learning_rate": 1.4671144289000806e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.3270319104194641, "step": 2750, "valid_targets_mean": 2623.6, "valid_targets_min": 1187 }, { "epoch": 4.400958466453674, "grad_norm": 0.7737153035103758, "learning_rate": 1.4594391789045513e-05, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.3190346360206604, "step": 2755, "valid_targets_mean": 2979.1, "valid_targets_min": 957 }, { "epoch": 4.4089456869009584, "grad_norm": 0.7196118582656776, "learning_rate": 1.4517725077810835e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696632146835327, "step": 2760, "valid_targets_mean": 3125.1, "valid_targets_min": 1003 }, { "epoch": 4.416932907348243, "grad_norm": 0.6494097240205376, "learning_rate": 1.4441145372021847e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.3023773431777954, "step": 2765, "valid_targets_mean": 3835.9, "valid_targets_min": 1076 }, { "epoch": 4.424920127795527, "grad_norm": 0.7789314639253977, "learning_rate": 1.4364653887022831e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.32076117396354675, "step": 2770, "valid_targets_mean": 2887.3, "valid_targets_min": 849 }, { "epoch": 4.432907348242812, "grad_norm": 0.8479733674287858, "learning_rate": 1.4288251836757956e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.31372612714767456, "step": 2775, "valid_targets_mean": 2776.1, "valid_targets_min": 1171 }, { "epoch": 4.440894568690096, "grad_norm": 0.7510027085556208, "learning_rate": 1.4211940433752052e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3128352165222168, "step": 2780, "valid_targets_mean": 3347.7, "valid_targets_min": 1018 }, { "epoch": 4.44888178913738, "grad_norm": 1.0678801727890188, "learning_rate": 1.4135720889091342e-05, "loss": 0.3116, "loss_nan_ranks": 0, "loss_rank_avg": 0.33587950468063354, "step": 2785, "valid_targets_mean": 2601.2, "valid_targets_min": 1071 }, { "epoch": 4.456869009584665, "grad_norm": 0.7024654713140126, "learning_rate": 1.4059594412404227e-05, "loss": 0.3257, "loss_nan_ranks": 0, "loss_rank_avg": 0.28195154666900635, "step": 2790, "valid_targets_mean": 3657.8, "valid_targets_min": 1431 }, { "epoch": 4.464856230031949, "grad_norm": 0.7937537911917101, "learning_rate": 1.3983562211842094e-05, "loss": 0.3259, "loss_nan_ranks": 0, "loss_rank_avg": 0.30999305844306946, "step": 2795, "valid_targets_mean": 3226.8, "valid_targets_min": 1176 }, { "epoch": 4.472843450479234, "grad_norm": 0.8150515310476798, "learning_rate": 1.390762549406013e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.33410537242889404, "step": 2800, "valid_targets_mean": 2873.4, "valid_targets_min": 983 }, { "epoch": 4.480830670926517, "grad_norm": 0.7481249885495977, "learning_rate": 1.3831785464198188e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.3242833912372589, "step": 2805, "valid_targets_mean": 3249.0, "valid_targets_min": 924 }, { "epoch": 4.488817891373802, "grad_norm": 0.8863393546681068, "learning_rate": 1.3756043325861648e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.30686694383621216, "step": 2810, "valid_targets_mean": 2602.9, "valid_targets_min": 1229 }, { "epoch": 4.496805111821086, "grad_norm": 0.8894834385161677, "learning_rate": 1.3680400281102326e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.2976420521736145, "step": 2815, "valid_targets_mean": 2074.1, "valid_targets_min": 1041 }, { "epoch": 4.50479233226837, "grad_norm": 0.9310689795086521, "learning_rate": 1.3604857530399378e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.40471312403678894, "step": 2820, "valid_targets_mean": 2295.2, "valid_targets_min": 430 }, { "epoch": 4.512779552715655, "grad_norm": 0.7523089341040629, "learning_rate": 1.3529416272640278e-05, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.2931872308254242, "step": 2825, "valid_targets_mean": 2772.8, "valid_targets_min": 1438 }, { "epoch": 4.520766773162939, "grad_norm": 0.8964434235440402, "learning_rate": 1.3454077705101766e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.35491257905960083, "step": 2830, "valid_targets_mean": 2291.6, "valid_targets_min": 857 }, { "epoch": 4.5287539936102235, "grad_norm": 0.7823384694721772, "learning_rate": 1.3378843023430856e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.3356529772281647, "step": 2835, "valid_targets_mean": 3122.6, "valid_targets_min": 1283 }, { "epoch": 4.536741214057508, "grad_norm": 0.8162940884992557, "learning_rate": 1.3303713421625864e-05, "loss": 0.3014, "loss_nan_ranks": 0, "loss_rank_avg": 0.30902934074401855, "step": 2840, "valid_targets_mean": 2529.6, "valid_targets_min": 992 }, { "epoch": 4.544728434504792, "grad_norm": 0.7970840712086852, "learning_rate": 1.3228690092017452e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.29649817943573, "step": 2845, "valid_targets_mean": 2565.8, "valid_targets_min": 1298 }, { "epoch": 4.552715654952077, "grad_norm": 0.8158566717200522, "learning_rate": 1.3153774225249705e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.33489930629730225, "step": 2850, "valid_targets_mean": 2931.1, "valid_targets_min": 1587 }, { "epoch": 4.560702875399361, "grad_norm": 0.9705943358780271, "learning_rate": 1.3078967010261243e-05, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.36530590057373047, "step": 2855, "valid_targets_mean": 2347.4, "valid_targets_min": 659 }, { "epoch": 4.568690095846645, "grad_norm": 0.867288807597881, "learning_rate": 1.3004269634266357e-05, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3266403079032898, "step": 2860, "valid_targets_mean": 2646.6, "valid_targets_min": 864 }, { "epoch": 4.57667731629393, "grad_norm": 0.85633385349373, "learning_rate": 1.2929683282736135e-05, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.31155091524124146, "step": 2865, "valid_targets_mean": 2291.2, "valid_targets_min": 1044 }, { "epoch": 4.584664536741214, "grad_norm": 0.8733957612598485, "learning_rate": 1.285520913937969e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.3596514165401459, "step": 2870, "valid_targets_mean": 2465.4, "valid_targets_min": 697 }, { "epoch": 4.592651757188499, "grad_norm": 0.8439557548254832, "learning_rate": 1.2780848386125354e-05, "loss": 0.341, "loss_nan_ranks": 0, "loss_rank_avg": 0.3084920644760132, "step": 2875, "valid_targets_mean": 2439.3, "valid_targets_min": 1096 }, { "epoch": 4.600638977635783, "grad_norm": 0.7574914303418859, "learning_rate": 1.2706602203101913e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.2827756404876709, "step": 2880, "valid_targets_mean": 2762.9, "valid_targets_min": 860 }, { "epoch": 4.608626198083067, "grad_norm": 0.8187552779251025, "learning_rate": 1.2632471768619894e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.3288748860359192, "step": 2885, "valid_targets_mean": 2768.2, "valid_targets_min": 1053 }, { "epoch": 4.616613418530352, "grad_norm": 0.7875128783332611, "learning_rate": 1.255845825915286e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.29355835914611816, "step": 2890, "valid_targets_mean": 2613.6, "valid_targets_min": 1075 }, { "epoch": 4.624600638977636, "grad_norm": 0.8034781377355279, "learning_rate": 1.248456284931873e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.3028643727302551, "step": 2895, "valid_targets_mean": 2869.2, "valid_targets_min": 1386 }, { "epoch": 4.63258785942492, "grad_norm": 0.7962900798710767, "learning_rate": 1.241078671186115e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.346049040555954, "step": 2900, "valid_targets_mean": 2883.4, "valid_targets_min": 1294 }, { "epoch": 4.640575079872205, "grad_norm": 0.8023873273428883, "learning_rate": 1.2337131017630873e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.3004358410835266, "step": 2905, "valid_targets_mean": 2556.7, "valid_targets_min": 891 }, { "epoch": 4.6485623003194885, "grad_norm": 0.8977806884389504, "learning_rate": 1.2263596935567175e-05, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.32839423418045044, "step": 2910, "valid_targets_mean": 3472.2, "valid_targets_min": 1178 }, { "epoch": 4.656549520766773, "grad_norm": 0.7106582489525565, "learning_rate": 1.2190185632679316e-05, "loss": 0.3118, "loss_nan_ranks": 0, "loss_rank_avg": 0.2885178327560425, "step": 2915, "valid_targets_mean": 3290.6, "valid_targets_min": 912 }, { "epoch": 4.664536741214057, "grad_norm": 0.667191215845006, "learning_rate": 1.2116898274028008e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.2748382091522217, "step": 2920, "valid_targets_mean": 4097.6, "valid_targets_min": 1180 }, { "epoch": 4.672523961661342, "grad_norm": 0.8255323403479464, "learning_rate": 1.2043736022706934e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.34103143215179443, "step": 2925, "valid_targets_mean": 2534.6, "valid_targets_min": 1061 }, { "epoch": 4.680511182108626, "grad_norm": 1.0630168206337054, "learning_rate": 1.1970700039824271e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.3425711989402771, "step": 2930, "valid_targets_mean": 2254.5, "valid_targets_min": 742 }, { "epoch": 4.68849840255591, "grad_norm": 0.8323979797486944, "learning_rate": 1.1897791484484284e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.31606024503707886, "step": 2935, "valid_targets_mean": 2571.6, "valid_targets_min": 747 }, { "epoch": 4.696485623003195, "grad_norm": 0.7798233457306829, "learning_rate": 1.182501151376893e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.2969059944152832, "step": 2940, "valid_targets_mean": 2631.4, "valid_targets_min": 1289 }, { "epoch": 4.704472843450479, "grad_norm": 0.717355278192079, "learning_rate": 1.1752361282719472e-05, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805374264717102, "step": 2945, "valid_targets_mean": 3219.2, "valid_targets_min": 1478 }, { "epoch": 4.712460063897764, "grad_norm": 0.8644521598904813, "learning_rate": 1.1679841944318171e-05, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.317280113697052, "step": 2950, "valid_targets_mean": 2483.1, "valid_targets_min": 927 }, { "epoch": 4.720447284345048, "grad_norm": 0.8645726435153137, "learning_rate": 1.1607454649469991e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.2650579810142517, "step": 2955, "valid_targets_mean": 2288.5, "valid_targets_min": 869 }, { "epoch": 4.728434504792332, "grad_norm": 0.7976688949944475, "learning_rate": 1.1535200546984291e-05, "loss": 0.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.30540648102760315, "step": 2960, "valid_targets_mean": 2663.8, "valid_targets_min": 1342 }, { "epoch": 4.736421725239617, "grad_norm": 0.8664261433843101, "learning_rate": 1.1463080783556663e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.3349177837371826, "step": 2965, "valid_targets_mean": 2668.2, "valid_targets_min": 1079 }, { "epoch": 4.744408945686901, "grad_norm": 0.7406641800839713, "learning_rate": 1.139109650375066e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.3015572130680084, "step": 2970, "valid_targets_mean": 3056.8, "valid_targets_min": 1715 }, { "epoch": 4.752396166134186, "grad_norm": 0.857312699295414, "learning_rate": 1.1319248849979705e-05, "loss": 0.3126, "loss_nan_ranks": 0, "loss_rank_avg": 0.35463592410087585, "step": 2975, "valid_targets_mean": 3039.2, "valid_targets_min": 1433 }, { "epoch": 4.76038338658147, "grad_norm": 0.8450913381311652, "learning_rate": 1.1247538962488882e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.3202403783798218, "step": 2980, "valid_targets_mean": 2744.7, "valid_targets_min": 901 }, { "epoch": 4.768370607028754, "grad_norm": 0.7830697313162523, "learning_rate": 1.1175967979336913e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.3308242857456207, "step": 2985, "valid_targets_mean": 3116.3, "valid_targets_min": 1017 }, { "epoch": 4.776357827476039, "grad_norm": 0.7830125935395612, "learning_rate": 1.1104537036378054e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.3096255660057068, "step": 2990, "valid_targets_mean": 3076.9, "valid_targets_min": 1036 }, { "epoch": 4.784345047923322, "grad_norm": 0.8355403682431177, "learning_rate": 1.1033247267244063e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.30156558752059937, "step": 2995, "valid_targets_mean": 2738.4, "valid_targets_min": 1026 }, { "epoch": 4.792332268370607, "grad_norm": 0.7250424081419844, "learning_rate": 1.0962099803326257e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.28947603702545166, "step": 3000, "valid_targets_mean": 3327.1, "valid_targets_min": 931 }, { "epoch": 4.800319488817891, "grad_norm": 0.9386381305034504, "learning_rate": 1.089109577375748e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.33451300859451294, "step": 3005, "valid_targets_mean": 1926.2, "valid_targets_min": 949 }, { "epoch": 4.8083067092651754, "grad_norm": 0.9607923151156983, "learning_rate": 1.082023630539427e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.3341418504714966, "step": 3010, "valid_targets_mean": 2006.8, "valid_targets_min": 944 }, { "epoch": 4.81629392971246, "grad_norm": 0.8329571872141134, "learning_rate": 1.07495225227989e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.35894811153411865, "step": 3015, "valid_targets_mean": 2908.5, "valid_targets_min": 887 }, { "epoch": 4.824281150159744, "grad_norm": 0.8370383236843801, "learning_rate": 1.0678955548221595e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.3370824456214905, "step": 3020, "valid_targets_mean": 2618.8, "valid_targets_min": 1134 }, { "epoch": 4.832268370607029, "grad_norm": 0.9448990709923799, "learning_rate": 1.0608536501582654e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.34659168124198914, "step": 3025, "valid_targets_mean": 2263.4, "valid_targets_min": 1230 }, { "epoch": 4.840255591054313, "grad_norm": 0.8223141685878618, "learning_rate": 1.0538266500454739e-05, "loss": 0.3247, "loss_nan_ranks": 0, "loss_rank_avg": 0.35333919525146484, "step": 3030, "valid_targets_mean": 3194.6, "valid_targets_min": 960 }, { "epoch": 4.848242811501597, "grad_norm": 0.8144903161010786, "learning_rate": 1.0468146660045118e-05, "loss": 0.3077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2987595498561859, "step": 3035, "valid_targets_mean": 2810.4, "valid_targets_min": 681 }, { "epoch": 4.856230031948882, "grad_norm": 0.9075766431749717, "learning_rate": 1.0398178093177928e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.3274604380130768, "step": 3040, "valid_targets_mean": 2483.5, "valid_targets_min": 948 }, { "epoch": 4.864217252396166, "grad_norm": 0.7273114917343588, "learning_rate": 1.0328361910276592e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.3381314277648926, "step": 3045, "valid_targets_mean": 3621.1, "valid_targets_min": 1769 }, { "epoch": 4.872204472843451, "grad_norm": 0.7820761358000989, "learning_rate": 1.0258699219346091e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.27850645780563354, "step": 3050, "valid_targets_mean": 3137.2, "valid_targets_min": 1036 }, { "epoch": 4.880191693290735, "grad_norm": 0.8361404113450691, "learning_rate": 1.0189191125955503e-05, "loss": 0.301, "loss_nan_ranks": 0, "loss_rank_avg": 0.328288197517395, "step": 3055, "valid_targets_mean": 2804.3, "valid_targets_min": 1316 }, { "epoch": 4.888178913738019, "grad_norm": 0.8866370829805829, "learning_rate": 1.0119838733220342e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.30976438522338867, "step": 3060, "valid_targets_mean": 2255.0, "valid_targets_min": 1081 }, { "epoch": 4.896166134185304, "grad_norm": 0.7548674340256988, "learning_rate": 1.0050643141785148e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.296387642621994, "step": 3065, "valid_targets_mean": 2844.9, "valid_targets_min": 1408 }, { "epoch": 4.904153354632588, "grad_norm": 0.8332532662745489, "learning_rate": 9.981605449805933e-06, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925332188606262, "step": 3070, "valid_targets_mean": 2291.7, "valid_targets_min": 1238 }, { "epoch": 4.912140575079873, "grad_norm": 0.8598926872352152, "learning_rate": 9.912726752932823e-06, "loss": 0.3198, "loss_nan_ranks": 0, "loss_rank_avg": 0.32179611921310425, "step": 3075, "valid_targets_mean": 2410.4, "valid_targets_min": 1110 }, { "epoch": 4.920127795527156, "grad_norm": 0.7424748231440373, "learning_rate": 9.844008144292643e-06, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.29315125942230225, "step": 3080, "valid_targets_mean": 3143.2, "valid_targets_min": 1075 }, { "epoch": 4.928115015974441, "grad_norm": 0.9235518733511646, "learning_rate": 9.775450714471537e-06, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.3396497070789337, "step": 3085, "valid_targets_mean": 2151.2, "valid_targets_min": 972 }, { "epoch": 4.936102236421725, "grad_norm": 0.6816211371601565, "learning_rate": 9.707055551497734e-06, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.29893457889556885, "step": 3090, "valid_targets_mean": 3611.6, "valid_targets_min": 1289 }, { "epoch": 4.944089456869009, "grad_norm": 0.8170219219392088, "learning_rate": 9.638823740824177e-06, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.2988799214363098, "step": 3095, "valid_targets_mean": 2490.7, "valid_targets_min": 1019 }, { "epoch": 4.952076677316294, "grad_norm": 0.7458396020996966, "learning_rate": 9.570756365311418e-06, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.32337093353271484, "step": 3100, "valid_targets_mean": 3530.2, "valid_targets_min": 1258 }, { "epoch": 4.960063897763578, "grad_norm": 0.7455812050660711, "learning_rate": 9.502854505210326e-06, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.3213096857070923, "step": 3105, "valid_targets_mean": 2728.7, "valid_targets_min": 1108 }, { "epoch": 4.968051118210862, "grad_norm": 0.7843594515963668, "learning_rate": 9.435119238145018e-06, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.3219505548477173, "step": 3110, "valid_targets_mean": 3162.7, "valid_targets_min": 357 }, { "epoch": 4.976038338658147, "grad_norm": 0.7656830597494546, "learning_rate": 9.367551639095704e-06, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.33506011962890625, "step": 3115, "valid_targets_mean": 3141.4, "valid_targets_min": 1192 }, { "epoch": 4.984025559105431, "grad_norm": 0.9724543109745135, "learning_rate": 9.300152780381664e-06, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.3792024254798889, "step": 3120, "valid_targets_mean": 2552.1, "valid_targets_min": 875 }, { "epoch": 4.992012779552716, "grad_norm": 0.748363011262852, "learning_rate": 9.232923731644216e-06, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.2932063043117523, "step": 3125, "valid_targets_mean": 3223.9, "valid_targets_min": 1187 }, { "epoch": 5.0, "grad_norm": 0.7872370648886844, "learning_rate": 9.16586555982972e-06, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.28079310059547424, "step": 3130, "valid_targets_mean": 2799.1, "valid_targets_min": 1113 }, { "epoch": 5.007987220447284, "grad_norm": 0.7939193129172704, "learning_rate": 9.098979329172702e-06, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.27301716804504395, "step": 3135, "valid_targets_mean": 2498.5, "valid_targets_min": 732 }, { "epoch": 5.015974440894569, "grad_norm": 0.8161794104869049, "learning_rate": 9.032266101178872e-06, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.30852165818214417, "step": 3140, "valid_targets_mean": 2731.8, "valid_targets_min": 857 }, { "epoch": 5.023961661341853, "grad_norm": 0.9254348282198132, "learning_rate": 8.965726934608392e-06, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.2905504107475281, "step": 3145, "valid_targets_mean": 2591.9, "valid_targets_min": 913 }, { "epoch": 5.031948881789138, "grad_norm": 0.6971325615014937, "learning_rate": 8.899362885458964e-06, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.28469550609588623, "step": 3150, "valid_targets_mean": 3842.1, "valid_targets_min": 990 }, { "epoch": 5.039936102236422, "grad_norm": 0.8228394781114576, "learning_rate": 8.833175006949165e-06, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.2873718738555908, "step": 3155, "valid_targets_mean": 2796.2, "valid_targets_min": 690 }, { "epoch": 5.047923322683706, "grad_norm": 0.7756264018207162, "learning_rate": 8.767164349501648e-06, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.2786628305912018, "step": 3160, "valid_targets_mean": 3256.9, "valid_targets_min": 1270 }, { "epoch": 5.055910543130991, "grad_norm": 0.9177797446364668, "learning_rate": 8.70133196072654e-06, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.31999728083610535, "step": 3165, "valid_targets_mean": 2434.4, "valid_targets_min": 1327 }, { "epoch": 5.063897763578275, "grad_norm": 0.8631163026077268, "learning_rate": 8.63567888540478e-06, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.3382035493850708, "step": 3170, "valid_targets_mean": 2910.9, "valid_targets_min": 1067 }, { "epoch": 5.0718849840255595, "grad_norm": 0.8946157821444155, "learning_rate": 8.570206165471535e-06, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751600742340088, "step": 3175, "valid_targets_mean": 2490.8, "valid_targets_min": 755 }, { "epoch": 5.079872204472843, "grad_norm": 0.8297010600531302, "learning_rate": 8.504914839999691e-06, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.27816468477249146, "step": 3180, "valid_targets_mean": 2886.9, "valid_targets_min": 1381 }, { "epoch": 5.087859424920127, "grad_norm": 0.8507115440982196, "learning_rate": 8.439805945183333e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.2772366404533386, "step": 3185, "valid_targets_mean": 2524.4, "valid_targets_min": 852 }, { "epoch": 5.095846645367412, "grad_norm": 0.807103384546817, "learning_rate": 8.374880514321318e-06, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.27188539505004883, "step": 3190, "valid_targets_mean": 2683.4, "valid_targets_min": 1022 }, { "epoch": 5.103833865814696, "grad_norm": 1.7728666178247663, "learning_rate": 8.310139577800864e-06, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.3083685636520386, "step": 3195, "valid_targets_mean": 3117.4, "valid_targets_min": 1083 }, { "epoch": 5.111821086261981, "grad_norm": 0.8170861054810535, "learning_rate": 8.245584163081228e-06, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.28269141912460327, "step": 3200, "valid_targets_mean": 3077.5, "valid_targets_min": 1317 }, { "epoch": 5.119808306709265, "grad_norm": 0.9004835635106335, "learning_rate": 8.18121529467735e-06, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.3067591190338135, "step": 3205, "valid_targets_mean": 3360.2, "valid_targets_min": 1502 }, { "epoch": 5.127795527156549, "grad_norm": 0.7289161691303735, "learning_rate": 8.117033994143635e-06, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.269919216632843, "step": 3210, "valid_targets_mean": 3433.9, "valid_targets_min": 1040 }, { "epoch": 5.135782747603834, "grad_norm": 0.8262371961557731, "learning_rate": 8.053041280057733e-06, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.30624669790267944, "step": 3215, "valid_targets_mean": 3221.0, "valid_targets_min": 1568 }, { "epoch": 5.143769968051118, "grad_norm": 0.8907753230016606, "learning_rate": 7.989238168004347e-06, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.29566720128059387, "step": 3220, "valid_targets_mean": 2364.5, "valid_targets_min": 964 }, { "epoch": 5.151757188498403, "grad_norm": 0.7773585981365254, "learning_rate": 7.925625670559158e-06, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.3160741925239563, "step": 3225, "valid_targets_mean": 3290.5, "valid_targets_min": 816 }, { "epoch": 5.159744408945687, "grad_norm": 0.798268114199115, "learning_rate": 7.862204797272716e-06, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.2718545198440552, "step": 3230, "valid_targets_mean": 3023.7, "valid_targets_min": 357 }, { "epoch": 5.167731629392971, "grad_norm": 0.8348325476127518, "learning_rate": 7.798976554654438e-06, "loss": 0.3014, "loss_nan_ranks": 0, "loss_rank_avg": 0.30119389295578003, "step": 3235, "valid_targets_mean": 2845.3, "valid_targets_min": 1075 }, { "epoch": 5.175718849840256, "grad_norm": 0.8607243588387653, "learning_rate": 7.73594194615663e-06, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.3085380494594574, "step": 3240, "valid_targets_mean": 3279.1, "valid_targets_min": 1584 }, { "epoch": 5.18370607028754, "grad_norm": 0.8423375550417697, "learning_rate": 7.673101972158572e-06, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.27567416429519653, "step": 3245, "valid_targets_mean": 3083.5, "valid_targets_min": 1024 }, { "epoch": 5.1916932907348246, "grad_norm": 0.852032784496535, "learning_rate": 7.610457629950621e-06, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.31364840269088745, "step": 3250, "valid_targets_mean": 2934.4, "valid_targets_min": 812 }, { "epoch": 5.199680511182109, "grad_norm": 0.893030105220023, "learning_rate": 7.548009913718402e-06, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.30386775732040405, "step": 3255, "valid_targets_mean": 2715.1, "valid_targets_min": 876 }, { "epoch": 5.207667731629393, "grad_norm": 0.8002908602580624, "learning_rate": 7.485759814527034e-06, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.22816193103790283, "step": 3260, "valid_targets_mean": 2609.4, "valid_targets_min": 873 }, { "epoch": 5.215654952076678, "grad_norm": 0.8435557857370886, "learning_rate": 7.423708320305361e-06, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.3217226564884186, "step": 3265, "valid_targets_mean": 3110.6, "valid_targets_min": 958 }, { "epoch": 5.223642172523961, "grad_norm": 0.8017066205902743, "learning_rate": 7.361856415830335e-06, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.31609028577804565, "step": 3270, "valid_targets_mean": 3048.7, "valid_targets_min": 1242 }, { "epoch": 5.231629392971246, "grad_norm": 0.7893657441141547, "learning_rate": 7.300205082711336e-06, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.28325214982032776, "step": 3275, "valid_targets_mean": 2750.2, "valid_targets_min": 949 }, { "epoch": 5.23961661341853, "grad_norm": 0.819627997431354, "learning_rate": 7.2387552993746204e-06, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.3147261440753937, "step": 3280, "valid_targets_mean": 3124.6, "valid_targets_min": 1264 }, { "epoch": 5.247603833865814, "grad_norm": 0.9351538022500683, "learning_rate": 7.177508041047769e-06, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2968599200248718, "step": 3285, "valid_targets_mean": 2553.6, "valid_targets_min": 815 }, { "epoch": 5.255591054313099, "grad_norm": 0.7977468970245414, "learning_rate": 7.116464279744262e-06, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.29074782133102417, "step": 3290, "valid_targets_mean": 3356.4, "valid_targets_min": 877 }, { "epoch": 5.263578274760383, "grad_norm": 1.0002932413081114, "learning_rate": 7.055624984247977e-06, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.29408007860183716, "step": 3295, "valid_targets_mean": 2184.9, "valid_targets_min": 861 }, { "epoch": 5.271565495207668, "grad_norm": 0.8787187369922238, "learning_rate": 6.9949911200978805e-06, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.3129739463329315, "step": 3300, "valid_targets_mean": 2784.6, "valid_targets_min": 1331 }, { "epoch": 5.279552715654952, "grad_norm": 0.7688302677974961, "learning_rate": 6.934563649572678e-06, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.3016201853752136, "step": 3305, "valid_targets_mean": 3469.8, "valid_targets_min": 974 }, { "epoch": 5.287539936102236, "grad_norm": 0.9959524806904558, "learning_rate": 6.874343531675521e-06, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.28774166107177734, "step": 3310, "valid_targets_mean": 2686.1, "valid_targets_min": 1122 }, { "epoch": 5.295527156549521, "grad_norm": 0.7733058351207257, "learning_rate": 6.814331722118837e-06, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.26841095089912415, "step": 3315, "valid_targets_mean": 3147.9, "valid_targets_min": 970 }, { "epoch": 5.303514376996805, "grad_norm": 0.9011760987645664, "learning_rate": 6.754529173309112e-06, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.30054977536201477, "step": 3320, "valid_targets_mean": 3109.7, "valid_targets_min": 1123 }, { "epoch": 5.31150159744409, "grad_norm": 0.9298325145703232, "learning_rate": 6.694936834331809e-06, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.3050529956817627, "step": 3325, "valid_targets_mean": 2623.0, "valid_targets_min": 1197 }, { "epoch": 5.319488817891374, "grad_norm": 1.064260914169855, "learning_rate": 6.635555650936278e-06, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775145173072815, "step": 3330, "valid_targets_mean": 2871.4, "valid_targets_min": 962 }, { "epoch": 5.327476038338658, "grad_norm": 1.0158736615306445, "learning_rate": 6.576386565520794e-06, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.29485511779785156, "step": 3335, "valid_targets_mean": 2650.2, "valid_targets_min": 918 }, { "epoch": 5.335463258785943, "grad_norm": 0.870400658138986, "learning_rate": 6.5174305171175336e-06, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.30564117431640625, "step": 3340, "valid_targets_mean": 2673.1, "valid_targets_min": 944 }, { "epoch": 5.343450479233227, "grad_norm": 0.9219545531854473, "learning_rate": 6.458688441377734e-06, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.3267873227596283, "step": 3345, "valid_targets_mean": 2452.8, "valid_targets_min": 1007 }, { "epoch": 5.3514376996805115, "grad_norm": 0.8548078329069492, "learning_rate": 6.400161270556817e-06, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.32129526138305664, "step": 3350, "valid_targets_mean": 2940.7, "valid_targets_min": 1154 }, { "epoch": 5.359424920127796, "grad_norm": 0.8829397660322249, "learning_rate": 6.341849933499573e-06, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.3029319941997528, "step": 3355, "valid_targets_mean": 2987.6, "valid_targets_min": 1235 }, { "epoch": 5.36741214057508, "grad_norm": 0.8530974806686331, "learning_rate": 6.283755355625472e-06, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.2870420217514038, "step": 3360, "valid_targets_mean": 2990.7, "valid_targets_min": 1015 }, { "epoch": 5.375399361022364, "grad_norm": 0.9145905408930249, "learning_rate": 6.225878458913917e-06, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793818414211273, "step": 3365, "valid_targets_mean": 2471.1, "valid_targets_min": 1095 }, { "epoch": 5.383386581469648, "grad_norm": 0.8855698711753888, "learning_rate": 6.168220161889678e-06, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.34292152523994446, "step": 3370, "valid_targets_mean": 2997.3, "valid_targets_min": 1237 }, { "epoch": 5.391373801916933, "grad_norm": 0.7349516509123469, "learning_rate": 6.110781379608226e-06, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.25433140993118286, "step": 3375, "valid_targets_mean": 3235.3, "valid_targets_min": 1040 }, { "epoch": 5.399361022364217, "grad_norm": 1.0542744110852993, "learning_rate": 6.053563023641318e-06, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.38673511147499084, "step": 3380, "valid_targets_mean": 2352.1, "valid_targets_min": 1110 }, { "epoch": 5.407348242811501, "grad_norm": 0.827121547272794, "learning_rate": 5.996566002062439e-06, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.31490558385849, "step": 3385, "valid_targets_mean": 2948.4, "valid_targets_min": 1442 }, { "epoch": 5.415335463258786, "grad_norm": 0.8460018479986304, "learning_rate": 5.939791219432442e-06, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.29256829619407654, "step": 3390, "valid_targets_mean": 3162.4, "valid_targets_min": 1461 }, { "epoch": 5.42332268370607, "grad_norm": 0.8344660862038872, "learning_rate": 5.8832395767851846e-06, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2993561923503876, "step": 3395, "valid_targets_mean": 2604.9, "valid_targets_min": 1357 }, { "epoch": 5.431309904153355, "grad_norm": 0.9435119676368734, "learning_rate": 5.826911971613198e-06, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911856174468994, "step": 3400, "valid_targets_mean": 2483.8, "valid_targets_min": 849 }, { "epoch": 5.439297124600639, "grad_norm": 0.8098232349422515, "learning_rate": 5.770809297853495e-06, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.26919856667518616, "step": 3405, "valid_targets_mean": 2917.8, "valid_targets_min": 960 }, { "epoch": 5.447284345047923, "grad_norm": 0.862605956589078, "learning_rate": 5.714932445873325e-06, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.27299582958221436, "step": 3410, "valid_targets_mean": 2560.8, "valid_targets_min": 1041 }, { "epoch": 5.455271565495208, "grad_norm": 0.9020710803465632, "learning_rate": 5.659282302456115e-06, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.282878577709198, "step": 3415, "valid_targets_mean": 2509.6, "valid_targets_min": 1406 }, { "epoch": 5.463258785942492, "grad_norm": 0.8669441953326755, "learning_rate": 5.603859750787302e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.26606321334838867, "step": 3420, "valid_targets_mean": 2598.4, "valid_targets_min": 936 }, { "epoch": 5.4712460063897765, "grad_norm": 0.8752038102537848, "learning_rate": 5.548665670440418e-06, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888076603412628, "step": 3425, "valid_targets_mean": 2626.9, "valid_targets_min": 1683 }, { "epoch": 5.479233226837061, "grad_norm": 0.8483698839811887, "learning_rate": 5.4937009373630535e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.2613609731197357, "step": 3430, "valid_targets_mean": 2517.3, "valid_targets_min": 1131 }, { "epoch": 5.487220447284345, "grad_norm": 0.8034035667215341, "learning_rate": 5.438966423862997e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.2635997533798218, "step": 3435, "valid_targets_mean": 3017.4, "valid_targets_min": 1019 }, { "epoch": 5.49520766773163, "grad_norm": 0.8066653273398859, "learning_rate": 5.384462998594384e-06, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.26338884234428406, "step": 3440, "valid_targets_mean": 2630.4, "valid_targets_min": 1079 }, { "epoch": 5.503194888178914, "grad_norm": 0.8323232685505498, "learning_rate": 5.330191526543884e-06, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.288205087184906, "step": 3445, "valid_targets_mean": 2767.9, "valid_targets_min": 1243 }, { "epoch": 5.511182108626198, "grad_norm": 1.046868167441267, "learning_rate": 5.276152869017028e-06, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.35603612661361694, "step": 3450, "valid_targets_mean": 2214.9, "valid_targets_min": 1039 }, { "epoch": 5.519169329073483, "grad_norm": 0.8670390164428484, "learning_rate": 5.22234788362447e-06, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.28677263855934143, "step": 3455, "valid_targets_mean": 2610.7, "valid_targets_min": 923 }, { "epoch": 5.527156549520766, "grad_norm": 0.953868413472568, "learning_rate": 5.168777424268454e-06, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.34387460350990295, "step": 3460, "valid_targets_mean": 2308.2, "valid_targets_min": 1232 }, { "epoch": 5.535143769968051, "grad_norm": 0.8022290889230155, "learning_rate": 5.115442341129171e-06, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.288701593875885, "step": 3465, "valid_targets_mean": 3129.0, "valid_targets_min": 870 }, { "epoch": 5.543130990415335, "grad_norm": 0.8115409043956004, "learning_rate": 5.062343480651364e-06, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.29845625162124634, "step": 3470, "valid_targets_mean": 2757.8, "valid_targets_min": 876 }, { "epoch": 5.55111821086262, "grad_norm": 0.7835197890738079, "learning_rate": 5.009481685530817e-06, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.28913915157318115, "step": 3475, "valid_targets_mean": 3522.1, "valid_targets_min": 1068 }, { "epoch": 5.559105431309904, "grad_norm": 0.7660079313726896, "learning_rate": 4.956857794701026e-06, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.2907702624797821, "step": 3480, "valid_targets_mean": 3248.2, "valid_targets_min": 1035 }, { "epoch": 5.567092651757188, "grad_norm": 0.8170731714868842, "learning_rate": 4.904472643319873e-06, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.2342405468225479, "step": 3485, "valid_targets_mean": 2918.7, "valid_targets_min": 967 }, { "epoch": 5.575079872204473, "grad_norm": 0.8514738656541708, "learning_rate": 4.852327062756352e-06, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.2788478136062622, "step": 3490, "valid_targets_mean": 2642.8, "valid_targets_min": 1083 }, { "epoch": 5.583067092651757, "grad_norm": 0.9142924446585464, "learning_rate": 4.800421880577411e-06, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.2819330096244812, "step": 3495, "valid_targets_mean": 2215.6, "valid_targets_min": 970 }, { "epoch": 5.5910543130990416, "grad_norm": 0.8351131614292047, "learning_rate": 4.748757920534779e-06, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.3117348551750183, "step": 3500, "valid_targets_mean": 2887.9, "valid_targets_min": 1066 }, { "epoch": 5.599041533546326, "grad_norm": 0.878780990253628, "learning_rate": 4.697336002551947e-06, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.30660977959632874, "step": 3505, "valid_targets_mean": 2960.4, "valid_targets_min": 1047 }, { "epoch": 5.60702875399361, "grad_norm": 0.9550316046064914, "learning_rate": 4.6461569427110684e-06, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.2975427508354187, "step": 3510, "valid_targets_mean": 2113.9, "valid_targets_min": 1039 }, { "epoch": 5.615015974440895, "grad_norm": 0.8614684885214283, "learning_rate": 4.5952215532401146e-06, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506102919578552, "step": 3515, "valid_targets_mean": 3007.6, "valid_targets_min": 1284 }, { "epoch": 5.623003194888179, "grad_norm": 0.7055162824372356, "learning_rate": 4.544530642499894e-06, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834452688694, "step": 3520, "valid_targets_mean": 3786.9, "valid_targets_min": 1342 }, { "epoch": 5.6309904153354635, "grad_norm": 0.9327473225687424, "learning_rate": 4.4940850149712765e-06, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.2986459732055664, "step": 3525, "valid_targets_mean": 2386.1, "valid_targets_min": 1204 }, { "epoch": 5.638977635782748, "grad_norm": 0.8782006771428341, "learning_rate": 4.443885471242418e-06, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.31005507707595825, "step": 3530, "valid_targets_mean": 2924.8, "valid_targets_min": 640 }, { "epoch": 5.646964856230032, "grad_norm": 0.9010177674718335, "learning_rate": 4.393932807996017e-06, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.31273573637008667, "step": 3535, "valid_targets_mean": 3174.8, "valid_targets_min": 998 }, { "epoch": 5.654952076677317, "grad_norm": 0.9330314923606065, "learning_rate": 4.344227817996735e-06, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.2842142581939697, "step": 3540, "valid_targets_mean": 2522.3, "valid_targets_min": 1245 }, { "epoch": 5.6629392971246, "grad_norm": 0.8724285443483777, "learning_rate": 4.294771290078548e-06, "loss": 0.3038, "loss_nan_ranks": 0, "loss_rank_avg": 0.26506611704826355, "step": 3545, "valid_targets_mean": 3159.2, "valid_targets_min": 1330 }, { "epoch": 5.6709265175718855, "grad_norm": 0.8540186381544715, "learning_rate": 4.245564009132293e-06, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.3010174036026001, "step": 3550, "valid_targets_mean": 2621.1, "valid_targets_min": 947 }, { "epoch": 5.678913738019169, "grad_norm": 0.8410560464629185, "learning_rate": 4.196606756093138e-06, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.27265846729278564, "step": 3555, "valid_targets_mean": 2626.9, "valid_targets_min": 981 }, { "epoch": 5.686900958466453, "grad_norm": 0.8063270462445804, "learning_rate": 4.147900307928268e-06, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.302957147359848, "step": 3560, "valid_targets_mean": 3118.4, "valid_targets_min": 883 }, { "epoch": 5.694888178913738, "grad_norm": 0.8910767531567404, "learning_rate": 4.099445437624487e-06, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881123125553131, "step": 3565, "valid_targets_mean": 2818.1, "valid_targets_min": 1050 }, { "epoch": 5.702875399361022, "grad_norm": 0.9644419826076724, "learning_rate": 4.051242914175995e-06, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.3191588819026947, "step": 3570, "valid_targets_mean": 2307.6, "valid_targets_min": 1330 }, { "epoch": 5.710862619808307, "grad_norm": 0.8825281014957341, "learning_rate": 4.003293502572163e-06, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749369144439697, "step": 3575, "valid_targets_mean": 2434.3, "valid_targets_min": 924 }, { "epoch": 5.718849840255591, "grad_norm": 0.8149662345511066, "learning_rate": 3.955597963785391e-06, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.30972984433174133, "step": 3580, "valid_targets_mean": 3602.3, "valid_targets_min": 1235 }, { "epoch": 5.726837060702875, "grad_norm": 0.8208308645247685, "learning_rate": 3.908157054759048e-06, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.33973070979118347, "step": 3585, "valid_targets_mean": 3309.0, "valid_targets_min": 1474 }, { "epoch": 5.73482428115016, "grad_norm": 1.2817350246441914, "learning_rate": 3.860971528395427e-06, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.281210720539093, "step": 3590, "valid_targets_mean": 3072.1, "valid_targets_min": 1051 }, { "epoch": 5.742811501597444, "grad_norm": 0.858260521624848, "learning_rate": 3.814042133543847e-06, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.29261261224746704, "step": 3595, "valid_targets_mean": 2800.6, "valid_targets_min": 1520 }, { "epoch": 5.7507987220447285, "grad_norm": 0.8620084879239728, "learning_rate": 3.7673696149887117e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.29667365550994873, "step": 3600, "valid_targets_mean": 2740.4, "valid_targets_min": 1116 }, { "epoch": 5.758785942492013, "grad_norm": 0.8265698068500232, "learning_rate": 3.72095471343773e-06, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.3263239562511444, "step": 3605, "valid_targets_mean": 3160.9, "valid_targets_min": 1162 }, { "epoch": 5.766773162939297, "grad_norm": 0.9027943191349252, "learning_rate": 3.674798165510136e-06, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.34345391392707825, "step": 3610, "valid_targets_mean": 3071.5, "valid_targets_min": 888 }, { "epoch": 5.774760383386582, "grad_norm": 0.836591157500133, "learning_rate": 3.6289007037250244e-06, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.26754382252693176, "step": 3615, "valid_targets_mean": 2665.3, "valid_targets_min": 1085 }, { "epoch": 5.782747603833866, "grad_norm": 0.9145676011202615, "learning_rate": 3.5832630564897073e-06, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.32892486453056335, "step": 3620, "valid_targets_mean": 2602.9, "valid_targets_min": 769 }, { "epoch": 5.7907348242811505, "grad_norm": 0.7629854921736774, "learning_rate": 3.5378859480881443e-06, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.24377216398715973, "step": 3625, "valid_targets_mean": 3199.8, "valid_targets_min": 811 }, { "epoch": 5.798722044728435, "grad_norm": 0.8042286264919823, "learning_rate": 3.492770098669478e-06, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911136746406555, "step": 3630, "valid_targets_mean": 3393.9, "valid_targets_min": 1265 }, { "epoch": 5.806709265175719, "grad_norm": 0.8369688623613801, "learning_rate": 3.4479162242365717e-06, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.27095547318458557, "step": 3635, "valid_targets_mean": 2753.4, "valid_targets_min": 1154 }, { "epoch": 5.814696485623003, "grad_norm": 0.8947818480367905, "learning_rate": 3.403325036634679e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.27299612760543823, "step": 3640, "valid_targets_mean": 2596.2, "valid_targets_min": 1244 }, { "epoch": 5.822683706070287, "grad_norm": 0.8775169850347424, "learning_rate": 3.3589972435401184e-06, "loss": 0.3042, "loss_nan_ranks": 0, "loss_rank_avg": 0.2821030616760254, "step": 3645, "valid_targets_mean": 2154.2, "valid_targets_min": 927 }, { "epoch": 5.830670926517572, "grad_norm": 0.9187215143961998, "learning_rate": 3.3149335484490553e-06, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.30498552322387695, "step": 3650, "valid_targets_mean": 2995.2, "valid_targets_min": 1031 }, { "epoch": 5.838658146964856, "grad_norm": 0.7319498337703215, "learning_rate": 3.2711346506663346e-06, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.28768712282180786, "step": 3655, "valid_targets_mean": 3588.6, "valid_targets_min": 2002 }, { "epoch": 5.84664536741214, "grad_norm": 0.8297441398475794, "learning_rate": 3.2276012452943893e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571295499801636, "step": 3660, "valid_targets_mean": 2946.4, "valid_targets_min": 957 }, { "epoch": 5.854632587859425, "grad_norm": 0.9457931068247055, "learning_rate": 3.1843340232222064e-06, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.23238760232925415, "step": 3665, "valid_targets_mean": 2739.9, "valid_targets_min": 848 }, { "epoch": 5.862619808306709, "grad_norm": 0.7880116160919101, "learning_rate": 3.1413336711143437e-06, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.2589631974697113, "step": 3670, "valid_targets_mean": 3419.8, "valid_targets_min": 1110 }, { "epoch": 5.8706070287539935, "grad_norm": 0.8733165347603803, "learning_rate": 3.0986008714000703e-06, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.2866963744163513, "step": 3675, "valid_targets_mean": 2831.0, "valid_targets_min": 1189 }, { "epoch": 5.878594249201278, "grad_norm": 0.9061936948826054, "learning_rate": 3.056136302262489e-06, "loss": 0.286, "loss_nan_ranks": 0, "loss_rank_avg": 0.2790377140045166, "step": 3680, "valid_targets_mean": 2385.3, "valid_targets_min": 995 }, { "epoch": 5.886581469648562, "grad_norm": 0.7744924847924733, "learning_rate": 3.0139406376278212e-06, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.23188713192939758, "step": 3685, "valid_targets_mean": 3068.9, "valid_targets_min": 1151 }, { "epoch": 5.894568690095847, "grad_norm": 0.8593959472274256, "learning_rate": 2.972014547154671e-06, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.28993451595306396, "step": 3690, "valid_targets_mean": 2661.4, "valid_targets_min": 1105 }, { "epoch": 5.902555910543131, "grad_norm": 0.872637452202428, "learning_rate": 2.930358696223423e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.2856522500514984, "step": 3695, "valid_targets_mean": 2584.5, "valid_targets_min": 1043 }, { "epoch": 5.9105431309904155, "grad_norm": 0.7625580478157692, "learning_rate": 2.8889737459256695e-06, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.2512621581554413, "step": 3700, "valid_targets_mean": 3041.8, "valid_targets_min": 810 }, { "epoch": 5.9185303514377, "grad_norm": 0.817825382177412, "learning_rate": 2.8478603530537285e-06, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.271395742893219, "step": 3705, "valid_targets_mean": 2701.8, "valid_targets_min": 1104 }, { "epoch": 5.926517571884984, "grad_norm": 0.945231408750339, "learning_rate": 2.8070191700902194e-06, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.3027716875076294, "step": 3710, "valid_targets_mean": 2422.8, "valid_targets_min": 866 }, { "epoch": 5.934504792332269, "grad_norm": 0.9458089413545945, "learning_rate": 2.7664508451976903e-06, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2904042899608612, "step": 3715, "valid_targets_mean": 2483.2, "valid_targets_min": 898 }, { "epoch": 5.942492012779553, "grad_norm": 0.8523965806490982, "learning_rate": 2.726156022208362e-06, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.28088122606277466, "step": 3720, "valid_targets_mean": 2949.6, "valid_targets_min": 666 }, { "epoch": 5.950479233226837, "grad_norm": 0.8763501591941483, "learning_rate": 2.6861353406138713e-06, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.27324312925338745, "step": 3725, "valid_targets_mean": 2387.6, "valid_targets_min": 895 }, { "epoch": 5.958466453674122, "grad_norm": 0.878634194918592, "learning_rate": 2.646389435555172e-06, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.32627028226852417, "step": 3730, "valid_targets_mean": 3211.6, "valid_targets_min": 891 }, { "epoch": 5.966453674121405, "grad_norm": 0.8672653374965403, "learning_rate": 2.6069189378124015e-06, "loss": 0.2995, "loss_nan_ranks": 0, "loss_rank_avg": 0.31162893772125244, "step": 3735, "valid_targets_mean": 2756.2, "valid_targets_min": 1049 }, { "epoch": 5.97444089456869, "grad_norm": 0.9052303395289947, "learning_rate": 2.567724473794908e-06, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.3283204436302185, "step": 3740, "valid_targets_mean": 2518.8, "valid_targets_min": 949 }, { "epoch": 5.982428115015974, "grad_norm": 0.9078280494758757, "learning_rate": 2.5288066655312914e-06, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.2921939492225647, "step": 3745, "valid_targets_mean": 2445.1, "valid_targets_min": 1158 }, { "epoch": 5.9904153354632586, "grad_norm": 0.9142787916430909, "learning_rate": 2.4901661306595414e-06, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.3068923354148865, "step": 3750, "valid_targets_mean": 2726.0, "valid_targets_min": 778 }, { "epoch": 5.998402555910543, "grad_norm": 0.8715476605369831, "learning_rate": 2.451803482417234e-06, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.3258388340473175, "step": 3755, "valid_targets_mean": 2622.8, "valid_targets_min": 784 }, { "epoch": 6.006389776357827, "grad_norm": 0.8127550034791736, "learning_rate": 2.413719329631785e-06, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.275146484375, "step": 3760, "valid_targets_mean": 2720.4, "valid_targets_min": 740 }, { "epoch": 6.014376996805112, "grad_norm": 0.8144087631669996, "learning_rate": 2.375914276710811e-06, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2622288167476654, "step": 3765, "valid_targets_mean": 2943.3, "valid_targets_min": 1245 }, { "epoch": 6.022364217252396, "grad_norm": 0.7721698190279348, "learning_rate": 2.338388923632513e-06, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618906497955322, "step": 3770, "valid_targets_mean": 2792.1, "valid_targets_min": 1287 }, { "epoch": 6.0303514376996805, "grad_norm": 0.8398697731858585, "learning_rate": 2.3011438659361794e-06, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.27312394976615906, "step": 3775, "valid_targets_mean": 2793.1, "valid_targets_min": 1555 }, { "epoch": 6.038338658146965, "grad_norm": 0.8567900298455935, "learning_rate": 2.2641796947127114e-06, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.28074395656585693, "step": 3780, "valid_targets_mean": 2851.5, "valid_targets_min": 964 }, { "epoch": 6.046325878594249, "grad_norm": 0.923861896817049, "learning_rate": 2.2274969965952553e-06, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.32039231061935425, "step": 3785, "valid_targets_mean": 2628.1, "valid_targets_min": 1072 }, { "epoch": 6.054313099041534, "grad_norm": 0.8181909679032574, "learning_rate": 2.1910963537498887e-06, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.2667577266693115, "step": 3790, "valid_targets_mean": 2870.7, "valid_targets_min": 1164 }, { "epoch": 6.062300319488818, "grad_norm": 0.8109778169918753, "learning_rate": 2.1549783438663872e-06, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.2527042627334595, "step": 3795, "valid_targets_mean": 3018.8, "valid_targets_min": 1043 }, { "epoch": 6.0702875399361025, "grad_norm": 0.8499658360083157, "learning_rate": 2.1191435401490534e-06, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.25481629371643066, "step": 3800, "valid_targets_mean": 2641.6, "valid_targets_min": 1046 }, { "epoch": 6.078274760383387, "grad_norm": 0.924864077463184, "learning_rate": 2.0835925113076062e-06, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.26144057512283325, "step": 3805, "valid_targets_mean": 2630.7, "valid_targets_min": 1213 }, { "epoch": 6.086261980830671, "grad_norm": 0.8611502725518941, "learning_rate": 2.0483258215481784e-06, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.28638124465942383, "step": 3810, "valid_targets_mean": 2681.8, "valid_targets_min": 915 }, { "epoch": 6.094249201277956, "grad_norm": 0.93643148378172, "learning_rate": 2.0133440305643413e-06, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.2659624218940735, "step": 3815, "valid_targets_mean": 2374.9, "valid_targets_min": 1264 }, { "epoch": 6.102236421725239, "grad_norm": 0.9094153943052289, "learning_rate": 1.9786476935282463e-06, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.29782217741012573, "step": 3820, "valid_targets_mean": 2679.3, "valid_targets_min": 1140 }, { "epoch": 6.110223642172524, "grad_norm": 0.8578921212730504, "learning_rate": 1.944237361081782e-06, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.30669862031936646, "step": 3825, "valid_targets_mean": 2931.2, "valid_targets_min": 919 }, { "epoch": 6.118210862619808, "grad_norm": 0.8774447171982998, "learning_rate": 1.9101135793278746e-06, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.24913069605827332, "step": 3830, "valid_targets_mean": 2745.9, "valid_targets_min": 1024 }, { "epoch": 6.126198083067092, "grad_norm": 0.8198399829117742, "learning_rate": 1.8762768898217732e-06, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930334806442261, "step": 3835, "valid_targets_mean": 2795.0, "valid_targets_min": 747 }, { "epoch": 6.134185303514377, "grad_norm": 0.6701701605321356, "learning_rate": 1.8427278295625006e-06, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.23434777557849884, "step": 3840, "valid_targets_mean": 3436.4, "valid_targets_min": 1204 }, { "epoch": 6.142172523961661, "grad_norm": 1.0174049901842122, "learning_rate": 1.8094669309843161e-06, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.28728413581848145, "step": 3845, "valid_targets_mean": 2038.7, "valid_targets_min": 1061 }, { "epoch": 6.1501597444089455, "grad_norm": 0.7377419451238836, "learning_rate": 1.776494721948241e-06, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.26700955629348755, "step": 3850, "valid_targets_mean": 3754.7, "valid_targets_min": 1146 }, { "epoch": 6.15814696485623, "grad_norm": 0.8809290165165347, "learning_rate": 1.7438117257337239e-06, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.22705921530723572, "step": 3855, "valid_targets_mean": 2662.8, "valid_targets_min": 944 }, { "epoch": 6.166134185303514, "grad_norm": 0.8531110330155715, "learning_rate": 1.7114184610302964e-06, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.27642789483070374, "step": 3860, "valid_targets_mean": 3141.9, "valid_targets_min": 1396 }, { "epoch": 6.174121405750799, "grad_norm": 0.7792356842403435, "learning_rate": 1.67931544192937e-06, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.26689833402633667, "step": 3865, "valid_targets_mean": 3185.1, "valid_targets_min": 1228 }, { "epoch": 6.182108626198083, "grad_norm": 0.932186250287318, "learning_rate": 1.6475031779160611e-06, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.29413291811943054, "step": 3870, "valid_targets_mean": 2828.4, "valid_targets_min": 817 }, { "epoch": 6.1900958466453675, "grad_norm": 0.9999872211296582, "learning_rate": 1.6159821738611192e-06, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.3073047697544098, "step": 3875, "valid_targets_mean": 2609.2, "valid_targets_min": 1015 }, { "epoch": 6.198083067092652, "grad_norm": 0.8522969496137042, "learning_rate": 1.5847529300128827e-06, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.2496946156024933, "step": 3880, "valid_targets_mean": 2715.8, "valid_targets_min": 947 }, { "epoch": 6.206070287539936, "grad_norm": 0.8205921714964237, "learning_rate": 1.5538159419893895e-06, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.3144986629486084, "step": 3885, "valid_targets_mean": 3409.3, "valid_targets_min": 1203 }, { "epoch": 6.214057507987221, "grad_norm": 1.0161305576290838, "learning_rate": 1.5231717007704738e-06, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.28573137521743774, "step": 3890, "valid_targets_mean": 2113.8, "valid_targets_min": 671 }, { "epoch": 6.222044728434505, "grad_norm": 0.8504064835959527, "learning_rate": 1.4928206926899801e-06, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.27324777841567993, "step": 3895, "valid_targets_mean": 2668.8, "valid_targets_min": 876 }, { "epoch": 6.2300319488817895, "grad_norm": 0.8751818535512605, "learning_rate": 1.4627633994280599e-06, "loss": 0.2901, "loss_nan_ranks": 0, "loss_rank_avg": 0.3199600577354431, "step": 3900, "valid_targets_mean": 2899.5, "valid_targets_min": 1095 }, { "epoch": 6.238019169329074, "grad_norm": 0.8728480586187728, "learning_rate": 1.433000298003504e-06, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.25064951181411743, "step": 3905, "valid_targets_mean": 3270.7, "valid_targets_min": 1027 }, { "epoch": 6.246006389776358, "grad_norm": 0.7665455493403013, "learning_rate": 1.4035318607662029e-06, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.28335410356521606, "step": 3910, "valid_targets_mean": 3683.3, "valid_targets_min": 1096 }, { "epoch": 6.253993610223642, "grad_norm": 0.7720218615283687, "learning_rate": 1.3743585553896144e-06, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.29515159130096436, "step": 3915, "valid_targets_mean": 3592.1, "valid_targets_min": 1158 }, { "epoch": 6.261980830670926, "grad_norm": 0.9127307390415227, "learning_rate": 1.345480844863376e-06, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.280670166015625, "step": 3920, "valid_targets_mean": 2674.4, "valid_targets_min": 1174 }, { "epoch": 6.2699680511182105, "grad_norm": 0.8744155416369218, "learning_rate": 1.316899187485925e-06, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.26286551356315613, "step": 3925, "valid_targets_mean": 2467.4, "valid_targets_min": 1295 }, { "epoch": 6.277955271565495, "grad_norm": 1.0050448884691408, "learning_rate": 1.288614036857252e-06, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.2835194766521454, "step": 3930, "valid_targets_mean": 2397.7, "valid_targets_min": 613 }, { "epoch": 6.285942492012779, "grad_norm": 1.073465147880673, "learning_rate": 1.260625841871692e-06, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.30487751960754395, "step": 3935, "valid_targets_mean": 1912.4, "valid_targets_min": 784 }, { "epoch": 6.293929712460064, "grad_norm": 0.9475913607873788, "learning_rate": 1.2329350467107925e-06, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.3098008334636688, "step": 3940, "valid_targets_mean": 2448.3, "valid_targets_min": 1050 }, { "epoch": 6.301916932907348, "grad_norm": 0.8134903936892746, "learning_rate": 1.2055420908362781e-06, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.2720017433166504, "step": 3945, "valid_targets_mean": 2767.9, "valid_targets_min": 681 }, { "epoch": 6.3099041533546325, "grad_norm": 0.8888924414509212, "learning_rate": 1.1784474089830612e-06, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.28785115480422974, "step": 3950, "valid_targets_mean": 2391.2, "valid_targets_min": 1345 }, { "epoch": 6.317891373801917, "grad_norm": 0.86398511760062, "learning_rate": 1.1516514311523607e-06, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.3019968271255493, "step": 3955, "valid_targets_mean": 3056.1, "valid_targets_min": 1161 }, { "epoch": 6.325878594249201, "grad_norm": 0.9214178738753978, "learning_rate": 1.1251545826048593e-06, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911544442176819, "step": 3960, "valid_targets_mean": 2535.8, "valid_targets_min": 938 }, { "epoch": 6.333865814696486, "grad_norm": 0.865667826552045, "learning_rate": 1.098957283853972e-06, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934360206127167, "step": 3965, "valid_targets_mean": 2922.7, "valid_targets_min": 1151 }, { "epoch": 6.34185303514377, "grad_norm": 0.7197667191842236, "learning_rate": 1.0730599506591476e-06, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.2684939503669739, "step": 3970, "valid_targets_mean": 3498.9, "valid_targets_min": 1109 }, { "epoch": 6.3498402555910545, "grad_norm": 1.0547057892528122, "learning_rate": 1.0474629940192994e-06, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.28599128127098083, "step": 3975, "valid_targets_mean": 2373.9, "valid_targets_min": 981 }, { "epoch": 6.357827476038339, "grad_norm": 0.7493494299222992, "learning_rate": 1.0221668201662726e-06, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.27192163467407227, "step": 3980, "valid_targets_mean": 3340.1, "valid_targets_min": 933 }, { "epoch": 6.365814696485623, "grad_norm": 0.8997567714591271, "learning_rate": 9.971718305583767e-07, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.30002540349960327, "step": 3985, "valid_targets_mean": 2738.8, "valid_targets_min": 905 }, { "epoch": 6.373801916932908, "grad_norm": 0.8866650690614957, "learning_rate": 9.724784218740524e-07, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.28500303626060486, "step": 3990, "valid_targets_mean": 2653.4, "valid_targets_min": 811 }, { "epoch": 6.381789137380192, "grad_norm": 0.9347856270629038, "learning_rate": 9.480869860055364e-07, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.27928462624549866, "step": 3995, "valid_targets_mean": 2648.6, "valid_targets_min": 617 }, { "epoch": 6.389776357827476, "grad_norm": 1.0017367851930086, "learning_rate": 9.239979100526763e-07, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.29938584566116333, "step": 4000, "valid_targets_mean": 2246.9, "valid_targets_min": 993 }, { "epoch": 6.397763578274761, "grad_norm": 0.8659652867802654, "learning_rate": 9.002115763167585e-07, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.3003730773925781, "step": 4005, "valid_targets_mean": 2882.9, "valid_targets_min": 1010 }, { "epoch": 6.405750798722044, "grad_norm": 0.9034083580157991, "learning_rate": 8.7672836229447e-07, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2945745289325714, "step": 4010, "valid_targets_mean": 2482.9, "valid_targets_min": 1156 }, { "epoch": 6.413738019169329, "grad_norm": 0.8927648422059912, "learning_rate": 8.535486406718684e-07, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580193877220154, "step": 4015, "valid_targets_mean": 2508.5, "valid_targets_min": 763 }, { "epoch": 6.421725239616613, "grad_norm": 0.9879607023550055, "learning_rate": 8.306727793185132e-07, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.2995275557041168, "step": 4020, "valid_targets_mean": 2534.1, "valid_targets_min": 1082 }, { "epoch": 6.4297124600638975, "grad_norm": 0.7936525585301886, "learning_rate": 8.081011412815965e-07, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.29689520597457886, "step": 4025, "valid_targets_mean": 4021.8, "valid_targets_min": 1473 }, { "epoch": 6.437699680511182, "grad_norm": 0.8966996505296543, "learning_rate": 7.858340847801815e-07, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.32515469193458557, "step": 4030, "valid_targets_mean": 2741.1, "valid_targets_min": 1039 }, { "epoch": 6.445686900958466, "grad_norm": 1.0500500173826224, "learning_rate": 7.638719631995406e-07, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.28945955634117126, "step": 4035, "valid_targets_mean": 2265.1, "valid_targets_min": 797 }, { "epoch": 6.453674121405751, "grad_norm": 0.7971219075331492, "learning_rate": 7.422151250855214e-07, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784157693386078, "step": 4040, "valid_targets_mean": 3321.6, "valid_targets_min": 1364 }, { "epoch": 6.461661341853035, "grad_norm": 0.8249509940299007, "learning_rate": 7.208639141390295e-07, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.2764117121696472, "step": 4045, "valid_targets_mean": 2801.1, "valid_targets_min": 1112 }, { "epoch": 6.4696485623003195, "grad_norm": 0.6754399283991835, "learning_rate": 6.998186692105657e-07, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.3034869134426117, "step": 4050, "valid_targets_mean": 4446.3, "valid_targets_min": 1249 }, { "epoch": 6.477635782747604, "grad_norm": 0.8541733280528224, "learning_rate": 6.790797242948644e-07, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.28104281425476074, "step": 4055, "valid_targets_mean": 2924.0, "valid_targets_min": 1210 }, { "epoch": 6.485623003194888, "grad_norm": 0.8991862823370763, "learning_rate": 6.5864740852557e-07, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.29677364230155945, "step": 4060, "valid_targets_mean": 2876.8, "valid_targets_min": 1021 }, { "epoch": 6.493610223642173, "grad_norm": 0.923502088444072, "learning_rate": 6.385220461700248e-07, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.2582230865955353, "step": 4065, "valid_targets_mean": 2419.9, "valid_targets_min": 1113 }, { "epoch": 6.501597444089457, "grad_norm": 0.8923137741720667, "learning_rate": 6.187039566241337e-07, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.29919350147247314, "step": 4070, "valid_targets_mean": 2512.4, "valid_targets_min": 1190 }, { "epoch": 6.5095846645367414, "grad_norm": 0.947003285788988, "learning_rate": 5.99193454407272e-07, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.25678086280822754, "step": 4075, "valid_targets_mean": 2908.8, "valid_targets_min": 852 }, { "epoch": 6.517571884984026, "grad_norm": 0.9290365545693675, "learning_rate": 5.799908491573148e-07, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2681635618209839, "step": 4080, "valid_targets_mean": 2875.2, "valid_targets_min": 1035 }, { "epoch": 6.52555910543131, "grad_norm": 0.8055510758263922, "learning_rate": 5.610964456257107e-07, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032207787036896, "step": 4085, "valid_targets_mean": 3016.1, "valid_targets_min": 860 }, { "epoch": 6.533546325878595, "grad_norm": 0.8661559196905022, "learning_rate": 5.425105436726496e-07, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192429542541504, "step": 4090, "valid_targets_mean": 3199.2, "valid_targets_min": 1193 }, { "epoch": 6.541533546325878, "grad_norm": 0.8334359620774163, "learning_rate": 5.242334382623004e-07, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644953727722168, "step": 4095, "valid_targets_mean": 2952.7, "valid_targets_min": 1006 }, { "epoch": 6.549520766773163, "grad_norm": 0.8345711981656436, "learning_rate": 5.062654194581429e-07, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751539349555969, "step": 4100, "valid_targets_mean": 2936.6, "valid_targets_min": 1057 }, { "epoch": 6.557507987220447, "grad_norm": 0.8249390721549272, "learning_rate": 4.88606772418343e-07, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.27628517150878906, "step": 4105, "valid_targets_mean": 3009.9, "valid_targets_min": 1232 }, { "epoch": 6.565495207667731, "grad_norm": 0.8906179256977498, "learning_rate": 4.7125777739123857e-07, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.26204580068588257, "step": 4110, "valid_targets_mean": 2616.2, "valid_targets_min": 786 }, { "epoch": 6.573482428115016, "grad_norm": 0.9564767125815427, "learning_rate": 4.54218709710903e-07, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.27267003059387207, "step": 4115, "valid_targets_mean": 2530.6, "valid_targets_min": 835 }, { "epoch": 6.5814696485623, "grad_norm": 1.0097256008643347, "learning_rate": 4.374898397927507e-07, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.280648410320282, "step": 4120, "valid_targets_mean": 2028.9, "valid_targets_min": 879 }, { "epoch": 6.5894568690095845, "grad_norm": 0.7910653764082966, "learning_rate": 4.210714331292698e-07, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.25909939408302307, "step": 4125, "valid_targets_mean": 3639.0, "valid_targets_min": 640 }, { "epoch": 6.597444089456869, "grad_norm": 0.8967697560189001, "learning_rate": 4.049637502857895e-07, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.31095483899116516, "step": 4130, "valid_targets_mean": 2755.9, "valid_targets_min": 1118 }, { "epoch": 6.605431309904153, "grad_norm": 0.8044131928051629, "learning_rate": 3.8916704689635707e-07, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.26935964822769165, "step": 4135, "valid_targets_mean": 3220.1, "valid_targets_min": 715 }, { "epoch": 6.613418530351438, "grad_norm": 0.9486702138753735, "learning_rate": 3.736815736596766e-07, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.262970507144928, "step": 4140, "valid_targets_mean": 2247.6, "valid_targets_min": 1247 }, { "epoch": 6.621405750798722, "grad_norm": 0.9444733020979281, "learning_rate": 3.5850757633513424e-07, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.2954460382461548, "step": 4145, "valid_targets_mean": 2492.8, "valid_targets_min": 960 }, { "epoch": 6.6293929712460065, "grad_norm": 0.8264663607471652, "learning_rate": 3.4364529573888803e-07, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.2821193337440491, "step": 4150, "valid_targets_mean": 3666.4, "valid_targets_min": 1362 }, { "epoch": 6.637380191693291, "grad_norm": 0.7883252732780124, "learning_rate": 3.2909496774005344e-07, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.24705815315246582, "step": 4155, "valid_targets_mean": 3010.6, "valid_targets_min": 760 }, { "epoch": 6.645367412140575, "grad_norm": 0.8581251837834798, "learning_rate": 3.14856823256966e-07, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2624890208244324, "step": 4160, "valid_targets_mean": 2668.6, "valid_targets_min": 1019 }, { "epoch": 6.65335463258786, "grad_norm": 0.8240095528399365, "learning_rate": 3.009310882534999e-07, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.29036304354667664, "step": 4165, "valid_targets_mean": 2824.6, "valid_targets_min": 963 }, { "epoch": 6.661341853035144, "grad_norm": 0.7516190273322936, "learning_rate": 2.8731798373550004e-07, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.25370168685913086, "step": 4170, "valid_targets_mean": 3306.3, "valid_targets_min": 1047 }, { "epoch": 6.669329073482428, "grad_norm": 0.9547075812225164, "learning_rate": 2.740177257472576e-07, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.3222120404243469, "step": 4175, "valid_targets_mean": 2726.6, "valid_targets_min": 1220 }, { "epoch": 6.677316293929713, "grad_norm": 0.9147687950227396, "learning_rate": 2.6103052536810226e-07, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2797955274581909, "step": 4180, "valid_targets_mean": 2509.3, "valid_targets_min": 1157 }, { "epoch": 6.685303514376997, "grad_norm": 0.9628729966351203, "learning_rate": 2.4835658870902226e-07, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.3168693780899048, "step": 4185, "valid_targets_mean": 2480.8, "valid_targets_min": 891 }, { "epoch": 6.693290734824281, "grad_norm": 0.9351117480178864, "learning_rate": 2.3599611690943158e-07, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.3047877848148346, "step": 4190, "valid_targets_mean": 2964.2, "valid_targets_min": 1300 }, { "epoch": 6.701277955271565, "grad_norm": 1.0413196442161707, "learning_rate": 2.2394930613393927e-07, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2819758653640747, "step": 4195, "valid_targets_mean": 2164.5, "valid_targets_min": 881 }, { "epoch": 6.7092651757188495, "grad_norm": 0.8822261803756162, "learning_rate": 2.122163475692629e-07, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054836392402649, "step": 4200, "valid_targets_mean": 2828.2, "valid_targets_min": 747 }, { "epoch": 6.717252396166134, "grad_norm": 1.3216177064624284, "learning_rate": 2.0079742742118878e-07, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610338032245636, "step": 4205, "valid_targets_mean": 3650.8, "valid_targets_min": 1250 }, { "epoch": 6.725239616613418, "grad_norm": 0.9383861038544505, "learning_rate": 1.8969272691160334e-07, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.30719295144081116, "step": 4210, "valid_targets_mean": 2418.2, "valid_targets_min": 1321 }, { "epoch": 6.733226837060703, "grad_norm": 0.8409922729450794, "learning_rate": 1.789024222756397e-07, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.265010803937912, "step": 4215, "valid_targets_mean": 3095.4, "valid_targets_min": 1215 }, { "epoch": 6.741214057507987, "grad_norm": 0.7495800721357617, "learning_rate": 1.6842668475885782e-07, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.3141767978668213, "step": 4220, "valid_targets_mean": 4236.1, "valid_targets_min": 1231 }, { "epoch": 6.7492012779552715, "grad_norm": 0.8522557539051201, "learning_rate": 1.582656806145444e-07, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.2988400459289551, "step": 4225, "valid_targets_mean": 3127.9, "valid_targets_min": 1049 }, { "epoch": 6.757188498402556, "grad_norm": 0.9893507336164773, "learning_rate": 1.4841957110106388e-07, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.28573116660118103, "step": 4230, "valid_targets_mean": 2120.6, "valid_targets_min": 925 }, { "epoch": 6.76517571884984, "grad_norm": 0.9491247142208109, "learning_rate": 1.388885124793049e-07, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.31920358538627625, "step": 4235, "valid_targets_mean": 2578.9, "valid_targets_min": 1035 }, { "epoch": 6.773162939297125, "grad_norm": 0.7611128237185949, "learning_rate": 1.2967265601019573e-07, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.2846299409866333, "step": 4240, "valid_targets_mean": 3655.2, "valid_targets_min": 1028 }, { "epoch": 6.781150159744409, "grad_norm": 0.9210913647426122, "learning_rate": 1.207721479523105e-07, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.35080933570861816, "step": 4245, "valid_targets_mean": 2840.4, "valid_targets_min": 1261 }, { "epoch": 6.789137380191693, "grad_norm": 1.721647903989534, "learning_rate": 1.1218712955954003e-07, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.2759488821029663, "step": 4250, "valid_targets_mean": 2726.2, "valid_targets_min": 1174 }, { "epoch": 6.797124600638978, "grad_norm": 0.8118881713456394, "learning_rate": 1.0391773707885578e-07, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.3287505507469177, "step": 4255, "valid_targets_mean": 3890.9, "valid_targets_min": 1776 }, { "epoch": 6.805111821086262, "grad_norm": 1.0237761097745328, "learning_rate": 9.596410174814497e-08, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.3121640682220459, "step": 4260, "valid_targets_mean": 2273.5, "valid_targets_min": 985 }, { "epoch": 6.813099041533547, "grad_norm": 0.8756144489602926, "learning_rate": 8.83263497941278e-08, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2863563895225525, "step": 4265, "valid_targets_mean": 3378.8, "valid_targets_min": 1177 }, { "epoch": 6.821086261980831, "grad_norm": 0.9055578315212417, "learning_rate": 8.10046024303568e-08, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192518949508667, "step": 4270, "valid_targets_mean": 2526.4, "valid_targets_min": 866 }, { "epoch": 6.8290734824281145, "grad_norm": 0.828803979329337, "learning_rate": 7.399897585528726e-08, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.275405615568161, "step": 4275, "valid_targets_mean": 3092.6, "valid_targets_min": 1241 }, { "epoch": 6.8370607028754, "grad_norm": 0.8196124102717052, "learning_rate": 6.730958125044319e-08, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.27911484241485596, "step": 4280, "valid_targets_mean": 3558.2, "valid_targets_min": 1120 }, { "epoch": 6.845047923322683, "grad_norm": 0.8901874965419135, "learning_rate": 6.093652477864309e-08, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.26097339391708374, "step": 4285, "valid_targets_mean": 3068.0, "valid_targets_min": 1169 }, { "epoch": 6.853035143769968, "grad_norm": 0.8655935287765495, "learning_rate": 5.4879907582316986e-08, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.2756623923778534, "step": 4290, "valid_targets_mean": 3080.9, "valid_targets_min": 1257 }, { "epoch": 6.861022364217252, "grad_norm": 0.7648381612652023, "learning_rate": 4.913982578190535e-08, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539091110229492, "step": 4295, "valid_targets_mean": 3344.6, "valid_targets_min": 1276 }, { "epoch": 6.8690095846645365, "grad_norm": 0.8390658265719673, "learning_rate": 4.3716370474331527e-08, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.36022868752479553, "step": 4300, "valid_targets_mean": 2998.6, "valid_targets_min": 1162 }, { "epoch": 6.876996805111821, "grad_norm": 0.8055876615636595, "learning_rate": 3.8609627731558405e-08, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.24102458357810974, "step": 4305, "valid_targets_mean": 3242.4, "valid_targets_min": 1254 }, { "epoch": 6.884984025559105, "grad_norm": 0.9539831877236683, "learning_rate": 3.381967859920954e-08, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.2361864149570465, "step": 4310, "valid_targets_mean": 2221.6, "valid_targets_min": 1262 }, { "epoch": 6.89297124600639, "grad_norm": 0.9029039854454836, "learning_rate": 2.9346599095305685e-08, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.3124200999736786, "step": 4315, "valid_targets_mean": 3012.0, "valid_targets_min": 1108 }, { "epoch": 6.900958466453674, "grad_norm": 0.9294252530003244, "learning_rate": 2.5190460209039146e-08, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.320919394493103, "step": 4320, "valid_targets_mean": 2418.2, "valid_targets_min": 1051 }, { "epoch": 6.9089456869009584, "grad_norm": 0.8167670634707263, "learning_rate": 2.1351327899656883e-08, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.3053489923477173, "step": 4325, "valid_targets_mean": 3051.6, "valid_targets_min": 1233 }, { "epoch": 6.916932907348243, "grad_norm": 0.891874638674044, "learning_rate": 1.782926309540578e-08, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.3282131850719452, "step": 4330, "valid_targets_mean": 2809.9, "valid_targets_min": 1303 }, { "epoch": 6.924920127795527, "grad_norm": 0.8436959953986517, "learning_rate": 1.462432169257344e-08, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.2719654440879822, "step": 4335, "valid_targets_mean": 3073.7, "valid_targets_min": 1214 }, { "epoch": 6.932907348242812, "grad_norm": 0.8769982264320124, "learning_rate": 1.1736554554604429e-08, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.28453394770622253, "step": 4340, "valid_targets_mean": 2600.9, "valid_targets_min": 1517 }, { "epoch": 6.940894568690096, "grad_norm": 0.799917953202752, "learning_rate": 9.166007511274278e-09, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.3287510871887207, "step": 4345, "valid_targets_mean": 3648.2, "valid_targets_min": 873 }, { "epoch": 6.94888178913738, "grad_norm": 0.9188207110001246, "learning_rate": 6.912721357985597e-09, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.2823947072029114, "step": 4350, "valid_targets_mean": 2750.2, "valid_targets_min": 1078 }, { "epoch": 6.956869009584665, "grad_norm": 0.8966652036625243, "learning_rate": 4.976731855104166e-09, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.2613156735897064, "step": 4355, "valid_targets_mean": 2528.8, "valid_targets_min": 909 }, { "epoch": 6.964856230031949, "grad_norm": 0.9156629228599535, "learning_rate": 3.3580697274016028e-09, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.30315962433815, "step": 4360, "valid_targets_mean": 2685.6, "valid_targets_min": 1197 }, { "epoch": 6.972843450479234, "grad_norm": 0.7280740965258752, "learning_rate": 2.056760663555757e-09, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2657495141029358, "step": 4365, "valid_targets_mean": 3746.4, "valid_targets_min": 1229 }, { "epoch": 6.980830670926517, "grad_norm": 0.9132105098927803, "learning_rate": 1.0728253157599178e-09, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.305087685585022, "step": 4370, "valid_targets_mean": 2696.9, "valid_targets_min": 657 }, { "epoch": 6.988817891373802, "grad_norm": 0.8569350748102568, "learning_rate": 4.062792993786424e-10, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.24934561550617218, "step": 4375, "valid_targets_mean": 2357.8, "valid_targets_min": 919 }, { "epoch": 6.996805111821086, "grad_norm": 0.9999686364147095, "learning_rate": 5.7133192707947705e-11, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.2727892994880676, "step": 4380, "valid_targets_mean": 2353.3, "valid_targets_min": 1390 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.24196135997772217, "step": 4382, "total_flos": 881525354463232.0, "train_loss": 0.37171825520364404, "train_runtime": 19745.0516, "train_samples_per_second": 3.548, "train_steps_per_second": 0.222, "valid_targets_mean": 3242.5, "valid_targets_min": 1195 } ], "logging_steps": 5, "max_steps": 4382, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 881525354463232.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }