{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 1175, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0042643923240938165, "grad_norm": 2.5366310886513554, "learning_rate": 0.0, "loss": 1.4664, "loss_nan_ranks": 0, "loss_rank_avg": 0.3633503019809723, "step": 1, "valid_targets_mean": 16166.3, "valid_targets_min": 15435 }, { "epoch": 0.008528784648187633, "grad_norm": 2.5801694932581136, "learning_rate": 3.3898305084745766e-07, "loss": 1.4775, "loss_nan_ranks": 0, "loss_rank_avg": 0.43468669056892395, "step": 2, "valid_targets_mean": 16231.4, "valid_targets_min": 15861 }, { "epoch": 0.01279317697228145, "grad_norm": 2.5436827836237237, "learning_rate": 6.779661016949153e-07, "loss": 1.498, "loss_nan_ranks": 0, "loss_rank_avg": 0.32442036271095276, "step": 3, "valid_targets_mean": 12902.7, "valid_targets_min": 9698 }, { "epoch": 0.017057569296375266, "grad_norm": 2.557611495365603, "learning_rate": 1.016949152542373e-06, "loss": 1.5634, "loss_nan_ranks": 0, "loss_rank_avg": 0.38837745785713196, "step": 4, "valid_targets_mean": 16193.7, "valid_targets_min": 15332 }, { "epoch": 0.021321961620469083, "grad_norm": 2.501076169530371, "learning_rate": 1.3559322033898307e-06, "loss": 1.4884, "loss_nan_ranks": 0, "loss_rank_avg": 0.4217827320098877, "step": 5, "valid_targets_mean": 16192.6, "valid_targets_min": 15561 }, { "epoch": 0.0255863539445629, "grad_norm": 2.5083867469645673, "learning_rate": 1.6949152542372882e-06, "loss": 1.4775, "loss_nan_ranks": 0, "loss_rank_avg": 0.33818453550338745, "step": 6, "valid_targets_mean": 14216.8, "valid_targets_min": 11918 }, { "epoch": 0.029850746268656716, "grad_norm": 2.408038285775719, "learning_rate": 2.033898305084746e-06, "loss": 1.4603, "loss_nan_ranks": 0, "loss_rank_avg": 0.44682514667510986, "step": 7, "valid_targets_mean": 15977.0, "valid_targets_min": 14845 }, { "epoch": 0.03411513859275053, "grad_norm": 2.3292454609481386, "learning_rate": 2.372881355932204e-06, "loss": 1.4851, "loss_nan_ranks": 0, "loss_rank_avg": 0.3509920835494995, "step": 8, "valid_targets_mean": 12883.5, "valid_targets_min": 1369 }, { "epoch": 0.03837953091684435, "grad_norm": 1.967700745194145, "learning_rate": 2.7118644067796613e-06, "loss": 1.4199, "loss_nan_ranks": 0, "loss_rank_avg": 0.3503936231136322, "step": 9, "valid_targets_mean": 15800.5, "valid_targets_min": 14349 }, { "epoch": 0.042643923240938165, "grad_norm": 1.8916462786230832, "learning_rate": 3.0508474576271192e-06, "loss": 1.479, "loss_nan_ranks": 0, "loss_rank_avg": 0.43284642696380615, "step": 10, "valid_targets_mean": 16118.9, "valid_targets_min": 15042 }, { "epoch": 0.046908315565031986, "grad_norm": 1.6595343637173545, "learning_rate": 3.3898305084745763e-06, "loss": 1.4307, "loss_nan_ranks": 0, "loss_rank_avg": 0.2499767243862152, "step": 11, "valid_targets_mean": 9185.1, "valid_targets_min": 1758 }, { "epoch": 0.0511727078891258, "grad_norm": 1.5151937956251524, "learning_rate": 3.7288135593220342e-06, "loss": 1.4265, "loss_nan_ranks": 0, "loss_rank_avg": 0.3513546884059906, "step": 12, "valid_targets_mean": 16135.2, "valid_targets_min": 14794 }, { "epoch": 0.05543710021321962, "grad_norm": 1.5292214435231881, "learning_rate": 4.067796610169492e-06, "loss": 1.4258, "loss_nan_ranks": 0, "loss_rank_avg": 0.39262068271636963, "step": 13, "valid_targets_mean": 16090.6, "valid_targets_min": 14826 }, { "epoch": 0.05970149253731343, "grad_norm": 1.393250104462496, "learning_rate": 4.40677966101695e-06, "loss": 1.4146, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585723102092743, "step": 14, "valid_targets_mean": 10057.8, "valid_targets_min": 6101 }, { "epoch": 0.06396588486140725, "grad_norm": 1.1760003188047685, "learning_rate": 4.745762711864408e-06, "loss": 1.4096, "loss_nan_ranks": 0, "loss_rank_avg": 0.38163837790489197, "step": 15, "valid_targets_mean": 16117.9, "valid_targets_min": 14544 }, { "epoch": 0.06823027718550106, "grad_norm": 1.8086044060522266, "learning_rate": 5.084745762711865e-06, "loss": 1.4154, "loss_nan_ranks": 0, "loss_rank_avg": 0.413485050201416, "step": 16, "valid_targets_mean": 16074.6, "valid_targets_min": 14755 }, { "epoch": 0.07249466950959488, "grad_norm": 1.7462651292016687, "learning_rate": 5.423728813559323e-06, "loss": 1.4223, "loss_nan_ranks": 0, "loss_rank_avg": 0.3601645231246948, "step": 17, "valid_targets_mean": 14765.2, "valid_targets_min": 12313 }, { "epoch": 0.0767590618336887, "grad_norm": 1.4910941336606407, "learning_rate": 5.7627118644067805e-06, "loss": 1.3985, "loss_nan_ranks": 0, "loss_rank_avg": 0.3598688840866089, "step": 18, "valid_targets_mean": 16238.3, "valid_targets_min": 15660 }, { "epoch": 0.08102345415778252, "grad_norm": 1.2152389918873905, "learning_rate": 6.1016949152542385e-06, "loss": 1.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.3777955174446106, "step": 19, "valid_targets_mean": 16181.4, "valid_targets_min": 15422 }, { "epoch": 0.08528784648187633, "grad_norm": 0.9439219563284131, "learning_rate": 6.440677966101695e-06, "loss": 1.4081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3570820689201355, "step": 20, "valid_targets_mean": 15211.0, "valid_targets_min": 13345 }, { "epoch": 0.08955223880597014, "grad_norm": 0.8614841201368815, "learning_rate": 6.779661016949153e-06, "loss": 1.3596, "loss_nan_ranks": 0, "loss_rank_avg": 0.39180970191955566, "step": 21, "valid_targets_mean": 16066.3, "valid_targets_min": 13888 }, { "epoch": 0.09381663113006397, "grad_norm": 0.989712835987842, "learning_rate": 7.1186440677966106e-06, "loss": 1.3796, "loss_nan_ranks": 0, "loss_rank_avg": 0.2866818308830261, "step": 22, "valid_targets_mean": 11589.2, "valid_targets_min": 2526 }, { "epoch": 0.09808102345415778, "grad_norm": 0.8838701674340025, "learning_rate": 7.4576271186440685e-06, "loss": 1.3191, "loss_nan_ranks": 0, "loss_rank_avg": 0.3461511731147766, "step": 23, "valid_targets_mean": 16071.5, "valid_targets_min": 14705 }, { "epoch": 0.1023454157782516, "grad_norm": 0.7102511059049913, "learning_rate": 7.796610169491526e-06, "loss": 1.334, "loss_nan_ranks": 0, "loss_rank_avg": 0.38423407077789307, "step": 24, "valid_targets_mean": 16015.3, "valid_targets_min": 13108 }, { "epoch": 0.10660980810234541, "grad_norm": 0.8200282677360692, "learning_rate": 8.135593220338983e-06, "loss": 1.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.23730315268039703, "step": 25, "valid_targets_mean": 10277.5, "valid_targets_min": 2154 }, { "epoch": 0.11087420042643924, "grad_norm": 0.7588068868281355, "learning_rate": 8.47457627118644e-06, "loss": 1.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.360531210899353, "step": 26, "valid_targets_mean": 16022.2, "valid_targets_min": 14908 }, { "epoch": 0.11513859275053305, "grad_norm": 0.6220593529622817, "learning_rate": 8.8135593220339e-06, "loss": 1.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.35754430294036865, "step": 27, "valid_targets_mean": 16100.3, "valid_targets_min": 13427 }, { "epoch": 0.11940298507462686, "grad_norm": 0.5954017359076195, "learning_rate": 9.152542372881356e-06, "loss": 1.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550112009048462, "step": 28, "valid_targets_mean": 11641.7, "valid_targets_min": 8792 }, { "epoch": 0.12366737739872068, "grad_norm": 0.641528051079028, "learning_rate": 9.491525423728815e-06, "loss": 1.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.3624398708343506, "step": 29, "valid_targets_mean": 16077.6, "valid_targets_min": 15116 }, { "epoch": 0.1279317697228145, "grad_norm": 0.4920851160355056, "learning_rate": 9.830508474576272e-06, "loss": 1.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.3876349627971649, "step": 30, "valid_targets_mean": 16075.6, "valid_targets_min": 15222 }, { "epoch": 0.13219616204690832, "grad_norm": 0.5222548588184942, "learning_rate": 1.016949152542373e-05, "loss": 1.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.29042887687683105, "step": 31, "valid_targets_mean": 14641.4, "valid_targets_min": 12602 }, { "epoch": 0.13646055437100213, "grad_norm": 0.5397850083552871, "learning_rate": 1.0508474576271188e-05, "loss": 1.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3626946806907654, "step": 32, "valid_targets_mean": 16118.6, "valid_targets_min": 14547 }, { "epoch": 0.14072494669509594, "grad_norm": 0.4793360544551292, "learning_rate": 1.0847457627118645e-05, "loss": 1.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.28542160987854004, "step": 33, "valid_targets_mean": 13292.3, "valid_targets_min": 2298 }, { "epoch": 0.14498933901918976, "grad_norm": 0.45405854099713594, "learning_rate": 1.1186440677966102e-05, "loss": 1.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.30616092681884766, "step": 34, "valid_targets_mean": 15516.8, "valid_targets_min": 13685 }, { "epoch": 0.14925373134328357, "grad_norm": 0.4319692781535827, "learning_rate": 1.1525423728813561e-05, "loss": 1.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.3785768747329712, "step": 35, "valid_targets_mean": 16160.1, "valid_targets_min": 15418 }, { "epoch": 0.1535181236673774, "grad_norm": 0.4527662177446445, "learning_rate": 1.1864406779661018e-05, "loss": 1.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.22713381052017212, "step": 36, "valid_targets_mean": 9924.8, "valid_targets_min": 1242 }, { "epoch": 0.15778251599147122, "grad_norm": 0.3765831906436275, "learning_rate": 1.2203389830508477e-05, "loss": 1.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.30958038568496704, "step": 37, "valid_targets_mean": 16209.8, "valid_targets_min": 15560 }, { "epoch": 0.16204690831556504, "grad_norm": 0.42044497087118887, "learning_rate": 1.2542372881355932e-05, "loss": 1.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.3550320565700531, "step": 38, "valid_targets_mean": 16175.6, "valid_targets_min": 15189 }, { "epoch": 0.16631130063965885, "grad_norm": 0.39664232457510257, "learning_rate": 1.288135593220339e-05, "loss": 1.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.23336681723594666, "step": 39, "valid_targets_mean": 9991.4, "valid_targets_min": 6726 }, { "epoch": 0.17057569296375266, "grad_norm": 0.39504221280618673, "learning_rate": 1.3220338983050848e-05, "loss": 1.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.3280348777770996, "step": 40, "valid_targets_mean": 16142.2, "valid_targets_min": 14273 }, { "epoch": 0.17484008528784648, "grad_norm": 0.34053684953238916, "learning_rate": 1.3559322033898305e-05, "loss": 1.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.33567771315574646, "step": 41, "valid_targets_mean": 16186.6, "valid_targets_min": 14994 }, { "epoch": 0.1791044776119403, "grad_norm": 0.3295620699042012, "learning_rate": 1.3898305084745764e-05, "loss": 1.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.27557477355003357, "step": 42, "valid_targets_mean": 13378.8, "valid_targets_min": 11254 }, { "epoch": 0.18336886993603413, "grad_norm": 0.3280221166685567, "learning_rate": 1.4237288135593221e-05, "loss": 1.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.34312349557876587, "step": 43, "valid_targets_mean": 16160.8, "valid_targets_min": 15560 }, { "epoch": 0.18763326226012794, "grad_norm": 0.32067396279656807, "learning_rate": 1.4576271186440678e-05, "loss": 1.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.31136569380760193, "step": 44, "valid_targets_mean": 16207.8, "valid_targets_min": 14732 }, { "epoch": 0.19189765458422176, "grad_norm": 0.3204956775534723, "learning_rate": 1.4915254237288137e-05, "loss": 1.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.32411104440689087, "step": 45, "valid_targets_mean": 14813.5, "valid_targets_min": 13169 }, { "epoch": 0.19616204690831557, "grad_norm": 0.31309834097280076, "learning_rate": 1.5254237288135594e-05, "loss": 1.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.3351410925388336, "step": 46, "valid_targets_mean": 16167.5, "valid_targets_min": 14831 }, { "epoch": 0.20042643923240938, "grad_norm": 0.3062761729865377, "learning_rate": 1.5593220338983053e-05, "loss": 1.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.2603297829627991, "step": 47, "valid_targets_mean": 11703.6, "valid_targets_min": 3390 }, { "epoch": 0.2046908315565032, "grad_norm": 0.3059044906159298, "learning_rate": 1.593220338983051e-05, "loss": 1.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.31020739674568176, "step": 48, "valid_targets_mean": 15695.9, "valid_targets_min": 14068 }, { "epoch": 0.208955223880597, "grad_norm": 0.29729679774217543, "learning_rate": 1.6271186440677967e-05, "loss": 1.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.3794437348842621, "step": 49, "valid_targets_mean": 16029.5, "valid_targets_min": 13688 }, { "epoch": 0.21321961620469082, "grad_norm": 0.28568244337662785, "learning_rate": 1.6610169491525424e-05, "loss": 1.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.17967450618743896, "step": 50, "valid_targets_mean": 7348.0, "valid_targets_min": 1535 }, { "epoch": 0.21748400852878466, "grad_norm": 0.30679422108986126, "learning_rate": 1.694915254237288e-05, "loss": 1.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.30095893144607544, "step": 51, "valid_targets_mean": 16203.1, "valid_targets_min": 15803 }, { "epoch": 0.22174840085287847, "grad_norm": 0.30903751456062006, "learning_rate": 1.728813559322034e-05, "loss": 1.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.36445748805999756, "step": 52, "valid_targets_mean": 16132.4, "valid_targets_min": 15171 }, { "epoch": 0.2260127931769723, "grad_norm": 0.2734644653742701, "learning_rate": 1.76271186440678e-05, "loss": 1.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.2611805200576782, "step": 53, "valid_targets_mean": 12511.2, "valid_targets_min": 10082 }, { "epoch": 0.2302771855010661, "grad_norm": 0.296167365405311, "learning_rate": 1.7966101694915256e-05, "loss": 1.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.33024922013282776, "step": 54, "valid_targets_mean": 16137.9, "valid_targets_min": 14934 }, { "epoch": 0.2345415778251599, "grad_norm": 0.2857314835724685, "learning_rate": 1.8305084745762713e-05, "loss": 1.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.36636629700660706, "step": 55, "valid_targets_mean": 16097.3, "valid_targets_min": 15345 }, { "epoch": 0.23880597014925373, "grad_norm": 0.30832952787337065, "learning_rate": 1.864406779661017e-05, "loss": 1.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.2799396216869354, "step": 56, "valid_targets_mean": 14551.7, "valid_targets_min": 12631 }, { "epoch": 0.24307036247334754, "grad_norm": 0.2742963507475523, "learning_rate": 1.898305084745763e-05, "loss": 1.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.33785948157310486, "step": 57, "valid_targets_mean": 15843.4, "valid_targets_min": 9286 }, { "epoch": 0.24733475479744135, "grad_norm": 0.3353292347627481, "learning_rate": 1.9322033898305087e-05, "loss": 1.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.30091214179992676, "step": 58, "valid_targets_mean": 13183.4, "valid_targets_min": 2731 }, { "epoch": 0.2515991471215352, "grad_norm": 0.28940885000192057, "learning_rate": 1.9661016949152545e-05, "loss": 1.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3025071620941162, "step": 59, "valid_targets_mean": 15810.2, "valid_targets_min": 14420 }, { "epoch": 0.255863539445629, "grad_norm": 0.3158097390368932, "learning_rate": 2e-05, "loss": 1.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.34030646085739136, "step": 60, "valid_targets_mean": 16229.3, "valid_targets_min": 15657 }, { "epoch": 0.2601279317697228, "grad_norm": 0.3421290994544124, "learning_rate": 2.033898305084746e-05, "loss": 1.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.2056933045387268, "step": 61, "valid_targets_mean": 8622.5, "valid_targets_min": 1160 }, { "epoch": 0.26439232409381663, "grad_norm": 0.2840875671625852, "learning_rate": 2.0677966101694916e-05, "loss": 1.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.3078186511993408, "step": 62, "valid_targets_mean": 16106.1, "valid_targets_min": 14943 }, { "epoch": 0.26865671641791045, "grad_norm": 0.36023223069817156, "learning_rate": 2.1016949152542376e-05, "loss": 1.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.34042203426361084, "step": 63, "valid_targets_mean": 16136.8, "valid_targets_min": 15314 }, { "epoch": 0.27292110874200426, "grad_norm": 0.3230768382997439, "learning_rate": 2.1355932203389833e-05, "loss": 1.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2322762906551361, "step": 64, "valid_targets_mean": 10336.6, "valid_targets_min": 5623 }, { "epoch": 0.2771855010660981, "grad_norm": 0.3201591381046788, "learning_rate": 2.169491525423729e-05, "loss": 1.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.3034995496273041, "step": 65, "valid_targets_mean": 16176.8, "valid_targets_min": 15278 }, { "epoch": 0.2814498933901919, "grad_norm": 0.3665430118978998, "learning_rate": 2.2033898305084748e-05, "loss": 1.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.35378801822662354, "step": 66, "valid_targets_mean": 16186.6, "valid_targets_min": 15380 }, { "epoch": 0.2857142857142857, "grad_norm": 0.29217465033844975, "learning_rate": 2.2372881355932205e-05, "loss": 1.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516692280769348, "step": 67, "valid_targets_mean": 12693.9, "valid_targets_min": 10543 }, { "epoch": 0.2899786780383795, "grad_norm": 0.411568614568208, "learning_rate": 2.2711864406779665e-05, "loss": 1.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.3390015661716461, "step": 68, "valid_targets_mean": 16133.4, "valid_targets_min": 15452 }, { "epoch": 0.2942430703624733, "grad_norm": 0.34592991350624464, "learning_rate": 2.3050847457627122e-05, "loss": 1.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.3600677251815796, "step": 69, "valid_targets_mean": 16142.4, "valid_targets_min": 15328 }, { "epoch": 0.29850746268656714, "grad_norm": 0.4123090858740144, "learning_rate": 2.338983050847458e-05, "loss": 1.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.28057190775871277, "step": 70, "valid_targets_mean": 14594.2, "valid_targets_min": 13086 }, { "epoch": 0.302771855010661, "grad_norm": 0.4890966579587274, "learning_rate": 2.3728813559322036e-05, "loss": 1.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.3367359936237335, "step": 71, "valid_targets_mean": 16185.4, "valid_targets_min": 15260 }, { "epoch": 0.3070362473347548, "grad_norm": 0.4147372197442472, "learning_rate": 2.406779661016949e-05, "loss": 1.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.253772497177124, "step": 72, "valid_targets_mean": 11549.2, "valid_targets_min": 1417 }, { "epoch": 0.31130063965884863, "grad_norm": 0.3466568226950996, "learning_rate": 2.4406779661016954e-05, "loss": 1.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.3072333335876465, "step": 73, "valid_targets_mean": 16113.0, "valid_targets_min": 13998 }, { "epoch": 0.31556503198294245, "grad_norm": 0.42271407097276814, "learning_rate": 2.474576271186441e-05, "loss": 1.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.31899935007095337, "step": 74, "valid_targets_mean": 16215.8, "valid_targets_min": 15958 }, { "epoch": 0.31982942430703626, "grad_norm": 0.4615831928578139, "learning_rate": 2.5084745762711865e-05, "loss": 1.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.17871591448783875, "step": 75, "valid_targets_mean": 8364.3, "valid_targets_min": 2376 }, { "epoch": 0.32409381663113007, "grad_norm": 0.4916646150801305, "learning_rate": 2.5423728813559322e-05, "loss": 1.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.3067433834075928, "step": 76, "valid_targets_mean": 16091.7, "valid_targets_min": 14826 }, { "epoch": 0.3283582089552239, "grad_norm": 0.3818058190469012, "learning_rate": 2.576271186440678e-05, "loss": 1.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.34559395909309387, "step": 77, "valid_targets_mean": 16167.6, "valid_targets_min": 15351 }, { "epoch": 0.3326226012793177, "grad_norm": 0.5328297519583807, "learning_rate": 2.610169491525424e-05, "loss": 1.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.23474229872226715, "step": 78, "valid_targets_mean": 12202.2, "valid_targets_min": 8376 }, { "epoch": 0.3368869936034115, "grad_norm": 0.4530723381013144, "learning_rate": 2.6440677966101696e-05, "loss": 1.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.31477317214012146, "step": 79, "valid_targets_mean": 16147.0, "valid_targets_min": 15397 }, { "epoch": 0.3411513859275053, "grad_norm": 0.37980374625899643, "learning_rate": 2.6779661016949153e-05, "loss": 1.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.34435707330703735, "step": 80, "valid_targets_mean": 16172.6, "valid_targets_min": 14636 }, { "epoch": 0.34541577825159914, "grad_norm": 0.443903919371291, "learning_rate": 2.711864406779661e-05, "loss": 1.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2900157868862152, "step": 81, "valid_targets_mean": 14128.0, "valid_targets_min": 10472 }, { "epoch": 0.34968017057569295, "grad_norm": 0.42006078121550716, "learning_rate": 2.7457627118644068e-05, "loss": 1.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.34231239557266235, "step": 82, "valid_targets_mean": 16067.8, "valid_targets_min": 15370 }, { "epoch": 0.35394456289978676, "grad_norm": 0.4771362126592886, "learning_rate": 2.7796610169491528e-05, "loss": 1.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.29910576343536377, "step": 83, "valid_targets_mean": 13262.2, "valid_targets_min": 2435 }, { "epoch": 0.3582089552238806, "grad_norm": 0.5188342182814704, "learning_rate": 2.8135593220338985e-05, "loss": 1.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.2677900195121765, "step": 84, "valid_targets_mean": 15934.3, "valid_targets_min": 14185 }, { "epoch": 0.3624733475479744, "grad_norm": 0.44679103859423375, "learning_rate": 2.8474576271186442e-05, "loss": 1.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.36229631304740906, "step": 85, "valid_targets_mean": 16101.3, "valid_targets_min": 14897 }, { "epoch": 0.36673773987206826, "grad_norm": 0.5537923610373594, "learning_rate": 2.88135593220339e-05, "loss": 1.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2012385129928589, "step": 86, "valid_targets_mean": 9425.7, "valid_targets_min": 1851 }, { "epoch": 0.37100213219616207, "grad_norm": 0.40877363516574183, "learning_rate": 2.9152542372881356e-05, "loss": 1.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.3085198998451233, "step": 87, "valid_targets_mean": 16128.9, "valid_targets_min": 15263 }, { "epoch": 0.3752665245202559, "grad_norm": 0.531131956607798, "learning_rate": 2.9491525423728817e-05, "loss": 1.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.3547207713127136, "step": 88, "valid_targets_mean": 16217.1, "valid_targets_min": 15697 }, { "epoch": 0.3795309168443497, "grad_norm": 0.4821539701368115, "learning_rate": 2.9830508474576274e-05, "loss": 1.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.20888623595237732, "step": 89, "valid_targets_mean": 10271.9, "valid_targets_min": 5871 }, { "epoch": 0.3837953091684435, "grad_norm": 0.44479347429852767, "learning_rate": 3.016949152542373e-05, "loss": 1.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.3040030598640442, "step": 90, "valid_targets_mean": 16159.1, "valid_targets_min": 15337 }, { "epoch": 0.3880597014925373, "grad_norm": 0.49611777623662034, "learning_rate": 3.0508474576271188e-05, "loss": 1.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.36148935556411743, "step": 91, "valid_targets_mean": 16088.1, "valid_targets_min": 14827 }, { "epoch": 0.39232409381663114, "grad_norm": 0.47030432730526317, "learning_rate": 3.084745762711865e-05, "loss": 1.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.27276670932769775, "step": 92, "valid_targets_mean": 13574.6, "valid_targets_min": 10444 }, { "epoch": 0.39658848614072495, "grad_norm": 0.45488608147303355, "learning_rate": 3.1186440677966106e-05, "loss": 1.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.33878713846206665, "step": 93, "valid_targets_mean": 16158.7, "valid_targets_min": 15460 }, { "epoch": 0.40085287846481876, "grad_norm": 0.485936892703445, "learning_rate": 3.152542372881356e-05, "loss": 1.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.34667015075683594, "step": 94, "valid_targets_mean": 16128.6, "valid_targets_min": 13927 }, { "epoch": 0.4051172707889126, "grad_norm": 0.39962744663044864, "learning_rate": 3.186440677966102e-05, "loss": 1.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.29390081763267517, "step": 95, "valid_targets_mean": 15844.7, "valid_targets_min": 14737 }, { "epoch": 0.4093816631130064, "grad_norm": 0.4535828391796072, "learning_rate": 3.2203389830508473e-05, "loss": 1.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.3389269709587097, "step": 96, "valid_targets_mean": 16087.4, "valid_targets_min": 13635 }, { "epoch": 0.4136460554371002, "grad_norm": 0.4208222066539856, "learning_rate": 3.2542372881355934e-05, "loss": 1.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.23698459565639496, "step": 97, "valid_targets_mean": 10771.6, "valid_targets_min": 1136 }, { "epoch": 0.417910447761194, "grad_norm": 0.6033426037267763, "learning_rate": 3.2881355932203394e-05, "loss": 1.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.29125797748565674, "step": 98, "valid_targets_mean": 15845.2, "valid_targets_min": 14972 }, { "epoch": 0.42217484008528783, "grad_norm": 0.6430996304411255, "learning_rate": 3.322033898305085e-05, "loss": 1.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.3551673889160156, "step": 99, "valid_targets_mean": 16180.6, "valid_targets_min": 15678 }, { "epoch": 0.42643923240938164, "grad_norm": 0.565665763179061, "learning_rate": 3.355932203389831e-05, "loss": 1.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.19581037759780884, "step": 100, "valid_targets_mean": 8886.4, "valid_targets_min": 2484 }, { "epoch": 0.43070362473347545, "grad_norm": 0.5396605416088711, "learning_rate": 3.389830508474576e-05, "loss": 1.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.27528661489486694, "step": 101, "valid_targets_mean": 16190.2, "valid_targets_min": 15322 }, { "epoch": 0.4349680170575693, "grad_norm": 0.872782047618966, "learning_rate": 3.423728813559322e-05, "loss": 1.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.3470345437526703, "step": 102, "valid_targets_mean": 16177.2, "valid_targets_min": 15635 }, { "epoch": 0.43923240938166314, "grad_norm": 1.0278755291690116, "learning_rate": 3.457627118644068e-05, "loss": 1.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.23301859200000763, "step": 103, "valid_targets_mean": 12241.3, "valid_targets_min": 9421 }, { "epoch": 0.44349680170575695, "grad_norm": 0.7125446740464207, "learning_rate": 3.491525423728814e-05, "loss": 1.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.29817789793014526, "step": 104, "valid_targets_mean": 16131.7, "valid_targets_min": 15263 }, { "epoch": 0.44776119402985076, "grad_norm": 0.5563012628453976, "learning_rate": 3.52542372881356e-05, "loss": 1.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.3532581329345703, "step": 105, "valid_targets_mean": 15808.0, "valid_targets_min": 5994 }, { "epoch": 0.4520255863539446, "grad_norm": 0.5790943913836976, "learning_rate": 3.559322033898305e-05, "loss": 1.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.2807878851890564, "step": 106, "valid_targets_mean": 14647.7, "valid_targets_min": 12782 }, { "epoch": 0.4562899786780384, "grad_norm": 0.44736003462007023, "learning_rate": 3.593220338983051e-05, "loss": 1.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.3288416862487793, "step": 107, "valid_targets_mean": 16161.3, "valid_targets_min": 15446 }, { "epoch": 0.4605543710021322, "grad_norm": 0.5622289779961762, "learning_rate": 3.627118644067797e-05, "loss": 1.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.28626295924186707, "step": 108, "valid_targets_mean": 12701.5, "valid_targets_min": 755 }, { "epoch": 0.464818763326226, "grad_norm": 0.6298643931105169, "learning_rate": 3.6610169491525426e-05, "loss": 1.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.27614328265190125, "step": 109, "valid_targets_mean": 15305.1, "valid_targets_min": 13189 }, { "epoch": 0.4690831556503198, "grad_norm": 0.5185621603579966, "learning_rate": 3.6949152542372886e-05, "loss": 1.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.33316150307655334, "step": 110, "valid_targets_mean": 16089.3, "valid_targets_min": 13573 }, { "epoch": 0.47334754797441364, "grad_norm": 0.42559122357589, "learning_rate": 3.728813559322034e-05, "loss": 1.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.19938254356384277, "step": 111, "valid_targets_mean": 9455.9, "valid_targets_min": 1155 }, { "epoch": 0.47761194029850745, "grad_norm": 0.547538253832718, "learning_rate": 3.76271186440678e-05, "loss": 1.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.2797814905643463, "step": 112, "valid_targets_mean": 16189.5, "valid_targets_min": 14479 }, { "epoch": 0.48187633262260127, "grad_norm": 0.4953749309045982, "learning_rate": 3.796610169491526e-05, "loss": 1.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203335404396057, "step": 113, "valid_targets_mean": 16139.4, "valid_targets_min": 15023 }, { "epoch": 0.4861407249466951, "grad_norm": 0.5008062729973279, "learning_rate": 3.8305084745762714e-05, "loss": 1.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.20449399948120117, "step": 114, "valid_targets_mean": 10739.7, "valid_targets_min": 4961 }, { "epoch": 0.4904051172707889, "grad_norm": 0.5386560071865651, "learning_rate": 3.8644067796610175e-05, "loss": 1.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.3071936368942261, "step": 115, "valid_targets_mean": 16131.4, "valid_targets_min": 15295 }, { "epoch": 0.4946695095948827, "grad_norm": 0.40711995591176553, "learning_rate": 3.898305084745763e-05, "loss": 1.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.35818758606910706, "step": 116, "valid_targets_mean": 16016.1, "valid_targets_min": 14837 }, { "epoch": 0.4989339019189765, "grad_norm": 0.5473817794095149, "learning_rate": 3.932203389830509e-05, "loss": 1.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.22010652720928192, "step": 117, "valid_targets_mean": 12074.7, "valid_targets_min": 9259 }, { "epoch": 0.5031982942430704, "grad_norm": 0.5549393845209296, "learning_rate": 3.966101694915255e-05, "loss": 1.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.33431297540664673, "step": 118, "valid_targets_mean": 16067.9, "valid_targets_min": 13427 }, { "epoch": 0.5074626865671642, "grad_norm": 0.5146152133859702, "learning_rate": 4e-05, "loss": 1.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.32214197516441345, "step": 119, "valid_targets_mean": 15887.3, "valid_targets_min": 4483 }, { "epoch": 0.511727078891258, "grad_norm": 0.6228833876090004, "learning_rate": 3.999991166161585e-05, "loss": 1.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.2574143409729004, "step": 120, "valid_targets_mean": 15023.2, "valid_targets_min": 12822 }, { "epoch": 0.5159914712153518, "grad_norm": 0.6342331737079137, "learning_rate": 3.999964664724376e-05, "loss": 1.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.33971458673477173, "step": 121, "valid_targets_mean": 16139.8, "valid_targets_min": 15345 }, { "epoch": 0.5202558635394456, "grad_norm": 0.7094986485415746, "learning_rate": 3.999920495922483e-05, "loss": 1.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.20790129899978638, "step": 122, "valid_targets_mean": 10948.9, "valid_targets_min": 2964 }, { "epoch": 0.5245202558635395, "grad_norm": 0.7145033987132133, "learning_rate": 3.999858660146085e-05, "loss": 1.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.29542362689971924, "step": 123, "valid_targets_mean": 16067.6, "valid_targets_min": 13788 }, { "epoch": 0.5287846481876333, "grad_norm": 0.7457689773326728, "learning_rate": 3.999779157941431e-05, "loss": 1.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.3226638734340668, "step": 124, "valid_targets_mean": 16100.9, "valid_targets_min": 14446 }, { "epoch": 0.5330490405117271, "grad_norm": 0.5239696778473059, "learning_rate": 3.99968199001083e-05, "loss": 1.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.17688265442848206, "step": 125, "valid_targets_mean": 8757.8, "valid_targets_min": 1946 }, { "epoch": 0.5373134328358209, "grad_norm": 0.6724127021853642, "learning_rate": 3.999567157212646e-05, "loss": 1.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.29729247093200684, "step": 126, "valid_targets_mean": 16084.3, "valid_targets_min": 15180 }, { "epoch": 0.5415778251599147, "grad_norm": 0.5970809000359247, "learning_rate": 3.9994346605612955e-05, "loss": 1.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.3342553675174713, "step": 127, "valid_targets_mean": 16168.2, "valid_targets_min": 15465 }, { "epoch": 0.5458422174840085, "grad_norm": 0.6500359122095334, "learning_rate": 3.999284501227232e-05, "loss": 1.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.22495630383491516, "step": 128, "valid_targets_mean": 11782.7, "valid_targets_min": 8043 }, { "epoch": 0.5501066098081023, "grad_norm": 0.5131778839895256, "learning_rate": 3.9991166805369393e-05, "loss": 1.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.31228113174438477, "step": 129, "valid_targets_mean": 16157.4, "valid_targets_min": 15459 }, { "epoch": 0.5543710021321961, "grad_norm": 0.6887330054802512, "learning_rate": 3.9989311999729166e-05, "loss": 1.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.33670181035995483, "step": 130, "valid_targets_mean": 16114.2, "valid_targets_min": 14385 }, { "epoch": 0.55863539445629, "grad_norm": 0.754673773153781, "learning_rate": 3.99872806117367e-05, "loss": 1.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2688842713832855, "step": 131, "valid_targets_mean": 14860.6, "valid_targets_min": 13129 }, { "epoch": 0.5628997867803838, "grad_norm": 0.6456491151478851, "learning_rate": 3.998507265933696e-05, "loss": 1.1058, "loss_nan_ranks": 0, "loss_rank_avg": 0.2996610403060913, "step": 132, "valid_targets_mean": 15748.8, "valid_targets_min": 2605 }, { "epoch": 0.5671641791044776, "grad_norm": 0.7739595345647093, "learning_rate": 3.9982688162034624e-05, "loss": 1.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.2546170949935913, "step": 133, "valid_targets_mean": 13342.2, "valid_targets_min": 2588 }, { "epoch": 0.5714285714285714, "grad_norm": 0.9331641630918175, "learning_rate": 3.998012714089397e-05, "loss": 1.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.28307855129241943, "step": 134, "valid_targets_mean": 15889.0, "valid_targets_min": 14972 }, { "epoch": 0.5756929637526652, "grad_norm": 0.9902818305571806, "learning_rate": 3.997738961853863e-05, "loss": 1.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.3365092873573303, "step": 135, "valid_targets_mean": 16079.2, "valid_targets_min": 14609 }, { "epoch": 0.579957356076759, "grad_norm": 0.8715174096943445, "learning_rate": 3.9974475619151445e-05, "loss": 1.1013, "loss_nan_ranks": 0, "loss_rank_avg": 0.1926274299621582, "step": 136, "valid_targets_mean": 11098.3, "valid_targets_min": 4124 }, { "epoch": 0.5842217484008528, "grad_norm": 0.5818454793871639, "learning_rate": 3.997138516847422e-05, "loss": 1.0952, "loss_nan_ranks": 0, "loss_rank_avg": 0.2703971266746521, "step": 137, "valid_targets_mean": 16150.4, "valid_targets_min": 15263 }, { "epoch": 0.5884861407249466, "grad_norm": 0.5206090871135683, "learning_rate": 3.9968118293807476e-05, "loss": 1.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.36197149753570557, "step": 138, "valid_targets_mean": 16076.4, "valid_targets_min": 15001 }, { "epoch": 0.5927505330490405, "grad_norm": 0.47851414710060025, "learning_rate": 3.996467502401028e-05, "loss": 1.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.2182786762714386, "step": 139, "valid_targets_mean": 10867.7, "valid_targets_min": 7289 }, { "epoch": 0.5970149253731343, "grad_norm": 0.5229917474490419, "learning_rate": 3.9961055389499904e-05, "loss": 1.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.301999032497406, "step": 140, "valid_targets_mean": 16133.0, "valid_targets_min": 14726 }, { "epoch": 0.6012793176972282, "grad_norm": 0.4640175563151738, "learning_rate": 3.995725942225162e-05, "loss": 1.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.34188324213027954, "step": 141, "valid_targets_mean": 16148.1, "valid_targets_min": 15478 }, { "epoch": 0.605543710021322, "grad_norm": 0.653443767069592, "learning_rate": 3.995328715579839e-05, "loss": 1.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.27668648958206177, "step": 142, "valid_targets_mean": 13650.9, "valid_targets_min": 11524 }, { "epoch": 0.6098081023454158, "grad_norm": 0.4986487612919465, "learning_rate": 3.994913862523058e-05, "loss": 1.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.3264992833137512, "step": 143, "valid_targets_mean": 16144.9, "valid_targets_min": 14836 }, { "epoch": 0.6140724946695096, "grad_norm": 0.5588149612000367, "learning_rate": 3.9944813867195624e-05, "loss": 1.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.30848005414009094, "step": 144, "valid_targets_mean": 16204.7, "valid_targets_min": 15523 }, { "epoch": 0.6183368869936035, "grad_norm": 0.7453941380994512, "learning_rate": 3.9940312919897744e-05, "loss": 1.084, "loss_nan_ranks": 0, "loss_rank_avg": 0.25924232602119446, "step": 145, "valid_targets_mean": 15518.0, "valid_targets_min": 13968 }, { "epoch": 0.6226012793176973, "grad_norm": 0.5464420276850471, "learning_rate": 3.993563582309759e-05, "loss": 1.0965, "loss_nan_ranks": 0, "loss_rank_avg": 0.31063953042030334, "step": 146, "valid_targets_mean": 16188.8, "valid_targets_min": 15135 }, { "epoch": 0.6268656716417911, "grad_norm": 0.42469028732271724, "learning_rate": 3.993078261811186e-05, "loss": 1.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.23097334802150726, "step": 147, "valid_targets_mean": 10491.1, "valid_targets_min": 1680 }, { "epoch": 0.6311300639658849, "grad_norm": 0.5478065261122042, "learning_rate": 3.9925753347813e-05, "loss": 1.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.265234112739563, "step": 148, "valid_targets_mean": 15896.2, "valid_targets_min": 14353 }, { "epoch": 0.6353944562899787, "grad_norm": 0.5043516530535429, "learning_rate": 3.992054805662876e-05, "loss": 1.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.3632124662399292, "step": 149, "valid_targets_mean": 16139.4, "valid_targets_min": 15325 }, { "epoch": 0.6396588486140725, "grad_norm": 0.4865290796482085, "learning_rate": 3.991516679054185e-05, "loss": 1.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.15352267026901245, "step": 150, "valid_targets_mean": 7331.1, "valid_targets_min": 1086 }, { "epoch": 0.6439232409381663, "grad_norm": 0.4746388637360173, "learning_rate": 3.9909609597089496e-05, "loss": 1.0899, "loss_nan_ranks": 0, "loss_rank_avg": 0.2732847332954407, "step": 151, "valid_targets_mean": 16209.2, "valid_targets_min": 15437 }, { "epoch": 0.6481876332622601, "grad_norm": 0.5814090165743458, "learning_rate": 3.9903876525363055e-05, "loss": 1.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.37276649475097656, "step": 152, "valid_targets_mean": 15970.0, "valid_targets_min": 15153 }, { "epoch": 0.652452025586354, "grad_norm": 0.47405089117198984, "learning_rate": 3.989796762600755e-05, "loss": 1.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.23082441091537476, "step": 153, "valid_targets_mean": 12333.0, "valid_targets_min": 7440 }, { "epoch": 0.6567164179104478, "grad_norm": 0.5802677001801227, "learning_rate": 3.9891882951221246e-05, "loss": 1.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.297301709651947, "step": 154, "valid_targets_mean": 16176.9, "valid_targets_min": 15348 }, { "epoch": 0.6609808102345416, "grad_norm": 0.4830864833929257, "learning_rate": 3.988562255475518e-05, "loss": 1.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305373191833496, "step": 155, "valid_targets_mean": 16113.9, "valid_targets_min": 15057 }, { "epoch": 0.6652452025586354, "grad_norm": 0.5582433112020596, "learning_rate": 3.987918649191268e-05, "loss": 1.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.30254873633384705, "step": 156, "valid_targets_mean": 15849.1, "valid_targets_min": 14908 }, { "epoch": 0.6695095948827292, "grad_norm": 0.5375408464387431, "learning_rate": 3.987257481954888e-05, "loss": 1.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.3167189955711365, "step": 157, "valid_targets_mean": 16035.5, "valid_targets_min": 13635 }, { "epoch": 0.673773987206823, "grad_norm": 0.45790634920349066, "learning_rate": 3.9865787596070236e-05, "loss": 1.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649564743041992, "step": 158, "valid_targets_mean": 13319.5, "valid_targets_min": 1947 }, { "epoch": 0.6780383795309168, "grad_norm": 0.4764551363056651, "learning_rate": 3.9858824881433975e-05, "loss": 1.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.2935394048690796, "step": 159, "valid_targets_mean": 15898.2, "valid_targets_min": 14591 }, { "epoch": 0.6823027718550106, "grad_norm": 0.5022076446019287, "learning_rate": 3.9851686737147585e-05, "loss": 1.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.31322112679481506, "step": 160, "valid_targets_mean": 16092.8, "valid_targets_min": 14793 }, { "epoch": 0.6865671641791045, "grad_norm": 0.5018966263143605, "learning_rate": 3.9844373226268305e-05, "loss": 1.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.19624844193458557, "step": 161, "valid_targets_mean": 8096.2, "valid_targets_min": 1500 }, { "epoch": 0.6908315565031983, "grad_norm": 0.42890520031468626, "learning_rate": 3.983688441340249e-05, "loss": 1.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.2715575098991394, "step": 162, "valid_targets_mean": 16160.3, "valid_targets_min": 15572 }, { "epoch": 0.6950959488272921, "grad_norm": 0.6118186311739395, "learning_rate": 3.98292203647051e-05, "loss": 1.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.33360719680786133, "step": 163, "valid_targets_mean": 16126.5, "valid_targets_min": 15564 }, { "epoch": 0.6993603411513859, "grad_norm": 0.48975314855537266, "learning_rate": 3.982138114787912e-05, "loss": 1.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.18657957017421722, "step": 164, "valid_targets_mean": 10036.9, "valid_targets_min": 3346 }, { "epoch": 0.7036247334754797, "grad_norm": 0.4611278946702579, "learning_rate": 3.98133668321749e-05, "loss": 1.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.2684292197227478, "step": 165, "valid_targets_mean": 16222.7, "valid_targets_min": 15436 }, { "epoch": 0.7078891257995735, "grad_norm": 0.4698326366462607, "learning_rate": 3.980517748838963e-05, "loss": 1.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.302453875541687, "step": 166, "valid_targets_mean": 16143.4, "valid_targets_min": 13886 }, { "epoch": 0.7121535181236673, "grad_norm": 0.6089019650141191, "learning_rate": 3.979681318886664e-05, "loss": 1.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.2620971202850342, "step": 167, "valid_targets_mean": 13617.7, "valid_targets_min": 11839 }, { "epoch": 0.7164179104477612, "grad_norm": 0.6121308914161944, "learning_rate": 3.978827400749481e-05, "loss": 1.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.3074718713760376, "step": 168, "valid_targets_mean": 16190.0, "valid_targets_min": 15712 }, { "epoch": 0.720682302771855, "grad_norm": 0.4181329572456291, "learning_rate": 3.977956001970788e-05, "loss": 1.0923, "loss_nan_ranks": 0, "loss_rank_avg": 0.316328227519989, "step": 169, "valid_targets_mean": 16177.5, "valid_targets_min": 15165 }, { "epoch": 0.7249466950959488, "grad_norm": 0.3820694759598411, "learning_rate": 3.977067130248381e-05, "loss": 1.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775130271911621, "step": 170, "valid_targets_mean": 16127.6, "valid_targets_min": 15280 }, { "epoch": 0.7292110874200426, "grad_norm": 0.42918885224199965, "learning_rate": 3.9761607934344095e-05, "loss": 1.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.3212129473686218, "step": 171, "valid_targets_mean": 16080.7, "valid_targets_min": 14124 }, { "epoch": 0.7334754797441365, "grad_norm": 0.38146809378376195, "learning_rate": 3.975236999535306e-05, "loss": 1.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.2378343939781189, "step": 172, "valid_targets_mean": 10701.9, "valid_targets_min": 1268 }, { "epoch": 0.7377398720682303, "grad_norm": 0.398396946713863, "learning_rate": 3.974295756711717e-05, "loss": 1.1167, "loss_nan_ranks": 0, "loss_rank_avg": 0.2819068729877472, "step": 173, "valid_targets_mean": 16045.4, "valid_targets_min": 15437 }, { "epoch": 0.7420042643923241, "grad_norm": 0.5961222558082274, "learning_rate": 3.9733370732784296e-05, "loss": 1.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.30488142371177673, "step": 174, "valid_targets_mean": 16151.0, "valid_targets_min": 14351 }, { "epoch": 0.746268656716418, "grad_norm": 0.5021411112013566, "learning_rate": 3.972360957704298e-05, "loss": 1.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.18337294459342957, "step": 175, "valid_targets_mean": 8556.6, "valid_targets_min": 1158 }, { "epoch": 0.7505330490405118, "grad_norm": 0.32592792574295393, "learning_rate": 3.97136741861217e-05, "loss": 1.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2854708135128021, "step": 176, "valid_targets_mean": 16134.4, "valid_targets_min": 14897 }, { "epoch": 0.7547974413646056, "grad_norm": 0.4732969959201329, "learning_rate": 3.970356464778808e-05, "loss": 1.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.3042914867401123, "step": 177, "valid_targets_mean": 16085.6, "valid_targets_min": 12492 }, { "epoch": 0.7590618336886994, "grad_norm": 0.47942982862373595, "learning_rate": 3.969328105134817e-05, "loss": 1.1127, "loss_nan_ranks": 0, "loss_rank_avg": 0.22245652973651886, "step": 178, "valid_targets_mean": 11892.4, "valid_targets_min": 9743 }, { "epoch": 0.7633262260127932, "grad_norm": 0.357596810395852, "learning_rate": 3.9682823487645584e-05, "loss": 1.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.35377755761146545, "step": 179, "valid_targets_mean": 15843.5, "valid_targets_min": 13927 }, { "epoch": 0.767590618336887, "grad_norm": 0.536182510954731, "learning_rate": 3.9672192049060745e-05, "loss": 1.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.2949283719062805, "step": 180, "valid_targets_mean": 16161.1, "valid_targets_min": 14871 }, { "epoch": 0.7718550106609808, "grad_norm": 0.5883409953635337, "learning_rate": 3.966138682951008e-05, "loss": 1.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.2617324888706207, "step": 181, "valid_targets_mean": 15097.6, "valid_targets_min": 12384 }, { "epoch": 0.7761194029850746, "grad_norm": 0.44943437576431317, "learning_rate": 3.9650407924445147e-05, "loss": 1.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.302264928817749, "step": 182, "valid_targets_mean": 15968.6, "valid_targets_min": 9799 }, { "epoch": 0.7803837953091685, "grad_norm": 0.348496876382619, "learning_rate": 3.963925543085181e-05, "loss": 1.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787725031375885, "step": 183, "valid_targets_mean": 13224.8, "valid_targets_min": 2180 }, { "epoch": 0.7846481876332623, "grad_norm": 0.5040058663611126, "learning_rate": 3.96279294472494e-05, "loss": 1.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726561427116394, "step": 184, "valid_targets_mean": 16042.3, "valid_targets_min": 15121 }, { "epoch": 0.7889125799573561, "grad_norm": 0.4983532852453396, "learning_rate": 3.961643007368984e-05, "loss": 1.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.3302464783191681, "step": 185, "valid_targets_mean": 16088.2, "valid_targets_min": 15153 }, { "epoch": 0.7931769722814499, "grad_norm": 0.3970225467932824, "learning_rate": 3.960475741175671e-05, "loss": 1.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.18872615694999695, "step": 186, "valid_targets_mean": 10063.5, "valid_targets_min": 1284 }, { "epoch": 0.7974413646055437, "grad_norm": 0.3378836915461822, "learning_rate": 3.959291156456444e-05, "loss": 1.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803310751914978, "step": 187, "valid_targets_mean": 16124.9, "valid_targets_min": 14690 }, { "epoch": 0.8017057569296375, "grad_norm": 0.35346936929216877, "learning_rate": 3.9580892636757334e-05, "loss": 1.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.34958887100219727, "step": 188, "valid_targets_mean": 16013.7, "valid_targets_min": 13414 }, { "epoch": 0.8059701492537313, "grad_norm": 0.3533808674922251, "learning_rate": 3.9568700734508645e-05, "loss": 1.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.198248952627182, "step": 189, "valid_targets_mean": 9630.3, "valid_targets_min": 4230 }, { "epoch": 0.8102345415778252, "grad_norm": 0.3223232955392409, "learning_rate": 3.955633596551967e-05, "loss": 1.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.2920791506767273, "step": 190, "valid_targets_mean": 16130.3, "valid_targets_min": 15217 }, { "epoch": 0.814498933901919, "grad_norm": 0.37818416609817124, "learning_rate": 3.9543798439018776e-05, "loss": 1.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.33160802721977234, "step": 191, "valid_targets_mean": 16100.2, "valid_targets_min": 15121 }, { "epoch": 0.8187633262260128, "grad_norm": 0.36234404052990765, "learning_rate": 3.953108826576046e-05, "loss": 1.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.2630240023136139, "step": 192, "valid_targets_mean": 13192.3, "valid_targets_min": 10124 }, { "epoch": 0.8230277185501066, "grad_norm": 0.3496189221525795, "learning_rate": 3.9518205558024334e-05, "loss": 1.1019, "loss_nan_ranks": 0, "loss_rank_avg": 0.3344437777996063, "step": 193, "valid_targets_mean": 16110.0, "valid_targets_min": 15222 }, { "epoch": 0.8272921108742004, "grad_norm": 0.3247000167494858, "learning_rate": 3.9505150429614154e-05, "loss": 1.0864, "loss_nan_ranks": 0, "loss_rank_avg": 0.32415539026260376, "step": 194, "valid_targets_mean": 16157.9, "valid_targets_min": 15195 }, { "epoch": 0.8315565031982942, "grad_norm": 0.3707009591283196, "learning_rate": 3.949192299585681e-05, "loss": 1.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.28162047266960144, "step": 195, "valid_targets_mean": 15813.3, "valid_targets_min": 14450 }, { "epoch": 0.835820895522388, "grad_norm": 0.3701248794721312, "learning_rate": 3.9478523373601325e-05, "loss": 1.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.34016382694244385, "step": 196, "valid_targets_mean": 15987.5, "valid_targets_min": 14241 }, { "epoch": 0.8400852878464818, "grad_norm": 0.41382661620814537, "learning_rate": 3.946495168121778e-05, "loss": 1.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.2231186181306839, "step": 197, "valid_targets_mean": 10847.8, "valid_targets_min": 793 }, { "epoch": 0.8443496801705757, "grad_norm": 0.3912544164406225, "learning_rate": 3.9451208038596325e-05, "loss": 1.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.2738224267959595, "step": 198, "valid_targets_mean": 15738.3, "valid_targets_min": 14685 }, { "epoch": 0.8486140724946695, "grad_norm": 0.37275760589482754, "learning_rate": 3.943729256714608e-05, "loss": 1.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.33501487970352173, "step": 199, "valid_targets_mean": 16183.1, "valid_targets_min": 15737 }, { "epoch": 0.8528784648187633, "grad_norm": 0.3523981647759341, "learning_rate": 3.942320538979408e-05, "loss": 1.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1693504899740219, "step": 200, "valid_targets_mean": 7677.2, "valid_targets_min": 2065 }, { "epoch": 0.8571428571428571, "grad_norm": 0.38769471517671245, "learning_rate": 3.9408946630984144e-05, "loss": 1.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.3229611814022064, "step": 201, "valid_targets_mean": 16004.1, "valid_targets_min": 12492 }, { "epoch": 0.8614072494669509, "grad_norm": 0.4029174334792178, "learning_rate": 3.939451641667587e-05, "loss": 1.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.3232455253601074, "step": 202, "valid_targets_mean": 16134.0, "valid_targets_min": 14956 }, { "epoch": 0.8656716417910447, "grad_norm": 0.3945056161774726, "learning_rate": 3.937991487434342e-05, "loss": 1.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.19846779108047485, "step": 203, "valid_targets_mean": 11952.2, "valid_targets_min": 9228 }, { "epoch": 0.8699360341151386, "grad_norm": 0.3911566718594917, "learning_rate": 3.9365142132974484e-05, "loss": 1.1028, "loss_nan_ranks": 0, "loss_rank_avg": 0.27967995405197144, "step": 204, "valid_targets_mean": 16192.1, "valid_targets_min": 15300 }, { "epoch": 0.8742004264392325, "grad_norm": 0.3960299479310709, "learning_rate": 3.935019832306905e-05, "loss": 1.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.3388521373271942, "step": 205, "valid_targets_mean": 16104.9, "valid_targets_min": 15016 }, { "epoch": 0.8784648187633263, "grad_norm": 0.379226669898679, "learning_rate": 3.933508357663832e-05, "loss": 1.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571180462837219, "step": 206, "valid_targets_mean": 14878.7, "valid_targets_min": 13210 }, { "epoch": 0.8827292110874201, "grad_norm": 0.309941973007609, "learning_rate": 3.9319798027203544e-05, "loss": 1.0723, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000110983848572, "step": 207, "valid_targets_mean": 16179.5, "valid_targets_min": 15250 }, { "epoch": 0.8869936034115139, "grad_norm": 0.3590551775559692, "learning_rate": 3.930434180979478e-05, "loss": 1.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.27522504329681396, "step": 208, "valid_targets_mean": 13244.8, "valid_targets_min": 979 }, { "epoch": 0.8912579957356077, "grad_norm": 0.3794972767149023, "learning_rate": 3.928871506094975e-05, "loss": 1.0999, "loss_nan_ranks": 0, "loss_rank_avg": 0.27033573389053345, "step": 209, "valid_targets_mean": 15530.1, "valid_targets_min": 14077 }, { "epoch": 0.8955223880597015, "grad_norm": 0.3468110890945256, "learning_rate": 3.927291791871264e-05, "loss": 1.1048, "loss_nan_ranks": 0, "loss_rank_avg": 0.3237696886062622, "step": 210, "valid_targets_mean": 16145.0, "valid_targets_min": 15408 }, { "epoch": 0.8997867803837953, "grad_norm": 0.28612789274214856, "learning_rate": 3.925695052263284e-05, "loss": 1.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.19704505801200867, "step": 211, "valid_targets_mean": 9302.1, "valid_targets_min": 2002 }, { "epoch": 0.9040511727078892, "grad_norm": 0.37829699375162723, "learning_rate": 3.924081301376375e-05, "loss": 1.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830193042755127, "step": 212, "valid_targets_mean": 16123.4, "valid_targets_min": 15464 }, { "epoch": 0.908315565031983, "grad_norm": 0.41084813490365696, "learning_rate": 3.9224505534661525e-05, "loss": 1.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.3296535611152649, "step": 213, "valid_targets_mean": 16164.3, "valid_targets_min": 15414 }, { "epoch": 0.9125799573560768, "grad_norm": 0.3448857418337144, "learning_rate": 3.92080282293838e-05, "loss": 1.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.21162542700767517, "step": 214, "valid_targets_mean": 11598.8, "valid_targets_min": 6923 }, { "epoch": 0.9168443496801706, "grad_norm": 0.4216988848704001, "learning_rate": 3.9191381243488417e-05, "loss": 1.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.2782018184661865, "step": 215, "valid_targets_mean": 16140.2, "valid_targets_min": 15054 }, { "epoch": 0.9211087420042644, "grad_norm": 0.4520192538398874, "learning_rate": 3.9174564724032167e-05, "loss": 1.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.3245173990726471, "step": 216, "valid_targets_mean": 16168.6, "valid_targets_min": 15492 }, { "epoch": 0.9253731343283582, "grad_norm": 0.5445990650271554, "learning_rate": 3.9157578819569455e-05, "loss": 1.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.23481634259223938, "step": 217, "valid_targets_mean": 13440.2, "valid_targets_min": 11543 }, { "epoch": 0.929637526652452, "grad_norm": 0.5450244324043093, "learning_rate": 3.9140423680151036e-05, "loss": 1.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.30909502506256104, "step": 218, "valid_targets_mean": 16076.0, "valid_targets_min": 14699 }, { "epoch": 0.9339019189765458, "grad_norm": 0.3585828701583468, "learning_rate": 3.9123099457322625e-05, "loss": 1.1154, "loss_nan_ranks": 0, "loss_rank_avg": 0.3166894316673279, "step": 219, "valid_targets_mean": 16097.1, "valid_targets_min": 14737 }, { "epoch": 0.9381663113006397, "grad_norm": 0.3698144959370942, "learning_rate": 3.9105606304123605e-05, "loss": 1.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.2708337604999542, "step": 220, "valid_targets_mean": 14339.8, "valid_targets_min": 12604 }, { "epoch": 0.9424307036247335, "grad_norm": 0.43891439561975154, "learning_rate": 3.908794437508567e-05, "loss": 1.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.3262331485748291, "step": 221, "valid_targets_mean": 16064.1, "valid_targets_min": 14428 }, { "epoch": 0.9466950959488273, "grad_norm": 0.396764810157014, "learning_rate": 3.907011382623145e-05, "loss": 1.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.23768097162246704, "step": 222, "valid_targets_mean": 10776.3, "valid_targets_min": 1379 }, { "epoch": 0.9509594882729211, "grad_norm": 0.3808667174396742, "learning_rate": 3.905211481507313e-05, "loss": 1.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.2573968470096588, "step": 223, "valid_targets_mean": 16155.4, "valid_targets_min": 14394 }, { "epoch": 0.9552238805970149, "grad_norm": 0.34271746822127364, "learning_rate": 3.903394750061106e-05, "loss": 1.0411, "loss_nan_ranks": 0, "loss_rank_avg": 0.2858397662639618, "step": 224, "valid_targets_mean": 16217.8, "valid_targets_min": 15574 }, { "epoch": 0.9594882729211087, "grad_norm": 0.4090699476429991, "learning_rate": 3.9015612043332375e-05, "loss": 1.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.15227608382701874, "step": 225, "valid_targets_mean": 7463.5, "valid_targets_min": 1267 }, { "epoch": 0.9637526652452025, "grad_norm": 0.4330402554544449, "learning_rate": 3.8997108605209535e-05, "loss": 1.1013, "loss_nan_ranks": 0, "loss_rank_avg": 0.26998600363731384, "step": 226, "valid_targets_mean": 16178.3, "valid_targets_min": 15368 }, { "epoch": 0.9680170575692963, "grad_norm": 0.3674055145879997, "learning_rate": 3.897843734969891e-05, "loss": 1.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.3121291697025299, "step": 227, "valid_targets_mean": 16218.0, "valid_targets_min": 15492 }, { "epoch": 0.9722814498933902, "grad_norm": 0.3443785580263128, "learning_rate": 3.895959844173937e-05, "loss": 1.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.20776158571243286, "step": 228, "valid_targets_mean": 11823.1, "valid_targets_min": 9219 }, { "epoch": 0.976545842217484, "grad_norm": 0.5250278239914289, "learning_rate": 3.8940592047750774e-05, "loss": 1.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.2968442142009735, "step": 229, "valid_targets_mean": 16117.2, "valid_targets_min": 14958 }, { "epoch": 0.9808102345415778, "grad_norm": 0.47342613018347207, "learning_rate": 3.892141833563255e-05, "loss": 1.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.3667376935482025, "step": 230, "valid_targets_mean": 16062.8, "valid_targets_min": 15242 }, { "epoch": 0.9850746268656716, "grad_norm": 0.4334492194409921, "learning_rate": 3.8902077474762155e-05, "loss": 1.0568, "loss_nan_ranks": 0, "loss_rank_avg": 0.22673600912094116, "step": 231, "valid_targets_mean": 13741.2, "valid_targets_min": 11500 }, { "epoch": 0.9893390191897654, "grad_norm": 0.38506194972597113, "learning_rate": 3.888256963599364e-05, "loss": 1.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.3469485938549042, "step": 232, "valid_targets_mean": 16078.0, "valid_targets_min": 14904 }, { "epoch": 0.9936034115138592, "grad_norm": 0.45946627720688377, "learning_rate": 3.886289499165609e-05, "loss": 1.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.27444905042648315, "step": 233, "valid_targets_mean": 13027.3, "valid_targets_min": 1521 }, { "epoch": 0.997867803837953, "grad_norm": 0.37072479002064795, "learning_rate": 3.884305371555215e-05, "loss": 1.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.30341586470603943, "step": 234, "valid_targets_mean": 15647.9, "valid_targets_min": 14103 }, { "epoch": 1.0, "grad_norm": 0.3713655362758878, "learning_rate": 3.882304598295643e-05, "loss": 1.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.5115901827812195, "step": 235, "valid_targets_mean": 9944.1, "valid_targets_min": 578 }, { "epoch": 1.004264392324094, "grad_norm": 0.492828062086341, "learning_rate": 3.880287197061402e-05, "loss": 1.1026, "loss_nan_ranks": 0, "loss_rank_avg": 0.28225335478782654, "step": 236, "valid_targets_mean": 16134.4, "valid_targets_min": 15417 }, { "epoch": 1.0085287846481876, "grad_norm": 0.48528813108169805, "learning_rate": 3.878253185673888e-05, "loss": 1.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.34507322311401367, "step": 237, "valid_targets_mean": 16085.3, "valid_targets_min": 15115 }, { "epoch": 1.0127931769722816, "grad_norm": 0.4657002193996111, "learning_rate": 3.876202582101229e-05, "loss": 1.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.22333009541034698, "step": 238, "valid_targets_mean": 11956.3, "valid_targets_min": 8620 }, { "epoch": 1.0170575692963753, "grad_norm": 0.5797505215217232, "learning_rate": 3.874135404458125e-05, "loss": 1.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.30123043060302734, "step": 239, "valid_targets_mean": 16189.2, "valid_targets_min": 15410 }, { "epoch": 1.0213219616204692, "grad_norm": 0.5565920299930178, "learning_rate": 3.8720516710056905e-05, "loss": 1.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.3295617699623108, "step": 240, "valid_targets_mean": 16079.0, "valid_targets_min": 14919 }, { "epoch": 1.0255863539445629, "grad_norm": 0.46016269563519424, "learning_rate": 3.8699514001512885e-05, "loss": 1.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2568991780281067, "step": 241, "valid_targets_mean": 14073.2, "valid_targets_min": 12010 }, { "epoch": 1.0298507462686568, "grad_norm": 0.45864038975323523, "learning_rate": 3.867834610448374e-05, "loss": 1.0814, "loss_nan_ranks": 0, "loss_rank_avg": 0.31548625230789185, "step": 242, "valid_targets_mean": 16126.4, "valid_targets_min": 15263 }, { "epoch": 1.0341151385927505, "grad_norm": 0.40278729122913604, "learning_rate": 3.865701320596324e-05, "loss": 1.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.24541878700256348, "step": 243, "valid_targets_mean": 13054.0, "valid_targets_min": 1882 }, { "epoch": 1.0383795309168444, "grad_norm": 0.4100179953102017, "learning_rate": 3.863551549440277e-05, "loss": 1.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.27249300479888916, "step": 244, "valid_targets_mean": 15801.2, "valid_targets_min": 14436 }, { "epoch": 1.0426439232409381, "grad_norm": 0.5075800018498047, "learning_rate": 3.861385315970964e-05, "loss": 1.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.2811691164970398, "step": 245, "valid_targets_mean": 16140.1, "valid_targets_min": 14444 }, { "epoch": 1.046908315565032, "grad_norm": 0.421480437018899, "learning_rate": 3.859202639324542e-05, "loss": 1.0968, "loss_nan_ranks": 0, "loss_rank_avg": 0.19223734736442566, "step": 246, "valid_targets_mean": 10079.0, "valid_targets_min": 1025 }, { "epoch": 1.0511727078891258, "grad_norm": 0.42648584594833727, "learning_rate": 3.8570035387824214e-05, "loss": 1.101, "loss_nan_ranks": 0, "loss_rank_avg": 0.2835865020751953, "step": 247, "valid_targets_mean": 16107.3, "valid_targets_min": 15290 }, { "epoch": 1.0554371002132197, "grad_norm": 0.44244263245684756, "learning_rate": 3.8547880337711036e-05, "loss": 1.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.32503050565719604, "step": 248, "valid_targets_mean": 16154.4, "valid_targets_min": 15031 }, { "epoch": 1.0597014925373134, "grad_norm": 0.5157379647358489, "learning_rate": 3.8525561438620016e-05, "loss": 1.0586, "loss_nan_ranks": 0, "loss_rank_avg": 0.18939271569252014, "step": 249, "valid_targets_mean": 10379.2, "valid_targets_min": 6997 }, { "epoch": 1.0639658848614073, "grad_norm": 0.4449900776791044, "learning_rate": 3.850307888771269e-05, "loss": 1.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888108193874359, "step": 250, "valid_targets_mean": 16118.5, "valid_targets_min": 14698 }, { "epoch": 1.068230277185501, "grad_norm": 0.48149873655188175, "learning_rate": 3.848043288359629e-05, "loss": 1.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.35437071323394775, "step": 251, "valid_targets_mean": 16145.3, "valid_targets_min": 15417 }, { "epoch": 1.072494669509595, "grad_norm": 0.4859386612268441, "learning_rate": 3.8457623626321944e-05, "loss": 1.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.2482079416513443, "step": 252, "valid_targets_mean": 13666.4, "valid_targets_min": 11928 }, { "epoch": 1.0767590618336886, "grad_norm": 0.3906169267825302, "learning_rate": 3.843465131738296e-05, "loss": 1.0505, "loss_nan_ranks": 0, "loss_rank_avg": 0.29448628425598145, "step": 253, "valid_targets_mean": 16168.5, "valid_targets_min": 15367 }, { "epoch": 1.0810234541577826, "grad_norm": 0.46947961764436325, "learning_rate": 3.8411516159713e-05, "loss": 1.1048, "loss_nan_ranks": 0, "loss_rank_avg": 0.33546367287635803, "step": 254, "valid_targets_mean": 16058.3, "valid_targets_min": 15122 }, { "epoch": 1.0852878464818763, "grad_norm": 0.46691663929706273, "learning_rate": 3.838821835768431e-05, "loss": 1.0998, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541680634021759, "step": 255, "valid_targets_mean": 14634.8, "valid_targets_min": 12318 }, { "epoch": 1.0895522388059702, "grad_norm": 0.3703812856992591, "learning_rate": 3.83647581171059e-05, "loss": 1.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.2811293601989746, "step": 256, "valid_targets_mean": 16229.5, "valid_targets_min": 15678 }, { "epoch": 1.0938166311300639, "grad_norm": 0.3996476088742633, "learning_rate": 3.8341135645221744e-05, "loss": 1.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.2120198756456375, "step": 257, "valid_targets_mean": 10198.9, "valid_targets_min": 1521 }, { "epoch": 1.0980810234541578, "grad_norm": 0.4111239192875592, "learning_rate": 3.831735115070895e-05, "loss": 1.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.2730482220649719, "step": 258, "valid_targets_mean": 15648.3, "valid_targets_min": 14587 }, { "epoch": 1.1023454157782515, "grad_norm": 0.40793417859239417, "learning_rate": 3.8293404843675904e-05, "loss": 1.0701, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305908441543579, "step": 259, "valid_targets_mean": 16135.6, "valid_targets_min": 15231 }, { "epoch": 1.1066098081023454, "grad_norm": 0.4148453446560916, "learning_rate": 3.8269296935660395e-05, "loss": 1.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.15724597871303558, "step": 260, "valid_targets_mean": 7092.5, "valid_targets_min": 808 }, { "epoch": 1.1108742004264391, "grad_norm": 0.3969229604496845, "learning_rate": 3.82450276396278e-05, "loss": 1.0551, "loss_nan_ranks": 0, "loss_rank_avg": 0.26030534505844116, "step": 261, "valid_targets_mean": 16152.0, "valid_targets_min": 14548 }, { "epoch": 1.115138592750533, "grad_norm": 0.42210203028372206, "learning_rate": 3.822059716996916e-05, "loss": 1.0822, "loss_nan_ranks": 0, "loss_rank_avg": 0.29231420159339905, "step": 262, "valid_targets_mean": 16084.3, "valid_targets_min": 11563 }, { "epoch": 1.1194029850746268, "grad_norm": 0.4689989288485153, "learning_rate": 3.819600574249929e-05, "loss": 1.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.22371648252010345, "step": 263, "valid_targets_mean": 12894.8, "valid_targets_min": 10816 }, { "epoch": 1.1236673773987207, "grad_norm": 0.4556738705049439, "learning_rate": 3.817125357445489e-05, "loss": 1.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.2985258102416992, "step": 264, "valid_targets_mean": 16128.0, "valid_targets_min": 15288 }, { "epoch": 1.1279317697228146, "grad_norm": 0.3800765405485939, "learning_rate": 3.814634088449261e-05, "loss": 1.0971, "loss_nan_ranks": 0, "loss_rank_avg": 0.30357831716537476, "step": 265, "valid_targets_mean": 16191.3, "valid_targets_min": 15360 }, { "epoch": 1.1321961620469083, "grad_norm": 0.4833962669327678, "learning_rate": 3.812126789268712e-05, "loss": 1.0661, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506658434867859, "step": 266, "valid_targets_mean": 13714.1, "valid_targets_min": 10885 }, { "epoch": 1.136460554371002, "grad_norm": 0.518902812754926, "learning_rate": 3.80960348205292e-05, "loss": 1.0766, "loss_nan_ranks": 0, "loss_rank_avg": 0.30003392696380615, "step": 267, "valid_targets_mean": 16230.6, "valid_targets_min": 14726 }, { "epoch": 1.140724946695096, "grad_norm": 0.462341573969094, "learning_rate": 3.807064189092372e-05, "loss": 1.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.258874773979187, "step": 268, "valid_targets_mean": 12928.8, "valid_targets_min": 578 }, { "epoch": 1.1449893390191899, "grad_norm": 0.35268494216191165, "learning_rate": 3.804508932818771e-05, "loss": 1.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675431966781616, "step": 269, "valid_targets_mean": 15937.6, "valid_targets_min": 14274 }, { "epoch": 1.1492537313432836, "grad_norm": 0.5517836141192989, "learning_rate": 3.801937735804838e-05, "loss": 1.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.31933826208114624, "step": 270, "valid_targets_mean": 16088.9, "valid_targets_min": 14394 }, { "epoch": 1.1535181236673775, "grad_norm": 0.5323326988029511, "learning_rate": 3.799350620764114e-05, "loss": 1.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2066635638475418, "step": 271, "valid_targets_mean": 9558.3, "valid_targets_min": 1284 }, { "epoch": 1.1577825159914712, "grad_norm": 0.45852592023556543, "learning_rate": 3.7967476105507535e-05, "loss": 1.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.2466944456100464, "step": 272, "valid_targets_mean": 16074.0, "valid_targets_min": 15120 }, { "epoch": 1.1620469083155651, "grad_norm": 0.52730269806394, "learning_rate": 3.7941287281593284e-05, "loss": 1.1183, "loss_nan_ranks": 0, "loss_rank_avg": 0.3480404019355774, "step": 273, "valid_targets_mean": 16051.9, "valid_targets_min": 14958 }, { "epoch": 1.1663113006396588, "grad_norm": 0.5317950143572628, "learning_rate": 3.7914939967246227e-05, "loss": 1.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.19135290384292603, "step": 274, "valid_targets_mean": 10320.2, "valid_targets_min": 4592 }, { "epoch": 1.1705756929637527, "grad_norm": 0.47104182647424275, "learning_rate": 3.7888434395214285e-05, "loss": 1.0645, "loss_nan_ranks": 0, "loss_rank_avg": 0.2776111364364624, "step": 275, "valid_targets_mean": 16176.9, "valid_targets_min": 15525 }, { "epoch": 1.1748400852878464, "grad_norm": 0.5015585288642224, "learning_rate": 3.786177079964339e-05, "loss": 1.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.34761297702789307, "step": 276, "valid_targets_mean": 15977.2, "valid_targets_min": 12151 }, { "epoch": 1.1791044776119404, "grad_norm": 0.46156337605426656, "learning_rate": 3.783494941607544e-05, "loss": 1.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.24728554487228394, "step": 277, "valid_targets_mean": 14817.6, "valid_targets_min": 12394 }, { "epoch": 1.183368869936034, "grad_norm": 0.5663761071799178, "learning_rate": 3.780797048144621e-05, "loss": 1.0673, "loss_nan_ranks": 0, "loss_rank_avg": 0.29986995458602905, "step": 278, "valid_targets_mean": 16170.4, "valid_targets_min": 15476 }, { "epoch": 1.187633262260128, "grad_norm": 0.4937926180202986, "learning_rate": 3.7780834234083236e-05, "loss": 1.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.29886218905448914, "step": 279, "valid_targets_mean": 16205.1, "valid_targets_min": 15621 }, { "epoch": 1.1918976545842217, "grad_norm": 0.5114978702997742, "learning_rate": 3.775354091370376e-05, "loss": 1.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.26027584075927734, "step": 280, "valid_targets_mean": 15438.3, "valid_targets_min": 13444 }, { "epoch": 1.1961620469083156, "grad_norm": 0.44901505238938466, "learning_rate": 3.772609076141255e-05, "loss": 1.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.3146480619907379, "step": 281, "valid_targets_mean": 16119.0, "valid_targets_min": 15507 }, { "epoch": 1.2004264392324093, "grad_norm": 0.4209579614378078, "learning_rate": 3.769848401969982e-05, "loss": 1.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.21626295149326324, "step": 282, "valid_targets_mean": 10172.0, "valid_targets_min": 1340 }, { "epoch": 1.2046908315565032, "grad_norm": 0.3888087959337898, "learning_rate": 3.767072093243907e-05, "loss": 1.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.2947539985179901, "step": 283, "valid_targets_mean": 15828.4, "valid_targets_min": 14460 }, { "epoch": 1.208955223880597, "grad_norm": 0.34764295291226055, "learning_rate": 3.7642801744884915e-05, "loss": 1.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.29402148723602295, "step": 284, "valid_targets_mean": 16200.7, "valid_targets_min": 15297 }, { "epoch": 1.2132196162046909, "grad_norm": 0.292454378743343, "learning_rate": 3.761472670367096e-05, "loss": 1.0746, "loss_nan_ranks": 0, "loss_rank_avg": 0.17497391998767853, "step": 285, "valid_targets_mean": 9475.9, "valid_targets_min": 1947 }, { "epoch": 1.2174840085287846, "grad_norm": 0.428465132297418, "learning_rate": 3.758649605680758e-05, "loss": 1.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.28571125864982605, "step": 286, "valid_targets_mean": 16135.3, "valid_targets_min": 15278 }, { "epoch": 1.2217484008528785, "grad_norm": 0.35353654724450573, "learning_rate": 3.755811005367974e-05, "loss": 1.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.34899359941482544, "step": 287, "valid_targets_mean": 15927.2, "valid_targets_min": 13538 }, { "epoch": 1.2260127931769722, "grad_norm": 0.32107825889625696, "learning_rate": 3.752956894504481e-05, "loss": 1.0786, "loss_nan_ranks": 0, "loss_rank_avg": 0.21786460280418396, "step": 288, "valid_targets_mean": 12555.1, "valid_targets_min": 10326 }, { "epoch": 1.2302771855010661, "grad_norm": 0.4011903267761661, "learning_rate": 3.750087298303033e-05, "loss": 1.086, "loss_nan_ranks": 0, "loss_rank_avg": 0.26555633544921875, "step": 289, "valid_targets_mean": 16137.8, "valid_targets_min": 12492 }, { "epoch": 1.2345415778251598, "grad_norm": 0.4140800310411746, "learning_rate": 3.7472022421131795e-05, "loss": 1.09, "loss_nan_ranks": 0, "loss_rank_avg": 0.3115846812725067, "step": 290, "valid_targets_mean": 16206.4, "valid_targets_min": 15481 }, { "epoch": 1.2388059701492538, "grad_norm": 0.3342400344520096, "learning_rate": 3.7443017514210406e-05, "loss": 1.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.25025108456611633, "step": 291, "valid_targets_mean": 14772.3, "valid_targets_min": 12576 }, { "epoch": 1.2430703624733475, "grad_norm": 0.4193850159643592, "learning_rate": 3.7413858518490825e-05, "loss": 1.0596, "loss_nan_ranks": 0, "loss_rank_avg": 0.30145931243896484, "step": 292, "valid_targets_mean": 16124.6, "valid_targets_min": 14727 }, { "epoch": 1.2473347547974414, "grad_norm": 0.3428033141851263, "learning_rate": 3.7384545691558895e-05, "loss": 1.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2986433506011963, "step": 293, "valid_targets_mean": 12797.4, "valid_targets_min": 1628 }, { "epoch": 1.251599147121535, "grad_norm": 0.46779767077850404, "learning_rate": 3.735507929235941e-05, "loss": 1.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.28899234533309937, "step": 294, "valid_targets_mean": 15906.0, "valid_targets_min": 14468 }, { "epoch": 1.255863539445629, "grad_norm": 0.3279641154358886, "learning_rate": 3.732545958119378e-05, "loss": 1.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.3267977833747864, "step": 295, "valid_targets_mean": 16134.5, "valid_targets_min": 15264 }, { "epoch": 1.260127931769723, "grad_norm": 0.32806455507915105, "learning_rate": 3.729568681971774e-05, "loss": 1.0908, "loss_nan_ranks": 0, "loss_rank_avg": 0.19333700835704803, "step": 296, "valid_targets_mean": 9574.0, "valid_targets_min": 2245 }, { "epoch": 1.2643923240938166, "grad_norm": 0.32374524860685283, "learning_rate": 3.726576127093905e-05, "loss": 1.0493, "loss_nan_ranks": 0, "loss_rank_avg": 0.2695855498313904, "step": 297, "valid_targets_mean": 16036.6, "valid_targets_min": 13771 }, { "epoch": 1.2686567164179103, "grad_norm": 0.33439627193487537, "learning_rate": 3.7235683199215177e-05, "loss": 1.0988, "loss_nan_ranks": 0, "loss_rank_avg": 0.3584269881248474, "step": 298, "valid_targets_mean": 16034.9, "valid_targets_min": 13226 }, { "epoch": 1.2729211087420043, "grad_norm": 0.3364668190663482, "learning_rate": 3.7205452870250944e-05, "loss": 1.0891, "loss_nan_ranks": 0, "loss_rank_avg": 0.20322629809379578, "step": 299, "valid_targets_mean": 11007.0, "valid_targets_min": 5744 }, { "epoch": 1.2771855010660982, "grad_norm": 0.3283276606591826, "learning_rate": 3.7175070551096204e-05, "loss": 1.0611, "loss_nan_ranks": 0, "loss_rank_avg": 0.2728656530380249, "step": 300, "valid_targets_mean": 16107.3, "valid_targets_min": 14275 }, { "epoch": 1.2814498933901919, "grad_norm": 0.3410129571670106, "learning_rate": 3.7144536510143436e-05, "loss": 1.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.312499463558197, "step": 301, "valid_targets_mean": 16167.8, "valid_targets_min": 15391 }, { "epoch": 1.2857142857142856, "grad_norm": 0.33178138136357144, "learning_rate": 3.711385101712544e-05, "loss": 1.088, "loss_nan_ranks": 0, "loss_rank_avg": 0.2378830462694168, "step": 302, "valid_targets_mean": 13015.2, "valid_targets_min": 10716 }, { "epoch": 1.2899786780383795, "grad_norm": 0.3052471145988171, "learning_rate": 3.708301434311289e-05, "loss": 1.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.3335162103176117, "step": 303, "valid_targets_mean": 16074.2, "valid_targets_min": 15513 }, { "epoch": 1.2942430703624734, "grad_norm": 0.3837352985797052, "learning_rate": 3.7052026760511996e-05, "loss": 1.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.33790653944015503, "step": 304, "valid_targets_mean": 16062.2, "valid_targets_min": 15222 }, { "epoch": 1.2985074626865671, "grad_norm": 0.3321958535826849, "learning_rate": 3.7020888543062046e-05, "loss": 1.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.28074121475219727, "step": 305, "valid_targets_mean": 15560.0, "valid_targets_min": 7641 }, { "epoch": 1.302771855010661, "grad_norm": 0.3501961919464328, "learning_rate": 3.6989599965833024e-05, "loss": 1.0766, "loss_nan_ranks": 0, "loss_rank_avg": 0.2851867377758026, "step": 306, "valid_targets_mean": 16099.2, "valid_targets_min": 13108 }, { "epoch": 1.3070362473347548, "grad_norm": 0.2955366487957757, "learning_rate": 3.695816130522317e-05, "loss": 1.0946, "loss_nan_ranks": 0, "loss_rank_avg": 0.22300812602043152, "step": 307, "valid_targets_mean": 11237.3, "valid_targets_min": 1669 }, { "epoch": 1.3113006396588487, "grad_norm": 0.325132523785184, "learning_rate": 3.692657283895651e-05, "loss": 1.0553, "loss_nan_ranks": 0, "loss_rank_avg": 0.2740810215473175, "step": 308, "valid_targets_mean": 16148.6, "valid_targets_min": 15513 }, { "epoch": 1.3155650319829424, "grad_norm": 0.3924334579310958, "learning_rate": 3.689483484608048e-05, "loss": 1.0616, "loss_nan_ranks": 0, "loss_rank_avg": 0.30613797903060913, "step": 309, "valid_targets_mean": 16065.3, "valid_targets_min": 13956 }, { "epoch": 1.3198294243070363, "grad_norm": 0.3701546337432741, "learning_rate": 3.6862947606963364e-05, "loss": 1.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709344983100891, "step": 310, "valid_targets_mean": 8786.3, "valid_targets_min": 979 }, { "epoch": 1.32409381663113, "grad_norm": 0.3069231801232966, "learning_rate": 3.6830911403291885e-05, "loss": 1.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.26452311873435974, "step": 311, "valid_targets_mean": 16189.7, "valid_targets_min": 15573 }, { "epoch": 1.328358208955224, "grad_norm": 0.37555960792372617, "learning_rate": 3.679872651806869e-05, "loss": 1.0453, "loss_nan_ranks": 0, "loss_rank_avg": 0.30860525369644165, "step": 312, "valid_targets_mean": 16043.3, "valid_targets_min": 13998 }, { "epoch": 1.3326226012793176, "grad_norm": 0.3570150907119278, "learning_rate": 3.676639323560986e-05, "loss": 1.0489, "loss_nan_ranks": 0, "loss_rank_avg": 0.21335217356681824, "step": 313, "valid_targets_mean": 11691.9, "valid_targets_min": 8218 }, { "epoch": 1.3368869936034116, "grad_norm": 0.3495179049936286, "learning_rate": 3.6733911841542365e-05, "loss": 1.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.2860753536224365, "step": 314, "valid_targets_mean": 16156.4, "valid_targets_min": 15261 }, { "epoch": 1.3411513859275053, "grad_norm": 0.314152802186107, "learning_rate": 3.6701282622801626e-05, "loss": 1.1131, "loss_nan_ranks": 0, "loss_rank_avg": 0.34913378953933716, "step": 315, "valid_targets_mean": 16031.2, "valid_targets_min": 14724 }, { "epoch": 1.3454157782515992, "grad_norm": 0.3525399586735576, "learning_rate": 3.666850586762886e-05, "loss": 1.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.26787278056144714, "step": 316, "valid_targets_mean": 15082.3, "valid_targets_min": 12379 }, { "epoch": 1.349680170575693, "grad_norm": 0.35426346625897037, "learning_rate": 3.663558186556863e-05, "loss": 1.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.3138875365257263, "step": 317, "valid_targets_mean": 16143.6, "valid_targets_min": 15422 }, { "epoch": 1.3539445628997868, "grad_norm": 0.329789873292349, "learning_rate": 3.660251090746627e-05, "loss": 1.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.27487125992774963, "step": 318, "valid_targets_mean": 13230.5, "valid_targets_min": 2050 }, { "epoch": 1.3582089552238805, "grad_norm": 0.3254671506286237, "learning_rate": 3.656929328546526e-05, "loss": 1.104, "loss_nan_ranks": 0, "loss_rank_avg": 0.2868189811706543, "step": 319, "valid_targets_mean": 15947.4, "valid_targets_min": 14844 }, { "epoch": 1.3624733475479744, "grad_norm": 0.37585500252720244, "learning_rate": 3.653592929300471e-05, "loss": 1.1131, "loss_nan_ranks": 0, "loss_rank_avg": 0.3040839731693268, "step": 320, "valid_targets_mean": 16161.1, "valid_targets_min": 15333 }, { "epoch": 1.3667377398720681, "grad_norm": 0.3427210209211445, "learning_rate": 3.650241922481675e-05, "loss": 1.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.1861184984445572, "step": 321, "valid_targets_mean": 9992.6, "valid_targets_min": 2412 }, { "epoch": 1.371002132196162, "grad_norm": 0.3384349571500406, "learning_rate": 3.6468763376923886e-05, "loss": 1.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.2832762598991394, "step": 322, "valid_targets_mean": 16080.6, "valid_targets_min": 15212 }, { "epoch": 1.375266524520256, "grad_norm": 0.3681645742819213, "learning_rate": 3.6434962046636464e-05, "loss": 1.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.32412612438201904, "step": 323, "valid_targets_mean": 16106.3, "valid_targets_min": 15153 }, { "epoch": 1.3795309168443497, "grad_norm": 0.38460123447575495, "learning_rate": 3.6401015532549957e-05, "loss": 1.1213, "loss_nan_ranks": 0, "loss_rank_avg": 0.21516337990760803, "step": 324, "valid_targets_mean": 10360.2, "valid_targets_min": 7125 }, { "epoch": 1.3837953091684434, "grad_norm": 0.3220307097756737, "learning_rate": 3.6366924134542386e-05, "loss": 1.0624, "loss_nan_ranks": 0, "loss_rank_avg": 0.289733350276947, "step": 325, "valid_targets_mean": 16060.8, "valid_targets_min": 13555 }, { "epoch": 1.3880597014925373, "grad_norm": 0.3669520161660149, "learning_rate": 3.633268815377166e-05, "loss": 1.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.3282416760921478, "step": 326, "valid_targets_mean": 16054.6, "valid_targets_min": 14273 }, { "epoch": 1.3923240938166312, "grad_norm": 0.33768050522683196, "learning_rate": 3.6298307892672895e-05, "loss": 1.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.23629745841026306, "step": 327, "valid_targets_mean": 14108.6, "valid_targets_min": 11744 }, { "epoch": 1.396588486140725, "grad_norm": 0.31959918290802164, "learning_rate": 3.626378365495577e-05, "loss": 1.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.29224511981010437, "step": 328, "valid_targets_mean": 16144.3, "valid_targets_min": 15182 }, { "epoch": 1.4008528784648187, "grad_norm": 0.3584955638744689, "learning_rate": 3.622911574560181e-05, "loss": 1.0662, "loss_nan_ranks": 0, "loss_rank_avg": 0.3278372585773468, "step": 329, "valid_targets_mean": 16119.1, "valid_targets_min": 14732 }, { "epoch": 1.4051172707889126, "grad_norm": 0.3551164253468689, "learning_rate": 3.6194304470861744e-05, "loss": 1.1081, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731977701187134, "step": 330, "valid_targets_mean": 15151.9, "valid_targets_min": 13814 }, { "epoch": 1.4093816631130065, "grad_norm": 0.33384857656040146, "learning_rate": 3.615935013825272e-05, "loss": 1.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.30953341722488403, "step": 331, "valid_targets_mean": 16155.7, "valid_targets_min": 15560 }, { "epoch": 1.4136460554371002, "grad_norm": 0.3465598489468695, "learning_rate": 3.612425305655569e-05, "loss": 1.0806, "loss_nan_ranks": 0, "loss_rank_avg": 0.22017063200473785, "step": 332, "valid_targets_mean": 10614.2, "valid_targets_min": 1489 }, { "epoch": 1.417910447761194, "grad_norm": 0.37042791165061556, "learning_rate": 3.6089013535812593e-05, "loss": 1.0543, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671017348766327, "step": 333, "valid_targets_mean": 16140.9, "valid_targets_min": 15217 }, { "epoch": 1.4221748400852878, "grad_norm": 0.32387094747577067, "learning_rate": 3.6053631887323656e-05, "loss": 1.0887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3278307616710663, "step": 334, "valid_targets_mean": 16096.1, "valid_targets_min": 14473 }, { "epoch": 1.4264392324093818, "grad_norm": 0.3699947447682408, "learning_rate": 3.601810842364465e-05, "loss": 1.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.1788579821586609, "step": 335, "valid_targets_mean": 8554.1, "valid_targets_min": 618 }, { "epoch": 1.4307036247334755, "grad_norm": 0.32886822517451314, "learning_rate": 3.598244345858412e-05, "loss": 1.1056, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595828175544739, "step": 336, "valid_targets_mean": 16153.3, "valid_targets_min": 15042 }, { "epoch": 1.4349680170575694, "grad_norm": 0.3523255078156776, "learning_rate": 3.594663730720059e-05, "loss": 1.0832, "loss_nan_ranks": 0, "loss_rank_avg": 0.31492581963539124, "step": 337, "valid_targets_mean": 16167.1, "valid_targets_min": 15032 }, { "epoch": 1.439232409381663, "grad_norm": 0.3705392055125923, "learning_rate": 3.591069028579982e-05, "loss": 1.0987, "loss_nan_ranks": 0, "loss_rank_avg": 0.22190961241722107, "step": 338, "valid_targets_mean": 12233.7, "valid_targets_min": 8961 }, { "epoch": 1.443496801705757, "grad_norm": 0.3047525795134772, "learning_rate": 3.5874602711931994e-05, "loss": 1.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.2945648431777954, "step": 339, "valid_targets_mean": 16054.2, "valid_targets_min": 15148 }, { "epoch": 1.4477611940298507, "grad_norm": 0.34833144896778817, "learning_rate": 3.5838374904388904e-05, "loss": 1.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.32256120443344116, "step": 340, "valid_targets_mean": 16200.9, "valid_targets_min": 15576 }, { "epoch": 1.4520255863539446, "grad_norm": 0.33905394371438524, "learning_rate": 3.580200718320115e-05, "loss": 1.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.25068533420562744, "step": 341, "valid_targets_mean": 15703.2, "valid_targets_min": 12835 }, { "epoch": 1.4562899786780383, "grad_norm": 0.36592609151750577, "learning_rate": 3.576549986963531e-05, "loss": 1.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.3194271922111511, "step": 342, "valid_targets_mean": 16056.5, "valid_targets_min": 14789 }, { "epoch": 1.4605543710021323, "grad_norm": 0.35390446845440837, "learning_rate": 3.5728853286191075e-05, "loss": 1.0643, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540942132472992, "step": 343, "valid_targets_mean": 12879.8, "valid_targets_min": 1242 }, { "epoch": 1.464818763326226, "grad_norm": 0.2755780659749987, "learning_rate": 3.5692067756598465e-05, "loss": 1.0582, "loss_nan_ranks": 0, "loss_rank_avg": 0.26042819023132324, "step": 344, "valid_targets_mean": 16118.8, "valid_targets_min": 15426 }, { "epoch": 1.4690831556503199, "grad_norm": 0.38020197667496863, "learning_rate": 3.5655143605814885e-05, "loss": 1.0941, "loss_nan_ranks": 0, "loss_rank_avg": 0.2965239882469177, "step": 345, "valid_targets_mean": 15897.9, "valid_targets_min": 9286 }, { "epoch": 1.4733475479744136, "grad_norm": 0.2901011570573045, "learning_rate": 3.561808116002232e-05, "loss": 1.0811, "loss_nan_ranks": 0, "loss_rank_avg": 0.19708998501300812, "step": 346, "valid_targets_mean": 10358.7, "valid_targets_min": 2096 }, { "epoch": 1.4776119402985075, "grad_norm": 0.275342451326057, "learning_rate": 3.5580880746624444e-05, "loss": 1.0537, "loss_nan_ranks": 0, "loss_rank_avg": 0.24683061242103577, "step": 347, "valid_targets_mean": 16129.1, "valid_targets_min": 15180 }, { "epoch": 1.4818763326226012, "grad_norm": 0.312505048766249, "learning_rate": 3.5543542694243685e-05, "loss": 1.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.3103181719779968, "step": 348, "valid_targets_mean": 16167.1, "valid_targets_min": 15444 }, { "epoch": 1.4861407249466951, "grad_norm": 0.29880209782535827, "learning_rate": 3.5506067332718355e-05, "loss": 1.0879, "loss_nan_ranks": 0, "loss_rank_avg": 0.21556365489959717, "step": 349, "valid_targets_mean": 10549.6, "valid_targets_min": 6923 }, { "epoch": 1.4904051172707888, "grad_norm": 0.3366257575023693, "learning_rate": 3.546845499309976e-05, "loss": 1.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.27540475130081177, "step": 350, "valid_targets_mean": 16196.4, "valid_targets_min": 15446 }, { "epoch": 1.4946695095948828, "grad_norm": 0.2949817898380746, "learning_rate": 3.5430706007649225e-05, "loss": 1.0752, "loss_nan_ranks": 0, "loss_rank_avg": 0.3441014289855957, "step": 351, "valid_targets_mean": 16196.4, "valid_targets_min": 15577 }, { "epoch": 1.4989339019189765, "grad_norm": 0.33561416621297063, "learning_rate": 3.539282070983518e-05, "loss": 1.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.24721038341522217, "step": 352, "valid_targets_mean": 13119.6, "valid_targets_min": 10183 }, { "epoch": 1.5031982942430704, "grad_norm": 0.33633932267657934, "learning_rate": 3.535479943433023e-05, "loss": 1.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.3473033607006073, "step": 353, "valid_targets_mean": 15859.2, "valid_targets_min": 14337 }, { "epoch": 1.5074626865671643, "grad_norm": 0.30291988931748776, "learning_rate": 3.5316642517008184e-05, "loss": 1.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.30852532386779785, "step": 354, "valid_targets_mean": 16225.0, "valid_targets_min": 15717 }, { "epoch": 1.511727078891258, "grad_norm": 0.35609152737731914, "learning_rate": 3.5278350294941074e-05, "loss": 1.0929, "loss_nan_ranks": 0, "loss_rank_avg": 0.281000018119812, "step": 355, "valid_targets_mean": 15363.8, "valid_targets_min": 13266 }, { "epoch": 1.5159914712153517, "grad_norm": 0.3753461112007819, "learning_rate": 3.523992310639622e-05, "loss": 1.0561, "loss_nan_ranks": 0, "loss_rank_avg": 0.2891591191291809, "step": 356, "valid_targets_mean": 16191.6, "valid_targets_min": 15466 }, { "epoch": 1.5202558635394456, "grad_norm": 0.3055423589980571, "learning_rate": 3.5201361290833165e-05, "loss": 1.0817, "loss_nan_ranks": 0, "loss_rank_avg": 0.2250066101551056, "step": 357, "valid_targets_mean": 11349.5, "valid_targets_min": 1359 }, { "epoch": 1.5245202558635396, "grad_norm": 0.34286072931150735, "learning_rate": 3.516266518890079e-05, "loss": 1.066, "loss_nan_ranks": 0, "loss_rank_avg": 0.2844963073730469, "step": 358, "valid_targets_mean": 16115.3, "valid_targets_min": 14702 }, { "epoch": 1.5287846481876333, "grad_norm": 0.3449248650441334, "learning_rate": 3.512383514243419e-05, "loss": 1.0596, "loss_nan_ranks": 0, "loss_rank_avg": 0.2860240340232849, "step": 359, "valid_targets_mean": 16163.1, "valid_targets_min": 14547 }, { "epoch": 1.533049040511727, "grad_norm": 0.3771111536637937, "learning_rate": 3.5084871494451716e-05, "loss": 1.0225, "loss_nan_ranks": 0, "loss_rank_avg": 0.1857428401708603, "step": 360, "valid_targets_mean": 9576.8, "valid_targets_min": 1522 }, { "epoch": 1.537313432835821, "grad_norm": 0.3018932724883368, "learning_rate": 3.5045774589151955e-05, "loss": 1.0808, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678816318511963, "step": 361, "valid_targets_mean": 15993.7, "valid_targets_min": 10506 }, { "epoch": 1.5415778251599148, "grad_norm": 0.40558509955640737, "learning_rate": 3.500654477191064e-05, "loss": 1.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.34176117181777954, "step": 362, "valid_targets_mean": 15984.2, "valid_targets_min": 14307 }, { "epoch": 1.5458422174840085, "grad_norm": 0.43847114516949215, "learning_rate": 3.496718238927764e-05, "loss": 1.0905, "loss_nan_ranks": 0, "loss_rank_avg": 0.19546037912368774, "step": 363, "valid_targets_mean": 10465.0, "valid_targets_min": 6740 }, { "epoch": 1.5501066098081022, "grad_norm": 0.355769107924039, "learning_rate": 3.492768778897388e-05, "loss": 1.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.2820717692375183, "step": 364, "valid_targets_mean": 16167.3, "valid_targets_min": 14513 }, { "epoch": 1.5543710021321961, "grad_norm": 0.4284452026174569, "learning_rate": 3.4888061319888276e-05, "loss": 1.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305700421333313, "step": 365, "valid_targets_mean": 16124.3, "valid_targets_min": 15263 }, { "epoch": 1.55863539445629, "grad_norm": 0.4382707341244304, "learning_rate": 3.484830333207466e-05, "loss": 1.0999, "loss_nan_ranks": 0, "loss_rank_avg": 0.24906116724014282, "step": 366, "valid_targets_mean": 13535.5, "valid_targets_min": 11622 }, { "epoch": 1.5628997867803838, "grad_norm": 0.3455333246727441, "learning_rate": 3.4808414176748666e-05, "loss": 1.0576, "loss_nan_ranks": 0, "loss_rank_avg": 0.2977335751056671, "step": 367, "valid_targets_mean": 16211.1, "valid_targets_min": 15301 }, { "epoch": 1.5671641791044775, "grad_norm": 0.40729051659063775, "learning_rate": 3.476839420628466e-05, "loss": 1.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757585346698761, "step": 368, "valid_targets_mean": 13357.7, "valid_targets_min": 1733 }, { "epoch": 1.5714285714285714, "grad_norm": 0.4306050253331128, "learning_rate": 3.472824377421257e-05, "loss": 1.0562, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567337155342102, "step": 369, "valid_targets_mean": 15113.8, "valid_targets_min": 13189 }, { "epoch": 1.5756929637526653, "grad_norm": 0.340921039883713, "learning_rate": 3.4687963235214845e-05, "loss": 1.0906, "loss_nan_ranks": 0, "loss_rank_avg": 0.3353586792945862, "step": 370, "valid_targets_mean": 16135.2, "valid_targets_min": 15576 }, { "epoch": 1.579957356076759, "grad_norm": 0.352901062487588, "learning_rate": 3.464755294512325e-05, "loss": 1.0873, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842219978570938, "step": 371, "valid_targets_mean": 8529.3, "valid_targets_min": 1895 }, { "epoch": 1.5842217484008527, "grad_norm": 0.3252571700975914, "learning_rate": 3.4607013260915765e-05, "loss": 1.0876, "loss_nan_ranks": 0, "loss_rank_avg": 0.2786511480808258, "step": 372, "valid_targets_mean": 16116.1, "valid_targets_min": 14467 }, { "epoch": 1.5884861407249466, "grad_norm": 0.32289879581539677, "learning_rate": 3.4566344540713404e-05, "loss": 1.0283, "loss_nan_ranks": 0, "loss_rank_avg": 0.283419132232666, "step": 373, "valid_targets_mean": 16224.1, "valid_targets_min": 15168 }, { "epoch": 1.5927505330490406, "grad_norm": 0.2898095739507456, "learning_rate": 3.452554714377706e-05, "loss": 1.0681, "loss_nan_ranks": 0, "loss_rank_avg": 0.2174898087978363, "step": 374, "valid_targets_mean": 11231.9, "valid_targets_min": 7068 }, { "epoch": 1.5970149253731343, "grad_norm": 0.32701686595227597, "learning_rate": 3.448462143050436e-05, "loss": 1.0558, "loss_nan_ranks": 0, "loss_rank_avg": 0.28061437606811523, "step": 375, "valid_targets_mean": 15767.3, "valid_targets_min": 9286 }, { "epoch": 1.6012793176972282, "grad_norm": 0.3273263196787299, "learning_rate": 3.4443567762426444e-05, "loss": 1.1019, "loss_nan_ranks": 0, "loss_rank_avg": 0.31637561321258545, "step": 376, "valid_targets_mean": 16184.6, "valid_targets_min": 15606 }, { "epoch": 1.6055437100213221, "grad_norm": 0.28906601817080585, "learning_rate": 3.440238650220477e-05, "loss": 1.0381, "loss_nan_ranks": 0, "loss_rank_avg": 0.223393052816391, "step": 377, "valid_targets_mean": 13476.9, "valid_targets_min": 11755 }, { "epoch": 1.6098081023454158, "grad_norm": 0.35312103375959536, "learning_rate": 3.4361078013627945e-05, "loss": 1.048, "loss_nan_ranks": 0, "loss_rank_avg": 0.28802990913391113, "step": 378, "valid_targets_mean": 16131.5, "valid_targets_min": 15301 }, { "epoch": 1.6140724946695095, "grad_norm": 0.3752371927643447, "learning_rate": 3.4319642661608474e-05, "loss": 1.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.3004334568977356, "step": 379, "valid_targets_mean": 16156.4, "valid_targets_min": 15345 }, { "epoch": 1.6183368869936035, "grad_norm": 0.32696956300360913, "learning_rate": 3.427808081217957e-05, "loss": 1.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2737543284893036, "step": 380, "valid_targets_mean": 15046.2, "valid_targets_min": 10805 }, { "epoch": 1.6226012793176974, "grad_norm": 0.32425215210692304, "learning_rate": 3.423639283249189e-05, "loss": 1.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964897155761719, "step": 381, "valid_targets_mean": 16231.2, "valid_targets_min": 15531 }, { "epoch": 1.626865671641791, "grad_norm": 0.3425598006408661, "learning_rate": 3.419457909081032e-05, "loss": 1.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.23575259745121002, "step": 382, "valid_targets_mean": 10985.6, "valid_targets_min": 1923 }, { "epoch": 1.6311300639658848, "grad_norm": 0.34150364485281803, "learning_rate": 3.415263995651069e-05, "loss": 1.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.28503063321113586, "step": 383, "valid_targets_mean": 15444.5, "valid_targets_min": 13058 }, { "epoch": 1.6353944562899787, "grad_norm": 0.26306448756733036, "learning_rate": 3.411057580007653e-05, "loss": 1.0587, "loss_nan_ranks": 0, "loss_rank_avg": 0.31446677446365356, "step": 384, "valid_targets_mean": 16178.7, "valid_targets_min": 15572 }, { "epoch": 1.6396588486140726, "grad_norm": 0.3965336853796899, "learning_rate": 3.4068386993095806e-05, "loss": 1.0459, "loss_nan_ranks": 0, "loss_rank_avg": 0.16267594695091248, "step": 385, "valid_targets_mean": 8596.7, "valid_targets_min": 2213 }, { "epoch": 1.6439232409381663, "grad_norm": 0.3169819070461087, "learning_rate": 3.402607390825762e-05, "loss": 1.0559, "loss_nan_ranks": 0, "loss_rank_avg": 0.24213969707489014, "step": 386, "valid_targets_mean": 16232.5, "valid_targets_min": 15539 }, { "epoch": 1.64818763326226, "grad_norm": 0.30538475252532604, "learning_rate": 3.398363691934894e-05, "loss": 1.0899, "loss_nan_ranks": 0, "loss_rank_avg": 0.33324548602104187, "step": 387, "valid_targets_mean": 16060.8, "valid_targets_min": 15033 }, { "epoch": 1.652452025586354, "grad_norm": 0.3569751677678015, "learning_rate": 3.3941076401251244e-05, "loss": 1.089, "loss_nan_ranks": 0, "loss_rank_avg": 0.1977802813053131, "step": 388, "valid_targets_mean": 11657.1, "valid_targets_min": 9535 }, { "epoch": 1.6567164179104479, "grad_norm": 0.3676226867999698, "learning_rate": 3.3898392729937295e-05, "loss": 1.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911812961101532, "step": 389, "valid_targets_mean": 16162.9, "valid_targets_min": 15023 }, { "epoch": 1.6609808102345416, "grad_norm": 0.28999735215403477, "learning_rate": 3.385558628246774e-05, "loss": 1.1031, "loss_nan_ranks": 0, "loss_rank_avg": 0.31773680448532104, "step": 390, "valid_targets_mean": 16113.8, "valid_targets_min": 15576 }, { "epoch": 1.6652452025586353, "grad_norm": 0.31093356074677225, "learning_rate": 3.381265743698781e-05, "loss": 1.0782, "loss_nan_ranks": 0, "loss_rank_avg": 0.2374432384967804, "step": 391, "valid_targets_mean": 14455.2, "valid_targets_min": 12866 }, { "epoch": 1.6695095948827292, "grad_norm": 0.35211344055285015, "learning_rate": 3.3769606572724e-05, "loss": 1.0542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2905210852622986, "step": 392, "valid_targets_mean": 16126.9, "valid_targets_min": 14699 }, { "epoch": 1.6737739872068231, "grad_norm": 0.33113775807720236, "learning_rate": 3.3726434069980686e-05, "loss": 1.0381, "loss_nan_ranks": 0, "loss_rank_avg": 0.2336466759443283, "step": 393, "valid_targets_mean": 12935.7, "valid_targets_min": 1379 }, { "epoch": 1.6780383795309168, "grad_norm": 0.34400941915401295, "learning_rate": 3.368314031013678e-05, "loss": 1.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.26921963691711426, "step": 394, "valid_targets_mean": 16041.7, "valid_targets_min": 14053 }, { "epoch": 1.6823027718550105, "grad_norm": 0.35946946376014055, "learning_rate": 3.363972567564236e-05, "loss": 1.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.29747501015663147, "step": 395, "valid_targets_mean": 16214.8, "valid_targets_min": 15371 }, { "epoch": 1.6865671641791045, "grad_norm": 0.3554906035816403, "learning_rate": 3.35961905500153e-05, "loss": 1.099, "loss_nan_ranks": 0, "loss_rank_avg": 0.18330803513526917, "step": 396, "valid_targets_mean": 8966.2, "valid_targets_min": 2017 }, { "epoch": 1.6908315565031984, "grad_norm": 0.3216736094709334, "learning_rate": 3.3552535317837855e-05, "loss": 1.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.28136104345321655, "step": 397, "valid_targets_mean": 15754.8, "valid_targets_min": 13899 }, { "epoch": 1.695095948827292, "grad_norm": 0.3400173672246051, "learning_rate": 3.35087603647533e-05, "loss": 1.0812, "loss_nan_ranks": 0, "loss_rank_avg": 0.322651207447052, "step": 398, "valid_targets_mean": 16187.2, "valid_targets_min": 15624 }, { "epoch": 1.6993603411513858, "grad_norm": 0.34927667719012767, "learning_rate": 3.346486607746249e-05, "loss": 1.0958, "loss_nan_ranks": 0, "loss_rank_avg": 0.16751596331596375, "step": 399, "valid_targets_mean": 9466.9, "valid_targets_min": 4761 }, { "epoch": 1.7036247334754797, "grad_norm": 0.3022943680117074, "learning_rate": 3.342085284372047e-05, "loss": 1.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.3175053596496582, "step": 400, "valid_targets_mean": 16054.5, "valid_targets_min": 15525 }, { "epoch": 1.7078891257995736, "grad_norm": 0.35250167872229066, "learning_rate": 3.337672105233303e-05, "loss": 1.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.29572397470474243, "step": 401, "valid_targets_mean": 16123.2, "valid_targets_min": 14638 }, { "epoch": 1.7121535181236673, "grad_norm": 0.3732899225473128, "learning_rate": 3.3332471093153296e-05, "loss": 1.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.22419768571853638, "step": 402, "valid_targets_mean": 13257.8, "valid_targets_min": 10153 }, { "epoch": 1.716417910447761, "grad_norm": 0.32688882568803734, "learning_rate": 3.3288103357078244e-05, "loss": 1.1048, "loss_nan_ranks": 0, "loss_rank_avg": 0.30736756324768066, "step": 403, "valid_targets_mean": 16162.8, "valid_targets_min": 15337 }, { "epoch": 1.720682302771855, "grad_norm": 0.3331310863968516, "learning_rate": 3.324361823604529e-05, "loss": 1.0879, "loss_nan_ranks": 0, "loss_rank_avg": 0.33133578300476074, "step": 404, "valid_targets_mean": 16163.1, "valid_targets_min": 15308 }, { "epoch": 1.724946695095949, "grad_norm": 0.35818787168114613, "learning_rate": 3.319901612302881e-05, "loss": 1.0842, "loss_nan_ranks": 0, "loss_rank_avg": 0.26041942834854126, "step": 405, "valid_targets_mean": 15849.7, "valid_targets_min": 14606 }, { "epoch": 1.7292110874200426, "grad_norm": 0.4007074600786429, "learning_rate": 3.315429741203666e-05, "loss": 1.0603, "loss_nan_ranks": 0, "loss_rank_avg": 0.27965423464775085, "step": 406, "valid_targets_mean": 16208.5, "valid_targets_min": 15536 }, { "epoch": 1.7334754797441365, "grad_norm": 0.3203604311420045, "learning_rate": 3.3109462498106705e-05, "loss": 1.0399, "loss_nan_ranks": 0, "loss_rank_avg": 0.20618872344493866, "step": 407, "valid_targets_mean": 11185.1, "valid_targets_min": 1926 }, { "epoch": 1.7377398720682304, "grad_norm": 0.3333080315095021, "learning_rate": 3.306451177730333e-05, "loss": 1.0416, "loss_nan_ranks": 0, "loss_rank_avg": 0.2642345428466797, "step": 408, "valid_targets_mean": 15921.4, "valid_targets_min": 15152 }, { "epoch": 1.7420042643923241, "grad_norm": 0.3843812441465554, "learning_rate": 3.301944564671394e-05, "loss": 1.0927, "loss_nan_ranks": 0, "loss_rank_avg": 0.3201923966407776, "step": 409, "valid_targets_mean": 16101.6, "valid_targets_min": 13635 }, { "epoch": 1.7462686567164178, "grad_norm": 0.32315567146113006, "learning_rate": 3.297426450444546e-05, "loss": 1.0773, "loss_nan_ranks": 0, "loss_rank_avg": 0.18927864730358124, "step": 410, "valid_targets_mean": 10622.0, "valid_targets_min": 2749 }, { "epoch": 1.7505330490405118, "grad_norm": 0.2968381836926156, "learning_rate": 3.292896874962078e-05, "loss": 1.0479, "loss_nan_ranks": 0, "loss_rank_avg": 0.2641192376613617, "step": 411, "valid_targets_mean": 16163.8, "valid_targets_min": 14690 }, { "epoch": 1.7547974413646057, "grad_norm": 0.3352633067258525, "learning_rate": 3.2883558782375294e-05, "loss": 1.0779, "loss_nan_ranks": 0, "loss_rank_avg": 0.29602476954460144, "step": 412, "valid_targets_mean": 16117.5, "valid_targets_min": 13635 }, { "epoch": 1.7590618336886994, "grad_norm": 0.28476969110178263, "learning_rate": 3.283803500385332e-05, "loss": 1.0934, "loss_nan_ranks": 0, "loss_rank_avg": 0.22423139214515686, "step": 413, "valid_targets_mean": 12500.9, "valid_targets_min": 9491 }, { "epoch": 1.763326226012793, "grad_norm": 0.30474507510851556, "learning_rate": 3.2792397816204546e-05, "loss": 1.0923, "loss_nan_ranks": 0, "loss_rank_avg": 0.29216915369033813, "step": 414, "valid_targets_mean": 16139.3, "valid_targets_min": 15077 }, { "epoch": 1.767590618336887, "grad_norm": 0.2888866831703543, "learning_rate": 3.2746647622580524e-05, "loss": 1.0929, "loss_nan_ranks": 0, "loss_rank_avg": 0.3108062148094177, "step": 415, "valid_targets_mean": 16148.9, "valid_targets_min": 15485 }, { "epoch": 1.771855010660981, "grad_norm": 0.32915338022522184, "learning_rate": 3.270078482713106e-05, "loss": 1.0337, "loss_nan_ranks": 0, "loss_rank_avg": 0.23528018593788147, "step": 416, "valid_targets_mean": 14075.5, "valid_targets_min": 11572 }, { "epoch": 1.7761194029850746, "grad_norm": 0.30919496917968614, "learning_rate": 3.265480983500069e-05, "loss": 1.063, "loss_nan_ranks": 0, "loss_rank_avg": 0.30584001541137695, "step": 417, "valid_targets_mean": 16051.5, "valid_targets_min": 13927 }, { "epoch": 1.7803837953091683, "grad_norm": 0.3441949263098652, "learning_rate": 3.260872305232507e-05, "loss": 1.041, "loss_nan_ranks": 0, "loss_rank_avg": 0.25926971435546875, "step": 418, "valid_targets_mean": 13168.9, "valid_targets_min": 2225 }, { "epoch": 1.7846481876332623, "grad_norm": 0.36423291496651444, "learning_rate": 3.256252488622738e-05, "loss": 1.0468, "loss_nan_ranks": 0, "loss_rank_avg": 0.24720856547355652, "step": 419, "valid_targets_mean": 16116.3, "valid_targets_min": 13473 }, { "epoch": 1.7889125799573562, "grad_norm": 0.4247004875254001, "learning_rate": 3.251621574481475e-05, "loss": 1.0639, "loss_nan_ranks": 0, "loss_rank_avg": 0.29388993978500366, "step": 420, "valid_targets_mean": 16112.0, "valid_targets_min": 14287 }, { "epoch": 1.79317697228145, "grad_norm": 0.29766378137701294, "learning_rate": 3.246979603717467e-05, "loss": 1.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.20671671628952026, "step": 421, "valid_targets_mean": 10187.9, "valid_targets_min": 1240 }, { "epoch": 1.7974413646055436, "grad_norm": 0.40271557718751394, "learning_rate": 3.242326617337133e-05, "loss": 1.0478, "loss_nan_ranks": 0, "loss_rank_avg": 0.2497304528951645, "step": 422, "valid_targets_mean": 16181.6, "valid_targets_min": 14875 }, { "epoch": 1.8017057569296375, "grad_norm": 0.3782484850120709, "learning_rate": 3.2376626564442016e-05, "loss": 1.0654, "loss_nan_ranks": 0, "loss_rank_avg": 0.31483617424964905, "step": 423, "valid_targets_mean": 16183.7, "valid_targets_min": 15121 }, { "epoch": 1.8059701492537314, "grad_norm": 0.30649531604027724, "learning_rate": 3.2329877622393515e-05, "loss": 1.0504, "loss_nan_ranks": 0, "loss_rank_avg": 0.2193414866924286, "step": 424, "valid_targets_mean": 11132.9, "valid_targets_min": 7632 }, { "epoch": 1.8102345415778252, "grad_norm": 0.35448072761495, "learning_rate": 3.228301976019841e-05, "loss": 1.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.291428804397583, "step": 425, "valid_targets_mean": 16018.5, "valid_targets_min": 14821 }, { "epoch": 1.8144989339019189, "grad_norm": 0.3390792473030516, "learning_rate": 3.22360533917915e-05, "loss": 1.0773, "loss_nan_ranks": 0, "loss_rank_avg": 0.2975163459777832, "step": 426, "valid_targets_mean": 16201.6, "valid_targets_min": 15221 }, { "epoch": 1.8187633262260128, "grad_norm": 0.3147806679424687, "learning_rate": 3.218897893206608e-05, "loss": 1.0406, "loss_nan_ranks": 0, "loss_rank_avg": 0.2215021848678589, "step": 427, "valid_targets_mean": 13069.1, "valid_targets_min": 8831 }, { "epoch": 1.8230277185501067, "grad_norm": 0.36019990325979584, "learning_rate": 3.2141796796870335e-05, "loss": 1.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.2969133257865906, "step": 428, "valid_targets_mean": 16014.8, "valid_targets_min": 13788 }, { "epoch": 1.8272921108742004, "grad_norm": 0.2981772660966227, "learning_rate": 3.2094507403003614e-05, "loss": 1.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.31634145975112915, "step": 429, "valid_targets_mean": 16206.0, "valid_targets_min": 15778 }, { "epoch": 1.831556503198294, "grad_norm": 0.3562159773344419, "learning_rate": 3.2047111168212785e-05, "loss": 1.1017, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830113470554352, "step": 430, "valid_targets_mean": 15181.8, "valid_targets_min": 13169 }, { "epoch": 1.835820895522388, "grad_norm": 0.3462357812701073, "learning_rate": 3.1999608511188524e-05, "loss": 1.0453, "loss_nan_ranks": 0, "loss_rank_avg": 0.28061801195144653, "step": 431, "valid_targets_mean": 16113.2, "valid_targets_min": 13828 }, { "epoch": 1.840085287846482, "grad_norm": 0.2712904109633026, "learning_rate": 3.1951999851561625e-05, "loss": 1.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.2145303189754486, "step": 432, "valid_targets_mean": 11254.6, "valid_targets_min": 1974 }, { "epoch": 1.8443496801705757, "grad_norm": 0.3372878988948171, "learning_rate": 3.190428560989931e-05, "loss": 1.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.269620805978775, "step": 433, "valid_targets_mean": 15552.6, "valid_targets_min": 14147 }, { "epoch": 1.8486140724946694, "grad_norm": 0.33502781437527734, "learning_rate": 3.185646620770146e-05, "loss": 1.0554, "loss_nan_ranks": 0, "loss_rank_avg": 0.3428090810775757, "step": 434, "valid_targets_mean": 16115.7, "valid_targets_min": 15331 }, { "epoch": 1.8528784648187633, "grad_norm": 0.32083840655486917, "learning_rate": 3.180854206739696e-05, "loss": 1.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.15823984146118164, "step": 435, "valid_targets_mean": 7300.2, "valid_targets_min": 1215 }, { "epoch": 1.8571428571428572, "grad_norm": 0.3655942212180277, "learning_rate": 3.176051361233991e-05, "loss": 1.0793, "loss_nan_ranks": 0, "loss_rank_avg": 0.27045610547065735, "step": 436, "valid_targets_mean": 16174.1, "valid_targets_min": 15414 }, { "epoch": 1.861407249466951, "grad_norm": 0.37573240088501814, "learning_rate": 3.171238126680594e-05, "loss": 1.0503, "loss_nan_ranks": 0, "loss_rank_avg": 0.29048848152160645, "step": 437, "valid_targets_mean": 16202.2, "valid_targets_min": 15560 }, { "epoch": 1.8656716417910446, "grad_norm": 0.352557840532509, "learning_rate": 3.166414545598839e-05, "loss": 1.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.23219341039657593, "step": 438, "valid_targets_mean": 12580.4, "valid_targets_min": 10074 }, { "epoch": 1.8699360341151388, "grad_norm": 0.40604007958968985, "learning_rate": 3.161580660599464e-05, "loss": 1.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.27523332834243774, "step": 439, "valid_targets_mean": 15703.7, "valid_targets_min": 4778 }, { "epoch": 1.8742004264392325, "grad_norm": 0.3578916382684771, "learning_rate": 3.1567365143842264e-05, "loss": 1.0602, "loss_nan_ranks": 0, "loss_rank_avg": 0.3120695650577545, "step": 440, "valid_targets_mean": 16157.0, "valid_targets_min": 15368 }, { "epoch": 1.8784648187633262, "grad_norm": 0.29322622999687875, "learning_rate": 3.1518821497455326e-05, "loss": 1.0661, "loss_nan_ranks": 0, "loss_rank_avg": 0.22893603146076202, "step": 441, "valid_targets_mean": 13424.1, "valid_targets_min": 11379 }, { "epoch": 1.88272921108742, "grad_norm": 0.36915524627767804, "learning_rate": 3.147017609566054e-05, "loss": 1.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.3331189453601837, "step": 442, "valid_targets_mean": 16049.3, "valid_targets_min": 14702 }, { "epoch": 1.886993603411514, "grad_norm": 0.25054962444606416, "learning_rate": 3.142142936818353e-05, "loss": 1.0737, "loss_nan_ranks": 0, "loss_rank_avg": 0.25321656465530396, "step": 443, "valid_targets_mean": 13397.8, "valid_targets_min": 2017 }, { "epoch": 1.8912579957356077, "grad_norm": 0.3509714430545398, "learning_rate": 3.137258174564501e-05, "loss": 1.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.27710413932800293, "step": 444, "valid_targets_mean": 16007.1, "valid_targets_min": 15085 }, { "epoch": 1.8955223880597014, "grad_norm": 0.35482602042188444, "learning_rate": 3.1323633659556986e-05, "loss": 1.0238, "loss_nan_ranks": 0, "loss_rank_avg": 0.2886030673980713, "step": 445, "valid_targets_mean": 16240.1, "valid_targets_min": 15762 }, { "epoch": 1.8997867803837953, "grad_norm": 0.26773049702383594, "learning_rate": 3.127458554231894e-05, "loss": 1.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.1944742053747177, "step": 446, "valid_targets_mean": 9927.9, "valid_targets_min": 2329 }, { "epoch": 1.9040511727078893, "grad_norm": 0.3483780481045023, "learning_rate": 3.122543782721402e-05, "loss": 1.0928, "loss_nan_ranks": 0, "loss_rank_avg": 0.27462565898895264, "step": 447, "valid_targets_mean": 16032.5, "valid_targets_min": 15102 }, { "epoch": 1.908315565031983, "grad_norm": 0.3368829130798326, "learning_rate": 3.1176190948405194e-05, "loss": 1.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.34951770305633545, "step": 448, "valid_targets_mean": 16119.2, "valid_targets_min": 15712 }, { "epoch": 1.9125799573560767, "grad_norm": 0.30268057780648044, "learning_rate": 3.112684534093142e-05, "loss": 1.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.19990648329257965, "step": 449, "valid_targets_mean": 10913.1, "valid_targets_min": 6367 }, { "epoch": 1.9168443496801706, "grad_norm": 0.30358006933130305, "learning_rate": 3.107740144070385e-05, "loss": 1.0234, "loss_nan_ranks": 0, "loss_rank_avg": 0.2891259789466858, "step": 450, "valid_targets_mean": 16040.9, "valid_targets_min": 13080 }, { "epoch": 1.9211087420042645, "grad_norm": 0.3628808145609311, "learning_rate": 3.102785968450188e-05, "loss": 1.0428, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000900149345398, "step": 451, "valid_targets_mean": 16137.6, "valid_targets_min": 15228 }, { "epoch": 1.9253731343283582, "grad_norm": 0.2764530866126593, "learning_rate": 3.09782205099694e-05, "loss": 1.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544265389442444, "step": 452, "valid_targets_mean": 13191.7, "valid_targets_min": 10839 }, { "epoch": 1.929637526652452, "grad_norm": 0.28797232262388883, "learning_rate": 3.092848435561084e-05, "loss": 1.0382, "loss_nan_ranks": 0, "loss_rank_avg": 0.28947630524635315, "step": 453, "valid_targets_mean": 16126.2, "valid_targets_min": 14702 }, { "epoch": 1.9339019189765458, "grad_norm": 0.31616751921565583, "learning_rate": 3.0878651660787376e-05, "loss": 1.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.2999494671821594, "step": 454, "valid_targets_mean": 16165.5, "valid_targets_min": 14997 }, { "epoch": 1.9381663113006398, "grad_norm": 0.26746073217550403, "learning_rate": 3.082872286571295e-05, "loss": 1.061, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623918652534485, "step": 455, "valid_targets_mean": 14387.2, "valid_targets_min": 12697 }, { "epoch": 1.9424307036247335, "grad_norm": 0.2840271608173446, "learning_rate": 3.077869841145049e-05, "loss": 1.0563, "loss_nan_ranks": 0, "loss_rank_avg": 0.30360060930252075, "step": 456, "valid_targets_mean": 16208.8, "valid_targets_min": 15627 }, { "epoch": 1.9466950959488272, "grad_norm": 0.28298849548309235, "learning_rate": 3.0728578739907934e-05, "loss": 1.1073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2182055413722992, "step": 457, "valid_targets_mean": 10413.9, "valid_targets_min": 2491 }, { "epoch": 1.950959488272921, "grad_norm": 0.267402368213611, "learning_rate": 3.067836429383437e-05, "loss": 1.0376, "loss_nan_ranks": 0, "loss_rank_avg": 0.2391853779554367, "step": 458, "valid_targets_mean": 16266.1, "valid_targets_min": 16019 }, { "epoch": 1.955223880597015, "grad_norm": 0.27519623772632346, "learning_rate": 3.062805551681609e-05, "loss": 1.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.3138701915740967, "step": 459, "valid_targets_mean": 16080.7, "valid_targets_min": 14943 }, { "epoch": 1.9594882729211087, "grad_norm": 0.3412396846851224, "learning_rate": 3.057765285327271e-05, "loss": 1.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.13240568339824677, "step": 460, "valid_targets_mean": 6411.7, "valid_targets_min": 2004 }, { "epoch": 1.9637526652452024, "grad_norm": 0.27637519468535493, "learning_rate": 3.0527156748453214e-05, "loss": 1.0246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2705056965351105, "step": 461, "valid_targets_mean": 16094.2, "valid_targets_min": 13927 }, { "epoch": 1.9680170575692963, "grad_norm": 0.2491017774469789, "learning_rate": 3.047656764843203e-05, "loss": 1.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.31651365756988525, "step": 462, "valid_targets_mean": 16166.5, "valid_targets_min": 15218 }, { "epoch": 1.9722814498933903, "grad_norm": 0.2898466387677518, "learning_rate": 3.0425886000105094e-05, "loss": 1.043, "loss_nan_ranks": 0, "loss_rank_avg": 0.2042815089225769, "step": 463, "valid_targets_mean": 12991.4, "valid_targets_min": 11115 }, { "epoch": 1.976545842217484, "grad_norm": 0.24076807322050023, "learning_rate": 3.0375112251185892e-05, "loss": 1.0471, "loss_nan_ranks": 0, "loss_rank_avg": 0.28346341848373413, "step": 464, "valid_targets_mean": 16167.2, "valid_targets_min": 15368 }, { "epoch": 1.9808102345415777, "grad_norm": 0.2987602021633277, "learning_rate": 3.0324246850201527e-05, "loss": 1.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.3213338851928711, "step": 465, "valid_targets_mean": 16105.9, "valid_targets_min": 15564 }, { "epoch": 1.9850746268656716, "grad_norm": 0.2728017482563389, "learning_rate": 3.0273290246488732e-05, "loss": 1.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.25564104318618774, "step": 466, "valid_targets_mean": 15038.5, "valid_targets_min": 13132 }, { "epoch": 1.9893390191897655, "grad_norm": 0.27178003591024674, "learning_rate": 3.0222242890189904e-05, "loss": 1.1019, "loss_nan_ranks": 0, "loss_rank_avg": 0.3196239471435547, "step": 467, "valid_targets_mean": 16099.2, "valid_targets_min": 15195 }, { "epoch": 1.9936034115138592, "grad_norm": 0.2960811264621479, "learning_rate": 3.017110523224914e-05, "loss": 1.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.243838369846344, "step": 468, "valid_targets_mean": 13108.7, "valid_targets_min": 1500 }, { "epoch": 1.997867803837953, "grad_norm": 0.2900638231868673, "learning_rate": 3.011987772440825e-05, "loss": 1.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.269381582736969, "step": 469, "valid_targets_mean": 15314.6, "valid_targets_min": 13039 }, { "epoch": 2.0, "grad_norm": 0.368934520127521, "learning_rate": 3.006856081920277e-05, "loss": 1.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.4675736427307129, "step": 470, "valid_targets_mean": 10737.9, "valid_targets_min": 1562 }, { "epoch": 2.0042643923240937, "grad_norm": 0.3552345026600377, "learning_rate": 3.001715496995793e-05, "loss": 1.0287, "loss_nan_ranks": 0, "loss_rank_avg": 0.2579972743988037, "step": 471, "valid_targets_mean": 16126.5, "valid_targets_min": 15300 }, { "epoch": 2.008528784648188, "grad_norm": 0.39123834746131897, "learning_rate": 2.9965660630784715e-05, "loss": 1.0687, "loss_nan_ranks": 0, "loss_rank_avg": 0.31611669063568115, "step": 472, "valid_targets_mean": 16121.2, "valid_targets_min": 14702 }, { "epoch": 2.0127931769722816, "grad_norm": 0.41374695875844714, "learning_rate": 2.9914078256575782e-05, "loss": 1.0199, "loss_nan_ranks": 0, "loss_rank_avg": 0.19053825736045837, "step": 473, "valid_targets_mean": 11766.6, "valid_targets_min": 7044 }, { "epoch": 2.0170575692963753, "grad_norm": 0.40073365553126444, "learning_rate": 2.9862408303001492e-05, "loss": 1.0289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2865005135536194, "step": 474, "valid_targets_mean": 16154.8, "valid_targets_min": 15606 }, { "epoch": 2.021321961620469, "grad_norm": 0.46584459230727177, "learning_rate": 2.9810651226505875e-05, "loss": 1.0107, "loss_nan_ranks": 0, "loss_rank_avg": 0.29241612553596497, "step": 475, "valid_targets_mean": 16143.0, "valid_targets_min": 14917 }, { "epoch": 2.025586353944563, "grad_norm": 0.40495999614766015, "learning_rate": 2.9758807484302566e-05, "loss": 1.0117, "loss_nan_ranks": 0, "loss_rank_avg": 0.22781220078468323, "step": 476, "valid_targets_mean": 14726.9, "valid_targets_min": 13072 }, { "epoch": 2.029850746268657, "grad_norm": 0.34368125435399516, "learning_rate": 2.9706877534370822e-05, "loss": 1.0104, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631028890609741, "step": 477, "valid_targets_mean": 16200.3, "valid_targets_min": 15042 }, { "epoch": 2.0341151385927505, "grad_norm": 0.4136824421856256, "learning_rate": 2.965486183545142e-05, "loss": 1.0937, "loss_nan_ranks": 0, "loss_rank_avg": 0.24957922101020813, "step": 478, "valid_targets_mean": 13077.4, "valid_targets_min": 1630 }, { "epoch": 2.038379530916844, "grad_norm": 0.3581098227344428, "learning_rate": 2.9602760847042645e-05, "loss": 1.0235, "loss_nan_ranks": 0, "loss_rank_avg": 0.24706491827964783, "step": 479, "valid_targets_mean": 15628.0, "valid_targets_min": 14094 }, { "epoch": 2.0426439232409384, "grad_norm": 0.3287300126568842, "learning_rate": 2.955057502939621e-05, "loss": 1.0477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2831410765647888, "step": 480, "valid_targets_mean": 16204.5, "valid_targets_min": 15520 }, { "epoch": 2.046908315565032, "grad_norm": 0.36544509127089886, "learning_rate": 2.9498304843513193e-05, "loss": 1.0476, "loss_nan_ranks": 0, "loss_rank_avg": 0.16354572772979736, "step": 481, "valid_targets_mean": 8899.1, "valid_targets_min": 1392 }, { "epoch": 2.0511727078891258, "grad_norm": 0.29290892374778665, "learning_rate": 2.9445950751139957e-05, "loss": 0.9926, "loss_nan_ranks": 0, "loss_rank_avg": 0.25088614225387573, "step": 482, "valid_targets_mean": 16143.0, "valid_targets_min": 15153 }, { "epoch": 2.0554371002132195, "grad_norm": 0.3413415806747987, "learning_rate": 2.939351321476412e-05, "loss": 1.0442, "loss_nan_ranks": 0, "loss_rank_avg": 0.3098033368587494, "step": 483, "valid_targets_mean": 16180.8, "valid_targets_min": 15538 }, { "epoch": 2.0597014925373136, "grad_norm": 0.3477262822317496, "learning_rate": 2.9340992697610393e-05, "loss": 1.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.23189440369606018, "step": 484, "valid_targets_mean": 12631.6, "valid_targets_min": 7725 }, { "epoch": 2.0639658848614073, "grad_norm": 0.25626551753147225, "learning_rate": 2.9288389663636537e-05, "loss": 1.0595, "loss_nan_ranks": 0, "loss_rank_avg": 0.2773468494415283, "step": 485, "valid_targets_mean": 16057.7, "valid_targets_min": 14555 }, { "epoch": 2.068230277185501, "grad_norm": 0.2975738669309161, "learning_rate": 2.923570457752925e-05, "loss": 0.9844, "loss_nan_ranks": 0, "loss_rank_avg": 0.2952193021774292, "step": 486, "valid_targets_mean": 16159.5, "valid_targets_min": 15168 }, { "epoch": 2.0724946695095947, "grad_norm": 0.3185341360493201, "learning_rate": 2.9182937904700078e-05, "loss": 1.0428, "loss_nan_ranks": 0, "loss_rank_avg": 0.23297083377838135, "step": 487, "valid_targets_mean": 13743.6, "valid_targets_min": 11030 }, { "epoch": 2.076759061833689, "grad_norm": 0.33249335218498505, "learning_rate": 2.9130090111281278e-05, "loss": 1.0131, "loss_nan_ranks": 0, "loss_rank_avg": 0.27144575119018555, "step": 488, "valid_targets_mean": 16219.4, "valid_targets_min": 15554 }, { "epoch": 2.0810234541577826, "grad_norm": 0.2996105345731296, "learning_rate": 2.9077161664121722e-05, "loss": 1.0553, "loss_nan_ranks": 0, "loss_rank_avg": 0.3078475892543793, "step": 489, "valid_targets_mean": 16029.9, "valid_targets_min": 15168 }, { "epoch": 2.0852878464818763, "grad_norm": 0.368268651082118, "learning_rate": 2.902415303078275e-05, "loss": 1.0256, "loss_nan_ranks": 0, "loss_rank_avg": 0.23868870735168457, "step": 490, "valid_targets_mean": 15594.2, "valid_targets_min": 13709 }, { "epoch": 2.08955223880597, "grad_norm": 0.3316811583389926, "learning_rate": 2.8971064679534072e-05, "loss": 1.0153, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731947600841522, "step": 491, "valid_targets_mean": 16149.3, "valid_targets_min": 15057 }, { "epoch": 2.093816631130064, "grad_norm": 0.3417240842034942, "learning_rate": 2.8917897079349604e-05, "loss": 1.0379, "loss_nan_ranks": 0, "loss_rank_avg": 0.2092648297548294, "step": 492, "valid_targets_mean": 10589.6, "valid_targets_min": 2052 }, { "epoch": 2.098081023454158, "grad_norm": 0.40376931007632894, "learning_rate": 2.8864650699903336e-05, "loss": 1.0248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2569881081581116, "step": 493, "valid_targets_mean": 15575.6, "valid_targets_min": 12875 }, { "epoch": 2.1023454157782515, "grad_norm": 0.30769674885232867, "learning_rate": 2.881132601156518e-05, "loss": 1.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.3187497854232788, "step": 494, "valid_targets_mean": 16201.0, "valid_targets_min": 15588 }, { "epoch": 2.106609808102345, "grad_norm": 0.33552517299223356, "learning_rate": 2.8757923485396805e-05, "loss": 1.0356, "loss_nan_ranks": 0, "loss_rank_avg": 0.15743032097816467, "step": 495, "valid_targets_mean": 8183.4, "valid_targets_min": 1761 }, { "epoch": 2.1108742004264394, "grad_norm": 0.3424571034637037, "learning_rate": 2.8704443593147517e-05, "loss": 1.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.27219459414482117, "step": 496, "valid_targets_mean": 16106.9, "valid_targets_min": 15525 }, { "epoch": 2.115138592750533, "grad_norm": 0.2808950772476962, "learning_rate": 2.8650886807250024e-05, "loss": 1.0675, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192838728427887, "step": 497, "valid_targets_mean": 16090.3, "valid_targets_min": 14394 }, { "epoch": 2.1194029850746268, "grad_norm": 0.37199865580909014, "learning_rate": 2.8597253600816332e-05, "loss": 1.0764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2070493996143341, "step": 498, "valid_targets_mean": 11938.5, "valid_targets_min": 10146 }, { "epoch": 2.1236673773987205, "grad_norm": 0.3091647855511728, "learning_rate": 2.8543544447633517e-05, "loss": 1.0565, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848047614097595, "step": 499, "valid_targets_mean": 16117.8, "valid_targets_min": 14547 }, { "epoch": 2.1279317697228146, "grad_norm": 0.4360073570883157, "learning_rate": 2.8489759822159558e-05, "loss": 1.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.3340121805667877, "step": 500, "valid_targets_mean": 16178.9, "valid_targets_min": 15565 }, { "epoch": 2.1321961620469083, "grad_norm": 0.35047972464084715, "learning_rate": 2.843590019951914e-05, "loss": 1.0502, "loss_nan_ranks": 0, "loss_rank_avg": 0.22108137607574463, "step": 501, "valid_targets_mean": 13181.2, "valid_targets_min": 11593 }, { "epoch": 2.136460554371002, "grad_norm": 0.40037840006291353, "learning_rate": 2.838196605549948e-05, "loss": 1.0656, "loss_nan_ranks": 0, "loss_rank_avg": 0.31084370613098145, "step": 502, "valid_targets_mean": 16180.7, "valid_targets_min": 15667 }, { "epoch": 2.140724946695096, "grad_norm": 0.3146422639655215, "learning_rate": 2.8327957866546082e-05, "loss": 1.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.25872519612312317, "step": 503, "valid_targets_mean": 12895.1, "valid_targets_min": 755 }, { "epoch": 2.14498933901919, "grad_norm": 0.36862933115455493, "learning_rate": 2.8273876109758568e-05, "loss": 1.0786, "loss_nan_ranks": 0, "loss_rank_avg": 0.26297274231910706, "step": 504, "valid_targets_mean": 15436.5, "valid_targets_min": 14157 }, { "epoch": 2.1492537313432836, "grad_norm": 0.361459762761618, "learning_rate": 2.8219721262886427e-05, "loss": 1.0455, "loss_nan_ranks": 0, "loss_rank_avg": 0.31806501746177673, "step": 505, "valid_targets_mean": 16037.3, "valid_targets_min": 13211 }, { "epoch": 2.1535181236673773, "grad_norm": 0.2864709994302262, "learning_rate": 2.816549380432483e-05, "loss": 1.0265, "loss_nan_ranks": 0, "loss_rank_avg": 0.18135976791381836, "step": 506, "valid_targets_mean": 9544.8, "valid_targets_min": 1763 }, { "epoch": 2.1577825159914714, "grad_norm": 0.3350310583584809, "learning_rate": 2.8111194213110386e-05, "loss": 1.0286, "loss_nan_ranks": 0, "loss_rank_avg": 0.2634314298629761, "step": 507, "valid_targets_mean": 15868.5, "valid_targets_min": 9799 }, { "epoch": 2.162046908315565, "grad_norm": 0.3255526769969389, "learning_rate": 2.805682296891691e-05, "loss": 1.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.3196669816970825, "step": 508, "valid_targets_mean": 16133.4, "valid_targets_min": 15537 }, { "epoch": 2.166311300639659, "grad_norm": 0.32487336416940715, "learning_rate": 2.8002380552051186e-05, "loss": 1.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.16130326688289642, "step": 509, "valid_targets_mean": 9578.0, "valid_targets_min": 5674 }, { "epoch": 2.1705756929637525, "grad_norm": 0.32268877543461205, "learning_rate": 2.7947867443448728e-05, "loss": 1.0267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731488049030304, "step": 510, "valid_targets_mean": 16089.0, "valid_targets_min": 14444 }, { "epoch": 2.1748400852878467, "grad_norm": 0.320456670152423, "learning_rate": 2.789328412466953e-05, "loss": 1.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.29730743169784546, "step": 511, "valid_targets_mean": 16163.5, "valid_targets_min": 15222 }, { "epoch": 2.1791044776119404, "grad_norm": 0.3321709887681174, "learning_rate": 2.7838631077893813e-05, "loss": 1.0546, "loss_nan_ranks": 0, "loss_rank_avg": 0.21399202942848206, "step": 512, "valid_targets_mean": 12320.2, "valid_targets_min": 10472 }, { "epoch": 2.183368869936034, "grad_norm": 0.39115337491407043, "learning_rate": 2.7783908785917753e-05, "loss": 1.0746, "loss_nan_ranks": 0, "loss_rank_avg": 0.30008408427238464, "step": 513, "valid_targets_mean": 16060.1, "valid_targets_min": 14908 }, { "epoch": 2.1876332622601278, "grad_norm": 0.3092000821820992, "learning_rate": 2.7729117732149244e-05, "loss": 1.0625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2982850670814514, "step": 514, "valid_targets_mean": 15956.0, "valid_targets_min": 12151 }, { "epoch": 2.191897654584222, "grad_norm": 0.39058023646491175, "learning_rate": 2.7674258400603587e-05, "loss": 1.043, "loss_nan_ranks": 0, "loss_rank_avg": 0.2451504021883011, "step": 515, "valid_targets_mean": 14654.4, "valid_targets_min": 12701 }, { "epoch": 2.1961620469083156, "grad_norm": 0.37207685669025975, "learning_rate": 2.761933127589927e-05, "loss": 1.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.2868039608001709, "step": 516, "valid_targets_mean": 16187.1, "valid_targets_min": 15153 }, { "epoch": 2.2004264392324093, "grad_norm": 0.3478055090012624, "learning_rate": 2.7564336843253633e-05, "loss": 1.0367, "loss_nan_ranks": 0, "loss_rank_avg": 0.20308353006839752, "step": 517, "valid_targets_mean": 11016.9, "valid_targets_min": 1500 }, { "epoch": 2.204690831556503, "grad_norm": 0.2834140615062104, "learning_rate": 2.7509275588478606e-05, "loss": 1.0648, "loss_nan_ranks": 0, "loss_rank_avg": 0.2778732180595398, "step": 518, "valid_targets_mean": 16131.2, "valid_targets_min": 15565 }, { "epoch": 2.208955223880597, "grad_norm": 0.35932831920478553, "learning_rate": 2.7454147997976404e-05, "loss": 1.0134, "loss_nan_ranks": 0, "loss_rank_avg": 0.2866620421409607, "step": 519, "valid_targets_mean": 16204.6, "valid_targets_min": 15596 }, { "epoch": 2.213219616204691, "grad_norm": 0.2839057580653145, "learning_rate": 2.7398954558735272e-05, "loss": 1.0505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1549297571182251, "step": 520, "valid_targets_mean": 8753.9, "valid_targets_min": 2749 }, { "epoch": 2.2174840085287846, "grad_norm": 0.37158603632443654, "learning_rate": 2.7343695758325125e-05, "loss": 1.0292, "loss_nan_ranks": 0, "loss_rank_avg": 0.2592717111110687, "step": 521, "valid_targets_mean": 16047.2, "valid_targets_min": 15012 }, { "epoch": 2.2217484008528783, "grad_norm": 0.3434129611890377, "learning_rate": 2.7288372084893282e-05, "loss": 1.0267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2959210276603699, "step": 522, "valid_targets_mean": 16112.9, "valid_targets_min": 14609 }, { "epoch": 2.2260127931769724, "grad_norm": 0.28134739630779465, "learning_rate": 2.7232984027160126e-05, "loss": 1.037, "loss_nan_ranks": 0, "loss_rank_avg": 0.22468724846839905, "step": 523, "valid_targets_mean": 12362.7, "valid_targets_min": 10008 }, { "epoch": 2.230277185501066, "grad_norm": 0.3786459000817747, "learning_rate": 2.7177532074414822e-05, "loss": 1.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.29006755352020264, "step": 524, "valid_targets_mean": 16111.7, "valid_targets_min": 14958 }, { "epoch": 2.23454157782516, "grad_norm": 0.31526672316574644, "learning_rate": 2.712201671651094e-05, "loss": 1.0374, "loss_nan_ranks": 0, "loss_rank_avg": 0.3149791359901428, "step": 525, "valid_targets_mean": 16096.5, "valid_targets_min": 13688 }, { "epoch": 2.2388059701492535, "grad_norm": 0.3251796622007667, "learning_rate": 2.7066438443862205e-05, "loss": 1.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.26117759943008423, "step": 526, "valid_targets_mean": 13684.5, "valid_targets_min": 11557 }, { "epoch": 2.2430703624733477, "grad_norm": 0.3571788387924515, "learning_rate": 2.701079774743808e-05, "loss": 1.0497, "loss_nan_ranks": 0, "loss_rank_avg": 0.31474095582962036, "step": 527, "valid_targets_mean": 16176.9, "valid_targets_min": 15185 }, { "epoch": 2.2473347547974414, "grad_norm": 0.31126045337404046, "learning_rate": 2.6955095118759496e-05, "loss": 1.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.2477262169122696, "step": 528, "valid_targets_mean": 13108.9, "valid_targets_min": 2016 }, { "epoch": 2.251599147121535, "grad_norm": 0.3704432931191125, "learning_rate": 2.689933104989447e-05, "loss": 1.0356, "loss_nan_ranks": 0, "loss_rank_avg": 0.2543630599975586, "step": 529, "valid_targets_mean": 15346.7, "valid_targets_min": 14049 }, { "epoch": 2.2558635394456292, "grad_norm": 0.2890683538315524, "learning_rate": 2.6843506033453777e-05, "loss": 1.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.3212983012199402, "step": 530, "valid_targets_mean": 15995.2, "valid_targets_min": 13688 }, { "epoch": 2.260127931769723, "grad_norm": 0.3612846459506985, "learning_rate": 2.6787620562586587e-05, "loss": 1.048, "loss_nan_ranks": 0, "loss_rank_avg": 0.172796368598938, "step": 531, "valid_targets_mean": 9370.6, "valid_targets_min": 3012 }, { "epoch": 2.2643923240938166, "grad_norm": 0.2753181517426568, "learning_rate": 2.673167513097613e-05, "loss": 0.9943, "loss_nan_ranks": 0, "loss_rank_avg": 0.23673027753829956, "step": 532, "valid_targets_mean": 16198.4, "valid_targets_min": 15665 }, { "epoch": 2.2686567164179103, "grad_norm": 0.3283853477750083, "learning_rate": 2.6675670232835297e-05, "loss": 1.0375, "loss_nan_ranks": 0, "loss_rank_avg": 0.29759296774864197, "step": 533, "valid_targets_mean": 16011.2, "valid_targets_min": 13427 }, { "epoch": 2.272921108742004, "grad_norm": 0.31579501674451577, "learning_rate": 2.661960636290231e-05, "loss": 1.052, "loss_nan_ranks": 0, "loss_rank_avg": 0.18113857507705688, "step": 534, "valid_targets_mean": 10492.3, "valid_targets_min": 5775 }, { "epoch": 2.277185501066098, "grad_norm": 0.32463975391375466, "learning_rate": 2.6563484016436346e-05, "loss": 1.056, "loss_nan_ranks": 0, "loss_rank_avg": 0.27056264877319336, "step": 535, "valid_targets_mean": 16125.0, "valid_targets_min": 15091 }, { "epoch": 2.281449893390192, "grad_norm": 0.30961628810230585, "learning_rate": 2.6507303689213143e-05, "loss": 1.0926, "loss_nan_ranks": 0, "loss_rank_avg": 0.29040077328681946, "step": 536, "valid_targets_mean": 16207.7, "valid_targets_min": 15562 }, { "epoch": 2.2857142857142856, "grad_norm": 0.30310963051771506, "learning_rate": 2.6451065877520634e-05, "loss": 1.0289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2182932049036026, "step": 537, "valid_targets_mean": 13124.1, "valid_targets_min": 10613 }, { "epoch": 2.2899786780383797, "grad_norm": 0.2783552318907119, "learning_rate": 2.639477107815455e-05, "loss": 1.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.29935818910598755, "step": 538, "valid_targets_mean": 16085.9, "valid_targets_min": 15042 }, { "epoch": 2.2942430703624734, "grad_norm": 0.3031273792078499, "learning_rate": 2.633841978841406e-05, "loss": 1.0427, "loss_nan_ranks": 0, "loss_rank_avg": 0.3005887567996979, "step": 539, "valid_targets_mean": 16127.8, "valid_targets_min": 14446 }, { "epoch": 2.298507462686567, "grad_norm": 0.26682988538100505, "learning_rate": 2.6282012506097347e-05, "loss": 0.9944, "loss_nan_ranks": 0, "loss_rank_avg": 0.2365766316652298, "step": 540, "valid_targets_mean": 14421.1, "valid_targets_min": 12694 }, { "epoch": 2.302771855010661, "grad_norm": 0.2989830647187291, "learning_rate": 2.622554972949724e-05, "loss": 1.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.2973644733428955, "step": 541, "valid_targets_mean": 16063.4, "valid_targets_min": 14259 }, { "epoch": 2.307036247334755, "grad_norm": 0.3320158283938759, "learning_rate": 2.6169031957396778e-05, "loss": 1.0506, "loss_nan_ranks": 0, "loss_rank_avg": 0.21213622391223907, "step": 542, "valid_targets_mean": 11104.2, "valid_targets_min": 2564 }, { "epoch": 2.3113006396588487, "grad_norm": 0.24704517072991675, "learning_rate": 2.611245968906482e-05, "loss": 1.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.28201478719711304, "step": 543, "valid_targets_mean": 15902.0, "valid_targets_min": 13609 }, { "epoch": 2.3155650319829424, "grad_norm": 0.29276197236011303, "learning_rate": 2.605583342425165e-05, "loss": 0.9868, "loss_nan_ranks": 0, "loss_rank_avg": 0.27429062128067017, "step": 544, "valid_targets_mean": 16183.0, "valid_targets_min": 15463 }, { "epoch": 2.319829424307036, "grad_norm": 0.2729037664782278, "learning_rate": 2.5999153663184546e-05, "loss": 1.0622, "loss_nan_ranks": 0, "loss_rank_avg": 0.17813602089881897, "step": 545, "valid_targets_mean": 9009.8, "valid_targets_min": 1284 }, { "epoch": 2.3240938166311302, "grad_norm": 0.2798009780695239, "learning_rate": 2.594242090656335e-05, "loss": 1.0542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2451293170452118, "step": 546, "valid_targets_mean": 16194.9, "valid_targets_min": 14875 }, { "epoch": 2.328358208955224, "grad_norm": 0.3141975194679562, "learning_rate": 2.5885635655556075e-05, "loss": 1.0407, "loss_nan_ranks": 0, "loss_rank_avg": 0.28895652294158936, "step": 547, "valid_targets_mean": 16138.1, "valid_targets_min": 14550 }, { "epoch": 2.3326226012793176, "grad_norm": 0.26163605590717465, "learning_rate": 2.5828798411794443e-05, "loss": 1.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.22583462297916412, "step": 548, "valid_targets_mean": 12317.6, "valid_targets_min": 8720 }, { "epoch": 2.3368869936034113, "grad_norm": 0.31763720417289987, "learning_rate": 2.5771909677369484e-05, "loss": 1.0127, "loss_nan_ranks": 0, "loss_rank_avg": 0.2829974889755249, "step": 549, "valid_targets_mean": 16203.8, "valid_targets_min": 15058 }, { "epoch": 2.3411513859275055, "grad_norm": 0.3056235028373722, "learning_rate": 2.571496995482709e-05, "loss": 1.0358, "loss_nan_ranks": 0, "loss_rank_avg": 0.2864728569984436, "step": 550, "valid_targets_mean": 16102.8, "valid_targets_min": 14826 }, { "epoch": 2.345415778251599, "grad_norm": 0.2863509643615744, "learning_rate": 2.565797974716357e-05, "loss": 0.9894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2198735773563385, "step": 551, "valid_targets_mean": 13737.8, "valid_targets_min": 11566 }, { "epoch": 2.349680170575693, "grad_norm": 0.3540898427883017, "learning_rate": 2.5600939557821205e-05, "loss": 1.0639, "loss_nan_ranks": 0, "loss_rank_avg": 0.31675875186920166, "step": 552, "valid_targets_mean": 16058.5, "valid_targets_min": 14649 }, { "epoch": 2.3539445628997866, "grad_norm": 0.30587327840171247, "learning_rate": 2.5543849890683813e-05, "loss": 1.041, "loss_nan_ranks": 0, "loss_rank_avg": 0.259478896856308, "step": 553, "valid_targets_mean": 13189.4, "valid_targets_min": 3578 }, { "epoch": 2.3582089552238807, "grad_norm": 0.26927479797465537, "learning_rate": 2.548671125007229e-05, "loss": 1.0295, "loss_nan_ranks": 0, "loss_rank_avg": 0.24672149121761322, "step": 554, "valid_targets_mean": 15325.0, "valid_targets_min": 13465 }, { "epoch": 2.3624733475479744, "grad_norm": 0.35359364585088576, "learning_rate": 2.5429524140740155e-05, "loss": 1.0446, "loss_nan_ranks": 0, "loss_rank_avg": 0.29348552227020264, "step": 555, "valid_targets_mean": 16192.3, "valid_targets_min": 15636 }, { "epoch": 2.366737739872068, "grad_norm": 0.2755949486919777, "learning_rate": 2.537228906786908e-05, "loss": 1.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.16546456515789032, "step": 556, "valid_targets_mean": 8583.2, "valid_targets_min": 1277 }, { "epoch": 2.3710021321961623, "grad_norm": 0.3417479182549748, "learning_rate": 2.5315006537064473e-05, "loss": 1.0346, "loss_nan_ranks": 0, "loss_rank_avg": 0.27253687381744385, "step": 557, "valid_targets_mean": 16119.8, "valid_targets_min": 15222 }, { "epoch": 2.375266524520256, "grad_norm": 0.26979098561187287, "learning_rate": 2.5257677054350927e-05, "loss": 1.0451, "loss_nan_ranks": 0, "loss_rank_avg": 0.3248399794101715, "step": 558, "valid_targets_mean": 16112.5, "valid_targets_min": 13427 }, { "epoch": 2.3795309168443497, "grad_norm": 0.2908440350974731, "learning_rate": 2.5200301126167857e-05, "loss": 1.0183, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952691376209259, "step": 559, "valid_targets_mean": 11318.0, "valid_targets_min": 7978 }, { "epoch": 2.3837953091684434, "grad_norm": 0.3078098175009307, "learning_rate": 2.514287925936492e-05, "loss": 1.0268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714043855667114, "step": 560, "valid_targets_mean": 16124.8, "valid_targets_min": 14702 }, { "epoch": 2.388059701492537, "grad_norm": 0.28078401099422134, "learning_rate": 2.5085411961197626e-05, "loss": 1.0382, "loss_nan_ranks": 0, "loss_rank_avg": 0.3055068850517273, "step": 561, "valid_targets_mean": 16119.8, "valid_targets_min": 15507 }, { "epoch": 2.3923240938166312, "grad_norm": 0.29354290379337106, "learning_rate": 2.502789973932278e-05, "loss": 1.0541, "loss_nan_ranks": 0, "loss_rank_avg": 0.23758560419082642, "step": 562, "valid_targets_mean": 13217.6, "valid_targets_min": 9927 }, { "epoch": 2.396588486140725, "grad_norm": 0.3126625252447049, "learning_rate": 2.4970343101794073e-05, "loss": 1.0578, "loss_nan_ranks": 0, "loss_rank_avg": 0.29068368673324585, "step": 563, "valid_targets_mean": 16146.4, "valid_targets_min": 15545 }, { "epoch": 2.4008528784648187, "grad_norm": 0.3034641047561609, "learning_rate": 2.4912742557057538e-05, "loss": 1.0254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2866404056549072, "step": 564, "valid_targets_mean": 16232.5, "valid_targets_min": 15938 }, { "epoch": 2.405117270788913, "grad_norm": 0.3849857823998909, "learning_rate": 2.485509861394708e-05, "loss": 1.0408, "loss_nan_ranks": 0, "loss_rank_avg": 0.25188344717025757, "step": 565, "valid_targets_mean": 15403.8, "valid_targets_min": 13098 }, { "epoch": 2.4093816631130065, "grad_norm": 0.2917300569778498, "learning_rate": 2.4797411781679975e-05, "loss": 1.0334, "loss_nan_ranks": 0, "loss_rank_avg": 0.29883241653442383, "step": 566, "valid_targets_mean": 16083.7, "valid_targets_min": 13883 }, { "epoch": 2.4136460554371, "grad_norm": 0.3346796905024958, "learning_rate": 2.473968256985238e-05, "loss": 1.0992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2282615453004837, "step": 567, "valid_targets_mean": 11219.6, "valid_targets_min": 2899 }, { "epoch": 2.417910447761194, "grad_norm": 0.26051979425264027, "learning_rate": 2.4681911488434825e-05, "loss": 0.9763, "loss_nan_ranks": 0, "loss_rank_avg": 0.23321135342121124, "step": 568, "valid_targets_mean": 16104.4, "valid_targets_min": 14771 }, { "epoch": 2.4221748400852876, "grad_norm": 0.38129667322859684, "learning_rate": 2.4624099047767702e-05, "loss": 1.0098, "loss_nan_ranks": 0, "loss_rank_avg": 0.30090954899787903, "step": 569, "valid_targets_mean": 16132.6, "valid_targets_min": 13886 }, { "epoch": 2.4264392324093818, "grad_norm": 0.2604040577862216, "learning_rate": 2.4566245758556787e-05, "loss": 1.0388, "loss_nan_ranks": 0, "loss_rank_avg": 0.18206843733787537, "step": 570, "valid_targets_mean": 9096.2, "valid_targets_min": 2044 }, { "epoch": 2.4307036247334755, "grad_norm": 0.32823939336311225, "learning_rate": 2.4508352131868664e-05, "loss": 1.0308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2432955950498581, "step": 571, "valid_targets_mean": 16176.6, "valid_targets_min": 14769 }, { "epoch": 2.434968017057569, "grad_norm": 0.2935285323392409, "learning_rate": 2.445041867912629e-05, "loss": 1.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.31023919582366943, "step": 572, "valid_targets_mean": 16152.8, "valid_targets_min": 15180 }, { "epoch": 2.4392324093816633, "grad_norm": 0.29705761968405225, "learning_rate": 2.439244591210443e-05, "loss": 1.0378, "loss_nan_ranks": 0, "loss_rank_avg": 0.22531543672084808, "step": 573, "valid_targets_mean": 12206.7, "valid_targets_min": 8908 }, { "epoch": 2.443496801705757, "grad_norm": 0.33119219679210354, "learning_rate": 2.4334434342925133e-05, "loss": 1.0412, "loss_nan_ranks": 0, "loss_rank_avg": 0.2790338099002838, "step": 574, "valid_targets_mean": 16198.4, "valid_targets_min": 15622 }, { "epoch": 2.4477611940298507, "grad_norm": 0.2628526445996163, "learning_rate": 2.4276384484053227e-05, "loss": 1.103, "loss_nan_ranks": 0, "loss_rank_avg": 0.30810728669166565, "step": 575, "valid_targets_mean": 16086.4, "valid_targets_min": 15153 }, { "epoch": 2.4520255863539444, "grad_norm": 0.3636611140247231, "learning_rate": 2.4218296848291795e-05, "loss": 1.0571, "loss_nan_ranks": 0, "loss_rank_avg": 0.2677125036716461, "step": 576, "valid_targets_mean": 14360.7, "valid_targets_min": 12313 }, { "epoch": 2.4562899786780386, "grad_norm": 0.27541640733521017, "learning_rate": 2.4160171948777603e-05, "loss": 1.0158, "loss_nan_ranks": 0, "loss_rank_avg": 0.28583091497421265, "step": 577, "valid_targets_mean": 16193.1, "valid_targets_min": 15374 }, { "epoch": 2.4605543710021323, "grad_norm": 0.28867613165733325, "learning_rate": 2.410201029897665e-05, "loss": 1.0913, "loss_nan_ranks": 0, "loss_rank_avg": 0.2489250898361206, "step": 578, "valid_targets_mean": 12682.9, "valid_targets_min": 1240 }, { "epoch": 2.464818763326226, "grad_norm": 0.2920196335006851, "learning_rate": 2.4043812412679532e-05, "loss": 1.0545, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607208490371704, "step": 579, "valid_targets_mean": 14894.9, "valid_targets_min": 13767 }, { "epoch": 2.4690831556503197, "grad_norm": 0.2521489707227015, "learning_rate": 2.3985578803996985e-05, "loss": 1.0264, "loss_nan_ranks": 0, "loss_rank_avg": 0.2972157299518585, "step": 580, "valid_targets_mean": 16157.9, "valid_targets_min": 14275 }, { "epoch": 2.473347547974414, "grad_norm": 0.299043517373016, "learning_rate": 2.392730998735529e-05, "loss": 1.0499, "loss_nan_ranks": 0, "loss_rank_avg": 0.17381398379802704, "step": 581, "valid_targets_mean": 10229.2, "valid_targets_min": 1759 }, { "epoch": 2.4776119402985075, "grad_norm": 0.27413297037766, "learning_rate": 2.3869006477491755e-05, "loss": 1.0934, "loss_nan_ranks": 0, "loss_rank_avg": 0.281957745552063, "step": 582, "valid_targets_mean": 15959.8, "valid_targets_min": 13835 }, { "epoch": 2.481876332622601, "grad_norm": 0.27270978121053446, "learning_rate": 2.381066878945017e-05, "loss": 1.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.29876717925071716, "step": 583, "valid_targets_mean": 16156.6, "valid_targets_min": 15054 }, { "epoch": 2.486140724946695, "grad_norm": 0.2651931261771279, "learning_rate": 2.3752297438576257e-05, "loss": 1.0479, "loss_nan_ranks": 0, "loss_rank_avg": 0.18752694129943848, "step": 584, "valid_targets_mean": 10441.4, "valid_targets_min": 7074 }, { "epoch": 2.490405117270789, "grad_norm": 0.23564039562850964, "learning_rate": 2.3693892940513074e-05, "loss": 1.0593, "loss_nan_ranks": 0, "loss_rank_avg": 0.2778427004814148, "step": 585, "valid_targets_mean": 16191.9, "valid_targets_min": 15389 }, { "epoch": 2.4946695095948828, "grad_norm": 0.2414011698937567, "learning_rate": 2.3635455811196536e-05, "loss": 1.0473, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203165531158447, "step": 586, "valid_targets_mean": 16169.7, "valid_targets_min": 15678 }, { "epoch": 2.4989339019189765, "grad_norm": 0.2670451356339994, "learning_rate": 2.3576986566850796e-05, "loss": 1.058, "loss_nan_ranks": 0, "loss_rank_avg": 0.2431665062904358, "step": 587, "valid_targets_mean": 13982.8, "valid_targets_min": 11677 }, { "epoch": 2.50319829424307, "grad_norm": 0.2555070879578905, "learning_rate": 2.351848572398371e-05, "loss": 0.9892, "loss_nan_ranks": 0, "loss_rank_avg": 0.2670406103134155, "step": 588, "valid_targets_mean": 16228.9, "valid_targets_min": 15674 }, { "epoch": 2.5074626865671643, "grad_norm": 0.272956121938524, "learning_rate": 2.3459953799382276e-05, "loss": 1.0058, "loss_nan_ranks": 0, "loss_rank_avg": 0.28342461585998535, "step": 589, "valid_targets_mean": 16192.3, "valid_targets_min": 15222 }, { "epoch": 2.511727078891258, "grad_norm": 0.2778901562741278, "learning_rate": 2.3401391310108054e-05, "loss": 1.0117, "loss_nan_ranks": 0, "loss_rank_avg": 0.25146615505218506, "step": 590, "valid_targets_mean": 15235.8, "valid_targets_min": 10805 }, { "epoch": 2.5159914712153517, "grad_norm": 0.28858163538064635, "learning_rate": 2.3342798773492602e-05, "loss": 1.0093, "loss_nan_ranks": 0, "loss_rank_avg": 0.27801817655563354, "step": 591, "valid_targets_mean": 16150.8, "valid_targets_min": 14997 }, { "epoch": 2.520255863539446, "grad_norm": 0.29292018521548724, "learning_rate": 2.328417670713294e-05, "loss": 1.0332, "loss_nan_ranks": 0, "loss_rank_avg": 0.2068709135055542, "step": 592, "valid_targets_mean": 10595.8, "valid_targets_min": 1383 }, { "epoch": 2.5245202558635396, "grad_norm": 0.2578187511591653, "learning_rate": 2.3225525628886918e-05, "loss": 1.0435, "loss_nan_ranks": 0, "loss_rank_avg": 0.25130176544189453, "step": 593, "valid_targets_mean": 16091.4, "valid_targets_min": 15167 }, { "epoch": 2.5287846481876333, "grad_norm": 0.27303874490141483, "learning_rate": 2.3166846056868687e-05, "loss": 1.0582, "loss_nan_ranks": 0, "loss_rank_avg": 0.3334190249443054, "step": 594, "valid_targets_mean": 15568.4, "valid_targets_min": 2605 }, { "epoch": 2.533049040511727, "grad_norm": 0.25870877325527797, "learning_rate": 2.31081385094441e-05, "loss": 1.0387, "loss_nan_ranks": 0, "loss_rank_avg": 0.15699400007724762, "step": 595, "valid_targets_mean": 8344.5, "valid_targets_min": 717 }, { "epoch": 2.5373134328358207, "grad_norm": 0.24477176242002976, "learning_rate": 2.304940350522615e-05, "loss": 1.0552, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562256157398224, "step": 596, "valid_targets_mean": 16130.5, "valid_targets_min": 14384 }, { "epoch": 2.541577825159915, "grad_norm": 0.2692001623707129, "learning_rate": 2.299064156307037e-05, "loss": 1.0373, "loss_nan_ranks": 0, "loss_rank_avg": 0.30675721168518066, "step": 597, "valid_targets_mean": 16067.1, "valid_targets_min": 14103 }, { "epoch": 2.5458422174840085, "grad_norm": 0.2500888984021968, "learning_rate": 2.2931853202070275e-05, "loss": 1.0624, "loss_nan_ranks": 0, "loss_rank_avg": 0.22056426107883453, "step": 598, "valid_targets_mean": 13112.9, "valid_targets_min": 9219 }, { "epoch": 2.550106609808102, "grad_norm": 0.25852515386306235, "learning_rate": 2.2873038941552724e-05, "loss": 0.9908, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784058153629303, "step": 599, "valid_targets_mean": 16142.3, "valid_targets_min": 13573 }, { "epoch": 2.5543710021321964, "grad_norm": 0.3256240388119314, "learning_rate": 2.2814199301073412e-05, "loss": 1.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.3061351776123047, "step": 600, "valid_targets_mean": 16099.6, "valid_targets_min": 13080 }, { "epoch": 2.55863539445629, "grad_norm": 0.23178965477142577, "learning_rate": 2.27553348004122e-05, "loss": 1.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541932761669159, "step": 601, "valid_targets_mean": 14181.0, "valid_targets_min": 11734 }, { "epoch": 2.5628997867803838, "grad_norm": 0.29686777150066457, "learning_rate": 2.2696445959568577e-05, "loss": 1.0465, "loss_nan_ranks": 0, "loss_rank_avg": 0.3028012216091156, "step": 602, "valid_targets_mean": 16122.7, "valid_targets_min": 15319 }, { "epoch": 2.5671641791044775, "grad_norm": 0.23765180354060697, "learning_rate": 2.2637533298757064e-05, "loss": 1.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.24337582290172577, "step": 603, "valid_targets_mean": 13220.1, "valid_targets_min": 2036 }, { "epoch": 2.571428571428571, "grad_norm": 0.2782471466241931, "learning_rate": 2.2578597338402567e-05, "loss": 1.0428, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604105472564697, "step": 604, "valid_targets_mean": 16067.2, "valid_targets_min": 14862 }, { "epoch": 2.5756929637526653, "grad_norm": 0.23032037185955748, "learning_rate": 2.2519638599135844e-05, "loss": 1.0983, "loss_nan_ranks": 0, "loss_rank_avg": 0.28923940658569336, "step": 605, "valid_targets_mean": 16087.8, "valid_targets_min": 14331 }, { "epoch": 2.579957356076759, "grad_norm": 0.2684594483983001, "learning_rate": 2.2460657601788875e-05, "loss": 1.0366, "loss_nan_ranks": 0, "loss_rank_avg": 0.18617041409015656, "step": 606, "valid_targets_mean": 9125.1, "valid_targets_min": 1895 }, { "epoch": 2.5842217484008527, "grad_norm": 0.232317126831534, "learning_rate": 2.2401654867390256e-05, "loss": 1.032, "loss_nan_ranks": 0, "loss_rank_avg": 0.23461005091667175, "step": 607, "valid_targets_mean": 16230.6, "valid_targets_min": 15761 }, { "epoch": 2.588486140724947, "grad_norm": 0.2813001202797154, "learning_rate": 2.2342630917160605e-05, "loss": 1.0525, "loss_nan_ranks": 0, "loss_rank_avg": 0.31943753361701965, "step": 608, "valid_targets_mean": 16008.2, "valid_targets_min": 12492 }, { "epoch": 2.5927505330490406, "grad_norm": 0.2602911096217211, "learning_rate": 2.2283586272507975e-05, "loss": 1.0367, "loss_nan_ranks": 0, "loss_rank_avg": 0.20762485265731812, "step": 609, "valid_targets_mean": 12059.9, "valid_targets_min": 7841 }, { "epoch": 2.5970149253731343, "grad_norm": 0.2631319658641279, "learning_rate": 2.2224521455023193e-05, "loss": 1.0351, "loss_nan_ranks": 0, "loss_rank_avg": 0.27428776025772095, "step": 610, "valid_targets_mean": 16181.1, "valid_targets_min": 15563 }, { "epoch": 2.6012793176972284, "grad_norm": 0.3101522318161875, "learning_rate": 2.216543698647534e-05, "loss": 1.0351, "loss_nan_ranks": 0, "loss_rank_avg": 0.3216131031513214, "step": 611, "valid_targets_mean": 16136.7, "valid_targets_min": 14943 }, { "epoch": 2.605543710021322, "grad_norm": 0.23841926854456202, "learning_rate": 2.210633338880704e-05, "loss": 1.0672, "loss_nan_ranks": 0, "loss_rank_avg": 0.23634910583496094, "step": 612, "valid_targets_mean": 13411.0, "valid_targets_min": 11613 }, { "epoch": 2.609808102345416, "grad_norm": 0.3422990747125992, "learning_rate": 2.204721118412994e-05, "loss": 1.063, "loss_nan_ranks": 0, "loss_rank_avg": 0.3301277160644531, "step": 613, "valid_targets_mean": 16006.3, "valid_targets_min": 15028 }, { "epoch": 2.6140724946695095, "grad_norm": 0.2443735209147375, "learning_rate": 2.1988070894720037e-05, "loss": 1.0509, "loss_nan_ranks": 0, "loss_rank_avg": 0.30868402123451233, "step": 614, "valid_targets_mean": 16166.3, "valid_targets_min": 15389 }, { "epoch": 2.6183368869936032, "grad_norm": 0.2769791836864251, "learning_rate": 2.192891304301309e-05, "loss": 1.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.24009822309017181, "step": 615, "valid_targets_mean": 14385.6, "valid_targets_min": 12637 }, { "epoch": 2.6226012793176974, "grad_norm": 0.2463937911425666, "learning_rate": 2.18697381516e-05, "loss": 1.0466, "loss_nan_ranks": 0, "loss_rank_avg": 0.29944130778312683, "step": 616, "valid_targets_mean": 16184.0, "valid_targets_min": 15614 }, { "epoch": 2.626865671641791, "grad_norm": 0.2625493187358278, "learning_rate": 2.181054674322221e-05, "loss": 1.0306, "loss_nan_ranks": 0, "loss_rank_avg": 0.19397038221359253, "step": 617, "valid_targets_mean": 10109.2, "valid_targets_min": 1733 }, { "epoch": 2.631130063965885, "grad_norm": 0.26131036300015253, "learning_rate": 2.1751339340767043e-05, "loss": 0.9939, "loss_nan_ranks": 0, "loss_rank_avg": 0.26601845026016235, "step": 618, "valid_targets_mean": 16138.7, "valid_targets_min": 14734 }, { "epoch": 2.635394456289979, "grad_norm": 0.27251382003765656, "learning_rate": 2.169211646726313e-05, "loss": 1.0788, "loss_nan_ranks": 0, "loss_rank_avg": 0.3152587115764618, "step": 619, "valid_targets_mean": 16145.5, "valid_targets_min": 15576 }, { "epoch": 2.6396588486140726, "grad_norm": 0.28166028840154184, "learning_rate": 2.163287864587576e-05, "loss": 1.0437, "loss_nan_ranks": 0, "loss_rank_avg": 0.15223997831344604, "step": 620, "valid_targets_mean": 8127.2, "valid_targets_min": 2379 }, { "epoch": 2.6439232409381663, "grad_norm": 0.2702402182533795, "learning_rate": 2.157362639990229e-05, "loss": 0.9963, "loss_nan_ranks": 0, "loss_rank_avg": 0.25352510809898376, "step": 621, "valid_targets_mean": 16050.8, "valid_targets_min": 14159 }, { "epoch": 2.64818763326226, "grad_norm": 0.2770114802483943, "learning_rate": 2.151436025276747e-05, "loss": 1.0471, "loss_nan_ranks": 0, "loss_rank_avg": 0.3116888403892517, "step": 622, "valid_targets_mean": 16133.9, "valid_targets_min": 13934 }, { "epoch": 2.6524520255863537, "grad_norm": 0.2764848889031583, "learning_rate": 2.145508072801888e-05, "loss": 1.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531043589115143, "step": 623, "valid_targets_mean": 13166.8, "valid_targets_min": 9709 }, { "epoch": 2.656716417910448, "grad_norm": 0.2516592344298666, "learning_rate": 2.1395788349322256e-05, "loss": 1.0671, "loss_nan_ranks": 0, "loss_rank_avg": 0.27907490730285645, "step": 624, "valid_targets_mean": 16132.4, "valid_targets_min": 14394 }, { "epoch": 2.6609808102345416, "grad_norm": 0.31791207712989383, "learning_rate": 2.133648364045689e-05, "loss": 1.0399, "loss_nan_ranks": 0, "loss_rank_avg": 0.3172053098678589, "step": 625, "valid_targets_mean": 16104.8, "valid_targets_min": 14688 }, { "epoch": 2.6652452025586353, "grad_norm": 0.23359854517165743, "learning_rate": 2.1277167125310996e-05, "loss": 1.0454, "loss_nan_ranks": 0, "loss_rank_avg": 0.2476862370967865, "step": 626, "valid_targets_mean": 15302.1, "valid_targets_min": 13615 }, { "epoch": 2.6695095948827294, "grad_norm": 0.2967447305403079, "learning_rate": 2.1217839327877098e-05, "loss": 1.0464, "loss_nan_ranks": 0, "loss_rank_avg": 0.2926100194454193, "step": 627, "valid_targets_mean": 16166.6, "valid_targets_min": 15148 }, { "epoch": 2.673773987206823, "grad_norm": 0.24300960387242868, "learning_rate": 2.1158500772247352e-05, "loss": 1.0539, "loss_nan_ranks": 0, "loss_rank_avg": 0.26239803433418274, "step": 628, "valid_targets_mean": 13016.6, "valid_targets_min": 1533 }, { "epoch": 2.678038379530917, "grad_norm": 0.2794531726229126, "learning_rate": 2.1099151982608985e-05, "loss": 1.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.2824642062187195, "step": 629, "valid_targets_mean": 15976.4, "valid_targets_min": 14810 }, { "epoch": 2.6823027718550105, "grad_norm": 0.2583131390220038, "learning_rate": 2.1039793483239607e-05, "loss": 1.0682, "loss_nan_ranks": 0, "loss_rank_avg": 0.3015969395637512, "step": 630, "valid_targets_mean": 16166.0, "valid_targets_min": 15282 }, { "epoch": 2.6865671641791042, "grad_norm": 0.2406239146234153, "learning_rate": 2.0980425798502616e-05, "loss": 1.021, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628062129020691, "step": 631, "valid_targets_mean": 8038.8, "valid_targets_min": 1420 }, { "epoch": 2.6908315565031984, "grad_norm": 0.2634618094704433, "learning_rate": 2.092104945284255e-05, "loss": 1.0157, "loss_nan_ranks": 0, "loss_rank_avg": 0.24490898847579956, "step": 632, "valid_targets_mean": 15944.4, "valid_targets_min": 14420 }, { "epoch": 2.695095948827292, "grad_norm": 0.2513490052749398, "learning_rate": 2.0861664970780434e-05, "loss": 1.0376, "loss_nan_ranks": 0, "loss_rank_avg": 0.3211136758327484, "step": 633, "valid_targets_mean": 16005.0, "valid_targets_min": 12680 }, { "epoch": 2.699360341151386, "grad_norm": 0.23777199420967957, "learning_rate": 2.08022728769092e-05, "loss": 1.0514, "loss_nan_ranks": 0, "loss_rank_avg": 0.19891712069511414, "step": 634, "valid_targets_mean": 10561.3, "valid_targets_min": 6389 }, { "epoch": 2.70362473347548, "grad_norm": 0.22784442937559377, "learning_rate": 2.0742873695889005e-05, "loss": 1.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.2798650860786438, "step": 635, "valid_targets_mean": 16137.4, "valid_targets_min": 15187 }, { "epoch": 2.7078891257995736, "grad_norm": 0.2578640629204441, "learning_rate": 2.0683467952442626e-05, "loss": 1.0577, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054782748222351, "step": 636, "valid_targets_mean": 16199.2, "valid_targets_min": 15333 }, { "epoch": 2.7121535181236673, "grad_norm": 0.23590469762852542, "learning_rate": 2.0624056171350785e-05, "loss": 1.0577, "loss_nan_ranks": 0, "loss_rank_avg": 0.2311520129442215, "step": 637, "valid_targets_mean": 13013.5, "valid_targets_min": 10913 }, { "epoch": 2.716417910447761, "grad_norm": 0.24606557103992302, "learning_rate": 2.0564638877447566e-05, "loss": 0.9992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2815939784049988, "step": 638, "valid_targets_mean": 16089.1, "valid_targets_min": 15225 }, { "epoch": 2.7206823027718547, "grad_norm": 0.2648957939437123, "learning_rate": 2.0505216595615742e-05, "loss": 1.1097, "loss_nan_ranks": 0, "loss_rank_avg": 0.32964062690734863, "step": 639, "valid_targets_mean": 16108.9, "valid_targets_min": 14793 }, { "epoch": 2.724946695095949, "grad_norm": 0.21696403842331907, "learning_rate": 2.044578985078215e-05, "loss": 1.0646, "loss_nan_ranks": 0, "loss_rank_avg": 0.2445964217185974, "step": 640, "valid_targets_mean": 15094.3, "valid_targets_min": 13211 }, { "epoch": 2.7292110874200426, "grad_norm": 0.2686175393069833, "learning_rate": 2.0386359167913046e-05, "loss": 1.0648, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203163743019104, "step": 641, "valid_targets_mean": 16148.0, "valid_targets_min": 15288 }, { "epoch": 2.7334754797441363, "grad_norm": 0.23381083889228563, "learning_rate": 2.0326925072009485e-05, "loss": 1.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.18711988627910614, "step": 642, "valid_targets_mean": 10481.8, "valid_targets_min": 1219 }, { "epoch": 2.7377398720682304, "grad_norm": 0.24796603748809626, "learning_rate": 2.0267488088102657e-05, "loss": 1.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.25230154395103455, "step": 643, "valid_targets_mean": 15958.4, "valid_targets_min": 15228 }, { "epoch": 2.742004264392324, "grad_norm": 0.25484572893188645, "learning_rate": 2.0208048741249288e-05, "loss": 0.9915, "loss_nan_ranks": 0, "loss_rank_avg": 0.29769226908683777, "step": 644, "valid_targets_mean": 16206.8, "valid_targets_min": 15398 }, { "epoch": 2.746268656716418, "grad_norm": 0.21276746285567366, "learning_rate": 2.014860755652695e-05, "loss": 1.0248, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710774004459381, "step": 645, "valid_targets_mean": 9416.3, "valid_targets_min": 979 }, { "epoch": 2.750533049040512, "grad_norm": 0.2333199165638852, "learning_rate": 2.0089165059029477e-05, "loss": 1.0624, "loss_nan_ranks": 0, "loss_rank_avg": 0.24201640486717224, "step": 646, "valid_targets_mean": 16177.7, "valid_targets_min": 14460 }, { "epoch": 2.7547974413646057, "grad_norm": 0.2135880074160673, "learning_rate": 2.0029721773862277e-05, "loss": 1.0362, "loss_nan_ranks": 0, "loss_rank_avg": 0.30199944972991943, "step": 647, "valid_targets_mean": 15917.4, "valid_targets_min": 9299 }, { "epoch": 2.7590618336886994, "grad_norm": 0.2362137019123995, "learning_rate": 1.997027822613773e-05, "loss": 1.0104, "loss_nan_ranks": 0, "loss_rank_avg": 0.2068403959274292, "step": 648, "valid_targets_mean": 12600.8, "valid_targets_min": 9289 }, { "epoch": 2.763326226012793, "grad_norm": 0.21479351229165758, "learning_rate": 1.9910834940970533e-05, "loss": 1.0881, "loss_nan_ranks": 0, "loss_rank_avg": 0.30875372886657715, "step": 649, "valid_targets_mean": 16163.2, "valid_targets_min": 15488 }, { "epoch": 2.767590618336887, "grad_norm": 0.2549516060520758, "learning_rate": 1.985139244347305e-05, "loss": 1.0175, "loss_nan_ranks": 0, "loss_rank_avg": 0.28148266673088074, "step": 650, "valid_targets_mean": 16152.5, "valid_targets_min": 14851 }, { "epoch": 2.771855010660981, "grad_norm": 0.2291803277727466, "learning_rate": 1.979195125875072e-05, "loss": 1.0532, "loss_nan_ranks": 0, "loss_rank_avg": 0.24805381894111633, "step": 651, "valid_targets_mean": 14425.4, "valid_targets_min": 12081 }, { "epoch": 2.7761194029850746, "grad_norm": 0.2784673614966153, "learning_rate": 1.9732511911897353e-05, "loss": 1.0534, "loss_nan_ranks": 0, "loss_rank_avg": 0.29927659034729004, "step": 652, "valid_targets_mean": 16109.8, "valid_targets_min": 14956 }, { "epoch": 2.7803837953091683, "grad_norm": 0.2665693367529166, "learning_rate": 1.9673074927990525e-05, "loss": 1.054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2553492784500122, "step": 653, "valid_targets_mean": 12686.2, "valid_targets_min": 1160 }, { "epoch": 2.7846481876332625, "grad_norm": 0.258366490540349, "learning_rate": 1.9613640832086957e-05, "loss": 1.0174, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649986743927002, "step": 654, "valid_targets_mean": 16176.4, "valid_targets_min": 15720 }, { "epoch": 2.788912579957356, "grad_norm": 0.27182690784206887, "learning_rate": 1.9554210149217855e-05, "loss": 1.0149, "loss_nan_ranks": 0, "loss_rank_avg": 0.2867087125778198, "step": 655, "valid_targets_mean": 16022.2, "valid_targets_min": 13473 }, { "epoch": 2.79317697228145, "grad_norm": 0.26722859528629267, "learning_rate": 1.9494783404384265e-05, "loss": 1.0539, "loss_nan_ranks": 0, "loss_rank_avg": 0.20252707600593567, "step": 656, "valid_targets_mean": 9653.7, "valid_targets_min": 1158 }, { "epoch": 2.7974413646055436, "grad_norm": 0.2316912477336916, "learning_rate": 1.9435361122552437e-05, "loss": 0.9846, "loss_nan_ranks": 0, "loss_rank_avg": 0.24132490158081055, "step": 657, "valid_targets_mean": 16161.2, "valid_targets_min": 14851 }, { "epoch": 2.8017057569296373, "grad_norm": 0.25748752302717803, "learning_rate": 1.9375943828649215e-05, "loss": 1.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.29179710149765015, "step": 658, "valid_targets_mean": 16125.6, "valid_targets_min": 14877 }, { "epoch": 2.8059701492537314, "grad_norm": 0.25746042952829756, "learning_rate": 1.9316532047557378e-05, "loss": 1.0235, "loss_nan_ranks": 0, "loss_rank_avg": 0.19404509663581848, "step": 659, "valid_targets_mean": 11347.2, "valid_targets_min": 7388 }, { "epoch": 2.810234541577825, "grad_norm": 0.2302939992167745, "learning_rate": 1.9257126304110998e-05, "loss": 1.031, "loss_nan_ranks": 0, "loss_rank_avg": 0.27259528636932373, "step": 660, "valid_targets_mean": 16103.5, "valid_targets_min": 15242 }, { "epoch": 2.814498933901919, "grad_norm": 0.25198259548480473, "learning_rate": 1.919772712309081e-05, "loss": 1.0209, "loss_nan_ranks": 0, "loss_rank_avg": 0.2935293912887573, "step": 661, "valid_targets_mean": 16163.3, "valid_targets_min": 15198 }, { "epoch": 2.818763326226013, "grad_norm": 0.2200286922289353, "learning_rate": 1.9138335029219572e-05, "loss": 1.0536, "loss_nan_ranks": 0, "loss_rank_avg": 0.23220394551753998, "step": 662, "valid_targets_mean": 13117.1, "valid_targets_min": 11573 }, { "epoch": 2.8230277185501067, "grad_norm": 0.23440034064219098, "learning_rate": 1.9078950547157458e-05, "loss": 1.0368, "loss_nan_ranks": 0, "loss_rank_avg": 0.2831166684627533, "step": 663, "valid_targets_mean": 16066.2, "valid_targets_min": 13927 }, { "epoch": 2.8272921108742004, "grad_norm": 0.2183113289524723, "learning_rate": 1.9019574201497387e-05, "loss": 1.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.33316051959991455, "step": 664, "valid_targets_mean": 16098.2, "valid_targets_min": 14646 }, { "epoch": 2.831556503198294, "grad_norm": 0.22078950062464048, "learning_rate": 1.8960206516760396e-05, "loss": 1.0492, "loss_nan_ranks": 0, "loss_rank_avg": 0.25347208976745605, "step": 665, "valid_targets_mean": 15457.3, "valid_targets_min": 14161 }, { "epoch": 2.835820895522388, "grad_norm": 0.2134148999740181, "learning_rate": 1.890084801739102e-05, "loss": 0.9944, "loss_nan_ranks": 0, "loss_rank_avg": 0.27177226543426514, "step": 666, "valid_targets_mean": 16156.0, "valid_targets_min": 15128 }, { "epoch": 2.840085287846482, "grad_norm": 0.22257594579115064, "learning_rate": 1.884149922775265e-05, "loss": 1.0345, "loss_nan_ranks": 0, "loss_rank_avg": 0.21412542462348938, "step": 667, "valid_targets_mean": 11165.4, "valid_targets_min": 2031 }, { "epoch": 2.8443496801705757, "grad_norm": 0.21178683195544276, "learning_rate": 1.878216067212291e-05, "loss": 1.0247, "loss_nan_ranks": 0, "loss_rank_avg": 0.25402650237083435, "step": 668, "valid_targets_mean": 15901.6, "valid_targets_min": 14526 }, { "epoch": 2.8486140724946694, "grad_norm": 0.25074264951872627, "learning_rate": 1.8722832874689007e-05, "loss": 1.0656, "loss_nan_ranks": 0, "loss_rank_avg": 0.28927081823349, "step": 669, "valid_targets_mean": 16190.7, "valid_targets_min": 15714 }, { "epoch": 2.8528784648187635, "grad_norm": 0.23287240870568066, "learning_rate": 1.8663516359543123e-05, "loss": 1.0172, "loss_nan_ranks": 0, "loss_rank_avg": 0.14716637134552002, "step": 670, "valid_targets_mean": 8172.2, "valid_targets_min": 1215 }, { "epoch": 2.857142857142857, "grad_norm": 0.23950131807780825, "learning_rate": 1.860421165067775e-05, "loss": 1.0239, "loss_nan_ranks": 0, "loss_rank_avg": 0.2460516393184662, "step": 671, "valid_targets_mean": 16181.2, "valid_targets_min": 15380 }, { "epoch": 2.861407249466951, "grad_norm": 0.23157562595418954, "learning_rate": 1.8544919271981125e-05, "loss": 1.0617, "loss_nan_ranks": 0, "loss_rank_avg": 0.31192123889923096, "step": 672, "valid_targets_mean": 16093.1, "valid_targets_min": 14929 }, { "epoch": 2.8656716417910446, "grad_norm": 0.22833207374850398, "learning_rate": 1.8485639747232535e-05, "loss": 1.035, "loss_nan_ranks": 0, "loss_rank_avg": 0.22791972756385803, "step": 673, "valid_targets_mean": 12507.3, "valid_targets_min": 10158 }, { "epoch": 2.8699360341151388, "grad_norm": 0.24941293281250398, "learning_rate": 1.8426373600097723e-05, "loss": 1.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2764943838119507, "step": 674, "valid_targets_mean": 16078.8, "valid_targets_min": 13788 }, { "epoch": 2.8742004264392325, "grad_norm": 0.22245905457862583, "learning_rate": 1.836712135412424e-05, "loss": 1.0315, "loss_nan_ranks": 0, "loss_rank_avg": 0.29476335644721985, "step": 675, "valid_targets_mean": 16158.5, "valid_targets_min": 14904 }, { "epoch": 2.878464818763326, "grad_norm": 0.2527922980176215, "learning_rate": 1.8307883532736878e-05, "loss": 1.0229, "loss_nan_ranks": 0, "loss_rank_avg": 0.23116479814052582, "step": 676, "valid_targets_mean": 14858.4, "valid_targets_min": 12939 }, { "epoch": 2.88272921108742, "grad_norm": 0.22475933770657133, "learning_rate": 1.8248660659232964e-05, "loss": 1.0149, "loss_nan_ranks": 0, "loss_rank_avg": 0.29866713285446167, "step": 677, "valid_targets_mean": 16104.2, "valid_targets_min": 15187 }, { "epoch": 2.886993603411514, "grad_norm": 0.231273821884454, "learning_rate": 1.8189453256777798e-05, "loss": 1.0114, "loss_nan_ranks": 0, "loss_rank_avg": 0.25470566749572754, "step": 678, "valid_targets_mean": 13330.7, "valid_targets_min": 1100 }, { "epoch": 2.8912579957356077, "grad_norm": 0.23910386595968475, "learning_rate": 1.8130261848399996e-05, "loss": 1.0467, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502293288707733, "step": 679, "valid_targets_mean": 15772.3, "valid_targets_min": 14001 }, { "epoch": 2.8955223880597014, "grad_norm": 0.22121884183094487, "learning_rate": 1.8071086956986916e-05, "loss": 1.0073, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032669723033905, "step": 680, "valid_targets_mean": 16085.4, "valid_targets_min": 14479 }, { "epoch": 2.8997867803837956, "grad_norm": 0.24253258088598406, "learning_rate": 1.8011929105279967e-05, "loss": 1.041, "loss_nan_ranks": 0, "loss_rank_avg": 0.15033088624477386, "step": 681, "valid_targets_mean": 8402.1, "valid_targets_min": 1075 }, { "epoch": 2.9040511727078893, "grad_norm": 0.20793563860463674, "learning_rate": 1.795278881587007e-05, "loss": 1.0471, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602580785751343, "step": 682, "valid_targets_mean": 16153.5, "valid_targets_min": 15636 }, { "epoch": 2.908315565031983, "grad_norm": 0.21533915056637562, "learning_rate": 1.7893666611192962e-05, "loss": 1.0346, "loss_nan_ranks": 0, "loss_rank_avg": 0.2978869080543518, "step": 683, "valid_targets_mean": 16154.4, "valid_targets_min": 15505 }, { "epoch": 2.9125799573560767, "grad_norm": 0.20511026387766632, "learning_rate": 1.783456301352467e-05, "loss": 1.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.18348674476146698, "step": 684, "valid_targets_mean": 10106.0, "valid_targets_min": 4326 }, { "epoch": 2.9168443496801704, "grad_norm": 0.21034257392870168, "learning_rate": 1.7775478544976813e-05, "loss": 1.0677, "loss_nan_ranks": 0, "loss_rank_avg": 0.2854713201522827, "step": 685, "valid_targets_mean": 16062.8, "valid_targets_min": 14365 }, { "epoch": 2.9211087420042645, "grad_norm": 0.21266707523484377, "learning_rate": 1.7716413727492035e-05, "loss": 1.0752, "loss_nan_ranks": 0, "loss_rank_avg": 0.32130110263824463, "step": 686, "valid_targets_mean": 16094.8, "valid_targets_min": 14920 }, { "epoch": 2.925373134328358, "grad_norm": 0.21812191169716444, "learning_rate": 1.7657369082839392e-05, "loss": 1.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.23229658603668213, "step": 687, "valid_targets_mean": 13003.5, "valid_targets_min": 10625 }, { "epoch": 2.929637526652452, "grad_norm": 0.2162686524716888, "learning_rate": 1.7598345132609747e-05, "loss": 1.0324, "loss_nan_ranks": 0, "loss_rank_avg": 0.28563833236694336, "step": 688, "valid_targets_mean": 16220.6, "valid_targets_min": 15582 }, { "epoch": 2.933901918976546, "grad_norm": 0.22879288653799318, "learning_rate": 1.7539342398211132e-05, "loss": 1.0593, "loss_nan_ranks": 0, "loss_rank_avg": 0.32399559020996094, "step": 689, "valid_targets_mean": 16127.6, "valid_targets_min": 15595 }, { "epoch": 2.9381663113006398, "grad_norm": 0.2302506984015126, "learning_rate": 1.748036140086416e-05, "loss": 1.0494, "loss_nan_ranks": 0, "loss_rank_avg": 0.260400652885437, "step": 690, "valid_targets_mean": 15390.4, "valid_targets_min": 14171 }, { "epoch": 2.9424307036247335, "grad_norm": 0.21850318614421996, "learning_rate": 1.742140266159744e-05, "loss": 1.0286, "loss_nan_ranks": 0, "loss_rank_avg": 0.2908626198768616, "step": 691, "valid_targets_mean": 16097.5, "valid_targets_min": 15042 }, { "epoch": 2.946695095948827, "grad_norm": 0.2298053216214348, "learning_rate": 1.7362466701242943e-05, "loss": 1.0351, "loss_nan_ranks": 0, "loss_rank_avg": 0.2131451517343521, "step": 692, "valid_targets_mean": 11418.3, "valid_targets_min": 2707 }, { "epoch": 2.950959488272921, "grad_norm": 0.2133637637780579, "learning_rate": 1.7303554040431426e-05, "loss": 1.0485, "loss_nan_ranks": 0, "loss_rank_avg": 0.2517058253288269, "step": 693, "valid_targets_mean": 16096.1, "valid_targets_min": 13929 }, { "epoch": 2.955223880597015, "grad_norm": 0.2485989853614221, "learning_rate": 1.7244665199587812e-05, "loss": 1.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812129557132721, "step": 694, "valid_targets_mean": 16215.6, "valid_targets_min": 15674 }, { "epoch": 2.9594882729211087, "grad_norm": 0.21752076241663548, "learning_rate": 1.7185800698926594e-05, "loss": 1.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.16977828741073608, "step": 695, "valid_targets_mean": 9167.3, "valid_targets_min": 2370 }, { "epoch": 2.9637526652452024, "grad_norm": 0.20427771557408353, "learning_rate": 1.7126961058447276e-05, "loss": 1.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.27761727571487427, "step": 696, "valid_targets_mean": 16013.3, "valid_targets_min": 14420 }, { "epoch": 2.9680170575692966, "grad_norm": 0.23787771224554388, "learning_rate": 1.706814679792973e-05, "loss": 1.0605, "loss_nan_ranks": 0, "loss_rank_avg": 0.27882838249206543, "step": 697, "valid_targets_mean": 16093.7, "valid_targets_min": 13108 }, { "epoch": 2.9722814498933903, "grad_norm": 0.2233058393397929, "learning_rate": 1.7009358436929632e-05, "loss": 1.0598, "loss_nan_ranks": 0, "loss_rank_avg": 0.2286585420370102, "step": 698, "valid_targets_mean": 12394.0, "valid_targets_min": 9653 }, { "epoch": 2.976545842217484, "grad_norm": 0.23102733923169372, "learning_rate": 1.6950596494773855e-05, "loss": 1.091, "loss_nan_ranks": 0, "loss_rank_avg": 0.30752837657928467, "step": 699, "valid_targets_mean": 16081.6, "valid_targets_min": 14632 }, { "epoch": 2.9808102345415777, "grad_norm": 0.21524273504458513, "learning_rate": 1.6891861490555906e-05, "loss": 0.9983, "loss_nan_ranks": 0, "loss_rank_avg": 0.2923296093940735, "step": 700, "valid_targets_mean": 16114.5, "valid_targets_min": 15221 }, { "epoch": 2.9850746268656714, "grad_norm": 0.21635269462461057, "learning_rate": 1.683315394313132e-05, "loss": 1.0638, "loss_nan_ranks": 0, "loss_rank_avg": 0.24893790483474731, "step": 701, "valid_targets_mean": 14577.7, "valid_targets_min": 12869 }, { "epoch": 2.9893390191897655, "grad_norm": 0.23777660105141393, "learning_rate": 1.677447437111309e-05, "loss": 1.0082, "loss_nan_ranks": 0, "loss_rank_avg": 0.2949479818344116, "step": 702, "valid_targets_mean": 16146.8, "valid_targets_min": 15427 }, { "epoch": 2.9936034115138592, "grad_norm": 0.2313537698655914, "learning_rate": 1.671582329286707e-05, "loss": 1.0479, "loss_nan_ranks": 0, "loss_rank_avg": 0.23207740485668182, "step": 703, "valid_targets_mean": 12671.8, "valid_targets_min": 1334 }, { "epoch": 2.997867803837953, "grad_norm": 0.2370830165882117, "learning_rate": 1.66572012265074e-05, "loss": 1.0403, "loss_nan_ranks": 0, "loss_rank_avg": 0.2588110566139221, "step": 704, "valid_targets_mean": 15686.2, "valid_targets_min": 14947 }, { "epoch": 3.0, "grad_norm": 0.2916023608705293, "learning_rate": 1.6598608689891953e-05, "loss": 1.003, "loss_nan_ranks": 0, "loss_rank_avg": 0.47874170541763306, "step": 705, "valid_targets_mean": 11341.6, "valid_targets_min": 3066 }, { "epoch": 3.0042643923240937, "grad_norm": 0.22546620007126184, "learning_rate": 1.654004620061773e-05, "loss": 1.0221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2473573088645935, "step": 706, "valid_targets_mean": 16072.4, "valid_targets_min": 14698 }, { "epoch": 3.008528784648188, "grad_norm": 0.24435078478549777, "learning_rate": 1.6481514276016297e-05, "loss": 1.0196, "loss_nan_ranks": 0, "loss_rank_avg": 0.26537612080574036, "step": 707, "valid_targets_mean": 16044.9, "valid_targets_min": 11563 }, { "epoch": 3.0127931769722816, "grad_norm": 0.21816044935934423, "learning_rate": 1.6423013433149207e-05, "loss": 1.0045, "loss_nan_ranks": 0, "loss_rank_avg": 0.21564412117004395, "step": 708, "valid_targets_mean": 13379.7, "valid_targets_min": 10328 }, { "epoch": 3.0170575692963753, "grad_norm": 0.23232216206932588, "learning_rate": 1.636454418880347e-05, "loss": 1.0164, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604576647281647, "step": 709, "valid_targets_mean": 16162.3, "valid_targets_min": 15122 }, { "epoch": 3.021321961620469, "grad_norm": 0.2340541867037144, "learning_rate": 1.630610705948693e-05, "loss": 1.0107, "loss_nan_ranks": 0, "loss_rank_avg": 0.2890893816947937, "step": 710, "valid_targets_mean": 16157.8, "valid_targets_min": 15578 }, { "epoch": 3.025586353944563, "grad_norm": 0.22984553170284047, "learning_rate": 1.6247702561423753e-05, "loss": 1.0195, "loss_nan_ranks": 0, "loss_rank_avg": 0.2258562445640564, "step": 711, "valid_targets_mean": 13078.1, "valid_targets_min": 11469 }, { "epoch": 3.029850746268657, "grad_norm": 0.22706069554415406, "learning_rate": 1.6189331210549828e-05, "loss": 1.0563, "loss_nan_ranks": 0, "loss_rank_avg": 0.3094644248485565, "step": 712, "valid_targets_mean": 16113.1, "valid_targets_min": 15270 }, { "epoch": 3.0341151385927505, "grad_norm": 0.2517273448178296, "learning_rate": 1.613099352250825e-05, "loss": 1.0505, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539500594139099, "step": 713, "valid_targets_mean": 13016.7, "valid_targets_min": 1369 }, { "epoch": 3.038379530916844, "grad_norm": 0.24724247646042918, "learning_rate": 1.6072690012644717e-05, "loss": 1.0232, "loss_nan_ranks": 0, "loss_rank_avg": 0.24730217456817627, "step": 714, "valid_targets_mean": 16104.4, "valid_targets_min": 14551 }, { "epoch": 3.0426439232409384, "grad_norm": 0.22341197798882587, "learning_rate": 1.6014421196003022e-05, "loss": 0.9959, "loss_nan_ranks": 0, "loss_rank_avg": 0.27211296558380127, "step": 715, "valid_targets_mean": 16228.6, "valid_targets_min": 15711 }, { "epoch": 3.046908315565032, "grad_norm": 0.2372792533087285, "learning_rate": 1.5956187587320468e-05, "loss": 1.0163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1803392767906189, "step": 716, "valid_targets_mean": 10309.6, "valid_targets_min": 1344 }, { "epoch": 3.0511727078891258, "grad_norm": 0.2246449853128541, "learning_rate": 1.5897989701023355e-05, "loss": 1.0308, "loss_nan_ranks": 0, "loss_rank_avg": 0.26668739318847656, "step": 717, "valid_targets_mean": 16109.7, "valid_targets_min": 14769 }, { "epoch": 3.0554371002132195, "grad_norm": 0.22388036653405088, "learning_rate": 1.58398280512224e-05, "loss": 1.0403, "loss_nan_ranks": 0, "loss_rank_avg": 0.29415494203567505, "step": 718, "valid_targets_mean": 15781.9, "valid_targets_min": 4778 }, { "epoch": 3.0597014925373136, "grad_norm": 0.2166445618932895, "learning_rate": 1.5781703151708215e-05, "loss": 1.0193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1880883276462555, "step": 719, "valid_targets_mean": 10639.8, "valid_targets_min": 4800 }, { "epoch": 3.0639658848614073, "grad_norm": 0.2341552816551429, "learning_rate": 1.5723615515946773e-05, "loss": 1.0522, "loss_nan_ranks": 0, "loss_rank_avg": 0.27435302734375, "step": 720, "valid_targets_mean": 16126.2, "valid_targets_min": 15410 }, { "epoch": 3.068230277185501, "grad_norm": 0.22436101078864107, "learning_rate": 1.5665565657074874e-05, "loss": 1.0562, "loss_nan_ranks": 0, "loss_rank_avg": 0.31322503089904785, "step": 721, "valid_targets_mean": 16086.5, "valid_targets_min": 14307 }, { "epoch": 3.0724946695095947, "grad_norm": 0.2327080346340859, "learning_rate": 1.560755408789558e-05, "loss": 1.0112, "loss_nan_ranks": 0, "loss_rank_avg": 0.22447748482227325, "step": 722, "valid_targets_mean": 14448.2, "valid_targets_min": 12279 }, { "epoch": 3.076759061833689, "grad_norm": 0.21443885865740964, "learning_rate": 1.5549581320873715e-05, "loss": 1.0388, "loss_nan_ranks": 0, "loss_rank_avg": 0.2837938070297241, "step": 723, "valid_targets_mean": 16100.5, "valid_targets_min": 14460 }, { "epoch": 3.0810234541577826, "grad_norm": 0.22515220337257996, "learning_rate": 1.5491647868131343e-05, "loss": 1.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.28435924649238586, "step": 724, "valid_targets_mean": 16215.7, "valid_targets_min": 15372 }, { "epoch": 3.0852878464818763, "grad_norm": 0.217034946809235, "learning_rate": 1.5433754241443223e-05, "loss": 1.0092, "loss_nan_ranks": 0, "loss_rank_avg": 0.23863840103149414, "step": 725, "valid_targets_mean": 15597.2, "valid_targets_min": 13274 }, { "epoch": 3.08955223880597, "grad_norm": 0.23567098500537823, "learning_rate": 1.53759009522323e-05, "loss": 1.0144, "loss_nan_ranks": 0, "loss_rank_avg": 0.2680036425590515, "step": 726, "valid_targets_mean": 16214.7, "valid_targets_min": 15574 }, { "epoch": 3.093816631130064, "grad_norm": 0.23150148218193378, "learning_rate": 1.5318088511565185e-05, "loss": 0.9811, "loss_nan_ranks": 0, "loss_rank_avg": 0.20448531210422516, "step": 727, "valid_targets_mean": 11884.8, "valid_targets_min": 1898 }, { "epoch": 3.098081023454158, "grad_norm": 0.24963689320764465, "learning_rate": 1.5260317430147627e-05, "loss": 0.9949, "loss_nan_ranks": 0, "loss_rank_avg": 0.23797962069511414, "step": 728, "valid_targets_mean": 15739.9, "valid_targets_min": 13414 }, { "epoch": 3.1023454157782515, "grad_norm": 0.23523132452561607, "learning_rate": 1.5202588218320024e-05, "loss": 1.0148, "loss_nan_ranks": 0, "loss_rank_avg": 0.28550830483436584, "step": 729, "valid_targets_mean": 16185.2, "valid_targets_min": 15222 }, { "epoch": 3.106609808102345, "grad_norm": 0.2300225672707401, "learning_rate": 1.5144901386052924e-05, "loss": 0.985, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239609241485596, "step": 730, "valid_targets_mean": 8392.7, "valid_targets_min": 1158 }, { "epoch": 3.1108742004264394, "grad_norm": 0.22194726120343725, "learning_rate": 1.5087257442942467e-05, "loss": 1.0368, "loss_nan_ranks": 0, "loss_rank_avg": 0.2581402063369751, "step": 731, "valid_targets_mean": 16164.5, "valid_targets_min": 15163 }, { "epoch": 3.115138592750533, "grad_norm": 0.21659593022650356, "learning_rate": 1.502965689820593e-05, "loss": 1.0126, "loss_nan_ranks": 0, "loss_rank_avg": 0.2931985855102539, "step": 732, "valid_targets_mean": 16121.2, "valid_targets_min": 15579 }, { "epoch": 3.1194029850746268, "grad_norm": 0.1979214228996395, "learning_rate": 1.4972100260677222e-05, "loss": 1.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.203348308801651, "step": 733, "valid_targets_mean": 12018.5, "valid_targets_min": 6953 }, { "epoch": 3.1236673773987205, "grad_norm": 0.2141897771266866, "learning_rate": 1.4914588038802383e-05, "loss": 1.0256, "loss_nan_ranks": 0, "loss_rank_avg": 0.2846953868865967, "step": 734, "valid_targets_mean": 16149.8, "valid_targets_min": 15222 }, { "epoch": 3.1279317697228146, "grad_norm": 0.22134730992124976, "learning_rate": 1.4857120740635084e-05, "loss": 1.0357, "loss_nan_ranks": 0, "loss_rank_avg": 0.308135986328125, "step": 735, "valid_targets_mean": 16092.7, "valid_targets_min": 14058 }, { "epoch": 3.1321961620469083, "grad_norm": 0.21199663364784577, "learning_rate": 1.4799698873832153e-05, "loss": 1.0532, "loss_nan_ranks": 0, "loss_rank_avg": 0.25040268898010254, "step": 736, "valid_targets_mean": 14434.2, "valid_targets_min": 12077 }, { "epoch": 3.136460554371002, "grad_norm": 0.22408687687739112, "learning_rate": 1.4742322945649073e-05, "loss": 0.9979, "loss_nan_ranks": 0, "loss_rank_avg": 0.28990089893341064, "step": 737, "valid_targets_mean": 16217.7, "valid_targets_min": 15808 }, { "epoch": 3.140724946695096, "grad_norm": 0.22090528353836641, "learning_rate": 1.4684993462935532e-05, "loss": 0.9881, "loss_nan_ranks": 0, "loss_rank_avg": 0.2285807728767395, "step": 738, "valid_targets_mean": 13375.1, "valid_targets_min": 1759 }, { "epoch": 3.14498933901919, "grad_norm": 0.21227037281282393, "learning_rate": 1.462771093213092e-05, "loss": 1.0113, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540406584739685, "step": 739, "valid_targets_mean": 15798.1, "valid_targets_min": 13840 }, { "epoch": 3.1492537313432836, "grad_norm": 0.22645562879511819, "learning_rate": 1.4570475859259856e-05, "loss": 0.9978, "loss_nan_ranks": 0, "loss_rank_avg": 0.28150904178619385, "step": 740, "valid_targets_mean": 16178.0, "valid_targets_min": 15576 }, { "epoch": 3.1535181236673773, "grad_norm": 0.2553953055802415, "learning_rate": 1.4513288749927714e-05, "loss": 0.9978, "loss_nan_ranks": 0, "loss_rank_avg": 0.1643623411655426, "step": 741, "valid_targets_mean": 9426.2, "valid_targets_min": 2154 }, { "epoch": 3.1577825159914714, "grad_norm": 0.21553654472222183, "learning_rate": 1.4456150109316192e-05, "loss": 1.024, "loss_nan_ranks": 0, "loss_rank_avg": 0.26102060079574585, "step": 742, "valid_targets_mean": 16006.3, "valid_targets_min": 14473 }, { "epoch": 3.162046908315565, "grad_norm": 0.24417735632997145, "learning_rate": 1.4399060442178798e-05, "loss": 0.947, "loss_nan_ranks": 0, "loss_rank_avg": 0.28816813230514526, "step": 743, "valid_targets_mean": 16178.9, "valid_targets_min": 15476 }, { "epoch": 3.166311300639659, "grad_norm": 0.22991537644479015, "learning_rate": 1.4342020252836437e-05, "loss": 1.0389, "loss_nan_ranks": 0, "loss_rank_avg": 0.19212383031845093, "step": 744, "valid_targets_mean": 10538.3, "valid_targets_min": 6177 }, { "epoch": 3.1705756929637525, "grad_norm": 0.22349717871874022, "learning_rate": 1.4285030045172913e-05, "loss": 1.0197, "loss_nan_ranks": 0, "loss_rank_avg": 0.26045793294906616, "step": 745, "valid_targets_mean": 16127.6, "valid_targets_min": 14124 }, { "epoch": 3.1748400852878467, "grad_norm": 0.21543348222421577, "learning_rate": 1.422809032263052e-05, "loss": 1.0468, "loss_nan_ranks": 0, "loss_rank_avg": 0.28180545568466187, "step": 746, "valid_targets_mean": 16165.9, "valid_targets_min": 15366 }, { "epoch": 3.1791044776119404, "grad_norm": 0.20075036785144845, "learning_rate": 1.4171201588205566e-05, "loss": 1.0547, "loss_nan_ranks": 0, "loss_rank_avg": 0.244021475315094, "step": 747, "valid_targets_mean": 13604.9, "valid_targets_min": 10519 }, { "epoch": 3.183368869936034, "grad_norm": 0.20359529763623488, "learning_rate": 1.4114364344443935e-05, "loss": 0.9755, "loss_nan_ranks": 0, "loss_rank_avg": 0.26434558629989624, "step": 748, "valid_targets_mean": 16148.0, "valid_targets_min": 13688 }, { "epoch": 3.1876332622601278, "grad_norm": 0.206317596580328, "learning_rate": 1.4057579093436653e-05, "loss": 1.019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964480519294739, "step": 749, "valid_targets_mean": 16185.6, "valid_targets_min": 15616 }, { "epoch": 3.191897654584222, "grad_norm": 0.19965426313624246, "learning_rate": 1.400084633681546e-05, "loss": 1.0369, "loss_nan_ranks": 0, "loss_rank_avg": 0.25970005989074707, "step": 750, "valid_targets_mean": 15437.9, "valid_targets_min": 13886 }, { "epoch": 3.1961620469083156, "grad_norm": 0.1931550450078641, "learning_rate": 1.3944166575748355e-05, "loss": 0.9745, "loss_nan_ranks": 0, "loss_rank_avg": 0.27987536787986755, "step": 751, "valid_targets_mean": 16108.0, "valid_targets_min": 15148 }, { "epoch": 3.2004264392324093, "grad_norm": 0.2285498671414749, "learning_rate": 1.3887540310935187e-05, "loss": 1.0267, "loss_nan_ranks": 0, "loss_rank_avg": 0.19410404562950134, "step": 752, "valid_targets_mean": 10666.6, "valid_targets_min": 1758 }, { "epoch": 3.204690831556503, "grad_norm": 0.1950207609526711, "learning_rate": 1.3830968042603226e-05, "loss": 1.0083, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649402618408203, "step": 753, "valid_targets_mean": 15740.0, "valid_targets_min": 14420 }, { "epoch": 3.208955223880597, "grad_norm": 0.23761770896996695, "learning_rate": 1.3774450270502762e-05, "loss": 0.9949, "loss_nan_ranks": 0, "loss_rank_avg": 0.31608280539512634, "step": 754, "valid_targets_mean": 16115.1, "valid_targets_min": 14966 }, { "epoch": 3.213219616204691, "grad_norm": 0.22083848523624852, "learning_rate": 1.3717987493902656e-05, "loss": 1.0205, "loss_nan_ranks": 0, "loss_rank_avg": 0.14785869419574738, "step": 755, "valid_targets_mean": 8256.4, "valid_targets_min": 1725 }, { "epoch": 3.2174840085287846, "grad_norm": 0.2271481305402101, "learning_rate": 1.3661580211585947e-05, "loss": 1.0203, "loss_nan_ranks": 0, "loss_rank_avg": 0.2505563497543335, "step": 756, "valid_targets_mean": 16184.0, "valid_targets_min": 14698 }, { "epoch": 3.2217484008528783, "grad_norm": 0.23538681792469754, "learning_rate": 1.3605228921845457e-05, "loss": 1.0205, "loss_nan_ranks": 0, "loss_rank_avg": 0.30578216910362244, "step": 757, "valid_targets_mean": 16165.3, "valid_targets_min": 15239 }, { "epoch": 3.2260127931769724, "grad_norm": 0.23014469470104712, "learning_rate": 1.3548934122479373e-05, "loss": 1.0558, "loss_nan_ranks": 0, "loss_rank_avg": 0.20352551341056824, "step": 758, "valid_targets_mean": 11775.9, "valid_targets_min": 8991 }, { "epoch": 3.230277185501066, "grad_norm": 0.23398942351829313, "learning_rate": 1.349269631078686e-05, "loss": 1.0173, "loss_nan_ranks": 0, "loss_rank_avg": 0.27417778968811035, "step": 759, "valid_targets_mean": 16214.9, "valid_targets_min": 15357 }, { "epoch": 3.23454157782516, "grad_norm": 0.23487663215223234, "learning_rate": 1.3436515983563659e-05, "loss": 1.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.3089166283607483, "step": 760, "valid_targets_mean": 16046.1, "valid_targets_min": 15157 }, { "epoch": 3.2388059701492535, "grad_norm": 0.22707354630172036, "learning_rate": 1.3380393637097692e-05, "loss": 0.9868, "loss_nan_ranks": 0, "loss_rank_avg": 0.24889841675758362, "step": 761, "valid_targets_mean": 14222.7, "valid_targets_min": 12022 }, { "epoch": 3.2430703624733477, "grad_norm": 0.2250444800568611, "learning_rate": 1.3324329767164708e-05, "loss": 1.0181, "loss_nan_ranks": 0, "loss_rank_avg": 0.2840118408203125, "step": 762, "valid_targets_mean": 16097.0, "valid_targets_min": 13888 }, { "epoch": 3.2473347547974414, "grad_norm": 0.2180264015784957, "learning_rate": 1.3268324869023878e-05, "loss": 0.9988, "loss_nan_ranks": 0, "loss_rank_avg": 0.2439872920513153, "step": 763, "valid_targets_mean": 13022.2, "valid_targets_min": 1535 }, { "epoch": 3.251599147121535, "grad_norm": 0.20409803688058786, "learning_rate": 1.3212379437413421e-05, "loss": 1.0638, "loss_nan_ranks": 0, "loss_rank_avg": 0.266012966632843, "step": 764, "valid_targets_mean": 15528.1, "valid_targets_min": 14452 }, { "epoch": 3.2558635394456292, "grad_norm": 0.2228089775488321, "learning_rate": 1.3156493966546236e-05, "loss": 1.0167, "loss_nan_ranks": 0, "loss_rank_avg": 0.28855788707733154, "step": 765, "valid_targets_mean": 16141.7, "valid_targets_min": 14987 }, { "epoch": 3.260127931769723, "grad_norm": 0.23085883706791083, "learning_rate": 1.3100668950105534e-05, "loss": 1.0809, "loss_nan_ranks": 0, "loss_rank_avg": 0.19959942996501923, "step": 766, "valid_targets_mean": 10493.4, "valid_targets_min": 2195 }, { "epoch": 3.2643923240938166, "grad_norm": 0.19998322552016268, "learning_rate": 1.3044904881240507e-05, "loss": 1.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537648677825928, "step": 767, "valid_targets_mean": 16092.9, "valid_targets_min": 15480 }, { "epoch": 3.2686567164179103, "grad_norm": 0.2288404706980349, "learning_rate": 1.2989202252561926e-05, "loss": 1.0208, "loss_nan_ranks": 0, "loss_rank_avg": 0.3139684796333313, "step": 768, "valid_targets_mean": 16164.0, "valid_targets_min": 15618 }, { "epoch": 3.272921108742004, "grad_norm": 0.23154431096127515, "learning_rate": 1.2933561556137806e-05, "loss": 0.9937, "loss_nan_ranks": 0, "loss_rank_avg": 0.20685717463493347, "step": 769, "valid_targets_mean": 11801.2, "valid_targets_min": 9058 }, { "epoch": 3.277185501066098, "grad_norm": 0.238643564108478, "learning_rate": 1.2877983283489062e-05, "loss": 1.0106, "loss_nan_ranks": 0, "loss_rank_avg": 0.26336807012557983, "step": 770, "valid_targets_mean": 16097.4, "valid_targets_min": 14732 }, { "epoch": 3.281449893390192, "grad_norm": 0.210463166838876, "learning_rate": 1.2822467925585186e-05, "loss": 1.0258, "loss_nan_ranks": 0, "loss_rank_avg": 0.28999316692352295, "step": 771, "valid_targets_mean": 16153.3, "valid_targets_min": 15217 }, { "epoch": 3.2857142857142856, "grad_norm": 0.21515324831546198, "learning_rate": 1.2767015972839879e-05, "loss": 0.9892, "loss_nan_ranks": 0, "loss_rank_avg": 0.21576184034347534, "step": 772, "valid_targets_mean": 13491.8, "valid_targets_min": 11383 }, { "epoch": 3.2899786780383797, "grad_norm": 0.19718742065687034, "learning_rate": 1.2711627915106728e-05, "loss": 1.0051, "loss_nan_ranks": 0, "loss_rank_avg": 0.28501254320144653, "step": 773, "valid_targets_mean": 16005.6, "valid_targets_min": 9286 }, { "epoch": 3.2942430703624734, "grad_norm": 0.20931056590488556, "learning_rate": 1.2656304241674877e-05, "loss": 0.9973, "loss_nan_ranks": 0, "loss_rank_avg": 0.3030652105808258, "step": 774, "valid_targets_mean": 16154.3, "valid_targets_min": 15623 }, { "epoch": 3.298507462686567, "grad_norm": 0.1864644163173028, "learning_rate": 1.2601045441264734e-05, "loss": 0.9799, "loss_nan_ranks": 0, "loss_rank_avg": 0.24769797921180725, "step": 775, "valid_targets_mean": 15966.1, "valid_targets_min": 14649 }, { "epoch": 3.302771855010661, "grad_norm": 0.21175345768619538, "learning_rate": 1.2545852002023599e-05, "loss": 0.9942, "loss_nan_ranks": 0, "loss_rank_avg": 0.30079352855682373, "step": 776, "valid_targets_mean": 16077.0, "valid_targets_min": 14795 }, { "epoch": 3.307036247334755, "grad_norm": 0.23951421924454977, "learning_rate": 1.2490724411521406e-05, "loss": 1.0185, "loss_nan_ranks": 0, "loss_rank_avg": 0.20463250577449799, "step": 777, "valid_targets_mean": 11349.3, "valid_targets_min": 1500 }, { "epoch": 3.3113006396588487, "grad_norm": 0.2266010059067405, "learning_rate": 1.243566315674637e-05, "loss": 1.0384, "loss_nan_ranks": 0, "loss_rank_avg": 0.26843178272247314, "step": 778, "valid_targets_mean": 15895.2, "valid_targets_min": 14853 }, { "epoch": 3.3155650319829424, "grad_norm": 0.21876189679359032, "learning_rate": 1.238066872410073e-05, "loss": 0.9662, "loss_nan_ranks": 0, "loss_rank_avg": 0.2956579923629761, "step": 779, "valid_targets_mean": 16154.4, "valid_targets_min": 15042 }, { "epoch": 3.319829424307036, "grad_norm": 0.224276681573692, "learning_rate": 1.2325741599396418e-05, "loss": 0.9855, "loss_nan_ranks": 0, "loss_rank_avg": 0.13216564059257507, "step": 780, "valid_targets_mean": 7354.0, "valid_targets_min": 2380 }, { "epoch": 3.3240938166311302, "grad_norm": 0.19662079347142808, "learning_rate": 1.2270882267850765e-05, "loss": 1.0673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2683402895927429, "step": 781, "valid_targets_mean": 16123.9, "valid_targets_min": 15331 }, { "epoch": 3.328358208955224, "grad_norm": 0.20498062466960942, "learning_rate": 1.2216091214082248e-05, "loss": 1.0287, "loss_nan_ranks": 0, "loss_rank_avg": 0.28701385855674744, "step": 782, "valid_targets_mean": 16087.6, "valid_targets_min": 13835 }, { "epoch": 3.3326226012793176, "grad_norm": 0.22236633186009508, "learning_rate": 1.2161368922106192e-05, "loss": 1.0277, "loss_nan_ranks": 0, "loss_rank_avg": 0.1911384016275406, "step": 783, "valid_targets_mean": 11460.7, "valid_targets_min": 8049 }, { "epoch": 3.3368869936034113, "grad_norm": 0.20791046573398056, "learning_rate": 1.2106715875330475e-05, "loss": 1.05, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731104791164398, "step": 784, "valid_targets_mean": 16209.4, "valid_targets_min": 15350 }, { "epoch": 3.3411513859275055, "grad_norm": 0.21261925120846067, "learning_rate": 1.2052132556551275e-05, "loss": 1.0367, "loss_nan_ranks": 0, "loss_rank_avg": 0.2992277145385742, "step": 785, "valid_targets_mean": 16167.2, "valid_targets_min": 15730 }, { "epoch": 3.345415778251599, "grad_norm": 0.216522475968083, "learning_rate": 1.1997619447948814e-05, "loss": 1.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.24031764268875122, "step": 786, "valid_targets_mean": 13789.7, "valid_targets_min": 11708 }, { "epoch": 3.349680170575693, "grad_norm": 0.20962862955449657, "learning_rate": 1.1943177031083094e-05, "loss": 1.0053, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922288179397583, "step": 787, "valid_targets_mean": 16186.4, "valid_targets_min": 14810 }, { "epoch": 3.3539445628997866, "grad_norm": 0.20784049608898483, "learning_rate": 1.1888805786889621e-05, "loss": 1.0411, "loss_nan_ranks": 0, "loss_rank_avg": 0.26215359568595886, "step": 788, "valid_targets_mean": 13417.4, "valid_targets_min": 3667 }, { "epoch": 3.3582089552238807, "grad_norm": 0.19438778955082836, "learning_rate": 1.183450619567518e-05, "loss": 1.0037, "loss_nan_ranks": 0, "loss_rank_avg": 0.25706902146339417, "step": 789, "valid_targets_mean": 15748.0, "valid_targets_min": 13975 }, { "epoch": 3.3624733475479744, "grad_norm": 0.18480593385926, "learning_rate": 1.1780278737113581e-05, "loss": 1.0402, "loss_nan_ranks": 0, "loss_rank_avg": 0.2852016091346741, "step": 790, "valid_targets_mean": 15791.8, "valid_targets_min": 5994 }, { "epoch": 3.366737739872068, "grad_norm": 0.19045874412467398, "learning_rate": 1.1726123890241439e-05, "loss": 0.9975, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702101230621338, "step": 791, "valid_targets_mean": 9803.9, "valid_targets_min": 1575 }, { "epoch": 3.3710021321961623, "grad_norm": 0.18142250180118896, "learning_rate": 1.1672042133453925e-05, "loss": 1.0138, "loss_nan_ranks": 0, "loss_rank_avg": 0.24327364563941956, "step": 792, "valid_targets_mean": 16135.9, "valid_targets_min": 15270 }, { "epoch": 3.375266524520256, "grad_norm": 0.18976083835973934, "learning_rate": 1.1618033944500527e-05, "loss": 0.9981, "loss_nan_ranks": 0, "loss_rank_avg": 0.3210751414299011, "step": 793, "valid_targets_mean": 16139.2, "valid_targets_min": 15361 }, { "epoch": 3.3795309168443497, "grad_norm": 0.19818634585506895, "learning_rate": 1.1564099800480864e-05, "loss": 1.048, "loss_nan_ranks": 0, "loss_rank_avg": 0.19776135683059692, "step": 794, "valid_targets_mean": 11481.5, "valid_targets_min": 6068 }, { "epoch": 3.3837953091684434, "grad_norm": 0.19760424713484523, "learning_rate": 1.151024017784045e-05, "loss": 1.0054, "loss_nan_ranks": 0, "loss_rank_avg": 0.24625568091869354, "step": 795, "valid_targets_mean": 16202.7, "valid_targets_min": 15135 }, { "epoch": 3.388059701492537, "grad_norm": 0.21328717602610783, "learning_rate": 1.1456455552366488e-05, "loss": 1.043, "loss_nan_ranks": 0, "loss_rank_avg": 0.3155757486820221, "step": 796, "valid_targets_mean": 16132.7, "valid_targets_min": 14783 }, { "epoch": 3.3923240938166312, "grad_norm": 0.18428037676198075, "learning_rate": 1.1402746399183671e-05, "loss": 1.0136, "loss_nan_ranks": 0, "loss_rank_avg": 0.24852502346038818, "step": 797, "valid_targets_mean": 13810.4, "valid_targets_min": 11194 }, { "epoch": 3.396588486140725, "grad_norm": 0.19469315419306438, "learning_rate": 1.1349113192749986e-05, "loss": 1.0325, "loss_nan_ranks": 0, "loss_rank_avg": 0.27724477648735046, "step": 798, "valid_targets_mean": 16136.4, "valid_targets_min": 13927 }, { "epoch": 3.4008528784648187, "grad_norm": 0.19335058306425573, "learning_rate": 1.1295556406852488e-05, "loss": 1.0257, "loss_nan_ranks": 0, "loss_rank_avg": 0.2919307351112366, "step": 799, "valid_targets_mean": 16118.9, "valid_targets_min": 15147 }, { "epoch": 3.405117270788913, "grad_norm": 0.17514958145184512, "learning_rate": 1.1242076514603201e-05, "loss": 1.0816, "loss_nan_ranks": 0, "loss_rank_avg": 0.25642216205596924, "step": 800, "valid_targets_mean": 14175.8, "valid_targets_min": 12875 }, { "epoch": 3.4093816631130065, "grad_norm": 0.20228613416602578, "learning_rate": 1.1188673988434831e-05, "loss": 1.0399, "loss_nan_ranks": 0, "loss_rank_avg": 0.3179895281791687, "step": 801, "valid_targets_mean": 16137.8, "valid_targets_min": 15389 }, { "epoch": 3.4136460554371, "grad_norm": 0.18851992182694163, "learning_rate": 1.1135349300096667e-05, "loss": 1.0053, "loss_nan_ranks": 0, "loss_rank_avg": 0.2002144306898117, "step": 802, "valid_targets_mean": 10829.2, "valid_targets_min": 1238 }, { "epoch": 3.417910447761194, "grad_norm": 0.19124496378036196, "learning_rate": 1.1082102920650397e-05, "loss": 1.0102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536805272102356, "step": 803, "valid_targets_mean": 16158.3, "valid_targets_min": 15109 }, { "epoch": 3.4221748400852876, "grad_norm": 0.22587700464345187, "learning_rate": 1.102893532046593e-05, "loss": 1.0389, "loss_nan_ranks": 0, "loss_rank_avg": 0.2835776209831238, "step": 804, "valid_targets_mean": 16059.1, "valid_targets_min": 14384 }, { "epoch": 3.4264392324093818, "grad_norm": 0.19199882848957545, "learning_rate": 1.0975846969217258e-05, "loss": 1.0246, "loss_nan_ranks": 0, "loss_rank_avg": 0.1586105227470398, "step": 805, "valid_targets_mean": 8455.3, "valid_targets_min": 578 }, { "epoch": 3.4307036247334755, "grad_norm": 0.19052360147803976, "learning_rate": 1.092283833587829e-05, "loss": 1.0397, "loss_nan_ranks": 0, "loss_rank_avg": 0.25331923365592957, "step": 806, "valid_targets_mean": 16085.5, "valid_targets_min": 14929 }, { "epoch": 3.434968017057569, "grad_norm": 0.2022605935609196, "learning_rate": 1.086990988871873e-05, "loss": 1.0609, "loss_nan_ranks": 0, "loss_rank_avg": 0.29131874442100525, "step": 807, "valid_targets_mean": 16047.4, "valid_targets_min": 13080 }, { "epoch": 3.4392324093816633, "grad_norm": 0.1901835998943412, "learning_rate": 1.0817062095299929e-05, "loss": 1.0441, "loss_nan_ranks": 0, "loss_rank_avg": 0.18520936369895935, "step": 808, "valid_targets_mean": 11042.4, "valid_targets_min": 7440 }, { "epoch": 3.443496801705757, "grad_norm": 0.20070764647087036, "learning_rate": 1.0764295422470755e-05, "loss": 1.0013, "loss_nan_ranks": 0, "loss_rank_avg": 0.2895042896270752, "step": 809, "valid_targets_mean": 16087.7, "valid_targets_min": 13211 }, { "epoch": 3.4477611940298507, "grad_norm": 0.1878010136021189, "learning_rate": 1.0711610336363477e-05, "loss": 1.0257, "loss_nan_ranks": 0, "loss_rank_avg": 0.30274391174316406, "step": 810, "valid_targets_mean": 16093.6, "valid_targets_min": 14556 }, { "epoch": 3.4520255863539444, "grad_norm": 0.17667053615946723, "learning_rate": 1.065900730238961e-05, "loss": 1.0249, "loss_nan_ranks": 0, "loss_rank_avg": 0.23889347910881042, "step": 811, "valid_targets_mean": 14490.8, "valid_targets_min": 12326 }, { "epoch": 3.4562899786780386, "grad_norm": 0.18797859932961541, "learning_rate": 1.0606486785235879e-05, "loss": 0.9799, "loss_nan_ranks": 0, "loss_rank_avg": 0.28064554929733276, "step": 812, "valid_targets_mean": 16143.8, "valid_targets_min": 14907 }, { "epoch": 3.4605543710021323, "grad_norm": 0.1885835078230724, "learning_rate": 1.0554049248860045e-05, "loss": 1.0568, "loss_nan_ranks": 0, "loss_rank_avg": 0.25304943323135376, "step": 813, "valid_targets_mean": 12887.4, "valid_targets_min": 1961 }, { "epoch": 3.464818763326226, "grad_norm": 0.19425937698400536, "learning_rate": 1.0501695156486819e-05, "loss": 1.0567, "loss_nan_ranks": 0, "loss_rank_avg": 0.2560194432735443, "step": 814, "valid_targets_mean": 15759.6, "valid_targets_min": 11287 }, { "epoch": 3.4690831556503197, "grad_norm": 0.2009073306626454, "learning_rate": 1.0449424970603796e-05, "loss": 0.9965, "loss_nan_ranks": 0, "loss_rank_avg": 0.265529990196228, "step": 815, "valid_targets_mean": 16230.9, "valid_targets_min": 15773 }, { "epoch": 3.473347547974414, "grad_norm": 0.19160044921213984, "learning_rate": 1.0397239152957356e-05, "loss": 1.0171, "loss_nan_ranks": 0, "loss_rank_avg": 0.16818805038928986, "step": 816, "valid_targets_mean": 9027.7, "valid_targets_min": 1228 }, { "epoch": 3.4776119402985075, "grad_norm": 0.20133406216973854, "learning_rate": 1.034513816454858e-05, "loss": 1.0378, "loss_nan_ranks": 0, "loss_rank_avg": 0.25717800855636597, "step": 817, "valid_targets_mean": 16111.5, "valid_targets_min": 15042 }, { "epoch": 3.481876332622601, "grad_norm": 0.20058057382990999, "learning_rate": 1.0293122465629186e-05, "loss": 1.0049, "loss_nan_ranks": 0, "loss_rank_avg": 0.28611189126968384, "step": 818, "valid_targets_mean": 16084.9, "valid_targets_min": 13788 }, { "epoch": 3.486140724946695, "grad_norm": 0.21471526294953153, "learning_rate": 1.0241192515697432e-05, "loss": 1.011, "loss_nan_ranks": 0, "loss_rank_avg": 0.20527414977550507, "step": 819, "valid_targets_mean": 12038.9, "valid_targets_min": 7752 }, { "epoch": 3.490405117270789, "grad_norm": 0.18698327284105212, "learning_rate": 1.0189348773494135e-05, "loss": 1.024, "loss_nan_ranks": 0, "loss_rank_avg": 0.27734407782554626, "step": 820, "valid_targets_mean": 16122.8, "valid_targets_min": 15219 }, { "epoch": 3.4946695095948828, "grad_norm": 0.1936151742736665, "learning_rate": 1.0137591696998514e-05, "loss": 1.0267, "loss_nan_ranks": 0, "loss_rank_avg": 0.3137998580932617, "step": 821, "valid_targets_mean": 16039.4, "valid_targets_min": 15167 }, { "epoch": 3.4989339019189765, "grad_norm": 0.23242629979557722, "learning_rate": 1.0085921743424225e-05, "loss": 1.0271, "loss_nan_ranks": 0, "loss_rank_avg": 0.22472453117370605, "step": 822, "valid_targets_mean": 13571.1, "valid_targets_min": 11707 }, { "epoch": 3.50319829424307, "grad_norm": 0.18107341012796876, "learning_rate": 1.0034339369215288e-05, "loss": 1.0324, "loss_nan_ranks": 0, "loss_rank_avg": 0.28194552659988403, "step": 823, "valid_targets_mean": 16043.7, "valid_targets_min": 13934 }, { "epoch": 3.5074626865671643, "grad_norm": 0.19598860481753452, "learning_rate": 9.982845030042068e-06, "loss": 1.0656, "loss_nan_ranks": 0, "loss_rank_avg": 0.33745408058166504, "step": 824, "valid_targets_mean": 16131.1, "valid_targets_min": 15258 }, { "epoch": 3.511727078891258, "grad_norm": 0.19947657391724366, "learning_rate": 9.931439180797237e-06, "loss": 1.0218, "loss_nan_ranks": 0, "loss_rank_avg": 0.22845852375030518, "step": 825, "valid_targets_mean": 14083.7, "valid_targets_min": 12058 }, { "epoch": 3.5159914712153517, "grad_norm": 0.19144720106478683, "learning_rate": 9.880122275591752e-06, "loss": 1.0479, "loss_nan_ranks": 0, "loss_rank_avg": 0.2947565019130707, "step": 826, "valid_targets_mean": 16235.3, "valid_targets_min": 15869 }, { "epoch": 3.520255863539446, "grad_norm": 0.2078277408605803, "learning_rate": 9.828894767750865e-06, "loss": 1.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.20672515034675598, "step": 827, "valid_targets_mean": 10532.3, "valid_targets_min": 793 }, { "epoch": 3.5245202558635396, "grad_norm": 0.19751630348586982, "learning_rate": 9.777757109810102e-06, "loss": 1.0312, "loss_nan_ranks": 0, "loss_rank_avg": 0.2553499937057495, "step": 828, "valid_targets_mean": 16077.7, "valid_targets_min": 15153 }, { "epoch": 3.5287846481876333, "grad_norm": 0.19658509693876208, "learning_rate": 9.726709753511275e-06, "loss": 1.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.29346132278442383, "step": 829, "valid_targets_mean": 16147.0, "valid_targets_min": 15263 }, { "epoch": 3.533049040511727, "grad_norm": 0.20929693034454866, "learning_rate": 9.675753149798474e-06, "loss": 1.0262, "loss_nan_ranks": 0, "loss_rank_avg": 0.1624056100845337, "step": 830, "valid_targets_mean": 9455.6, "valid_targets_min": 1075 }, { "epoch": 3.5373134328358207, "grad_norm": 0.18635446379853654, "learning_rate": 9.624887748814118e-06, "loss": 1.0308, "loss_nan_ranks": 0, "loss_rank_avg": 0.24756374955177307, "step": 831, "valid_targets_mean": 16233.1, "valid_targets_min": 15409 }, { "epoch": 3.541577825159915, "grad_norm": 0.21157734136180095, "learning_rate": 9.574113999894909e-06, "loss": 1.0297, "loss_nan_ranks": 0, "loss_rank_avg": 0.274283230304718, "step": 832, "valid_targets_mean": 16230.2, "valid_targets_min": 14917 }, { "epoch": 3.5458422174840085, "grad_norm": 0.20909402716707864, "learning_rate": 9.523432351567979e-06, "loss": 1.0222, "loss_nan_ranks": 0, "loss_rank_avg": 0.20221446454524994, "step": 833, "valid_targets_mean": 12193.7, "valid_targets_min": 9042 }, { "epoch": 3.550106609808102, "grad_norm": 0.2126134326170871, "learning_rate": 9.472843251546792e-06, "loss": 1.0422, "loss_nan_ranks": 0, "loss_rank_avg": 0.3187773823738098, "step": 834, "valid_targets_mean": 16074.3, "valid_targets_min": 14705 }, { "epoch": 3.5543710021321964, "grad_norm": 0.2248429864051284, "learning_rate": 9.422347146727294e-06, "loss": 1.017, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925642430782318, "step": 835, "valid_targets_mean": 16097.2, "valid_targets_min": 14702 }, { "epoch": 3.55863539445629, "grad_norm": 0.19764809114586646, "learning_rate": 9.371944483183912e-06, "loss": 1.0199, "loss_nan_ranks": 0, "loss_rank_avg": 0.24568304419517517, "step": 836, "valid_targets_mean": 13546.5, "valid_targets_min": 11766 }, { "epoch": 3.5628997867803838, "grad_norm": 0.19852269613513113, "learning_rate": 9.321635706165635e-06, "loss": 1.0502, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961001396179199, "step": 837, "valid_targets_mean": 16135.5, "valid_targets_min": 15091 }, { "epoch": 3.5671641791044775, "grad_norm": 0.22539551639713004, "learning_rate": 9.271421260092075e-06, "loss": 1.0581, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696417272090912, "step": 838, "valid_targets_mean": 12912.3, "valid_targets_min": 1400 }, { "epoch": 3.571428571428571, "grad_norm": 0.17369169122057854, "learning_rate": 9.221301588549519e-06, "loss": 1.0186, "loss_nan_ranks": 0, "loss_rank_avg": 0.25950783491134644, "step": 839, "valid_targets_mean": 15765.0, "valid_targets_min": 14646 }, { "epoch": 3.5756929637526653, "grad_norm": 0.19826394949704745, "learning_rate": 9.171277134287057e-06, "loss": 1.0423, "loss_nan_ranks": 0, "loss_rank_avg": 0.28724998235702515, "step": 840, "valid_targets_mean": 16137.4, "valid_targets_min": 14841 }, { "epoch": 3.579957356076759, "grad_norm": 0.22605116372463568, "learning_rate": 9.121348339212634e-06, "loss": 1.0514, "loss_nan_ranks": 0, "loss_rank_avg": 0.19209089875221252, "step": 841, "valid_targets_mean": 11219.8, "valid_targets_min": 3007 }, { "epoch": 3.5842217484008527, "grad_norm": 0.18985231179138834, "learning_rate": 9.07151564438916e-06, "loss": 1.0271, "loss_nan_ranks": 0, "loss_rank_avg": 0.26109862327575684, "step": 842, "valid_targets_mean": 15881.8, "valid_targets_min": 15016 }, { "epoch": 3.588486140724947, "grad_norm": 0.19525270465200253, "learning_rate": 9.021779490030611e-06, "loss": 1.0068, "loss_nan_ranks": 0, "loss_rank_avg": 0.29757362604141235, "step": 843, "valid_targets_mean": 16168.9, "valid_targets_min": 15515 }, { "epoch": 3.5927505330490406, "grad_norm": 0.20273161279088872, "learning_rate": 8.972140315498119e-06, "loss": 0.9891, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628081500530243, "step": 844, "valid_targets_mean": 9614.0, "valid_targets_min": 3748 }, { "epoch": 3.5970149253731343, "grad_norm": 0.17829706313717747, "learning_rate": 8.922598559296154e-06, "loss": 0.9995, "loss_nan_ranks": 0, "loss_rank_avg": 0.26611262559890747, "step": 845, "valid_targets_mean": 16162.2, "valid_targets_min": 15506 }, { "epoch": 3.6012793176972284, "grad_norm": 0.21027782800390699, "learning_rate": 8.873154659068582e-06, "loss": 0.9777, "loss_nan_ranks": 0, "loss_rank_avg": 0.27415943145751953, "step": 846, "valid_targets_mean": 16113.0, "valid_targets_min": 14547 }, { "epoch": 3.605543710021322, "grad_norm": 0.1933481346322796, "learning_rate": 8.823809051594816e-06, "loss": 1.0405, "loss_nan_ranks": 0, "loss_rank_avg": 0.2183433175086975, "step": 847, "valid_targets_mean": 13214.4, "valid_targets_min": 11479 }, { "epoch": 3.609808102345416, "grad_norm": 0.1911863955607189, "learning_rate": 8.774562172785988e-06, "loss": 1.0198, "loss_nan_ranks": 0, "loss_rank_avg": 0.27938979864120483, "step": 848, "valid_targets_mean": 16196.8, "valid_targets_min": 15650 }, { "epoch": 3.6140724946695095, "grad_norm": 0.1996827380897634, "learning_rate": 8.725414457681063e-06, "loss": 1.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.31652724742889404, "step": 849, "valid_targets_mean": 16141.3, "valid_targets_min": 15560 }, { "epoch": 3.6183368869936032, "grad_norm": 0.18875838410836185, "learning_rate": 8.676366340443017e-06, "loss": 1.0259, "loss_nan_ranks": 0, "loss_rank_avg": 0.23282839357852936, "step": 850, "valid_targets_mean": 15714.5, "valid_targets_min": 13969 }, { "epoch": 3.6226012793176974, "grad_norm": 0.1922747408101709, "learning_rate": 8.627418254355e-06, "loss": 0.9953, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925228476524353, "step": 851, "valid_targets_mean": 16100.1, "valid_targets_min": 14702 }, { "epoch": 3.626865671641791, "grad_norm": 0.1871926147470615, "learning_rate": 8.578570631816474e-06, "loss": 0.9884, "loss_nan_ranks": 0, "loss_rank_avg": 0.1962984800338745, "step": 852, "valid_targets_mean": 10805.0, "valid_targets_min": 1647 }, { "epoch": 3.631130063965885, "grad_norm": 0.18840256973106104, "learning_rate": 8.529823904339472e-06, "loss": 1.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.26471132040023804, "step": 853, "valid_targets_mean": 16080.2, "valid_targets_min": 14810 }, { "epoch": 3.635394456289979, "grad_norm": 0.19166828194360724, "learning_rate": 8.481178502544684e-06, "loss": 0.98, "loss_nan_ranks": 0, "loss_rank_avg": 0.2843315899372101, "step": 854, "valid_targets_mean": 16059.2, "valid_targets_min": 13226 }, { "epoch": 3.6396588486140726, "grad_norm": 0.19558513955706905, "learning_rate": 8.43263485615774e-06, "loss": 1.0439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1629284918308258, "step": 855, "valid_targets_mean": 8378.9, "valid_targets_min": 1276 }, { "epoch": 3.6439232409381663, "grad_norm": 0.18871230748742543, "learning_rate": 8.384193394005372e-06, "loss": 1.0378, "loss_nan_ranks": 0, "loss_rank_avg": 0.25322186946868896, "step": 856, "valid_targets_mean": 16128.1, "valid_targets_min": 14943 }, { "epoch": 3.64818763326226, "grad_norm": 0.19849367481773825, "learning_rate": 8.33585454401161e-06, "loss": 1.0521, "loss_nan_ranks": 0, "loss_rank_avg": 0.32179251313209534, "step": 857, "valid_targets_mean": 16055.6, "valid_targets_min": 15389 }, { "epoch": 3.6524520255863537, "grad_norm": 0.18765256209710596, "learning_rate": 8.287618733194073e-06, "loss": 1.029, "loss_nan_ranks": 0, "loss_rank_avg": 0.21054477989673615, "step": 858, "valid_targets_mean": 12071.9, "valid_targets_min": 9257 }, { "epoch": 3.656716417910448, "grad_norm": 0.193326982284514, "learning_rate": 8.239486387660096e-06, "loss": 0.9993, "loss_nan_ranks": 0, "loss_rank_avg": 0.29164233803749084, "step": 859, "valid_targets_mean": 16002.4, "valid_targets_min": 14544 }, { "epoch": 3.6609808102345416, "grad_norm": 0.20503274346576894, "learning_rate": 8.191457932603052e-06, "loss": 0.9978, "loss_nan_ranks": 0, "loss_rank_avg": 0.3028004765510559, "step": 860, "valid_targets_mean": 16125.6, "valid_targets_min": 14765 }, { "epoch": 3.6652452025586353, "grad_norm": 0.20103325130745195, "learning_rate": 8.143533792298545e-06, "loss": 1.0762, "loss_nan_ranks": 0, "loss_rank_avg": 0.25633686780929565, "step": 861, "valid_targets_mean": 15072.8, "valid_targets_min": 13354 }, { "epoch": 3.6695095948827294, "grad_norm": 0.19253920882400277, "learning_rate": 8.095714390100698e-06, "loss": 1.0125, "loss_nan_ranks": 0, "loss_rank_avg": 0.25641998648643494, "step": 862, "valid_targets_mean": 16131.2, "valid_targets_min": 13888 }, { "epoch": 3.673773987206823, "grad_norm": 0.20352579026745357, "learning_rate": 8.048000148438375e-06, "loss": 1.0594, "loss_nan_ranks": 0, "loss_rank_avg": 0.2648036777973175, "step": 863, "valid_targets_mean": 13058.5, "valid_targets_min": 1185 }, { "epoch": 3.678038379530917, "grad_norm": 0.19639948915191724, "learning_rate": 8.000391488811485e-06, "loss": 1.015, "loss_nan_ranks": 0, "loss_rank_avg": 0.25266677141189575, "step": 864, "valid_targets_mean": 15782.9, "valid_targets_min": 15070 }, { "epoch": 3.6823027718550105, "grad_norm": 0.19386053477890763, "learning_rate": 7.952888831787215e-06, "loss": 1.0346, "loss_nan_ranks": 0, "loss_rank_avg": 0.2928309738636017, "step": 865, "valid_targets_mean": 16152.8, "valid_targets_min": 14904 }, { "epoch": 3.6865671641791042, "grad_norm": 0.19745476342088736, "learning_rate": 7.905492596996391e-06, "loss": 0.9991, "loss_nan_ranks": 0, "loss_rank_avg": 0.1756155639886856, "step": 866, "valid_targets_mean": 9315.6, "valid_targets_min": 979 }, { "epoch": 3.6908315565031984, "grad_norm": 0.20138153016069346, "learning_rate": 7.858203203129668e-06, "loss": 1.0574, "loss_nan_ranks": 0, "loss_rank_avg": 0.26242029666900635, "step": 867, "valid_targets_mean": 16006.4, "valid_targets_min": 14911 }, { "epoch": 3.695095948827292, "grad_norm": 0.19412757800945293, "learning_rate": 7.811021067933919e-06, "loss": 1.0214, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751907706260681, "step": 868, "valid_targets_mean": 16138.8, "valid_targets_min": 14951 }, { "epoch": 3.699360341151386, "grad_norm": 0.21012497339785624, "learning_rate": 7.763946608208504e-06, "loss": 1.0114, "loss_nan_ranks": 0, "loss_rank_avg": 0.20527902245521545, "step": 869, "valid_targets_mean": 11099.1, "valid_targets_min": 7003 }, { "epoch": 3.70362473347548, "grad_norm": 0.19117367793417456, "learning_rate": 7.716980239801588e-06, "loss": 1.0112, "loss_nan_ranks": 0, "loss_rank_avg": 0.28386640548706055, "step": 870, "valid_targets_mean": 16065.7, "valid_targets_min": 14908 }, { "epoch": 3.7078891257995736, "grad_norm": 0.19692586454539995, "learning_rate": 7.670122377606495e-06, "loss": 1.0628, "loss_nan_ranks": 0, "loss_rank_avg": 0.3160354495048523, "step": 871, "valid_targets_mean": 16118.9, "valid_targets_min": 15290 }, { "epoch": 3.7121535181236673, "grad_norm": 0.1909097750601415, "learning_rate": 7.623373435557988e-06, "loss": 1.0436, "loss_nan_ranks": 0, "loss_rank_avg": 0.24374912679195404, "step": 872, "valid_targets_mean": 13757.4, "valid_targets_min": 11218 }, { "epoch": 3.716417910447761, "grad_norm": 0.20030508106272105, "learning_rate": 7.5767338266286775e-06, "loss": 1.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.28267043828964233, "step": 873, "valid_targets_mean": 16168.4, "valid_targets_min": 14830 }, { "epoch": 3.7206823027718547, "grad_norm": 0.20812341049975572, "learning_rate": 7.530203962825331e-06, "loss": 1.0316, "loss_nan_ranks": 0, "loss_rank_avg": 0.30265045166015625, "step": 874, "valid_targets_mean": 16155.6, "valid_targets_min": 15464 }, { "epoch": 3.724946695095949, "grad_norm": 0.18360113210996984, "learning_rate": 7.483784255185249e-06, "loss": 1.0431, "loss_nan_ranks": 0, "loss_rank_avg": 0.23530153930187225, "step": 875, "valid_targets_mean": 14721.8, "valid_targets_min": 12209 }, { "epoch": 3.7292110874200426, "grad_norm": 0.20221222455542814, "learning_rate": 7.437475113772632e-06, "loss": 1.0017, "loss_nan_ranks": 0, "loss_rank_avg": 0.2918761372566223, "step": 876, "valid_targets_mean": 16160.6, "valid_targets_min": 15234 }, { "epoch": 3.7334754797441363, "grad_norm": 0.18530134539495166, "learning_rate": 7.391276947674932e-06, "loss": 1.0165, "loss_nan_ranks": 0, "loss_rank_avg": 0.21132834255695343, "step": 877, "valid_targets_mean": 11079.2, "valid_targets_min": 1520 }, { "epoch": 3.7377398720682304, "grad_norm": 0.21377599326496985, "learning_rate": 7.345190164999307e-06, "loss": 1.007, "loss_nan_ranks": 0, "loss_rank_avg": 0.24113556742668152, "step": 878, "valid_targets_mean": 15988.7, "valid_targets_min": 14889 }, { "epoch": 3.742004264392324, "grad_norm": 0.18807427523413936, "learning_rate": 7.299215172868947e-06, "loss": 1.0029, "loss_nan_ranks": 0, "loss_rank_avg": 0.3014865517616272, "step": 879, "valid_targets_mean": 16100.1, "valid_targets_min": 15198 }, { "epoch": 3.746268656716418, "grad_norm": 0.17169001499638226, "learning_rate": 7.2533523774194865e-06, "loss": 0.9928, "loss_nan_ranks": 0, "loss_rank_avg": 0.15240547060966492, "step": 880, "valid_targets_mean": 8749.8, "valid_targets_min": 1971 }, { "epoch": 3.750533049040512, "grad_norm": 0.1679285384728096, "learning_rate": 7.2076021837954616e-06, "loss": 0.9577, "loss_nan_ranks": 0, "loss_rank_avg": 0.24019278585910797, "step": 881, "valid_targets_mean": 16235.8, "valid_targets_min": 15737 }, { "epoch": 3.7547974413646057, "grad_norm": 0.19434300770296428, "learning_rate": 7.161964996146689e-06, "loss": 0.9948, "loss_nan_ranks": 0, "loss_rank_avg": 0.28557753562927246, "step": 882, "valid_targets_mean": 16172.3, "valid_targets_min": 15386 }, { "epoch": 3.7590618336886994, "grad_norm": 0.17407388837457433, "learning_rate": 7.116441217624708e-06, "loss": 1.0277, "loss_nan_ranks": 0, "loss_rank_avg": 0.20178121328353882, "step": 883, "valid_targets_mean": 11656.7, "valid_targets_min": 7621 }, { "epoch": 3.763326226012793, "grad_norm": 0.18193248717461616, "learning_rate": 7.071031250379228e-06, "loss": 0.998, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768580913543701, "step": 884, "valid_targets_mean": 16177.2, "valid_targets_min": 15576 }, { "epoch": 3.767590618336887, "grad_norm": 0.18181519483778066, "learning_rate": 7.0257354955545466e-06, "loss": 1.0266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2880393862724304, "step": 885, "valid_targets_mean": 16203.8, "valid_targets_min": 15219 }, { "epoch": 3.771855010660981, "grad_norm": 0.17358900056666338, "learning_rate": 6.980554353286066e-06, "loss": 0.9932, "loss_nan_ranks": 0, "loss_rank_avg": 0.24835087358951569, "step": 886, "valid_targets_mean": 14070.1, "valid_targets_min": 12079 }, { "epoch": 3.7761194029850746, "grad_norm": 0.1969409285627566, "learning_rate": 6.935488222696676e-06, "loss": 1.0337, "loss_nan_ranks": 0, "loss_rank_avg": 0.294018030166626, "step": 887, "valid_targets_mean": 16149.6, "valid_targets_min": 15401 }, { "epoch": 3.7803837953091683, "grad_norm": 0.1790611891295005, "learning_rate": 6.890537501893302e-06, "loss": 1.0152, "loss_nan_ranks": 0, "loss_rank_avg": 0.23835018277168274, "step": 888, "valid_targets_mean": 12633.7, "valid_targets_min": 618 }, { "epoch": 3.7846481876332625, "grad_norm": 0.17338948935102383, "learning_rate": 6.845702587963352e-06, "loss": 1.047, "loss_nan_ranks": 0, "loss_rank_avg": 0.25005704164505005, "step": 889, "valid_targets_mean": 15490.9, "valid_targets_min": 13898 }, { "epoch": 3.788912579957356, "grad_norm": 0.17636192922700825, "learning_rate": 6.800983876971192e-06, "loss": 0.967, "loss_nan_ranks": 0, "loss_rank_avg": 0.277923047542572, "step": 890, "valid_targets_mean": 16048.4, "valid_targets_min": 13573 }, { "epoch": 3.79317697228145, "grad_norm": 0.19529875362281152, "learning_rate": 6.756381763954718e-06, "loss": 1.0392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1701369434595108, "step": 891, "valid_targets_mean": 9984.5, "valid_targets_min": 1676 }, { "epoch": 3.7974413646055436, "grad_norm": 0.1719459899710793, "learning_rate": 6.7118966429217645e-06, "loss": 1.0305, "loss_nan_ranks": 0, "loss_rank_avg": 0.25571155548095703, "step": 892, "valid_targets_mean": 15897.7, "valid_targets_min": 15188 }, { "epoch": 3.8017057569296373, "grad_norm": 0.19200006643367323, "learning_rate": 6.667528906846714e-06, "loss": 1.0152, "loss_nan_ranks": 0, "loss_rank_avg": 0.30839601159095764, "step": 893, "valid_targets_mean": 16174.7, "valid_targets_min": 15665 }, { "epoch": 3.8059701492537314, "grad_norm": 0.17799336332146048, "learning_rate": 6.623278947666974e-06, "loss": 1.0596, "loss_nan_ranks": 0, "loss_rank_avg": 0.19059264659881592, "step": 894, "valid_targets_mean": 10780.8, "valid_targets_min": 6697 }, { "epoch": 3.810234541577825, "grad_norm": 0.18003393409064003, "learning_rate": 6.579147156279538e-06, "loss": 1.017, "loss_nan_ranks": 0, "loss_rank_avg": 0.24897435307502747, "step": 895, "valid_targets_mean": 16181.2, "valid_targets_min": 14287 }, { "epoch": 3.814498933901919, "grad_norm": 0.18280328337121599, "learning_rate": 6.535133922537513e-06, "loss": 1.0184, "loss_nan_ranks": 0, "loss_rank_avg": 0.27476099133491516, "step": 896, "valid_targets_mean": 16171.2, "valid_targets_min": 15437 }, { "epoch": 3.818763326226013, "grad_norm": 0.18875212290983107, "learning_rate": 6.491239635246709e-06, "loss": 1.029, "loss_nan_ranks": 0, "loss_rank_avg": 0.2043631672859192, "step": 897, "valid_targets_mean": 13337.2, "valid_targets_min": 10600 }, { "epoch": 3.8230277185501067, "grad_norm": 0.1804494494953742, "learning_rate": 6.447464682162143e-06, "loss": 1.0278, "loss_nan_ranks": 0, "loss_rank_avg": 0.28921037912368774, "step": 898, "valid_targets_mean": 16177.3, "valid_targets_min": 15404 }, { "epoch": 3.8272921108742004, "grad_norm": 0.19211175028697716, "learning_rate": 6.403809449984704e-06, "loss": 1.0163, "loss_nan_ranks": 0, "loss_rank_avg": 0.2918737530708313, "step": 899, "valid_targets_mean": 16179.9, "valid_targets_min": 15636 }, { "epoch": 3.831556503198294, "grad_norm": 0.1765273759141979, "learning_rate": 6.3602743243576405e-06, "loss": 1.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2659085690975189, "step": 900, "valid_targets_mean": 15050.4, "valid_targets_min": 12744 }, { "epoch": 3.835820895522388, "grad_norm": 0.17748639822638573, "learning_rate": 6.316859689863222e-06, "loss": 1.0028, "loss_nan_ranks": 0, "loss_rank_avg": 0.2765544056892395, "step": 901, "valid_targets_mean": 16103.3, "valid_targets_min": 14365 }, { "epoch": 3.840085287846482, "grad_norm": 0.17420461378371643, "learning_rate": 6.273565930019316e-06, "loss": 1.0172, "loss_nan_ranks": 0, "loss_rank_avg": 0.19079825282096863, "step": 902, "valid_targets_mean": 9851.0, "valid_targets_min": 1680 }, { "epoch": 3.8443496801705757, "grad_norm": 0.16560599770246665, "learning_rate": 6.230393427276e-06, "loss": 0.9984, "loss_nan_ranks": 0, "loss_rank_avg": 0.2510971128940582, "step": 903, "valid_targets_mean": 16164.2, "valid_targets_min": 15371 }, { "epoch": 3.8486140724946694, "grad_norm": 0.1792965626692126, "learning_rate": 6.187342563012198e-06, "loss": 0.9932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2955405116081238, "step": 904, "valid_targets_mean": 16153.7, "valid_targets_min": 15258 }, { "epoch": 3.8528784648187635, "grad_norm": 0.17574840664926, "learning_rate": 6.144413717532269e-06, "loss": 0.985, "loss_nan_ranks": 0, "loss_rank_avg": 0.1359398365020752, "step": 905, "valid_targets_mean": 7781.8, "valid_targets_min": 1738 }, { "epoch": 3.857142857142857, "grad_norm": 0.16345377393674543, "learning_rate": 6.1016072700627106e-06, "loss": 1.0492, "loss_nan_ranks": 0, "loss_rank_avg": 0.2529211640357971, "step": 906, "valid_targets_mean": 16108.3, "valid_targets_min": 14821 }, { "epoch": 3.861407249466951, "grad_norm": 0.16703781468036705, "learning_rate": 6.058923598748756e-06, "loss": 1.0049, "loss_nan_ranks": 0, "loss_rank_avg": 0.27441149950027466, "step": 907, "valid_targets_mean": 16135.9, "valid_targets_min": 15182 }, { "epoch": 3.8656716417910446, "grad_norm": 0.18499862087725924, "learning_rate": 6.016363080651066e-06, "loss": 1.0129, "loss_nan_ranks": 0, "loss_rank_avg": 0.22376945614814758, "step": 908, "valid_targets_mean": 12611.5, "valid_targets_min": 9636 }, { "epoch": 3.8699360341151388, "grad_norm": 0.18549970597241158, "learning_rate": 5.973926091742386e-06, "loss": 1.0333, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838277816772461, "step": 909, "valid_targets_mean": 15943.4, "valid_targets_min": 11336 }, { "epoch": 3.8742004264392325, "grad_norm": 0.18280157811663325, "learning_rate": 5.931613006904196e-06, "loss": 0.9666, "loss_nan_ranks": 0, "loss_rank_avg": 0.27379751205444336, "step": 910, "valid_targets_mean": 16215.7, "valid_targets_min": 15773 }, { "epoch": 3.878464818763326, "grad_norm": 0.1670060683446909, "learning_rate": 5.889424199923473e-06, "loss": 1.0194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2533782124519348, "step": 911, "valid_targets_mean": 15084.9, "valid_targets_min": 13687 }, { "epoch": 3.88272921108742, "grad_norm": 0.17872960329716236, "learning_rate": 5.847360043489318e-06, "loss": 1.0414, "loss_nan_ranks": 0, "loss_rank_avg": 0.27177613973617554, "step": 912, "valid_targets_mean": 16055.0, "valid_targets_min": 13080 }, { "epoch": 3.886993603411514, "grad_norm": 0.18737262682718556, "learning_rate": 5.805420909189683e-06, "loss": 0.9968, "loss_nan_ranks": 0, "loss_rank_avg": 0.23658359050750732, "step": 913, "valid_targets_mean": 12997.0, "valid_targets_min": 1489 }, { "epoch": 3.8912579957356077, "grad_norm": 0.19688812946072382, "learning_rate": 5.7636071675081076e-06, "loss": 1.0155, "loss_nan_ranks": 0, "loss_rank_avg": 0.2453310787677765, "step": 914, "valid_targets_mean": 15195.4, "valid_targets_min": 13288 }, { "epoch": 3.8955223880597014, "grad_norm": 0.1801164773199151, "learning_rate": 5.721919187820431e-06, "loss": 1.0186, "loss_nan_ranks": 0, "loss_rank_avg": 0.30522605776786804, "step": 915, "valid_targets_mean": 16162.2, "valid_targets_min": 14786 }, { "epoch": 3.8997867803837956, "grad_norm": 0.20184345060283754, "learning_rate": 5.6803573383915265e-06, "loss": 1.0158, "loss_nan_ranks": 0, "loss_rank_avg": 0.16402074694633484, "step": 916, "valid_targets_mean": 8992.8, "valid_targets_min": 2237 }, { "epoch": 3.9040511727078893, "grad_norm": 0.19429181652200073, "learning_rate": 5.638921986372064e-06, "loss": 1.051, "loss_nan_ranks": 0, "loss_rank_avg": 0.25736844539642334, "step": 917, "valid_targets_mean": 16127.8, "valid_targets_min": 15305 }, { "epoch": 3.908315565031983, "grad_norm": 0.17669068878546865, "learning_rate": 5.5976134977952315e-06, "loss": 1.0119, "loss_nan_ranks": 0, "loss_rank_avg": 0.2880447506904602, "step": 918, "valid_targets_mean": 16123.2, "valid_targets_min": 15121 }, { "epoch": 3.9125799573560767, "grad_norm": 0.17299784357769227, "learning_rate": 5.556432237573564e-06, "loss": 1.0279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2095554769039154, "step": 919, "valid_targets_mean": 11376.9, "valid_targets_min": 7337 }, { "epoch": 3.9168443496801704, "grad_norm": 0.16934613260599296, "learning_rate": 5.5153785694956416e-06, "loss": 0.9933, "loss_nan_ranks": 0, "loss_rank_avg": 0.2432553768157959, "step": 920, "valid_targets_mean": 16196.0, "valid_targets_min": 15345 }, { "epoch": 3.9211087420042645, "grad_norm": 0.18745002576395378, "learning_rate": 5.474452856222942e-06, "loss": 1.0192, "loss_nan_ranks": 0, "loss_rank_avg": 0.3223433494567871, "step": 921, "valid_targets_mean": 15823.3, "valid_targets_min": 4778 }, { "epoch": 3.925373134328358, "grad_norm": 0.16413131624487595, "learning_rate": 5.433655459286611e-06, "loss": 1.0356, "loss_nan_ranks": 0, "loss_rank_avg": 0.23510609567165375, "step": 922, "valid_targets_mean": 13433.8, "valid_targets_min": 9965 }, { "epoch": 3.929637526652452, "grad_norm": 0.17157667668614518, "learning_rate": 5.392986739084238e-06, "loss": 1.0416, "loss_nan_ranks": 0, "loss_rank_avg": 0.28263452649116516, "step": 923, "valid_targets_mean": 16122.8, "valid_targets_min": 15294 }, { "epoch": 3.933901918976546, "grad_norm": 0.18312844983042084, "learning_rate": 5.352447054876755e-06, "loss": 1.0217, "loss_nan_ranks": 0, "loss_rank_avg": 0.2850250005722046, "step": 924, "valid_targets_mean": 16221.2, "valid_targets_min": 15261 }, { "epoch": 3.9381663113006398, "grad_norm": 0.1730633555170915, "learning_rate": 5.31203676478516e-06, "loss": 1.0177, "loss_nan_ranks": 0, "loss_rank_avg": 0.2412496656179428, "step": 925, "valid_targets_mean": 14959.6, "valid_targets_min": 12523 }, { "epoch": 3.9424307036247335, "grad_norm": 0.18254919910899342, "learning_rate": 5.271756225787434e-06, "loss": 1.0219, "loss_nan_ranks": 0, "loss_rank_avg": 0.3025828003883362, "step": 926, "valid_targets_mean": 16134.2, "valid_targets_min": 15345 }, { "epoch": 3.946695095948827, "grad_norm": 0.18547006293160873, "learning_rate": 5.231605793715348e-06, "loss": 1.0402, "loss_nan_ranks": 0, "loss_rank_avg": 0.20674429833889008, "step": 927, "valid_targets_mean": 10423.7, "valid_targets_min": 1155 }, { "epoch": 3.950959488272921, "grad_norm": 0.17483882087778208, "learning_rate": 5.191585823251335e-06, "loss": 1.0086, "loss_nan_ranks": 0, "loss_rank_avg": 0.2677437663078308, "step": 928, "valid_targets_mean": 15745.4, "valid_targets_min": 12492 }, { "epoch": 3.955223880597015, "grad_norm": 0.18340491692906996, "learning_rate": 5.151696667925348e-06, "loss": 1.0196, "loss_nan_ranks": 0, "loss_rank_avg": 0.30543091893196106, "step": 929, "valid_targets_mean": 15883.8, "valid_targets_min": 9286 }, { "epoch": 3.9594882729211087, "grad_norm": 0.17353634019809588, "learning_rate": 5.111938680111732e-06, "loss": 1.0082, "loss_nan_ranks": 0, "loss_rank_avg": 0.15605176985263824, "step": 930, "valid_targets_mean": 8194.7, "valid_targets_min": 2514 }, { "epoch": 3.9637526652452024, "grad_norm": 0.16013301608797142, "learning_rate": 5.072312211026125e-06, "loss": 0.9481, "loss_nan_ranks": 0, "loss_rank_avg": 0.23745262622833252, "step": 931, "valid_targets_mean": 16183.0, "valid_targets_min": 15263 }, { "epoch": 3.9680170575692966, "grad_norm": 0.18752852307138054, "learning_rate": 5.032817610722369e-06, "loss": 1.0416, "loss_nan_ranks": 0, "loss_rank_avg": 0.28059718012809753, "step": 932, "valid_targets_mean": 16226.6, "valid_targets_min": 15460 }, { "epoch": 3.9722814498933903, "grad_norm": 0.16759127501176574, "learning_rate": 4.993455228089366e-06, "loss": 0.98, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952660083770752, "step": 933, "valid_targets_mean": 12267.8, "valid_targets_min": 9004 }, { "epoch": 3.976545842217484, "grad_norm": 0.16670340148359164, "learning_rate": 4.954225410848048e-06, "loss": 1.0271, "loss_nan_ranks": 0, "loss_rank_avg": 0.2915708124637604, "step": 934, "valid_targets_mean": 16006.9, "valid_targets_min": 13688 }, { "epoch": 3.9808102345415777, "grad_norm": 0.1799964499560203, "learning_rate": 4.915128505548284e-06, "loss": 1.0526, "loss_nan_ranks": 0, "loss_rank_avg": 0.29275304079055786, "step": 935, "valid_targets_mean": 16135.8, "valid_targets_min": 14460 }, { "epoch": 3.9850746268656714, "grad_norm": 0.17170353398696742, "learning_rate": 4.8761648575658145e-06, "loss": 0.9824, "loss_nan_ranks": 0, "loss_rank_avg": 0.22930490970611572, "step": 936, "valid_targets_mean": 14490.9, "valid_targets_min": 12290 }, { "epoch": 3.9893390191897655, "grad_norm": 0.17908275507086058, "learning_rate": 4.837334811099217e-06, "loss": 1.041, "loss_nan_ranks": 0, "loss_rank_avg": 0.3175300657749176, "step": 937, "valid_targets_mean": 16084.7, "valid_targets_min": 14795 }, { "epoch": 3.9936034115138592, "grad_norm": 0.16982624399836438, "learning_rate": 4.7986387091668365e-06, "loss": 1.0495, "loss_nan_ranks": 0, "loss_rank_avg": 0.244386225938797, "step": 938, "valid_targets_mean": 13311.0, "valid_targets_min": 1753 }, { "epoch": 3.997867803837953, "grad_norm": 0.17348971376797556, "learning_rate": 4.760076893603791e-06, "loss": 0.9879, "loss_nan_ranks": 0, "loss_rank_avg": 0.24180036783218384, "step": 939, "valid_targets_mean": 16049.2, "valid_targets_min": 15191 }, { "epoch": 4.0, "grad_norm": 0.25328745288321697, "learning_rate": 4.721649705058926e-06, "loss": 0.9824, "loss_nan_ranks": 0, "loss_rank_avg": 0.4427715837955475, "step": 940, "valid_targets_mean": 11319.7, "valid_targets_min": 1545 }, { "epoch": 4.004264392324094, "grad_norm": 0.17162594790757177, "learning_rate": 4.683357482991819e-06, "loss": 0.9659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2455882728099823, "step": 941, "valid_targets_mean": 16066.7, "valid_targets_min": 14483 }, { "epoch": 4.008528784648187, "grad_norm": 0.18660661591121844, "learning_rate": 4.645200565669776e-06, "loss": 1.0174, "loss_nan_ranks": 0, "loss_rank_avg": 0.3127480745315552, "step": 942, "valid_targets_mean": 16023.8, "valid_targets_min": 14103 }, { "epoch": 4.0127931769722816, "grad_norm": 0.1797699085533669, "learning_rate": 4.607179290164823e-06, "loss": 1.0181, "loss_nan_ranks": 0, "loss_rank_avg": 0.21285849809646606, "step": 943, "valid_targets_mean": 13279.5, "valid_targets_min": 10443 }, { "epoch": 4.017057569296376, "grad_norm": 0.1815782872447276, "learning_rate": 4.569293992350783e-06, "loss": 0.9927, "loss_nan_ranks": 0, "loss_rank_avg": 0.26089972257614136, "step": 944, "valid_targets_mean": 16190.7, "valid_targets_min": 14904 }, { "epoch": 4.021321961620469, "grad_norm": 0.18902901787261803, "learning_rate": 4.531545006900244e-06, "loss": 1.0005, "loss_nan_ranks": 0, "loss_rank_avg": 0.29636943340301514, "step": 945, "valid_targets_mean": 16119.8, "valid_targets_min": 15234 }, { "epoch": 4.025586353944563, "grad_norm": 0.16917585233331373, "learning_rate": 4.493932667281646e-06, "loss": 1.0045, "loss_nan_ranks": 0, "loss_rank_avg": 0.2362777590751648, "step": 946, "valid_targets_mean": 14883.1, "valid_targets_min": 12676 }, { "epoch": 4.029850746268656, "grad_norm": 0.17323089731676028, "learning_rate": 4.456457305756321e-06, "loss": 1.0169, "loss_nan_ranks": 0, "loss_rank_avg": 0.29187196493148804, "step": 947, "valid_targets_mean": 16098.3, "valid_targets_min": 15263 }, { "epoch": 4.0341151385927505, "grad_norm": 0.17607985421245612, "learning_rate": 4.419119253375557e-06, "loss": 1.0203, "loss_nan_ranks": 0, "loss_rank_avg": 0.2674245834350586, "step": 948, "valid_targets_mean": 12999.3, "valid_targets_min": 2666 }, { "epoch": 4.038379530916845, "grad_norm": 0.197620639593689, "learning_rate": 4.381918839977675e-06, "loss": 1.0165, "loss_nan_ranks": 0, "loss_rank_avg": 0.25065767765045166, "step": 949, "valid_targets_mean": 15620.4, "valid_targets_min": 13538 }, { "epoch": 4.042643923240938, "grad_norm": 0.19309410606119287, "learning_rate": 4.344856394185122e-06, "loss": 0.9905, "loss_nan_ranks": 0, "loss_rank_avg": 0.3093436360359192, "step": 950, "valid_targets_mean": 16151.6, "valid_targets_min": 15414 }, { "epoch": 4.046908315565032, "grad_norm": 0.17737637616480462, "learning_rate": 4.307932243401538e-06, "loss": 1.0561, "loss_nan_ranks": 0, "loss_rank_avg": 0.17596712708473206, "step": 951, "valid_targets_mean": 9453.4, "valid_targets_min": 1451 }, { "epoch": 4.051172707889126, "grad_norm": 0.15964671170178713, "learning_rate": 4.271146713808927e-06, "loss": 0.9751, "loss_nan_ranks": 0, "loss_rank_avg": 0.24877549707889557, "step": 952, "valid_targets_mean": 16083.6, "valid_targets_min": 13226 }, { "epoch": 4.0554371002132195, "grad_norm": 0.17690684966733292, "learning_rate": 4.234500130364698e-06, "loss": 1.0566, "loss_nan_ranks": 0, "loss_rank_avg": 0.31012070178985596, "step": 953, "valid_targets_mean": 16129.1, "valid_targets_min": 15302 }, { "epoch": 4.059701492537314, "grad_norm": 0.16959319370168027, "learning_rate": 4.197992816798851e-06, "loss": 0.9986, "loss_nan_ranks": 0, "loss_rank_avg": 0.16628019511699677, "step": 954, "valid_targets_mean": 10084.4, "valid_targets_min": 5271 }, { "epoch": 4.063965884861407, "grad_norm": 0.17645660091887394, "learning_rate": 4.161625095611101e-06, "loss": 1.0102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812536358833313, "step": 955, "valid_targets_mean": 16028.5, "valid_targets_min": 14444 }, { "epoch": 4.068230277185501, "grad_norm": 0.18743764773437324, "learning_rate": 4.125397288068007e-06, "loss": 1.0075, "loss_nan_ranks": 0, "loss_rank_avg": 0.295288622379303, "step": 956, "valid_targets_mean": 16037.3, "valid_targets_min": 15042 }, { "epoch": 4.072494669509595, "grad_norm": 0.16311422806532486, "learning_rate": 4.089309714200187e-06, "loss": 1.0173, "loss_nan_ranks": 0, "loss_rank_avg": 0.2155115008354187, "step": 957, "valid_targets_mean": 12814.3, "valid_targets_min": 10793 }, { "epoch": 4.076759061833688, "grad_norm": 0.17008518119709745, "learning_rate": 4.0533626927994185e-06, "loss": 1.0294, "loss_nan_ranks": 0, "loss_rank_avg": 0.2760984003543854, "step": 958, "valid_targets_mean": 16213.8, "valid_targets_min": 15779 }, { "epoch": 4.081023454157783, "grad_norm": 0.17203247691720971, "learning_rate": 4.017556541415888e-06, "loss": 1.0215, "loss_nan_ranks": 0, "loss_rank_avg": 0.2968873381614685, "step": 959, "valid_targets_mean": 16128.7, "valid_targets_min": 15225 }, { "epoch": 4.085287846481877, "grad_norm": 0.15759084987503583, "learning_rate": 3.981891576355352e-06, "loss": 1.033, "loss_nan_ranks": 0, "loss_rank_avg": 0.23213127255439758, "step": 960, "valid_targets_mean": 14446.7, "valid_targets_min": 12362 }, { "epoch": 4.08955223880597, "grad_norm": 0.16464042746741422, "learning_rate": 3.946368112676346e-06, "loss": 0.9613, "loss_nan_ranks": 0, "loss_rank_avg": 0.2920254170894623, "step": 961, "valid_targets_mean": 16109.6, "valid_targets_min": 15314 }, { "epoch": 4.093816631130064, "grad_norm": 0.17425631840044417, "learning_rate": 3.9109864641874166e-06, "loss": 0.9768, "loss_nan_ranks": 0, "loss_rank_avg": 0.19915470480918884, "step": 962, "valid_targets_mean": 11302.1, "valid_targets_min": 1971 }, { "epoch": 4.098081023454157, "grad_norm": 0.16209513754356383, "learning_rate": 3.875746943444316e-06, "loss": 1.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.26291438937187195, "step": 963, "valid_targets_mean": 14906.4, "valid_targets_min": 13182 }, { "epoch": 4.1023454157782515, "grad_norm": 0.17081354223050138, "learning_rate": 3.840649861747278e-06, "loss": 1.0001, "loss_nan_ranks": 0, "loss_rank_avg": 0.29953575134277344, "step": 964, "valid_targets_mean": 16189.0, "valid_targets_min": 15541 }, { "epoch": 4.106609808102346, "grad_norm": 0.1677930354720929, "learning_rate": 3.8056955291382667e-06, "loss": 1.0416, "loss_nan_ranks": 0, "loss_rank_avg": 0.15104900300502777, "step": 965, "valid_targets_mean": 8370.9, "valid_targets_min": 1779 }, { "epoch": 4.110874200426439, "grad_norm": 0.16354509231928108, "learning_rate": 3.7708842543981928e-06, "loss": 1.0102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2592680752277374, "step": 966, "valid_targets_mean": 16096.9, "valid_targets_min": 15058 }, { "epoch": 4.115138592750533, "grad_norm": 0.16447018627054752, "learning_rate": 3.736216345044237e-06, "loss": 0.9855, "loss_nan_ranks": 0, "loss_rank_avg": 0.3046714961528778, "step": 967, "valid_targets_mean": 16148.6, "valid_targets_min": 15180 }, { "epoch": 4.119402985074627, "grad_norm": 0.17326586136059488, "learning_rate": 3.7016921073271084e-06, "loss": 1.0408, "loss_nan_ranks": 0, "loss_rank_avg": 0.21079136431217194, "step": 968, "valid_targets_mean": 12434.7, "valid_targets_min": 9731 }, { "epoch": 4.1236673773987205, "grad_norm": 0.15867633625313174, "learning_rate": 3.6673118462283453e-06, "loss": 1.0082, "loss_nan_ranks": 0, "loss_rank_avg": 0.25667932629585266, "step": 969, "valid_targets_mean": 16190.2, "valid_targets_min": 15606 }, { "epoch": 4.127931769722815, "grad_norm": 0.17485078203246107, "learning_rate": 3.6330758654576227e-06, "loss": 0.9784, "loss_nan_ranks": 0, "loss_rank_avg": 0.2849656343460083, "step": 970, "valid_targets_mean": 16164.5, "valid_targets_min": 14793 }, { "epoch": 4.132196162046908, "grad_norm": 0.15447506956117477, "learning_rate": 3.598984467450055e-06, "loss": 1.0411, "loss_nan_ranks": 0, "loss_rank_avg": 0.2483430951833725, "step": 971, "valid_targets_mean": 14369.9, "valid_targets_min": 12092 }, { "epoch": 4.136460554371002, "grad_norm": 0.17016881271259185, "learning_rate": 3.565037953363546e-06, "loss": 1.0143, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875226140022278, "step": 972, "valid_targets_mean": 16104.4, "valid_targets_min": 15148 }, { "epoch": 4.140724946695096, "grad_norm": 0.17959212116223483, "learning_rate": 3.5312366230761154e-06, "loss": 1.0354, "loss_nan_ranks": 0, "loss_rank_avg": 0.23283183574676514, "step": 973, "valid_targets_mean": 13172.6, "valid_targets_min": 3256 }, { "epoch": 4.144989339019189, "grad_norm": 0.15432162678640157, "learning_rate": 3.497580775183258e-06, "loss": 0.9921, "loss_nan_ranks": 0, "loss_rank_avg": 0.25189337134361267, "step": 974, "valid_targets_mean": 15601.2, "valid_targets_min": 14121 }, { "epoch": 4.149253731343284, "grad_norm": 0.1634454106505598, "learning_rate": 3.464070706995295e-06, "loss": 1.0218, "loss_nan_ranks": 0, "loss_rank_avg": 0.3254646956920624, "step": 975, "valid_targets_mean": 16042.2, "valid_targets_min": 14897 }, { "epoch": 4.153518123667378, "grad_norm": 0.1708252383415284, "learning_rate": 3.4307067145347417e-06, "loss": 1.038, "loss_nan_ranks": 0, "loss_rank_avg": 0.18007853627204895, "step": 976, "valid_targets_mean": 8586.8, "valid_targets_min": 1768 }, { "epoch": 4.157782515991471, "grad_norm": 0.1542398896632874, "learning_rate": 3.397489092533739e-06, "loss": 1.0342, "loss_nan_ranks": 0, "loss_rank_avg": 0.2551620900630951, "step": 977, "valid_targets_mean": 16131.9, "valid_targets_min": 15537 }, { "epoch": 4.162046908315565, "grad_norm": 0.18247902007514508, "learning_rate": 3.364418134431371e-06, "loss": 1.0482, "loss_nan_ranks": 0, "loss_rank_avg": 0.3169439136981964, "step": 978, "valid_targets_mean": 16057.0, "valid_targets_min": 15080 }, { "epoch": 4.166311300639659, "grad_norm": 0.16694802259065614, "learning_rate": 3.331494132371149e-06, "loss": 0.9846, "loss_nan_ranks": 0, "loss_rank_avg": 0.18681488931179047, "step": 979, "valid_targets_mean": 10399.8, "valid_targets_min": 5144 }, { "epoch": 4.1705756929637525, "grad_norm": 0.16907813619908482, "learning_rate": 3.2987173771983816e-06, "loss": 1.0193, "loss_nan_ranks": 0, "loss_rank_avg": 0.26041150093078613, "step": 980, "valid_targets_mean": 16078.6, "valid_targets_min": 14547 }, { "epoch": 4.174840085287847, "grad_norm": 0.1770777712940949, "learning_rate": 3.266088158457634e-06, "loss": 0.9868, "loss_nan_ranks": 0, "loss_rank_avg": 0.3240050673484802, "step": 981, "valid_targets_mean": 16150.1, "valid_targets_min": 15327 }, { "epoch": 4.17910447761194, "grad_norm": 0.15912496641507942, "learning_rate": 3.233606764390147e-06, "loss": 1.0079, "loss_nan_ranks": 0, "loss_rank_avg": 0.24741700291633606, "step": 982, "valid_targets_mean": 14295.7, "valid_targets_min": 11896 }, { "epoch": 4.183368869936034, "grad_norm": 0.16265146944586914, "learning_rate": 3.2012734819313127e-06, "loss": 0.9714, "loss_nan_ranks": 0, "loss_rank_avg": 0.27438461780548096, "step": 983, "valid_targets_mean": 16193.6, "valid_targets_min": 15576 }, { "epoch": 4.187633262260128, "grad_norm": 0.16083598802712898, "learning_rate": 3.1690885967081187e-06, "loss": 1.0139, "loss_nan_ranks": 0, "loss_rank_avg": 0.30279818177223206, "step": 984, "valid_targets_mean": 16187.3, "valid_targets_min": 15688 }, { "epoch": 4.1918976545842215, "grad_norm": 0.14979200671170342, "learning_rate": 3.1370523930366393e-06, "loss": 1.0096, "loss_nan_ranks": 0, "loss_rank_avg": 0.232590913772583, "step": 985, "valid_targets_mean": 15108.0, "valid_targets_min": 13057 }, { "epoch": 4.196162046908316, "grad_norm": 0.17621147779251822, "learning_rate": 3.105165153919525e-06, "loss": 1.0543, "loss_nan_ranks": 0, "loss_rank_avg": 0.3233955502510071, "step": 986, "valid_targets_mean": 16057.4, "valid_targets_min": 13080 }, { "epoch": 4.20042643923241, "grad_norm": 0.1756035801626048, "learning_rate": 3.073427161043492e-06, "loss": 1.0446, "loss_nan_ranks": 0, "loss_rank_avg": 0.19718195497989655, "step": 987, "valid_targets_mean": 10671.0, "valid_targets_min": 1160 }, { "epoch": 4.204690831556503, "grad_norm": 0.1658033352673812, "learning_rate": 3.0418386947768463e-06, "loss": 1.0348, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562304735183716, "step": 988, "valid_targets_mean": 15663.9, "valid_targets_min": 13837 }, { "epoch": 4.208955223880597, "grad_norm": 0.1682898687908902, "learning_rate": 3.01040003416698e-06, "loss": 1.0535, "loss_nan_ranks": 0, "loss_rank_avg": 0.3200420141220093, "step": 989, "valid_targets_mean": 16049.9, "valid_targets_min": 14594 }, { "epoch": 4.21321961620469, "grad_norm": 0.16795589651540707, "learning_rate": 2.97911145693796e-06, "loss": 0.9836, "loss_nan_ranks": 0, "loss_rank_avg": 0.15380680561065674, "step": 990, "valid_targets_mean": 8766.8, "valid_targets_min": 1535 }, { "epoch": 4.217484008528785, "grad_norm": 0.15635899916733167, "learning_rate": 2.947973239488009e-06, "loss": 1.0194, "loss_nan_ranks": 0, "loss_rank_avg": 0.25666990876197815, "step": 991, "valid_targets_mean": 16073.6, "valid_targets_min": 13538 }, { "epoch": 4.221748400852879, "grad_norm": 0.18479556506671047, "learning_rate": 2.91698565688711e-06, "loss": 1.0424, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063018321990967, "step": 992, "valid_targets_mean": 16132.2, "valid_targets_min": 15545 }, { "epoch": 4.226012793176972, "grad_norm": 0.16647450476412914, "learning_rate": 2.886148982874566e-06, "loss": 0.9808, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856815069913864, "step": 993, "valid_targets_mean": 12287.9, "valid_targets_min": 10321 }, { "epoch": 4.230277185501066, "grad_norm": 0.1650596049711428, "learning_rate": 2.8554634898565668e-06, "loss": 1.0019, "loss_nan_ranks": 0, "loss_rank_avg": 0.27796709537506104, "step": 994, "valid_targets_mean": 16178.9, "valid_targets_min": 15636 }, { "epoch": 4.23454157782516, "grad_norm": 0.1809480512413989, "learning_rate": 2.824929448903806e-06, "loss": 0.9823, "loss_nan_ranks": 0, "loss_rank_avg": 0.28689736127853394, "step": 995, "valid_targets_mean": 16156.2, "valid_targets_min": 14699 }, { "epoch": 4.2388059701492535, "grad_norm": 0.15370745546883308, "learning_rate": 2.794547129749059e-06, "loss": 0.9896, "loss_nan_ranks": 0, "loss_rank_avg": 0.23388049006462097, "step": 996, "valid_targets_mean": 14443.9, "valid_targets_min": 12790 }, { "epoch": 4.243070362473348, "grad_norm": 0.16203382511484396, "learning_rate": 2.7643168007848255e-06, "loss": 0.9708, "loss_nan_ranks": 0, "loss_rank_avg": 0.27245384454727173, "step": 997, "valid_targets_mean": 16089.3, "valid_targets_min": 15042 }, { "epoch": 4.247334754797441, "grad_norm": 0.16967353030673493, "learning_rate": 2.734238729060956e-06, "loss": 1.0114, "loss_nan_ranks": 0, "loss_rank_avg": 0.20903266966342926, "step": 998, "valid_targets_mean": 13288.2, "valid_targets_min": 1630 }, { "epoch": 4.251599147121535, "grad_norm": 0.168705045038412, "learning_rate": 2.7043131802822653e-06, "loss": 1.0119, "loss_nan_ranks": 0, "loss_rank_avg": 0.257682740688324, "step": 999, "valid_targets_mean": 15930.2, "valid_targets_min": 14795 }, { "epoch": 4.255863539445629, "grad_norm": 0.19231465994332417, "learning_rate": 2.674540418806222e-06, "loss": 1.0501, "loss_nan_ranks": 0, "loss_rank_avg": 0.3070492744445801, "step": 1000, "valid_targets_mean": 16080.7, "valid_targets_min": 14917 }, { "epoch": 4.2601279317697225, "grad_norm": 0.1710007863233519, "learning_rate": 2.6449207076405857e-06, "loss": 1.0332, "loss_nan_ranks": 0, "loss_rank_avg": 0.18669047951698303, "step": 1001, "valid_targets_mean": 9100.4, "valid_targets_min": 1545 }, { "epoch": 4.264392324093817, "grad_norm": 0.16262781178453378, "learning_rate": 2.6154543084411035e-06, "loss": 0.9947, "loss_nan_ranks": 0, "loss_rank_avg": 0.23665502667427063, "step": 1002, "valid_targets_mean": 16176.8, "valid_targets_min": 15348 }, { "epoch": 4.268656716417911, "grad_norm": 0.17595307243521127, "learning_rate": 2.5861414815091834e-06, "loss": 1.0022, "loss_nan_ranks": 0, "loss_rank_avg": 0.29712724685668945, "step": 1003, "valid_targets_mean": 16140.2, "valid_targets_min": 14907 }, { "epoch": 4.272921108742004, "grad_norm": 0.15446894931777008, "learning_rate": 2.5569824857895987e-06, "loss": 0.9775, "loss_nan_ranks": 0, "loss_rank_avg": 0.15721696615219116, "step": 1004, "valid_targets_mean": 10518.3, "valid_targets_min": 5601 }, { "epoch": 4.277185501066098, "grad_norm": 0.16471914325864995, "learning_rate": 2.5279775788682083e-06, "loss": 0.9857, "loss_nan_ranks": 0, "loss_rank_avg": 0.25779882073402405, "step": 1005, "valid_targets_mean": 16179.2, "valid_targets_min": 15505 }, { "epoch": 4.281449893390192, "grad_norm": 0.16593655371423804, "learning_rate": 2.499127016969671e-06, "loss": 1.0034, "loss_nan_ranks": 0, "loss_rank_avg": 0.3106514811515808, "step": 1006, "valid_targets_mean": 16071.4, "valid_targets_min": 14103 }, { "epoch": 4.285714285714286, "grad_norm": 0.15988426257142174, "learning_rate": 2.4704310549551934e-06, "loss": 1.0443, "loss_nan_ranks": 0, "loss_rank_avg": 0.2495417445898056, "step": 1007, "valid_targets_mean": 15003.7, "valid_targets_min": 12787 }, { "epoch": 4.28997867803838, "grad_norm": 0.1649193232476725, "learning_rate": 2.441889946320266e-06, "loss": 0.9922, "loss_nan_ranks": 0, "loss_rank_avg": 0.27028751373291016, "step": 1008, "valid_targets_mean": 16140.7, "valid_targets_min": 15389 }, { "epoch": 4.294243070362473, "grad_norm": 0.16539209263258192, "learning_rate": 2.4135039431924233e-06, "loss": 1.0159, "loss_nan_ranks": 0, "loss_rank_avg": 0.3285196125507355, "step": 1009, "valid_targets_mean": 16154.0, "valid_targets_min": 15556 }, { "epoch": 4.298507462686567, "grad_norm": 0.15009629164504895, "learning_rate": 2.3852732963290426e-06, "loss": 0.9767, "loss_nan_ranks": 0, "loss_rank_avg": 0.22692888975143433, "step": 1010, "valid_targets_mean": 15455.0, "valid_targets_min": 13975 }, { "epoch": 4.302771855010661, "grad_norm": 0.17494261785315382, "learning_rate": 2.3571982551150853e-06, "loss": 1.0086, "loss_nan_ranks": 0, "loss_rank_avg": 0.2918718755245209, "step": 1011, "valid_targets_mean": 16222.7, "valid_targets_min": 15806 }, { "epoch": 4.3070362473347545, "grad_norm": 0.16531887286752694, "learning_rate": 2.329279067560937e-06, "loss": 1.018, "loss_nan_ranks": 0, "loss_rank_avg": 0.19952315092086792, "step": 1012, "valid_targets_mean": 11263.8, "valid_targets_min": 2852 }, { "epoch": 4.311300639658849, "grad_norm": 0.15243334089024038, "learning_rate": 2.301515980300182e-06, "loss": 0.9703, "loss_nan_ranks": 0, "loss_rank_avg": 0.24621377885341644, "step": 1013, "valid_targets_mean": 15904.6, "valid_targets_min": 14269 }, { "epoch": 4.315565031982943, "grad_norm": 0.1696156362286878, "learning_rate": 2.2739092385874527e-06, "loss": 1.0225, "loss_nan_ranks": 0, "loss_rank_avg": 0.31331756711006165, "step": 1014, "valid_targets_mean": 15890.2, "valid_targets_min": 13080 }, { "epoch": 4.319829424307036, "grad_norm": 0.16944189227686046, "learning_rate": 2.2464590862962443e-06, "loss": 1.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.15785104036331177, "step": 1015, "valid_targets_mean": 9874.5, "valid_targets_min": 1763 }, { "epoch": 4.32409381663113, "grad_norm": 0.15163721169159744, "learning_rate": 2.219165765916769e-06, "loss": 0.9763, "loss_nan_ranks": 0, "loss_rank_avg": 0.25100529193878174, "step": 1016, "valid_targets_mean": 16141.7, "valid_targets_min": 15225 }, { "epoch": 4.3283582089552235, "grad_norm": 0.16139062458464656, "learning_rate": 2.192029518553798e-06, "loss": 1.0176, "loss_nan_ranks": 0, "loss_rank_avg": 0.27301234006881714, "step": 1017, "valid_targets_mean": 16163.5, "valid_targets_min": 15023 }, { "epoch": 4.332622601279318, "grad_norm": 0.16698422619677605, "learning_rate": 2.165050583924566e-06, "loss": 1.0073, "loss_nan_ranks": 0, "loss_rank_avg": 0.17534929513931274, "step": 1018, "valid_targets_mean": 10685.0, "valid_targets_min": 8089 }, { "epoch": 4.336886993603412, "grad_norm": 0.15697779416050714, "learning_rate": 2.1382292003566163e-06, "loss": 0.9786, "loss_nan_ranks": 0, "loss_rank_avg": 0.26187610626220703, "step": 1019, "valid_targets_mean": 16124.3, "valid_targets_min": 14958 }, { "epoch": 4.341151385927505, "grad_norm": 0.16866112206724562, "learning_rate": 2.1115656047857213e-06, "loss": 1.0342, "loss_nan_ranks": 0, "loss_rank_avg": 0.31126171350479126, "step": 1020, "valid_targets_mean": 16112.7, "valid_targets_min": 14259 }, { "epoch": 4.345415778251599, "grad_norm": 0.15065213807725636, "learning_rate": 2.0850600327537806e-06, "loss": 1.0104, "loss_nan_ranks": 0, "loss_rank_avg": 0.22538825869560242, "step": 1021, "valid_targets_mean": 14805.6, "valid_targets_min": 12847 }, { "epoch": 4.349680170575693, "grad_norm": 0.16502741819996938, "learning_rate": 2.058712718406719e-06, "loss": 0.9824, "loss_nan_ranks": 0, "loss_rank_avg": 0.26563185453414917, "step": 1022, "valid_targets_mean": 16220.5, "valid_targets_min": 15492 }, { "epoch": 4.353944562899787, "grad_norm": 0.1573403450572898, "learning_rate": 2.032523894492471e-06, "loss": 0.9938, "loss_nan_ranks": 0, "loss_rank_avg": 0.2223053276538849, "step": 1023, "valid_targets_mean": 13809.1, "valid_targets_min": 1400 }, { "epoch": 4.358208955223881, "grad_norm": 0.15014771494971305, "learning_rate": 2.0064937923588634e-06, "loss": 0.9892, "loss_nan_ranks": 0, "loss_rank_avg": 0.24883639812469482, "step": 1024, "valid_targets_mean": 15233.9, "valid_targets_min": 13301 }, { "epoch": 4.362473347547974, "grad_norm": 0.17815349436266908, "learning_rate": 1.9806226419516195e-06, "loss": 1.0345, "loss_nan_ranks": 0, "loss_rank_avg": 0.33343401551246643, "step": 1025, "valid_targets_mean": 16119.5, "valid_targets_min": 15337 }, { "epoch": 4.366737739872068, "grad_norm": 0.1571520268395417, "learning_rate": 1.954910671812298e-06, "loss": 0.9604, "loss_nan_ranks": 0, "loss_rank_avg": 0.16843195259571075, "step": 1026, "valid_targets_mean": 10671.9, "valid_targets_min": 1922 }, { "epoch": 4.371002132196162, "grad_norm": 0.1600877305624945, "learning_rate": 1.9293581090762894e-06, "loss": 0.9774, "loss_nan_ranks": 0, "loss_rank_avg": 0.25779786705970764, "step": 1027, "valid_targets_mean": 16111.6, "valid_targets_min": 15024 }, { "epoch": 4.3752665245202556, "grad_norm": 0.1640378891646234, "learning_rate": 1.9039651794708058e-06, "loss": 1.0046, "loss_nan_ranks": 0, "loss_rank_avg": 0.30417150259017944, "step": 1028, "valid_targets_mean": 16166.4, "valid_targets_min": 15153 }, { "epoch": 4.37953091684435, "grad_norm": 0.1592978210094137, "learning_rate": 1.8787321073128817e-06, "loss": 1.0003, "loss_nan_ranks": 0, "loss_rank_avg": 0.1675044298171997, "step": 1029, "valid_targets_mean": 10813.5, "valid_targets_min": 7229 }, { "epoch": 4.383795309168444, "grad_norm": 0.15196142418764982, "learning_rate": 1.8536591155073958e-06, "loss": 1.0349, "loss_nan_ranks": 0, "loss_rank_avg": 0.26272517442703247, "step": 1030, "valid_targets_mean": 16132.2, "valid_targets_min": 13998 }, { "epoch": 4.388059701492537, "grad_norm": 0.16137244722688085, "learning_rate": 1.8287464255451181e-06, "loss": 1.0366, "loss_nan_ranks": 0, "loss_rank_avg": 0.31955209374427795, "step": 1031, "valid_targets_mean": 16103.5, "valid_targets_min": 15221 }, { "epoch": 4.392324093816631, "grad_norm": 0.1560253877137604, "learning_rate": 1.803994257500714e-06, "loss": 1.0578, "loss_nan_ranks": 0, "loss_rank_avg": 0.22638271749019623, "step": 1032, "valid_targets_mean": 12657.4, "valid_targets_min": 10184 }, { "epoch": 4.396588486140725, "grad_norm": 0.1592937648378557, "learning_rate": 1.7794028300308474e-06, "loss": 0.97, "loss_nan_ranks": 0, "loss_rank_avg": 0.27584147453308105, "step": 1033, "valid_targets_mean": 16116.2, "valid_targets_min": 14473 }, { "epoch": 4.400852878464819, "grad_norm": 0.15663526905175879, "learning_rate": 1.7549723603722003e-06, "loss": 0.9841, "loss_nan_ranks": 0, "loss_rank_avg": 0.26768210530281067, "step": 1034, "valid_targets_mean": 16112.7, "valid_targets_min": 13108 }, { "epoch": 4.405117270788913, "grad_norm": 0.15097542648465498, "learning_rate": 1.730703064339605e-06, "loss": 1.0184, "loss_nan_ranks": 0, "loss_rank_avg": 0.2370276004076004, "step": 1035, "valid_targets_mean": 15234.6, "valid_targets_min": 13039 }, { "epoch": 4.409381663113006, "grad_norm": 0.16244715692164918, "learning_rate": 1.7065951563241022e-06, "loss": 1.013, "loss_nan_ranks": 0, "loss_rank_avg": 0.2689659297466278, "step": 1036, "valid_targets_mean": 16181.4, "valid_targets_min": 15559 }, { "epoch": 4.4136460554371, "grad_norm": 0.15813153445282555, "learning_rate": 1.682648849291051e-06, "loss": 1.0179, "loss_nan_ranks": 0, "loss_rank_avg": 0.20376157760620117, "step": 1037, "valid_targets_mean": 11859.0, "valid_targets_min": 1729 }, { "epoch": 4.417910447761194, "grad_norm": 0.1510387947396715, "learning_rate": 1.6588643547782579e-06, "loss": 0.9837, "loss_nan_ranks": 0, "loss_rank_avg": 0.26324427127838135, "step": 1038, "valid_targets_mean": 16072.0, "valid_targets_min": 14287 }, { "epoch": 4.422174840085288, "grad_norm": 0.1631530373592602, "learning_rate": 1.6352418828941052e-06, "loss": 1.021, "loss_nan_ranks": 0, "loss_rank_avg": 0.30005693435668945, "step": 1039, "valid_targets_mean": 16157.0, "valid_targets_min": 15147 }, { "epoch": 4.426439232409382, "grad_norm": 0.1653269557190585, "learning_rate": 1.6117816423156952e-06, "loss": 1.0062, "loss_nan_ranks": 0, "loss_rank_avg": 0.1579434871673584, "step": 1040, "valid_targets_mean": 8889.2, "valid_targets_min": 2228 }, { "epoch": 4.430703624733475, "grad_norm": 0.14601140512061164, "learning_rate": 1.5884838402870029e-06, "loss": 0.9856, "loss_nan_ranks": 0, "loss_rank_avg": 0.24858561158180237, "step": 1041, "valid_targets_mean": 15932.7, "valid_targets_min": 9286 }, { "epoch": 4.434968017057569, "grad_norm": 0.1592912536183881, "learning_rate": 1.5653486826170384e-06, "loss": 1.01, "loss_nan_ranks": 0, "loss_rank_avg": 0.284557580947876, "step": 1042, "valid_targets_mean": 16150.2, "valid_targets_min": 14556 }, { "epoch": 4.439232409381663, "grad_norm": 0.14634296882098108, "learning_rate": 1.5423763736780583e-06, "loss": 0.9726, "loss_nan_ranks": 0, "loss_rank_avg": 0.19540275633335114, "step": 1043, "valid_targets_mean": 11303.3, "valid_targets_min": 8757 }, { "epoch": 4.443496801705757, "grad_norm": 0.1606028911978746, "learning_rate": 1.5195671164037173e-06, "loss": 1.0075, "loss_nan_ranks": 0, "loss_rank_avg": 0.26238173246383667, "step": 1044, "valid_targets_mean": 16184.0, "valid_targets_min": 15290 }, { "epoch": 4.447761194029851, "grad_norm": 0.15880887563413223, "learning_rate": 1.496921112287315e-06, "loss": 1.0156, "loss_nan_ranks": 0, "loss_rank_avg": 0.28872594237327576, "step": 1045, "valid_targets_mean": 16116.8, "valid_targets_min": 14479 }, { "epoch": 4.452025586353945, "grad_norm": 0.1503886439979893, "learning_rate": 1.4744385613799894e-06, "loss": 0.991, "loss_nan_ranks": 0, "loss_rank_avg": 0.23140674829483032, "step": 1046, "valid_targets_mean": 15366.7, "valid_targets_min": 14043 }, { "epoch": 4.456289978678038, "grad_norm": 0.15398807665192815, "learning_rate": 1.4521196622889644e-06, "loss": 1.0175, "loss_nan_ranks": 0, "loss_rank_avg": 0.28529155254364014, "step": 1047, "valid_targets_mean": 16143.6, "valid_targets_min": 15408 }, { "epoch": 4.460554371002132, "grad_norm": 0.15846972825741604, "learning_rate": 1.4299646121757892e-06, "loss": 0.9533, "loss_nan_ranks": 0, "loss_rank_avg": 0.21494928002357483, "step": 1048, "valid_targets_mean": 12775.2, "valid_targets_min": 1665 }, { "epoch": 4.464818763326226, "grad_norm": 0.14883790923907791, "learning_rate": 1.4079736067545912e-06, "loss": 1.0303, "loss_nan_ranks": 0, "loss_rank_avg": 0.26430243253707886, "step": 1049, "valid_targets_mean": 15916.8, "valid_targets_min": 13208 }, { "epoch": 4.46908315565032, "grad_norm": 0.15949849865118698, "learning_rate": 1.3861468402903634e-06, "loss": 1.0528, "loss_nan_ranks": 0, "loss_rank_avg": 0.3019446134567261, "step": 1050, "valid_targets_mean": 15767.2, "valid_targets_min": 7641 }, { "epoch": 4.473347547974414, "grad_norm": 0.16006328824608898, "learning_rate": 1.3644845055972322e-06, "loss": 1.0067, "loss_nan_ranks": 0, "loss_rank_avg": 0.17121657729148865, "step": 1051, "valid_targets_mean": 9511.8, "valid_targets_min": 1923 }, { "epoch": 4.477611940298507, "grad_norm": 0.1520066722967756, "learning_rate": 1.3429867940367626e-06, "loss": 1.0094, "loss_nan_ranks": 0, "loss_rank_avg": 0.25051623582839966, "step": 1052, "valid_targets_mean": 16088.7, "valid_targets_min": 14698 }, { "epoch": 4.481876332622601, "grad_norm": 0.15543351987099552, "learning_rate": 1.321653895516264e-06, "loss": 1.058, "loss_nan_ranks": 0, "loss_rank_avg": 0.3083563446998596, "step": 1053, "valid_targets_mean": 16089.3, "valid_targets_min": 14313 }, { "epoch": 4.486140724946695, "grad_norm": 0.15500162373470328, "learning_rate": 1.3004859984871199e-06, "loss": 1.0584, "loss_nan_ranks": 0, "loss_rank_avg": 0.1911185383796692, "step": 1054, "valid_targets_mean": 10396.3, "valid_targets_min": 6721 }, { "epoch": 4.490405117270789, "grad_norm": 0.15723817636653856, "learning_rate": 1.279483289943102e-06, "loss": 1.0568, "loss_nan_ranks": 0, "loss_rank_avg": 0.262037068605423, "step": 1055, "valid_targets_mean": 16159.7, "valid_targets_min": 15182 }, { "epoch": 4.494669509594883, "grad_norm": 0.16006229679549797, "learning_rate": 1.2586459554187558e-06, "loss": 0.9644, "loss_nan_ranks": 0, "loss_rank_avg": 0.28707319498062134, "step": 1056, "valid_targets_mean": 16055.6, "valid_targets_min": 11563 }, { "epoch": 4.498933901918977, "grad_norm": 0.14334699676474721, "learning_rate": 1.2379741789877175e-06, "loss": 0.9871, "loss_nan_ranks": 0, "loss_rank_avg": 0.2111390084028244, "step": 1057, "valid_targets_mean": 13391.1, "valid_targets_min": 11725 }, { "epoch": 4.50319829424307, "grad_norm": 0.1530149837424847, "learning_rate": 1.2174681432611245e-06, "loss": 1.0221, "loss_nan_ranks": 0, "loss_rank_avg": 0.3102961480617523, "step": 1058, "valid_targets_mean": 16118.4, "valid_targets_min": 15359 }, { "epoch": 4.507462686567164, "grad_norm": 0.1666265526562195, "learning_rate": 1.1971280293859811e-06, "loss": 1.0477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2946819067001343, "step": 1059, "valid_targets_mean": 16146.3, "valid_targets_min": 15305 }, { "epoch": 4.5117270788912585, "grad_norm": 0.1457230775806161, "learning_rate": 1.17695401704357e-06, "loss": 1.0072, "loss_nan_ranks": 0, "loss_rank_avg": 0.25192567706108093, "step": 1060, "valid_targets_mean": 15245.5, "valid_targets_min": 13728 }, { "epoch": 4.515991471215352, "grad_norm": 0.1620480528171536, "learning_rate": 1.1569462844478552e-06, "loss": 0.9563, "loss_nan_ranks": 0, "loss_rank_avg": 0.2645701766014099, "step": 1061, "valid_targets_mean": 16195.4, "valid_targets_min": 15305 }, { "epoch": 4.520255863539446, "grad_norm": 0.16142683707754352, "learning_rate": 1.1371050083439107e-06, "loss": 1.0315, "loss_nan_ranks": 0, "loss_rank_avg": 0.19992002844810486, "step": 1062, "valid_targets_mean": 10561.4, "valid_targets_min": 1369 }, { "epoch": 4.524520255863539, "grad_norm": 0.14622862418070282, "learning_rate": 1.1174303640063622e-06, "loss": 1.0269, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594802975654602, "step": 1063, "valid_targets_mean": 16008.1, "valid_targets_min": 15016 }, { "epoch": 4.528784648187633, "grad_norm": 0.1582067915541115, "learning_rate": 1.097922525237849e-06, "loss": 0.9584, "loss_nan_ranks": 0, "loss_rank_avg": 0.27360403537750244, "step": 1064, "valid_targets_mean": 16250.7, "valid_targets_min": 15657 }, { "epoch": 4.533049040511727, "grad_norm": 0.15399864010070974, "learning_rate": 1.078581664367455e-06, "loss": 1.0058, "loss_nan_ranks": 0, "loss_rank_avg": 0.1768619269132614, "step": 1065, "valid_targets_mean": 9856.1, "valid_targets_min": 1136 }, { "epoch": 4.537313432835821, "grad_norm": 0.15167944596731006, "learning_rate": 1.0594079522492274e-06, "loss": 0.9306, "loss_nan_ranks": 0, "loss_rank_avg": 0.25108233094215393, "step": 1066, "valid_targets_mean": 16141.2, "valid_targets_min": 14841 }, { "epoch": 4.541577825159915, "grad_norm": 0.16155044487851364, "learning_rate": 1.040401558260633e-06, "loss": 1.0514, "loss_nan_ranks": 0, "loss_rank_avg": 0.29427772760391235, "step": 1067, "valid_targets_mean": 16152.6, "valid_targets_min": 15628 }, { "epoch": 4.545842217484008, "grad_norm": 0.1608449787433378, "learning_rate": 1.0215626503010911e-06, "loss": 1.032, "loss_nan_ranks": 0, "loss_rank_avg": 0.21294349431991577, "step": 1068, "valid_targets_mean": 12159.6, "valid_targets_min": 10098 }, { "epoch": 4.550106609808102, "grad_norm": 0.14555507264167167, "learning_rate": 1.002891394790475e-06, "loss": 1.0014, "loss_nan_ranks": 0, "loss_rank_avg": 0.27116233110427856, "step": 1069, "valid_targets_mean": 16114.3, "valid_targets_min": 15154 }, { "epoch": 4.554371002132196, "grad_norm": 0.15514665887054913, "learning_rate": 9.843879566676273e-07, "loss": 1.0051, "loss_nan_ranks": 0, "loss_rank_avg": 0.2847168445587158, "step": 1070, "valid_targets_mean": 16146.2, "valid_targets_min": 15081 }, { "epoch": 4.55863539445629, "grad_norm": 0.14935522772969523, "learning_rate": 9.660524993889386e-07, "loss": 1.0106, "loss_nan_ranks": 0, "loss_rank_avg": 0.22059902548789978, "step": 1071, "valid_targets_mean": 14322.9, "valid_targets_min": 12453 }, { "epoch": 4.562899786780384, "grad_norm": 0.1508180934872635, "learning_rate": 9.478851849268733e-07, "loss": 0.9695, "loss_nan_ranks": 0, "loss_rank_avg": 0.26452839374542236, "step": 1072, "valid_targets_mean": 16183.2, "valid_targets_min": 15361 }, { "epoch": 4.567164179104478, "grad_norm": 0.15771190777876098, "learning_rate": 9.298861737685527e-07, "loss": 0.9916, "loss_nan_ranks": 0, "loss_rank_avg": 0.22417476773262024, "step": 1073, "valid_targets_mean": 13273.8, "valid_targets_min": 1961 }, { "epoch": 4.571428571428571, "grad_norm": 0.14841479834324803, "learning_rate": 9.120556249143341e-07, "loss": 1.0185, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562493681907654, "step": 1074, "valid_targets_mean": 15460.6, "valid_targets_min": 13041 }, { "epoch": 4.575692963752665, "grad_norm": 0.15977629857912234, "learning_rate": 8.943936958763988e-07, "loss": 1.0483, "loss_nan_ranks": 0, "loss_rank_avg": 0.3335935175418854, "step": 1075, "valid_targets_mean": 16153.5, "valid_targets_min": 15474 }, { "epoch": 4.5799573560767595, "grad_norm": 0.16477286952064188, "learning_rate": 8.769005426773836e-07, "loss": 1.0093, "loss_nan_ranks": 0, "loss_rank_avg": 0.15570859611034393, "step": 1076, "valid_targets_mean": 8296.6, "valid_targets_min": 1759 }, { "epoch": 4.584221748400853, "grad_norm": 0.14398661458138798, "learning_rate": 8.595763198489714e-07, "loss": 0.991, "loss_nan_ranks": 0, "loss_rank_avg": 0.25216251611709595, "step": 1077, "valid_targets_mean": 15818.3, "valid_targets_min": 7637 }, { "epoch": 4.588486140724947, "grad_norm": 0.15797679062016337, "learning_rate": 8.42421180430546e-07, "loss": 1.0011, "loss_nan_ranks": 0, "loss_rank_avg": 0.2939158082008362, "step": 1078, "valid_targets_mean": 16082.0, "valid_targets_min": 14558 }, { "epoch": 4.59275053304904, "grad_norm": 0.15853786185199106, "learning_rate": 8.254352759678386e-07, "loss": 1.0096, "loss_nan_ranks": 0, "loss_rank_avg": 0.1950775682926178, "step": 1079, "valid_targets_mean": 10988.8, "valid_targets_min": 7524 }, { "epoch": 4.597014925373134, "grad_norm": 0.15315161643048186, "learning_rate": 8.086187565115877e-07, "loss": 1.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.27116912603378296, "step": 1080, "valid_targets_mean": 16105.0, "valid_targets_min": 14248 }, { "epoch": 4.601279317697228, "grad_norm": 0.15729652259472846, "learning_rate": 7.919717706162067e-07, "loss": 1.0249, "loss_nan_ranks": 0, "loss_rank_avg": 0.289058119058609, "step": 1081, "valid_targets_mean": 16170.6, "valid_targets_min": 15348 }, { "epoch": 4.605543710021322, "grad_norm": 0.15299507799822196, "learning_rate": 7.754944653384777e-07, "loss": 0.9961, "loss_nan_ranks": 0, "loss_rank_avg": 0.2105131447315216, "step": 1082, "valid_targets_mean": 13349.8, "valid_targets_min": 10099 }, { "epoch": 4.609808102345416, "grad_norm": 0.15991928398901403, "learning_rate": 7.591869862362534e-07, "loss": 1.0078, "loss_nan_ranks": 0, "loss_rank_avg": 0.26621466875076294, "step": 1083, "valid_targets_mean": 16033.9, "valid_targets_min": 13427 }, { "epoch": 4.61407249466951, "grad_norm": 0.15354881551455993, "learning_rate": 7.430494773671682e-07, "loss": 0.9676, "loss_nan_ranks": 0, "loss_rank_avg": 0.30778414011001587, "step": 1084, "valid_targets_mean": 16172.6, "valid_targets_min": 15109 }, { "epoch": 4.618336886993603, "grad_norm": 0.1743479691706049, "learning_rate": 7.270820812873714e-07, "loss": 1.0087, "loss_nan_ranks": 0, "loss_rank_avg": 0.2505803108215332, "step": 1085, "valid_targets_mean": 14830.2, "valid_targets_min": 12981 }, { "epoch": 4.622601279317697, "grad_norm": 0.15448738581055893, "learning_rate": 7.112849390502563e-07, "loss": 0.9816, "loss_nan_ranks": 0, "loss_rank_avg": 0.26799455285072327, "step": 1086, "valid_targets_mean": 16209.5, "valid_targets_min": 15350 }, { "epoch": 4.6268656716417915, "grad_norm": 0.15706645950649392, "learning_rate": 6.956581902052306e-07, "loss": 1.0225, "loss_nan_ranks": 0, "loss_rank_avg": 0.20473934710025787, "step": 1087, "valid_targets_mean": 11744.4, "valid_targets_min": 2102 }, { "epoch": 4.631130063965885, "grad_norm": 0.143365373014936, "learning_rate": 6.802019727964593e-07, "loss": 0.9888, "loss_nan_ranks": 0, "loss_rank_avg": 0.2392513006925583, "step": 1088, "valid_targets_mean": 16153.6, "valid_targets_min": 15511 }, { "epoch": 4.635394456289979, "grad_norm": 0.15945068466229714, "learning_rate": 6.64916423361679e-07, "loss": 1.0181, "loss_nan_ranks": 0, "loss_rank_avg": 0.2937304973602295, "step": 1089, "valid_targets_mean": 16096.2, "valid_targets_min": 15122 }, { "epoch": 4.639658848614072, "grad_norm": 0.1591581081828491, "learning_rate": 6.498016769309567e-07, "loss": 1.0082, "loss_nan_ranks": 0, "loss_rank_avg": 0.1473933458328247, "step": 1090, "valid_targets_mean": 8071.3, "valid_targets_min": 2493 }, { "epoch": 4.643923240938166, "grad_norm": 0.13705684735753473, "learning_rate": 6.348578670255224e-07, "loss": 1.0004, "loss_nan_ranks": 0, "loss_rank_avg": 0.2415798306465149, "step": 1091, "valid_targets_mean": 16186.2, "valid_targets_min": 15270 }, { "epoch": 4.6481876332622605, "grad_norm": 0.14894995926384885, "learning_rate": 6.200851256565799e-07, "loss": 1.0026, "loss_nan_ranks": 0, "loss_rank_avg": 0.29065680503845215, "step": 1092, "valid_targets_mean": 15866.9, "valid_targets_min": 5993 }, { "epoch": 4.652452025586354, "grad_norm": 0.14628259051610237, "learning_rate": 6.054835833241357e-07, "loss": 0.9657, "loss_nan_ranks": 0, "loss_rank_avg": 0.20221902430057526, "step": 1093, "valid_targets_mean": 13206.6, "valid_targets_min": 10096 }, { "epoch": 4.656716417910448, "grad_norm": 0.1465313831298571, "learning_rate": 5.910533690158593e-07, "loss": 1.0124, "loss_nan_ranks": 0, "loss_rank_avg": 0.25688618421554565, "step": 1094, "valid_targets_mean": 16232.6, "valid_targets_min": 15734 }, { "epoch": 4.660980810234541, "grad_norm": 0.14879824830331395, "learning_rate": 5.767946102059307e-07, "loss": 0.9861, "loss_nan_ranks": 0, "loss_rank_avg": 0.276365727186203, "step": 1095, "valid_targets_mean": 16205.2, "valid_targets_min": 15637 }, { "epoch": 4.665245202558635, "grad_norm": 0.14986577980104723, "learning_rate": 5.627074328539173e-07, "loss": 1.0086, "loss_nan_ranks": 0, "loss_rank_avg": 0.22488278150558472, "step": 1096, "valid_targets_mean": 13320.2, "valid_targets_min": 11667 }, { "epoch": 4.669509594882729, "grad_norm": 0.15263641354366045, "learning_rate": 5.487919614036741e-07, "loss": 1.0345, "loss_nan_ranks": 0, "loss_rank_avg": 0.2853548526763916, "step": 1097, "valid_targets_mean": 16139.1, "valid_targets_min": 14753 }, { "epoch": 4.673773987206823, "grad_norm": 0.15304900679796296, "learning_rate": 5.350483187822231e-07, "loss": 1.03, "loss_nan_ranks": 0, "loss_rank_avg": 0.25601962208747864, "step": 1098, "valid_targets_mean": 12700.3, "valid_targets_min": 1472 }, { "epoch": 4.678038379530917, "grad_norm": 0.13864305612866518, "learning_rate": 5.214766263986848e-07, "loss": 1.0247, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643899917602539, "step": 1099, "valid_targets_mean": 15921.6, "valid_targets_min": 15264 }, { "epoch": 4.682302771855011, "grad_norm": 0.1585008120687658, "learning_rate": 5.080770041431926e-07, "loss": 0.9869, "loss_nan_ranks": 0, "loss_rank_avg": 0.2867545485496521, "step": 1100, "valid_targets_mean": 16070.0, "valid_targets_min": 13688 }, { "epoch": 4.686567164179104, "grad_norm": 0.15796797836556023, "learning_rate": 4.948495703858492e-07, "loss": 0.9744, "loss_nan_ranks": 0, "loss_rank_avg": 0.14525067806243896, "step": 1101, "valid_targets_mean": 8999.8, "valid_targets_min": 1416 }, { "epoch": 4.690831556503198, "grad_norm": 0.14332859110714966, "learning_rate": 4.81794441975667e-07, "loss": 1.0161, "loss_nan_ranks": 0, "loss_rank_avg": 0.26003924012184143, "step": 1102, "valid_targets_mean": 16092.8, "valid_targets_min": 14994 }, { "epoch": 4.6950959488272925, "grad_norm": 0.1627151240096481, "learning_rate": 4.689117342395388e-07, "loss": 0.9894, "loss_nan_ranks": 0, "loss_rank_avg": 0.27263838052749634, "step": 1103, "valid_targets_mean": 16196.6, "valid_targets_min": 15475 }, { "epoch": 4.699360341151386, "grad_norm": 0.15728636158959014, "learning_rate": 4.5620156098122204e-07, "loss": 1.0145, "loss_nan_ranks": 0, "loss_rank_avg": 0.19399403035640717, "step": 1104, "valid_targets_mean": 10582.8, "valid_targets_min": 5279 }, { "epoch": 4.70362473347548, "grad_norm": 0.14868122226793565, "learning_rate": 4.4366403448033334e-07, "loss": 1.024, "loss_nan_ranks": 0, "loss_rank_avg": 0.25753432512283325, "step": 1105, "valid_targets_mean": 16152.5, "valid_targets_min": 15082 }, { "epoch": 4.707889125799573, "grad_norm": 0.1556625193647965, "learning_rate": 4.3129926549136057e-07, "loss": 1.0442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2863929867744446, "step": 1106, "valid_targets_mean": 16147.2, "valid_targets_min": 15112 }, { "epoch": 4.712153518123667, "grad_norm": 0.14446145619265383, "learning_rate": 4.191073632426701e-07, "loss": 0.9751, "loss_nan_ranks": 0, "loss_rank_avg": 0.21357882022857666, "step": 1107, "valid_targets_mean": 13378.2, "valid_targets_min": 10566 }, { "epoch": 4.7164179104477615, "grad_norm": 0.16206675648159802, "learning_rate": 4.0708843543555643e-07, "loss": 0.9997, "loss_nan_ranks": 0, "loss_rank_avg": 0.2900570034980774, "step": 1108, "valid_targets_mean": 15993.5, "valid_targets_min": 10506 }, { "epoch": 4.720682302771855, "grad_norm": 0.15101141923399938, "learning_rate": 3.95242588243292e-07, "loss": 0.9856, "loss_nan_ranks": 0, "loss_rank_avg": 0.2901330888271332, "step": 1109, "valid_targets_mean": 16143.4, "valid_targets_min": 15280 }, { "epoch": 4.724946695095949, "grad_norm": 0.14621637188831488, "learning_rate": 3.8356992631017e-07, "loss": 1.0324, "loss_nan_ranks": 0, "loss_rank_avg": 0.23136021196842194, "step": 1110, "valid_targets_mean": 15238.5, "valid_targets_min": 13159 }, { "epoch": 4.729211087420042, "grad_norm": 0.1524386161010507, "learning_rate": 3.720705527506008e-07, "loss": 1.0195, "loss_nan_ranks": 0, "loss_rank_avg": 0.30147069692611694, "step": 1111, "valid_targets_mean": 16091.4, "valid_targets_min": 14723 }, { "epoch": 4.733475479744136, "grad_norm": 0.1619679827146892, "learning_rate": 3.60744569148197e-07, "loss": 1.066, "loss_nan_ranks": 0, "loss_rank_avg": 0.20357254147529602, "step": 1112, "valid_targets_mean": 11411.5, "valid_targets_min": 2225 }, { "epoch": 4.73773987206823, "grad_norm": 0.14349005246341898, "learning_rate": 3.4959207555485873e-07, "loss": 1.0372, "loss_nan_ranks": 0, "loss_rank_avg": 0.27663302421569824, "step": 1113, "valid_targets_mean": 15943.1, "valid_targets_min": 14159 }, { "epoch": 4.742004264392325, "grad_norm": 0.16716344154424714, "learning_rate": 3.3861317048992317e-07, "loss": 1.04, "loss_nan_ranks": 0, "loss_rank_avg": 0.3008594214916229, "step": 1114, "valid_targets_mean": 16178.0, "valid_targets_min": 15181 }, { "epoch": 4.746268656716418, "grad_norm": 0.14277538969640619, "learning_rate": 3.278079509392562e-07, "loss": 0.97, "loss_nan_ranks": 0, "loss_rank_avg": 0.17491425573825836, "step": 1115, "valid_targets_mean": 9657.3, "valid_targets_min": 3062 }, { "epoch": 4.750533049040512, "grad_norm": 0.1411692924943566, "learning_rate": 3.171765123544224e-07, "loss": 1.0159, "loss_nan_ranks": 0, "loss_rank_avg": 0.25507792830467224, "step": 1116, "valid_targets_mean": 16089.0, "valid_targets_min": 13436 }, { "epoch": 4.754797441364605, "grad_norm": 0.15818532876299207, "learning_rate": 3.06718948651834e-07, "loss": 1.0006, "loss_nan_ranks": 0, "loss_rank_avg": 0.2846674919128418, "step": 1117, "valid_targets_mean": 16174.9, "valid_targets_min": 15128 }, { "epoch": 4.759061833688699, "grad_norm": 0.14543713743713674, "learning_rate": 2.964353522119168e-07, "loss": 1.0132, "loss_nan_ranks": 0, "loss_rank_avg": 0.2241479456424713, "step": 1118, "valid_targets_mean": 13306.7, "valid_targets_min": 11186 }, { "epoch": 4.7633262260127935, "grad_norm": 0.15406571881357786, "learning_rate": 2.863258138783032e-07, "loss": 1.0327, "loss_nan_ranks": 0, "loss_rank_avg": 0.29350900650024414, "step": 1119, "valid_targets_mean": 16107.2, "valid_targets_min": 15308 }, { "epoch": 4.767590618336887, "grad_norm": 0.1454041308304772, "learning_rate": 2.7639042295702245e-07, "loss": 0.9931, "loss_nan_ranks": 0, "loss_rank_avg": 0.2819235026836395, "step": 1120, "valid_targets_mean": 16163.9, "valid_targets_min": 15717 }, { "epoch": 4.771855010660981, "grad_norm": 0.14077932344598632, "learning_rate": 2.666292672157056e-07, "loss": 0.9905, "loss_nan_ranks": 0, "loss_rank_avg": 0.23407378792762756, "step": 1121, "valid_targets_mean": 15291.8, "valid_targets_min": 13903 }, { "epoch": 4.776119402985074, "grad_norm": 0.1608947735935997, "learning_rate": 2.570424328828325e-07, "loss": 1.01, "loss_nan_ranks": 0, "loss_rank_avg": 0.2588140070438385, "step": 1122, "valid_targets_mean": 16229.8, "valid_targets_min": 15610 }, { "epoch": 4.780383795309168, "grad_norm": 0.15743473018186965, "learning_rate": 2.4763000464694377e-07, "loss": 1.0033, "loss_nan_ranks": 0, "loss_rank_avg": 0.23125317692756653, "step": 1123, "valid_targets_mean": 12867.4, "valid_targets_min": 1501 }, { "epoch": 4.7846481876332625, "grad_norm": 0.14635899385747156, "learning_rate": 2.383920656559102e-07, "loss": 1.0252, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757848799228668, "step": 1124, "valid_targets_mean": 15862.7, "valid_targets_min": 14853 }, { "epoch": 4.788912579957356, "grad_norm": 0.15057907442569857, "learning_rate": 2.2932869751619568e-07, "loss": 0.983, "loss_nan_ranks": 0, "loss_rank_avg": 0.2796521782875061, "step": 1125, "valid_targets_mean": 16139.7, "valid_targets_min": 14793 }, { "epoch": 4.79317697228145, "grad_norm": 0.15462099524501327, "learning_rate": 2.2043998029212643e-07, "loss": 1.0425, "loss_nan_ranks": 0, "loss_rank_avg": 0.19477930665016174, "step": 1126, "valid_targets_mean": 10342.5, "valid_targets_min": 1758 }, { "epoch": 4.797441364605544, "grad_norm": 0.14428333450435837, "learning_rate": 2.1172599250519398e-07, "loss": 0.998, "loss_nan_ranks": 0, "loss_rank_avg": 0.23206013441085815, "step": 1127, "valid_targets_mean": 16088.4, "valid_targets_min": 14763 }, { "epoch": 4.801705756929637, "grad_norm": 0.15760507966173962, "learning_rate": 2.0318681113336013e-07, "loss": 1.0299, "loss_nan_ranks": 0, "loss_rank_avg": 0.2897353768348694, "step": 1128, "valid_targets_mean": 16119.7, "valid_targets_min": 14736 }, { "epoch": 4.8059701492537314, "grad_norm": 0.14776221098452197, "learning_rate": 1.9482251161037302e-07, "loss": 0.9977, "loss_nan_ranks": 0, "loss_rank_avg": 0.1809859275817871, "step": 1129, "valid_targets_mean": 9719.4, "valid_targets_min": 5689 }, { "epoch": 4.810234541577826, "grad_norm": 0.14661112551393696, "learning_rate": 1.866331678251032e-07, "loss": 1.0252, "loss_nan_ranks": 0, "loss_rank_avg": 0.2804567217826843, "step": 1130, "valid_targets_mean": 16003.1, "valid_targets_min": 13828 }, { "epoch": 4.814498933901919, "grad_norm": 0.14900277046790783, "learning_rate": 1.7861885212088869e-07, "loss": 0.9969, "loss_nan_ranks": 0, "loss_rank_avg": 0.28320544958114624, "step": 1131, "valid_targets_mean": 15943.6, "valid_targets_min": 13414 }, { "epoch": 4.818763326226013, "grad_norm": 0.14358657341847153, "learning_rate": 1.7077963529490204e-07, "loss": 0.9993, "loss_nan_ranks": 0, "loss_rank_avg": 0.21058914065361023, "step": 1132, "valid_targets_mean": 13237.8, "valid_targets_min": 10666 }, { "epoch": 4.823027718550106, "grad_norm": 0.1503311290624774, "learning_rate": 1.6311558659751535e-07, "loss": 0.9778, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585322856903076, "step": 1133, "valid_targets_mean": 16197.3, "valid_targets_min": 14919 }, { "epoch": 4.8272921108742, "grad_norm": 0.15520941024351134, "learning_rate": 1.5562677373169855e-07, "loss": 1.0642, "loss_nan_ranks": 0, "loss_rank_avg": 0.31580662727355957, "step": 1134, "valid_targets_mean": 15890.8, "valid_targets_min": 11287 }, { "epoch": 4.8315565031982945, "grad_norm": 0.14840007430449761, "learning_rate": 1.483132628524131e-07, "loss": 1.0291, "loss_nan_ranks": 0, "loss_rank_avg": 0.24786341190338135, "step": 1135, "valid_targets_mean": 14563.6, "valid_targets_min": 12694 }, { "epoch": 4.835820895522388, "grad_norm": 0.15658968069087506, "learning_rate": 1.4117511856603262e-07, "loss": 1.0482, "loss_nan_ranks": 0, "loss_rank_avg": 0.30078184604644775, "step": 1136, "valid_targets_mean": 16095.4, "valid_targets_min": 15282 }, { "epoch": 4.840085287846482, "grad_norm": 0.15285312174229707, "learning_rate": 1.342124039297721e-07, "loss": 1.0314, "loss_nan_ranks": 0, "loss_rank_avg": 0.19714577496051788, "step": 1137, "valid_targets_mean": 10712.7, "valid_targets_min": 983 }, { "epoch": 4.844349680170575, "grad_norm": 0.14167262709410533, "learning_rate": 1.2742518045112396e-07, "loss": 1.0354, "loss_nan_ranks": 0, "loss_rank_avg": 0.2605418562889099, "step": 1138, "valid_targets_mean": 15546.0, "valid_targets_min": 14178 }, { "epoch": 4.848614072494669, "grad_norm": 0.15674575697411522, "learning_rate": 1.2081350808732518e-07, "loss": 1.0282, "loss_nan_ranks": 0, "loss_rank_avg": 0.31616824865341187, "step": 1139, "valid_targets_mean": 16119.0, "valid_targets_min": 15332 }, { "epoch": 4.8528784648187635, "grad_norm": 0.15423989041611458, "learning_rate": 1.143774452448243e-07, "loss": 1.0315, "loss_nan_ranks": 0, "loss_rank_avg": 0.16706404089927673, "step": 1140, "valid_targets_mean": 9525.8, "valid_targets_min": 4937 }, { "epoch": 4.857142857142857, "grad_norm": 0.14447090658394057, "learning_rate": 1.0811704877875528e-07, "loss": 0.9732, "loss_nan_ranks": 0, "loss_rank_avg": 0.24503830075263977, "step": 1141, "valid_targets_mean": 16191.3, "valid_targets_min": 15163 }, { "epoch": 4.861407249466951, "grad_norm": 0.1615026471556301, "learning_rate": 1.0203237399245336e-07, "loss": 1.0181, "loss_nan_ranks": 0, "loss_rank_avg": 0.28254231810569763, "step": 1142, "valid_targets_mean": 16124.7, "valid_targets_min": 15328 }, { "epoch": 4.865671641791045, "grad_norm": 0.14928773912115367, "learning_rate": 9.612347463694882e-08, "loss": 1.0314, "loss_nan_ranks": 0, "loss_rank_avg": 0.19812950491905212, "step": 1143, "valid_targets_mean": 12115.9, "valid_targets_min": 9191 }, { "epoch": 4.869936034115138, "grad_norm": 0.15010321527120785, "learning_rate": 9.039040291050738e-08, "loss": 0.9814, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673875689506531, "step": 1144, "valid_targets_mean": 16236.7, "valid_targets_min": 15773 }, { "epoch": 4.8742004264392325, "grad_norm": 0.15861682212571024, "learning_rate": 8.483320945815499e-08, "loss": 1.0056, "loss_nan_ranks": 0, "loss_rank_avg": 0.2802891731262207, "step": 1145, "valid_targets_mean": 16165.2, "valid_targets_min": 14819 }, { "epoch": 4.878464818763327, "grad_norm": 0.13882421330125413, "learning_rate": 7.945194337124262e-08, "loss": 1.0089, "loss_nan_ranks": 0, "loss_rank_avg": 0.2199188768863678, "step": 1146, "valid_targets_mean": 14201.6, "valid_targets_min": 11573 }, { "epoch": 4.88272921108742, "grad_norm": 0.1470938082355776, "learning_rate": 7.424665218700444e-08, "loss": 1.0122, "loss_nan_ranks": 0, "loss_rank_avg": 0.2924698293209076, "step": 1147, "valid_targets_mean": 16140.8, "valid_targets_min": 15359 }, { "epoch": 4.886993603411514, "grad_norm": 0.14990143490007027, "learning_rate": 6.921738188814254e-08, "loss": 0.9767, "loss_nan_ranks": 0, "loss_rank_avg": 0.2214415818452835, "step": 1148, "valid_targets_mean": 13035.8, "valid_targets_min": 2380 }, { "epoch": 4.891257995735607, "grad_norm": 0.14054548406236866, "learning_rate": 6.436417690241614e-08, "loss": 0.9932, "loss_nan_ranks": 0, "loss_rank_avg": 0.27612608671188354, "step": 1149, "valid_targets_mean": 15234.4, "valid_targets_min": 13564 }, { "epoch": 4.895522388059701, "grad_norm": 0.15582504420991788, "learning_rate": 5.968708010225532e-08, "loss": 0.949, "loss_nan_ranks": 0, "loss_rank_avg": 0.27208343148231506, "step": 1150, "valid_targets_mean": 16216.5, "valid_targets_min": 15713 }, { "epoch": 4.899786780383796, "grad_norm": 0.15383698638285176, "learning_rate": 5.518613280437901e-08, "loss": 1.0332, "loss_nan_ranks": 0, "loss_rank_avg": 0.17712029814720154, "step": 1151, "valid_targets_mean": 9263.9, "valid_targets_min": 930 }, { "epoch": 4.904051172707889, "grad_norm": 0.1421412073915396, "learning_rate": 5.0861374769426433e-08, "loss": 1.0092, "loss_nan_ranks": 0, "loss_rank_avg": 0.26269394159317017, "step": 1152, "valid_targets_mean": 15946.3, "valid_targets_min": 14850 }, { "epoch": 4.908315565031983, "grad_norm": 0.1600097468312609, "learning_rate": 4.671284420161071e-08, "loss": 1.0605, "loss_nan_ranks": 0, "loss_rank_avg": 0.32577964663505554, "step": 1153, "valid_targets_mean": 15997.7, "valid_targets_min": 14732 }, { "epoch": 4.912579957356077, "grad_norm": 0.15738714930436676, "learning_rate": 4.274057774838136e-08, "loss": 1.0205, "loss_nan_ranks": 0, "loss_rank_avg": 0.18098321557044983, "step": 1154, "valid_targets_mean": 10754.5, "valid_targets_min": 7226 }, { "epoch": 4.91684434968017, "grad_norm": 0.14450740335662998, "learning_rate": 3.894461050010012e-08, "loss": 1.0047, "loss_nan_ranks": 0, "loss_rank_avg": 0.27671700716018677, "step": 1155, "valid_targets_mean": 16053.7, "valid_targets_min": 15223 }, { "epoch": 4.9211087420042645, "grad_norm": 0.15489667907035298, "learning_rate": 3.5324975989725615e-08, "loss": 0.9844, "loss_nan_ranks": 0, "loss_rank_avg": 0.30148401856422424, "step": 1156, "valid_targets_mean": 16156.8, "valid_targets_min": 15596 }, { "epoch": 4.925373134328359, "grad_norm": 0.14276493452378128, "learning_rate": 3.188170619252473e-08, "loss": 0.9553, "loss_nan_ranks": 0, "loss_rank_avg": 0.20629984140396118, "step": 1157, "valid_targets_mean": 12721.6, "valid_targets_min": 10683 }, { "epoch": 4.929637526652452, "grad_norm": 0.1499066761403792, "learning_rate": 2.8614831525786147e-08, "loss": 0.9996, "loss_nan_ranks": 0, "loss_rank_avg": 0.26819825172424316, "step": 1158, "valid_targets_mean": 16143.8, "valid_targets_min": 14124 }, { "epoch": 4.933901918976546, "grad_norm": 0.1546352831828286, "learning_rate": 2.552438084855613e-08, "loss": 1.0172, "loss_nan_ranks": 0, "loss_rank_avg": 0.29075586795806885, "step": 1159, "valid_targets_mean": 16117.7, "valid_targets_min": 14424 }, { "epoch": 4.938166311300639, "grad_norm": 0.14296264281771326, "learning_rate": 2.2610381461372068e-08, "loss": 1.0429, "loss_nan_ranks": 0, "loss_rank_avg": 0.27615079283714294, "step": 1160, "valid_targets_mean": 15388.0, "valid_targets_min": 13731 }, { "epoch": 4.9424307036247335, "grad_norm": 0.1486321420613884, "learning_rate": 1.987285910603598e-08, "loss": 0.9986, "loss_nan_ranks": 0, "loss_rank_avg": 0.29423749446868896, "step": 1161, "valid_targets_mean": 16165.4, "valid_targets_min": 15308 }, { "epoch": 4.946695095948828, "grad_norm": 0.1549221284940577, "learning_rate": 1.7311837965379164e-08, "loss": 0.9956, "loss_nan_ranks": 0, "loss_rank_avg": 0.19188982248306274, "step": 1162, "valid_targets_mean": 10865.3, "valid_targets_min": 1443 }, { "epoch": 4.950959488272921, "grad_norm": 0.14892217565418125, "learning_rate": 1.4927340663046798e-08, "loss": 1.0422, "loss_nan_ranks": 0, "loss_rank_avg": 0.26834145188331604, "step": 1163, "valid_targets_mean": 16131.4, "valid_targets_min": 14555 }, { "epoch": 4.955223880597015, "grad_norm": 0.1517686797669809, "learning_rate": 1.2719388263300325e-08, "loss": 1.0194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2813887596130371, "step": 1164, "valid_targets_mean": 16143.4, "valid_targets_min": 15234 }, { "epoch": 4.959488272921108, "grad_norm": 0.15087023278229247, "learning_rate": 1.0688000270839827e-08, "loss": 1.0049, "loss_nan_ranks": 0, "loss_rank_avg": 0.17231392860412598, "step": 1165, "valid_targets_mean": 9892.4, "valid_targets_min": 1676 }, { "epoch": 4.963752665245202, "grad_norm": 0.14010312630125438, "learning_rate": 8.833194630615271e-09, "loss": 1.0094, "loss_nan_ranks": 0, "loss_rank_avg": 0.25139176845550537, "step": 1166, "valid_targets_mean": 16117.2, "valid_targets_min": 14248 }, { "epoch": 4.968017057569297, "grad_norm": 0.14920848498253594, "learning_rate": 7.154987727682194e-09, "loss": 0.9357, "loss_nan_ranks": 0, "loss_rank_avg": 0.2747774124145508, "step": 1167, "valid_targets_mean": 16177.2, "valid_targets_min": 15498 }, { "epoch": 4.97228144989339, "grad_norm": 0.14459040867917233, "learning_rate": 5.6533943870462625e-09, "loss": 1.0106, "loss_nan_ranks": 0, "loss_rank_avg": 0.20723284780979156, "step": 1168, "valid_targets_mean": 12527.4, "valid_targets_min": 9734 }, { "epoch": 4.976545842217484, "grad_norm": 0.14742734957961473, "learning_rate": 4.328427873541152e-09, "loss": 1.0015, "loss_nan_ranks": 0, "loss_rank_avg": 0.24740174412727356, "step": 1169, "valid_targets_mean": 16187.4, "valid_targets_min": 15278 }, { "epoch": 4.980810234541578, "grad_norm": 0.1569923184042177, "learning_rate": 3.1800998917086432e-09, "loss": 1.0297, "loss_nan_ranks": 0, "loss_rank_avg": 0.2794538736343384, "step": 1170, "valid_targets_mean": 16146.8, "valid_targets_min": 15337 }, { "epoch": 4.985074626865671, "grad_norm": 0.14694235426435637, "learning_rate": 2.2084205856920393e-09, "loss": 1.02, "loss_nan_ranks": 0, "loss_rank_avg": 0.22485260665416718, "step": 1171, "valid_targets_mean": 14174.9, "valid_targets_min": 11882 }, { "epoch": 4.9893390191897655, "grad_norm": 0.1503276282480094, "learning_rate": 1.4133985391473482e-09, "loss": 1.0201, "loss_nan_ranks": 0, "loss_rank_avg": 0.2849038541316986, "step": 1172, "valid_targets_mean": 16147.8, "valid_targets_min": 14958 }, { "epoch": 4.99360341151386, "grad_norm": 0.15542866475604034, "learning_rate": 7.950407751722288e-10, "loss": 1.0032, "loss_nan_ranks": 0, "loss_rank_avg": 0.25908148288726807, "step": 1173, "valid_targets_mean": 12998.6, "valid_targets_min": 1158 }, { "epoch": 4.997867803837953, "grad_norm": 0.1441501696307319, "learning_rate": 3.5335275624159835e-10, "loss": 1.0496, "loss_nan_ranks": 0, "loss_rank_avg": 0.24824313819408417, "step": 1174, "valid_targets_mean": 15772.4, "valid_targets_min": 14853 }, { "epoch": 5.0, "grad_norm": 0.22893672755573746, "learning_rate": 8.833838415212014e-11, "loss": 1.0091, "loss_nan_ranks": 0, "loss_rank_avg": 0.4849323630332947, "step": 1175, "valid_targets_mean": 11353.3, "valid_targets_min": 2084 }, { "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.4849323630332947, "step": 1175, "total_flos": 1940656491724800.0, "train_loss": 1.0709928606926127, "train_runtime": 5219.2407, "train_samples_per_second": 28.74, "train_steps_per_second": 0.225, "valid_targets_mean": 11353.3, "valid_targets_min": 2084 } ], "logging_steps": 1, "max_steps": 1175, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1940656491724800.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }