{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4326, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008090614886731391, "grad_norm": 27.459321741406143, "learning_rate": 3.695150115473441e-07, "loss": 0.9065, "loss_nan_ranks": 0, "loss_rank_avg": 0.9109030961990356, "step": 5, "valid_targets_mean": 3808.2, "valid_targets_min": 426 }, { "epoch": 0.016181229773462782, "grad_norm": 28.139176144208395, "learning_rate": 8.314087759815243e-07, "loss": 0.896, "loss_nan_ranks": 0, "loss_rank_avg": 0.9023652672767639, "step": 10, "valid_targets_mean": 3801.5, "valid_targets_min": 1847 }, { "epoch": 0.024271844660194174, "grad_norm": 25.93354792492918, "learning_rate": 1.2933025404157046e-06, "loss": 0.8805, "loss_nan_ranks": 0, "loss_rank_avg": 0.8771004676818848, "step": 15, "valid_targets_mean": 3371.9, "valid_targets_min": 419 }, { "epoch": 0.032362459546925564, "grad_norm": 17.810433239456163, "learning_rate": 1.7551963048498846e-06, "loss": 0.7848, "loss_nan_ranks": 0, "loss_rank_avg": 0.7335680723190308, "step": 20, "valid_targets_mean": 3780.7, "valid_targets_min": 725 }, { "epoch": 0.040453074433656956, "grad_norm": 11.26352797874236, "learning_rate": 2.217090069284065e-06, "loss": 0.7078, "loss_nan_ranks": 0, "loss_rank_avg": 0.70474773645401, "step": 25, "valid_targets_mean": 3891.1, "valid_targets_min": 1957 }, { "epoch": 0.04854368932038835, "grad_norm": 5.655520832965064, "learning_rate": 2.678983833718245e-06, "loss": 0.6187, "loss_nan_ranks": 0, "loss_rank_avg": 0.5794852375984192, "step": 30, "valid_targets_mean": 3575.2, "valid_targets_min": 855 }, { "epoch": 0.05663430420711974, "grad_norm": 3.1011900466301516, "learning_rate": 3.1408775981524254e-06, "loss": 0.5928, "loss_nan_ranks": 0, "loss_rank_avg": 0.568791925907135, "step": 35, "valid_targets_mean": 3848.1, "valid_targets_min": 462 }, { "epoch": 0.06472491909385113, "grad_norm": 1.8794850275863664, "learning_rate": 3.6027713625866056e-06, "loss": 0.5507, "loss_nan_ranks": 0, "loss_rank_avg": 0.5347862839698792, "step": 40, "valid_targets_mean": 3735.5, "valid_targets_min": 778 }, { "epoch": 0.07281553398058252, "grad_norm": 1.6933093485589523, "learning_rate": 4.064665127020786e-06, "loss": 0.5209, "loss_nan_ranks": 0, "loss_rank_avg": 0.5246684551239014, "step": 45, "valid_targets_mean": 3173.0, "valid_targets_min": 448 }, { "epoch": 0.08090614886731391, "grad_norm": 1.3451241482911473, "learning_rate": 4.526558891454966e-06, "loss": 0.5153, "loss_nan_ranks": 0, "loss_rank_avg": 0.5409998893737793, "step": 50, "valid_targets_mean": 3681.6, "valid_targets_min": 1298 }, { "epoch": 0.0889967637540453, "grad_norm": 0.9951670347910555, "learning_rate": 4.988452655889146e-06, "loss": 0.4808, "loss_nan_ranks": 0, "loss_rank_avg": 0.49074310064315796, "step": 55, "valid_targets_mean": 4001.4, "valid_targets_min": 1226 }, { "epoch": 0.0970873786407767, "grad_norm": 0.9366809742158559, "learning_rate": 5.450346420323326e-06, "loss": 0.4683, "loss_nan_ranks": 0, "loss_rank_avg": 0.4610210657119751, "step": 60, "valid_targets_mean": 3441.2, "valid_targets_min": 451 }, { "epoch": 0.10517799352750809, "grad_norm": 0.8147959249499319, "learning_rate": 5.912240184757506e-06, "loss": 0.444, "loss_nan_ranks": 0, "loss_rank_avg": 0.43035197257995605, "step": 65, "valid_targets_mean": 3823.9, "valid_targets_min": 433 }, { "epoch": 0.11326860841423948, "grad_norm": 0.7676476543138736, "learning_rate": 6.374133949191687e-06, "loss": 0.4545, "loss_nan_ranks": 0, "loss_rank_avg": 0.4499027132987976, "step": 70, "valid_targets_mean": 3687.8, "valid_targets_min": 706 }, { "epoch": 0.12135922330097088, "grad_norm": 0.7061949661440534, "learning_rate": 6.836027713625867e-06, "loss": 0.4295, "loss_nan_ranks": 0, "loss_rank_avg": 0.4421675205230713, "step": 75, "valid_targets_mean": 4411.3, "valid_targets_min": 2975 }, { "epoch": 0.12944983818770225, "grad_norm": 0.6513122781968413, "learning_rate": 7.297921478060047e-06, "loss": 0.4279, "loss_nan_ranks": 0, "loss_rank_avg": 0.43355122208595276, "step": 80, "valid_targets_mean": 4360.9, "valid_targets_min": 2906 }, { "epoch": 0.13754045307443366, "grad_norm": 1.0234423222827205, "learning_rate": 7.759815242494227e-06, "loss": 0.4077, "loss_nan_ranks": 0, "loss_rank_avg": 0.4059848189353943, "step": 85, "valid_targets_mean": 3950.6, "valid_targets_min": 1915 }, { "epoch": 0.14563106796116504, "grad_norm": 0.6393770994585668, "learning_rate": 8.221709006928407e-06, "loss": 0.404, "loss_nan_ranks": 0, "loss_rank_avg": 0.4126480221748352, "step": 90, "valid_targets_mean": 3699.2, "valid_targets_min": 465 }, { "epoch": 0.15372168284789645, "grad_norm": 0.6009758856614545, "learning_rate": 8.683602771362586e-06, "loss": 0.3888, "loss_nan_ranks": 0, "loss_rank_avg": 0.37331610918045044, "step": 95, "valid_targets_mean": 4251.8, "valid_targets_min": 535 }, { "epoch": 0.16181229773462782, "grad_norm": 0.6411212665967604, "learning_rate": 9.145496535796767e-06, "loss": 0.3838, "loss_nan_ranks": 0, "loss_rank_avg": 0.37150484323501587, "step": 100, "valid_targets_mean": 3675.9, "valid_targets_min": 613 }, { "epoch": 0.16990291262135923, "grad_norm": 0.6094648920085912, "learning_rate": 9.607390300230948e-06, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.3679890036582947, "step": 105, "valid_targets_mean": 4052.5, "valid_targets_min": 428 }, { "epoch": 0.1779935275080906, "grad_norm": 0.6714933928137066, "learning_rate": 1.0069284064665128e-05, "loss": 0.3778, "loss_nan_ranks": 0, "loss_rank_avg": 0.39726799726486206, "step": 110, "valid_targets_mean": 3751.6, "valid_targets_min": 1619 }, { "epoch": 0.18608414239482202, "grad_norm": 0.6885921268773545, "learning_rate": 1.0531177829099309e-05, "loss": 0.3789, "loss_nan_ranks": 0, "loss_rank_avg": 0.36161985993385315, "step": 115, "valid_targets_mean": 3398.1, "valid_targets_min": 958 }, { "epoch": 0.1941747572815534, "grad_norm": 0.6786362718946853, "learning_rate": 1.0993071593533488e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.3428874611854553, "step": 120, "valid_targets_mean": 2924.1, "valid_targets_min": 967 }, { "epoch": 0.2022653721682848, "grad_norm": 0.5847017454839042, "learning_rate": 1.1454965357967669e-05, "loss": 0.356, "loss_nan_ranks": 0, "loss_rank_avg": 0.38618525862693787, "step": 125, "valid_targets_mean": 4299.1, "valid_targets_min": 1861 }, { "epoch": 0.21035598705501618, "grad_norm": 0.6176988756110413, "learning_rate": 1.1916859122401848e-05, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.35746678709983826, "step": 130, "valid_targets_mean": 3582.0, "valid_targets_min": 968 }, { "epoch": 0.21844660194174756, "grad_norm": 0.6868618523160048, "learning_rate": 1.237875288683603e-05, "loss": 0.3448, "loss_nan_ranks": 0, "loss_rank_avg": 0.34397560358047485, "step": 135, "valid_targets_mean": 3697.5, "valid_targets_min": 686 }, { "epoch": 0.22653721682847897, "grad_norm": 0.5948797006890421, "learning_rate": 1.284064665127021e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.32718050479888916, "step": 140, "valid_targets_mean": 3896.3, "valid_targets_min": 2104 }, { "epoch": 0.23462783171521034, "grad_norm": 0.5529849234577984, "learning_rate": 1.3302540415704388e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.35815680027008057, "step": 145, "valid_targets_mean": 4403.2, "valid_targets_min": 2975 }, { "epoch": 0.24271844660194175, "grad_norm": 0.7558788212006664, "learning_rate": 1.3764434180138568e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.34972795844078064, "step": 150, "valid_targets_mean": 3551.3, "valid_targets_min": 1597 }, { "epoch": 0.25080906148867316, "grad_norm": 0.556839697232855, "learning_rate": 1.4226327944572749e-05, "loss": 0.3542, "loss_nan_ranks": 0, "loss_rank_avg": 0.31378552317619324, "step": 155, "valid_targets_mean": 3750.6, "valid_targets_min": 800 }, { "epoch": 0.2588996763754045, "grad_norm": 0.6341317824410588, "learning_rate": 1.468822170900693e-05, "loss": 0.3403, "loss_nan_ranks": 0, "loss_rank_avg": 0.34858211874961853, "step": 160, "valid_targets_mean": 3940.8, "valid_targets_min": 2064 }, { "epoch": 0.2669902912621359, "grad_norm": 0.5957011932092419, "learning_rate": 1.5150115473441109e-05, "loss": 0.3434, "loss_nan_ranks": 0, "loss_rank_avg": 0.32572871446609497, "step": 165, "valid_targets_mean": 3897.5, "valid_targets_min": 1732 }, { "epoch": 0.2750809061488673, "grad_norm": 0.6068605911979195, "learning_rate": 1.561200923787529e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.32489800453186035, "step": 170, "valid_targets_mean": 4304.5, "valid_targets_min": 1617 }, { "epoch": 0.28317152103559873, "grad_norm": 0.6959522324597113, "learning_rate": 1.607390300230947e-05, "loss": 0.3271, "loss_nan_ranks": 0, "loss_rank_avg": 0.3342089056968689, "step": 175, "valid_targets_mean": 3460.9, "valid_targets_min": 405 }, { "epoch": 0.2912621359223301, "grad_norm": 0.6993033966832811, "learning_rate": 1.653579676674365e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.3438107371330261, "step": 180, "valid_targets_mean": 3719.4, "valid_targets_min": 672 }, { "epoch": 0.2993527508090615, "grad_norm": 0.6054454798783228, "learning_rate": 1.699769053117783e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.3246925473213196, "step": 185, "valid_targets_mean": 3983.6, "valid_targets_min": 2354 }, { "epoch": 0.3074433656957929, "grad_norm": 0.6024947392151053, "learning_rate": 1.7459584295612013e-05, "loss": 0.3277, "loss_nan_ranks": 0, "loss_rank_avg": 0.34920066595077515, "step": 190, "valid_targets_mean": 4179.0, "valid_targets_min": 2225 }, { "epoch": 0.3155339805825243, "grad_norm": 0.5881601386489697, "learning_rate": 1.792147806004619e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.30888259410858154, "step": 195, "valid_targets_mean": 3780.8, "valid_targets_min": 522 }, { "epoch": 0.32362459546925565, "grad_norm": 0.6804460855209646, "learning_rate": 1.838337182448037e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.3233288526535034, "step": 200, "valid_targets_mean": 3176.1, "valid_targets_min": 579 }, { "epoch": 0.33171521035598706, "grad_norm": 0.641730901873238, "learning_rate": 1.8845265588914552e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.3117061257362366, "step": 205, "valid_targets_mean": 3649.1, "valid_targets_min": 1236 }, { "epoch": 0.33980582524271846, "grad_norm": 0.627739058134076, "learning_rate": 1.9307159353348733e-05, "loss": 0.3216, "loss_nan_ranks": 0, "loss_rank_avg": 0.3217557370662689, "step": 210, "valid_targets_mean": 3684.2, "valid_targets_min": 377 }, { "epoch": 0.3478964401294498, "grad_norm": 0.6743803896335775, "learning_rate": 1.976905311778291e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.363000750541687, "step": 215, "valid_targets_mean": 3696.2, "valid_targets_min": 451 }, { "epoch": 0.3559870550161812, "grad_norm": 0.6503092166966725, "learning_rate": 2.0230946882217092e-05, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.3128376305103302, "step": 220, "valid_targets_mean": 3296.0, "valid_targets_min": 1104 }, { "epoch": 0.3640776699029126, "grad_norm": 0.6460762248227256, "learning_rate": 2.0692840646651273e-05, "loss": 0.3111, "loss_nan_ranks": 0, "loss_rank_avg": 0.31550925970077515, "step": 225, "valid_targets_mean": 3500.8, "valid_targets_min": 430 }, { "epoch": 0.37216828478964403, "grad_norm": 0.6602639443938337, "learning_rate": 2.115473441108545e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.31277865171432495, "step": 230, "valid_targets_mean": 2942.6, "valid_targets_min": 480 }, { "epoch": 0.3802588996763754, "grad_norm": 0.6503964007795302, "learning_rate": 2.1616628175519635e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.27533742785453796, "step": 235, "valid_targets_mean": 3215.6, "valid_targets_min": 418 }, { "epoch": 0.3883495145631068, "grad_norm": 0.6456014703726483, "learning_rate": 2.2078521939953813e-05, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.29455316066741943, "step": 240, "valid_targets_mean": 3503.1, "valid_targets_min": 470 }, { "epoch": 0.3964401294498382, "grad_norm": 0.6050471441367182, "learning_rate": 2.2540415704387994e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.3035230338573456, "step": 245, "valid_targets_mean": 3800.3, "valid_targets_min": 1457 }, { "epoch": 0.4045307443365696, "grad_norm": 0.5739221439490244, "learning_rate": 2.3002309468822172e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.3035668730735779, "step": 250, "valid_targets_mean": 4172.5, "valid_targets_min": 2005 }, { "epoch": 0.41262135922330095, "grad_norm": 0.6573809007717452, "learning_rate": 2.346420323325635e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.33286434412002563, "step": 255, "valid_targets_mean": 3657.9, "valid_targets_min": 410 }, { "epoch": 0.42071197411003236, "grad_norm": 0.621214006304506, "learning_rate": 2.3926096997690534e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.27294284105300903, "step": 260, "valid_targets_mean": 3487.0, "valid_targets_min": 718 }, { "epoch": 0.42880258899676377, "grad_norm": 0.6194570084768386, "learning_rate": 2.438799076212471e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.28968545794487, "step": 265, "valid_targets_mean": 4048.9, "valid_targets_min": 259 }, { "epoch": 0.4368932038834951, "grad_norm": 0.6123508382890656, "learning_rate": 2.4849884526558893e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.2817320227622986, "step": 270, "valid_targets_mean": 3786.6, "valid_targets_min": 957 }, { "epoch": 0.4449838187702265, "grad_norm": 0.6349448992907608, "learning_rate": 2.5311778290993074e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.2887231409549713, "step": 275, "valid_targets_mean": 3590.3, "valid_targets_min": 691 }, { "epoch": 0.45307443365695793, "grad_norm": 0.6041395356484386, "learning_rate": 2.5773672055427255e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.30666863918304443, "step": 280, "valid_targets_mean": 3870.8, "valid_targets_min": 481 }, { "epoch": 0.46116504854368934, "grad_norm": 0.6423139569561586, "learning_rate": 2.6235565819861432e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.30878114700317383, "step": 285, "valid_targets_mean": 3677.9, "valid_targets_min": 605 }, { "epoch": 0.4692556634304207, "grad_norm": 0.5950734204281998, "learning_rate": 2.6697459584295617e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.27899283170700073, "step": 290, "valid_targets_mean": 3649.2, "valid_targets_min": 504 }, { "epoch": 0.4773462783171521, "grad_norm": 0.6370745562989614, "learning_rate": 2.7159353348729794e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.29412591457366943, "step": 295, "valid_targets_mean": 3545.8, "valid_targets_min": 454 }, { "epoch": 0.4854368932038835, "grad_norm": 1.92659801088735, "learning_rate": 2.7621247113163975e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.25594255328178406, "step": 300, "valid_targets_mean": 3757.3, "valid_targets_min": 1286 }, { "epoch": 0.4935275080906149, "grad_norm": 0.6375789687289607, "learning_rate": 2.8083140877598153e-05, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.2897154986858368, "step": 305, "valid_targets_mean": 3368.8, "valid_targets_min": 460 }, { "epoch": 0.5016181229773463, "grad_norm": 0.6781242545223203, "learning_rate": 2.8545034642032338e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.30849897861480713, "step": 310, "valid_targets_mean": 3861.2, "valid_targets_min": 1085 }, { "epoch": 0.5097087378640777, "grad_norm": 0.5620898167135456, "learning_rate": 2.9006928406466515e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.29005423188209534, "step": 315, "valid_targets_mean": 3949.1, "valid_targets_min": 1506 }, { "epoch": 0.517799352750809, "grad_norm": 0.6011594540412086, "learning_rate": 2.9468822170900696e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.24850499629974365, "step": 320, "valid_targets_mean": 3461.3, "valid_targets_min": 579 }, { "epoch": 0.5258899676375405, "grad_norm": 0.5667335774154261, "learning_rate": 2.9930715935334874e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.28869470953941345, "step": 325, "valid_targets_mean": 3888.8, "valid_targets_min": 427 }, { "epoch": 0.5339805825242718, "grad_norm": 0.6018602985123674, "learning_rate": 3.0392609699769055e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.25187310576438904, "step": 330, "valid_targets_mean": 3572.2, "valid_targets_min": 416 }, { "epoch": 0.5420711974110033, "grad_norm": 0.5530170018702698, "learning_rate": 3.0854503464203236e-05, "loss": 0.3014, "loss_nan_ranks": 0, "loss_rank_avg": 0.3016529679298401, "step": 335, "valid_targets_mean": 4167.5, "valid_targets_min": 605 }, { "epoch": 0.5501618122977346, "grad_norm": 0.5683688168773894, "learning_rate": 3.131639722863742e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.2862555980682373, "step": 340, "valid_targets_mean": 4065.1, "valid_targets_min": 490 }, { "epoch": 0.558252427184466, "grad_norm": 0.6422148617718519, "learning_rate": 3.17782909930716e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2575664222240448, "step": 345, "valid_targets_mean": 3347.6, "valid_targets_min": 1490 }, { "epoch": 0.5663430420711975, "grad_norm": 0.6028555328769979, "learning_rate": 3.224018475750577e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.2789534628391266, "step": 350, "valid_targets_mean": 3205.9, "valid_targets_min": 514 }, { "epoch": 0.5744336569579288, "grad_norm": 0.703646722775362, "learning_rate": 3.270207852193996e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.29907727241516113, "step": 355, "valid_targets_mean": 3719.6, "valid_targets_min": 1032 }, { "epoch": 0.5825242718446602, "grad_norm": 0.686644747611541, "learning_rate": 3.3163972286374135e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848784625530243, "step": 360, "valid_targets_mean": 3759.4, "valid_targets_min": 1201 }, { "epoch": 0.5906148867313916, "grad_norm": 0.6324843088148043, "learning_rate": 3.3625866050808316e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.3301808834075928, "step": 365, "valid_targets_mean": 3985.0, "valid_targets_min": 559 }, { "epoch": 0.598705501618123, "grad_norm": 0.6657889896899425, "learning_rate": 3.40877598152425e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.2617691159248352, "step": 370, "valid_targets_mean": 3649.1, "valid_targets_min": 862 }, { "epoch": 0.6067961165048543, "grad_norm": 0.7044977758301637, "learning_rate": 3.454965357967668e-05, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.28061506152153015, "step": 375, "valid_targets_mean": 3758.7, "valid_targets_min": 1980 }, { "epoch": 0.6148867313915858, "grad_norm": 0.5793210298303975, "learning_rate": 3.501154734411086e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.28702807426452637, "step": 380, "valid_targets_mean": 3827.2, "valid_targets_min": 703 }, { "epoch": 0.6229773462783171, "grad_norm": 0.6428205927219847, "learning_rate": 3.547344110854504e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2545207738876343, "step": 385, "valid_targets_mean": 3273.9, "valid_targets_min": 738 }, { "epoch": 0.6310679611650486, "grad_norm": 0.591271300160177, "learning_rate": 3.5935334872979214e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.28500238060951233, "step": 390, "valid_targets_mean": 3836.4, "valid_targets_min": 533 }, { "epoch": 0.63915857605178, "grad_norm": 0.5988205344788338, "learning_rate": 3.63972286374134e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.3076947331428528, "step": 395, "valid_targets_mean": 3890.5, "valid_targets_min": 877 }, { "epoch": 0.6472491909385113, "grad_norm": 0.5508624611045605, "learning_rate": 3.6859122401847576e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.27103567123413086, "step": 400, "valid_targets_mean": 3915.4, "valid_targets_min": 420 }, { "epoch": 0.6553398058252428, "grad_norm": 0.5985040648059813, "learning_rate": 3.732101616628176e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.2661280333995819, "step": 405, "valid_targets_mean": 3904.9, "valid_targets_min": 1350 }, { "epoch": 0.6634304207119741, "grad_norm": 0.5990129213673812, "learning_rate": 3.778290993071594e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.26289594173431396, "step": 410, "valid_targets_mean": 3605.1, "valid_targets_min": 840 }, { "epoch": 0.6715210355987055, "grad_norm": 0.6190982488306185, "learning_rate": 3.824480369515012e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.31816816329956055, "step": 415, "valid_targets_mean": 3736.1, "valid_targets_min": 427 }, { "epoch": 0.6796116504854369, "grad_norm": 0.5654861961445968, "learning_rate": 3.87066974595843e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.29399573802948, "step": 420, "valid_targets_mean": 4115.8, "valid_targets_min": 2051 }, { "epoch": 0.6877022653721683, "grad_norm": 0.6733368871549665, "learning_rate": 3.9168591224018475e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.269350528717041, "step": 425, "valid_targets_mean": 3661.5, "valid_targets_min": 446 }, { "epoch": 0.6957928802588996, "grad_norm": 0.5881509692853332, "learning_rate": 3.963048498845266e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.3111186623573303, "step": 430, "valid_targets_mean": 3747.9, "valid_targets_min": 1335 }, { "epoch": 0.7038834951456311, "grad_norm": 0.6653833282495153, "learning_rate": 3.999999348775225e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.2823415696620941, "step": 435, "valid_targets_mean": 3997.1, "valid_targets_min": 2126 }, { "epoch": 0.7119741100323624, "grad_norm": 0.5650668386347658, "learning_rate": 3.9999765559526296e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.2572442591190338, "step": 440, "valid_targets_mean": 4013.0, "valid_targets_min": 2021 }, { "epoch": 0.7200647249190939, "grad_norm": 0.5389309645168817, "learning_rate": 3.999921202315374e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.28636130690574646, "step": 445, "valid_targets_mean": 4386.1, "valid_targets_min": 2956 }, { "epoch": 0.7281553398058253, "grad_norm": 0.6194102937241955, "learning_rate": 3.9998332887646504e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838453948497772, "step": 450, "valid_targets_mean": 3617.1, "valid_targets_min": 598 }, { "epoch": 0.7362459546925566, "grad_norm": 0.5816499043205773, "learning_rate": 3.999712816731743e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.25679758191108704, "step": 455, "valid_targets_mean": 3520.3, "valid_targets_min": 1240 }, { "epoch": 0.7443365695792881, "grad_norm": 0.579241211012032, "learning_rate": 3.999559788178009e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.29625752568244934, "step": 460, "valid_targets_mean": 3625.7, "valid_targets_min": 451 }, { "epoch": 0.7524271844660194, "grad_norm": 0.5909898166135259, "learning_rate": 3.999374205594845e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.26413339376449585, "step": 465, "valid_targets_mean": 3644.6, "valid_targets_min": 313 }, { "epoch": 0.7605177993527508, "grad_norm": 0.5693299452079705, "learning_rate": 3.999156072003646e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.2781625986099243, "step": 470, "valid_targets_mean": 3661.7, "valid_targets_min": 1014 }, { "epoch": 0.7686084142394822, "grad_norm": 0.5919226456235103, "learning_rate": 3.9989053909557576e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.29603859782218933, "step": 475, "valid_targets_mean": 3722.9, "valid_targets_min": 1030 }, { "epoch": 0.7766990291262136, "grad_norm": 0.5943887354321051, "learning_rate": 3.998622166532417e-05, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638964056968689, "step": 480, "valid_targets_mean": 4079.6, "valid_targets_min": 1751 }, { "epoch": 0.7847896440129449, "grad_norm": 0.711842012876838, "learning_rate": 3.998306403344688e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.26152002811431885, "step": 485, "valid_targets_mean": 3510.2, "valid_targets_min": 786 }, { "epoch": 0.7928802588996764, "grad_norm": 0.5734682192660957, "learning_rate": 3.997958106533383e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649049758911133, "step": 490, "valid_targets_mean": 3927.6, "valid_targets_min": 716 }, { "epoch": 0.8009708737864077, "grad_norm": 0.5361986202564702, "learning_rate": 3.997577281768982e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.2324935793876648, "step": 495, "valid_targets_mean": 3626.5, "valid_targets_min": 1365 }, { "epoch": 0.8090614886731392, "grad_norm": 0.5122712699333561, "learning_rate": 3.997163935251543e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.27357301115989685, "step": 500, "valid_targets_mean": 4106.0, "valid_targets_min": 2489 }, { "epoch": 0.8171521035598706, "grad_norm": 0.6066344337324161, "learning_rate": 3.996718073710591e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.27873921394348145, "step": 505, "valid_targets_mean": 3503.3, "valid_targets_min": 1526 }, { "epoch": 0.8252427184466019, "grad_norm": 0.5284961700363339, "learning_rate": 3.9962397044050206e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654161751270294, "step": 510, "valid_targets_mean": 3800.1, "valid_targets_min": 640 }, { "epoch": 0.8333333333333334, "grad_norm": 0.621823217819916, "learning_rate": 3.99572883512297e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.27369263768196106, "step": 515, "valid_targets_mean": 3488.2, "valid_targets_min": 1050 }, { "epoch": 0.8414239482200647, "grad_norm": 0.5267599319786561, "learning_rate": 3.9951854741816954e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.2734227776527405, "step": 520, "valid_targets_mean": 3832.6, "valid_targets_min": 481 }, { "epoch": 0.8495145631067961, "grad_norm": 0.6257107494353524, "learning_rate": 3.99460963042744e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.28572967648506165, "step": 525, "valid_targets_mean": 3736.1, "valid_targets_min": 668 }, { "epoch": 0.8576051779935275, "grad_norm": 1.2714399983105327, "learning_rate": 3.994001313235283e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.282131552696228, "step": 530, "valid_targets_mean": 3938.2, "valid_targets_min": 1085 }, { "epoch": 0.8656957928802589, "grad_norm": 0.5806714978099429, "learning_rate": 3.993360532508993e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508247494697571, "step": 535, "valid_targets_mean": 3894.8, "valid_targets_min": 1526 }, { "epoch": 0.8737864077669902, "grad_norm": 0.5581090898685672, "learning_rate": 3.9926872986808626e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.24472543597221375, "step": 540, "valid_targets_mean": 3818.2, "valid_targets_min": 1048 }, { "epoch": 0.8818770226537217, "grad_norm": 0.602578818433595, "learning_rate": 3.991981622711542e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.27875274419784546, "step": 545, "valid_targets_mean": 3362.0, "valid_targets_min": 451 }, { "epoch": 0.889967637540453, "grad_norm": 0.6000853415599751, "learning_rate": 3.991243516089859e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.28475719690322876, "step": 550, "valid_targets_mean": 3562.8, "valid_targets_min": 494 }, { "epoch": 0.8980582524271845, "grad_norm": 0.6045079118077683, "learning_rate": 3.9904729908326295e-05, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536866366863251, "step": 555, "valid_targets_mean": 3200.2, "valid_targets_min": 441 }, { "epoch": 0.9061488673139159, "grad_norm": 0.5385268237514557, "learning_rate": 3.989670059484465e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.25445741415023804, "step": 560, "valid_targets_mean": 3636.5, "valid_targets_min": 471 }, { "epoch": 0.9142394822006472, "grad_norm": 0.569538684495337, "learning_rate": 3.98883473511757e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.259962797164917, "step": 565, "valid_targets_mean": 3567.1, "valid_targets_min": 405 }, { "epoch": 0.9223300970873787, "grad_norm": 0.605779218415475, "learning_rate": 3.987967031331523e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.27796828746795654, "step": 570, "valid_targets_mean": 3790.8, "valid_targets_min": 1266 }, { "epoch": 0.93042071197411, "grad_norm": 0.5218505117582313, "learning_rate": 3.987066962253063e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.26819664239883423, "step": 575, "valid_targets_mean": 4475.1, "valid_targets_min": 2968 }, { "epoch": 0.9385113268608414, "grad_norm": 0.5475939469674147, "learning_rate": 3.9861345425358506e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.2616320252418518, "step": 580, "valid_targets_mean": 3786.9, "valid_targets_min": 1797 }, { "epoch": 0.9466019417475728, "grad_norm": 0.5842375761808629, "learning_rate": 3.985169787360238e-05, "loss": 0.2576, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507282793521881, "step": 585, "valid_targets_mean": 3231.1, "valid_targets_min": 875 }, { "epoch": 0.9546925566343042, "grad_norm": 0.5858929733036307, "learning_rate": 3.984172712433016e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.26595237851142883, "step": 590, "valid_targets_mean": 3756.8, "valid_targets_min": 432 }, { "epoch": 0.9627831715210357, "grad_norm": 0.562817714467397, "learning_rate": 3.983143333987161e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.2702093720436096, "step": 595, "valid_targets_mean": 3892.1, "valid_targets_min": 885 }, { "epoch": 0.970873786407767, "grad_norm": 0.5674781126145693, "learning_rate": 3.98208166878157e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.24162045121192932, "step": 600, "valid_targets_mean": 3564.8, "valid_targets_min": 662 }, { "epoch": 0.9789644012944984, "grad_norm": 0.6062685894488582, "learning_rate": 3.9809877341007865e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.25364941358566284, "step": 605, "valid_targets_mean": 3195.0, "valid_targets_min": 462 }, { "epoch": 0.9870550161812298, "grad_norm": 0.5787698953603837, "learning_rate": 3.979861547754723e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.2575009763240814, "step": 610, "valid_targets_mean": 3920.9, "valid_targets_min": 1737 }, { "epoch": 0.9951456310679612, "grad_norm": 0.5410984656955982, "learning_rate": 3.9787031280783665e-05, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.24462872743606567, "step": 615, "valid_targets_mean": 3699.8, "valid_targets_min": 370 }, { "epoch": 1.0032362459546926, "grad_norm": 0.5559196648009831, "learning_rate": 3.977512493931482e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.22372806072235107, "step": 620, "valid_targets_mean": 3276.6, "valid_targets_min": 1253 }, { "epoch": 1.0113268608414239, "grad_norm": 0.562287316511375, "learning_rate": 3.976289664698305e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.25618696212768555, "step": 625, "valid_targets_mean": 3868.9, "valid_targets_min": 1350 }, { "epoch": 1.0194174757281553, "grad_norm": 0.5369177782487862, "learning_rate": 3.9750346602872275e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.2368406504392624, "step": 630, "valid_targets_mean": 3707.1, "valid_targets_min": 671 }, { "epoch": 1.0275080906148868, "grad_norm": 0.5804008703361665, "learning_rate": 3.973747501130473e-05, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.25358450412750244, "step": 635, "valid_targets_mean": 4052.9, "valid_targets_min": 468 }, { "epoch": 1.035598705501618, "grad_norm": 0.605778216509064, "learning_rate": 3.97242820818376e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.2552924156188965, "step": 640, "valid_targets_mean": 3504.3, "valid_targets_min": 422 }, { "epoch": 1.0436893203883495, "grad_norm": 0.5654932430709362, "learning_rate": 3.9710768029259695e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.2729843854904175, "step": 645, "valid_targets_mean": 3681.1, "valid_targets_min": 770 }, { "epoch": 1.051779935275081, "grad_norm": 0.7172757360142547, "learning_rate": 3.9696933073587864e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.27672040462493896, "step": 650, "valid_targets_mean": 3507.8, "valid_targets_min": 957 }, { "epoch": 1.0598705501618122, "grad_norm": 0.5607347532030501, "learning_rate": 3.9682777440063455e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.24472706019878387, "step": 655, "valid_targets_mean": 3917.8, "valid_targets_min": 2470 }, { "epoch": 1.0679611650485437, "grad_norm": 0.5387121591142974, "learning_rate": 3.9668301359148655e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.31839385628700256, "step": 660, "valid_targets_mean": 4574.2, "valid_targets_min": 1939 }, { "epoch": 1.0760517799352751, "grad_norm": 0.4738915321475537, "learning_rate": 3.965350506652272e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.22641263902187347, "step": 665, "valid_targets_mean": 4143.0, "valid_targets_min": 896 }, { "epoch": 1.0841423948220066, "grad_norm": 0.673765362529483, "learning_rate": 3.963838880307815e-05, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.253450870513916, "step": 670, "valid_targets_mean": 3418.4, "valid_targets_min": 513 }, { "epoch": 1.0922330097087378, "grad_norm": 0.592144514072726, "learning_rate": 3.962295281491674e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.22054757177829742, "step": 675, "valid_targets_mean": 3311.9, "valid_targets_min": 1647 }, { "epoch": 1.1003236245954693, "grad_norm": 0.5462311520114211, "learning_rate": 3.960719735334562e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.25668200850486755, "step": 680, "valid_targets_mean": 4145.4, "valid_targets_min": 1357 }, { "epoch": 1.1084142394822007, "grad_norm": 0.5596472621487413, "learning_rate": 3.959112267487314e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.2636863589286804, "step": 685, "valid_targets_mean": 3808.9, "valid_targets_min": 2280 }, { "epoch": 1.116504854368932, "grad_norm": 0.5925165742724042, "learning_rate": 3.957472904120467e-05, "loss": 0.2457, "loss_nan_ranks": 0, "loss_rank_avg": 0.2322475016117096, "step": 690, "valid_targets_mean": 3328.8, "valid_targets_min": 536 }, { "epoch": 1.1245954692556634, "grad_norm": 0.7318667286756769, "learning_rate": 3.955801671923837e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675679326057434, "step": 695, "valid_targets_mean": 3433.7, "valid_targets_min": 630 }, { "epoch": 1.132686084142395, "grad_norm": 0.5473167172657988, "learning_rate": 3.954098598106084e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.26063698530197144, "step": 700, "valid_targets_mean": 3818.1, "valid_targets_min": 718 }, { "epoch": 1.1407766990291262, "grad_norm": 0.5634978237369443, "learning_rate": 3.952363710394269e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.25784575939178467, "step": 705, "valid_targets_mean": 3970.0, "valid_targets_min": 1100 }, { "epoch": 1.1488673139158576, "grad_norm": 0.5655594345426586, "learning_rate": 3.9505970370334015e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.25309622287750244, "step": 710, "valid_targets_mean": 3924.2, "valid_targets_min": 1172 }, { "epoch": 1.156957928802589, "grad_norm": 0.5075142775296616, "learning_rate": 3.94879860678598e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.22384929656982422, "step": 715, "valid_targets_mean": 3865.6, "valid_targets_min": 1426 }, { "epoch": 1.1650485436893203, "grad_norm": 0.5601883688914359, "learning_rate": 3.9469684489315256e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.2752339243888855, "step": 720, "valid_targets_mean": 4222.7, "valid_targets_min": 2497 }, { "epoch": 1.1731391585760518, "grad_norm": 0.5134594549264883, "learning_rate": 3.945106593266102e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594758868217468, "step": 725, "valid_targets_mean": 4206.9, "valid_targets_min": 1984 }, { "epoch": 1.1812297734627832, "grad_norm": 0.5798021779182408, "learning_rate": 3.943213070101834e-05, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.2584797143936157, "step": 730, "valid_targets_mean": 3489.6, "valid_targets_min": 463 }, { "epoch": 1.1893203883495145, "grad_norm": 0.5348245496682883, "learning_rate": 3.941287910266411e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.23523803055286407, "step": 735, "valid_targets_mean": 3916.9, "valid_targets_min": 423 }, { "epoch": 1.197411003236246, "grad_norm": 0.5847494410182235, "learning_rate": 3.9393311451025865e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.26313185691833496, "step": 740, "valid_targets_mean": 3422.8, "valid_targets_min": 471 }, { "epoch": 1.2055016181229774, "grad_norm": 0.5715879469688606, "learning_rate": 3.937342806467668e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.24966466426849365, "step": 745, "valid_targets_mean": 3915.3, "valid_targets_min": 1299 }, { "epoch": 1.2135922330097086, "grad_norm": 0.5433469085571423, "learning_rate": 3.935322926732998e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.234421506524086, "step": 750, "valid_targets_mean": 4102.1, "valid_targets_min": 1597 }, { "epoch": 1.22168284789644, "grad_norm": 0.5868454178512109, "learning_rate": 3.933271538783427e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.27477163076400757, "step": 755, "valid_targets_mean": 3842.6, "valid_targets_min": 662 }, { "epoch": 1.2297734627831716, "grad_norm": 0.6436982098810824, "learning_rate": 3.931188676016777e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649001479148865, "step": 760, "valid_targets_mean": 3557.1, "valid_targets_min": 463 }, { "epoch": 1.237864077669903, "grad_norm": 0.6131515769175564, "learning_rate": 3.9290743723433e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2513100206851959, "step": 765, "valid_targets_mean": 3496.9, "valid_targets_min": 428 }, { "epoch": 1.2459546925566343, "grad_norm": 0.6865052077576037, "learning_rate": 3.926928662185126e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.2739570140838623, "step": 770, "valid_targets_mean": 3481.2, "valid_targets_min": 418 }, { "epoch": 1.2540453074433657, "grad_norm": 0.5799644871312117, "learning_rate": 3.924751580475698e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.2648698687553406, "step": 775, "valid_targets_mean": 3644.6, "valid_targets_min": 910 }, { "epoch": 1.262135922330097, "grad_norm": 0.5318310447138261, "learning_rate": 3.922543162659209e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.20989498496055603, "step": 780, "valid_targets_mean": 3411.7, "valid_targets_min": 1369 }, { "epoch": 1.2702265372168284, "grad_norm": 0.5814600954030472, "learning_rate": 3.9203034446900224e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.24911276996135712, "step": 785, "valid_targets_mean": 3388.5, "valid_targets_min": 1085 }, { "epoch": 1.27831715210356, "grad_norm": 0.5206654650887855, "learning_rate": 3.918032463032086e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2422664314508438, "step": 790, "valid_targets_mean": 3730.7, "valid_targets_min": 1009 }, { "epoch": 1.2864077669902914, "grad_norm": 0.5964049859480364, "learning_rate": 3.9157302546583406e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.2198229730129242, "step": 795, "valid_targets_mean": 3327.1, "valid_targets_min": 877 }, { "epoch": 1.2944983818770226, "grad_norm": 0.6407156866162471, "learning_rate": 3.913396857050115e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676980495452881, "step": 800, "valid_targets_mean": 3686.9, "valid_targets_min": 330 }, { "epoch": 1.302588996763754, "grad_norm": 0.5372612492899006, "learning_rate": 3.911032308196518e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.21625232696533203, "step": 805, "valid_targets_mean": 3276.7, "valid_targets_min": 471 }, { "epoch": 1.3106796116504853, "grad_norm": 0.500246673496057, "learning_rate": 3.9086366465938194e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.22332966327667236, "step": 810, "valid_targets_mean": 4221.2, "valid_targets_min": 1014 }, { "epoch": 1.3187702265372168, "grad_norm": 0.5393069350727855, "learning_rate": 3.906209911244823e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.2488965392112732, "step": 815, "valid_targets_mean": 3860.0, "valid_targets_min": 1522 }, { "epoch": 1.3268608414239482, "grad_norm": 0.558283313672063, "learning_rate": 3.903752141658232e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.24360036849975586, "step": 820, "valid_targets_mean": 3291.6, "valid_targets_min": 450 }, { "epoch": 1.3349514563106797, "grad_norm": 0.527247168235714, "learning_rate": 3.9012633778480054e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.23953786492347717, "step": 825, "valid_targets_mean": 3723.9, "valid_targets_min": 624 }, { "epoch": 1.343042071197411, "grad_norm": 0.5365474363809069, "learning_rate": 3.8987436603327064e-05, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.2417599856853485, "step": 830, "valid_targets_mean": 3770.5, "valid_targets_min": 496 }, { "epoch": 1.3511326860841424, "grad_norm": 0.627416131833293, "learning_rate": 3.896193030134844e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.21616961061954498, "step": 835, "valid_targets_mean": 3342.2, "valid_targets_min": 377 }, { "epoch": 1.3592233009708738, "grad_norm": 0.5201944735490818, "learning_rate": 3.893611528780204e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.24615398049354553, "step": 840, "valid_targets_mean": 4086.8, "valid_targets_min": 2711 }, { "epoch": 1.367313915857605, "grad_norm": 0.49258839979449737, "learning_rate": 3.890999198297171e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.23036456108093262, "step": 845, "valid_targets_mean": 4122.5, "valid_targets_min": 1744 }, { "epoch": 1.3754045307443366, "grad_norm": 0.5777476229346971, "learning_rate": 3.888356081216049e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.24178913235664368, "step": 850, "valid_targets_mean": 3572.0, "valid_targets_min": 523 }, { "epoch": 1.383495145631068, "grad_norm": 0.6128443853720431, "learning_rate": 3.8856822205683646e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.2308482676744461, "step": 855, "valid_targets_mean": 2943.4, "valid_targets_min": 427 }, { "epoch": 1.3915857605177995, "grad_norm": 0.5764652601903296, "learning_rate": 3.882977659886169e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.25092625617980957, "step": 860, "valid_targets_mean": 3776.6, "valid_targets_min": 1586 }, { "epoch": 1.3996763754045307, "grad_norm": 0.5072175975075331, "learning_rate": 3.8802424432013283e-05, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.2366875559091568, "step": 865, "valid_targets_mean": 4086.3, "valid_targets_min": 1855 }, { "epoch": 1.4077669902912622, "grad_norm": 0.5559560078057603, "learning_rate": 3.8774766150448055e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.25183963775634766, "step": 870, "valid_targets_mean": 3595.1, "valid_targets_min": 454 }, { "epoch": 1.4158576051779934, "grad_norm": 0.5350029401989669, "learning_rate": 3.874680220445938e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.22824493050575256, "step": 875, "valid_targets_mean": 3540.8, "valid_targets_min": 579 }, { "epoch": 1.4239482200647249, "grad_norm": 0.5447669496074694, "learning_rate": 3.871853304931701e-05, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.23308587074279785, "step": 880, "valid_targets_mean": 3631.0, "valid_targets_min": 1014 }, { "epoch": 1.4320388349514563, "grad_norm": 0.5411709921199677, "learning_rate": 3.8689959145259725e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.25159168243408203, "step": 885, "valid_targets_mean": 4113.1, "valid_targets_min": 950 }, { "epoch": 1.4401294498381878, "grad_norm": 0.5729522085372347, "learning_rate": 3.866108095748776e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.24209068715572357, "step": 890, "valid_targets_mean": 3630.1, "valid_targets_min": 985 }, { "epoch": 1.448220064724919, "grad_norm": 0.9115507641863799, "learning_rate": 3.863189895615529e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.24850182235240936, "step": 895, "valid_targets_mean": 3811.0, "valid_targets_min": 1259 }, { "epoch": 1.4563106796116505, "grad_norm": 0.5308936337618426, "learning_rate": 3.8602413616362745e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.2650480270385742, "step": 900, "valid_targets_mean": 4117.1, "valid_targets_min": 485 }, { "epoch": 1.4644012944983817, "grad_norm": 0.589828834343643, "learning_rate": 3.85726254181491e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.25212791562080383, "step": 905, "valid_targets_mean": 3238.6, "valid_targets_min": 615 }, { "epoch": 1.4724919093851132, "grad_norm": 0.5452549763443945, "learning_rate": 3.8542534846484055e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.23172008991241455, "step": 910, "valid_targets_mean": 4015.4, "valid_targets_min": 1840 }, { "epoch": 1.4805825242718447, "grad_norm": 0.488860349833199, "learning_rate": 3.8512142391260085e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.21231934428215027, "step": 915, "valid_targets_mean": 3872.8, "valid_targets_min": 1818 }, { "epoch": 1.4886731391585761, "grad_norm": 0.5579335354336327, "learning_rate": 3.848144854728457e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.2260228395462036, "step": 920, "valid_targets_mean": 3835.0, "valid_targets_min": 522 }, { "epoch": 1.4967637540453074, "grad_norm": 0.5381713237133415, "learning_rate": 3.8450453814271636e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.2695598900318146, "step": 925, "valid_targets_mean": 3745.8, "valid_targets_min": 269 }, { "epoch": 1.5048543689320388, "grad_norm": 0.5004455221868256, "learning_rate": 3.8419158696834075e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.2213108390569687, "step": 930, "valid_targets_mean": 3773.2, "valid_targets_min": 374 }, { "epoch": 1.51294498381877, "grad_norm": 0.5946986799926913, "learning_rate": 3.8387563704475124e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.25130200386047363, "step": 935, "valid_targets_mean": 3319.4, "valid_targets_min": 349 }, { "epoch": 1.5210355987055015, "grad_norm": 0.554915642632707, "learning_rate": 3.835566935158015e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2504206895828247, "step": 940, "valid_targets_mean": 4108.0, "valid_targets_min": 538 }, { "epoch": 1.529126213592233, "grad_norm": 0.6107974094646808, "learning_rate": 3.8323476157408315e-05, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.2469642460346222, "step": 945, "valid_targets_mean": 3444.4, "valid_targets_min": 405 }, { "epoch": 1.5372168284789645, "grad_norm": 0.48014681884612614, "learning_rate": 3.8290984646084056e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.21410520374774933, "step": 950, "valid_targets_mean": 3711.6, "valid_targets_min": 1014 }, { "epoch": 1.545307443365696, "grad_norm": 0.5852050304300088, "learning_rate": 3.825819534658862e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539462745189667, "step": 955, "valid_targets_mean": 3593.4, "valid_targets_min": 494 }, { "epoch": 1.5533980582524272, "grad_norm": 0.5324836100311932, "learning_rate": 3.822510879275142e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.2364928424358368, "step": 960, "valid_targets_mean": 4131.8, "valid_targets_min": 749 }, { "epoch": 1.5614886731391586, "grad_norm": 0.5478699189171505, "learning_rate": 3.8191725523241346e-05, "loss": 0.2431, "loss_nan_ranks": 0, "loss_rank_avg": 0.2546507716178894, "step": 965, "valid_targets_mean": 3874.2, "valid_targets_min": 810 }, { "epoch": 1.5695792880258899, "grad_norm": 0.5661577436107965, "learning_rate": 3.8158046081557986e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.24910283088684082, "step": 970, "valid_targets_mean": 3499.5, "valid_targets_min": 433 }, { "epoch": 1.5776699029126213, "grad_norm": 0.5514241647506224, "learning_rate": 3.812407101602281e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2755923271179199, "step": 975, "valid_targets_mean": 4040.9, "valid_targets_min": 1763 }, { "epoch": 1.5857605177993528, "grad_norm": 0.5112749027291317, "learning_rate": 3.808980087977019e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.22368744015693665, "step": 980, "valid_targets_mean": 3874.2, "valid_targets_min": 1686 }, { "epoch": 1.5938511326860842, "grad_norm": 0.5289695797679198, "learning_rate": 3.8055236230738456e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.2390768676996231, "step": 985, "valid_targets_mean": 3974.6, "valid_targets_min": 503 }, { "epoch": 1.6019417475728155, "grad_norm": 0.5705928004093642, "learning_rate": 3.8020377631660756e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2246730476617813, "step": 990, "valid_targets_mean": 3101.2, "valid_targets_min": 377 }, { "epoch": 1.610032362459547, "grad_norm": 0.7386498116488778, "learning_rate": 3.7985225650055956e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.2365446835756302, "step": 995, "valid_targets_mean": 3654.5, "valid_targets_min": 370 }, { "epoch": 1.6181229773462782, "grad_norm": 0.5552219499272047, "learning_rate": 3.794978085821933e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.251254141330719, "step": 1000, "valid_targets_mean": 3474.9, "valid_targets_min": 419 }, { "epoch": 1.6262135922330097, "grad_norm": 0.5607678761522751, "learning_rate": 3.7914043833213294e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.2405933141708374, "step": 1005, "valid_targets_mean": 3489.9, "valid_targets_min": 834 }, { "epoch": 1.6343042071197411, "grad_norm": 0.5527801381980166, "learning_rate": 3.787801515685799e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.2157033085823059, "step": 1010, "valid_targets_mean": 3482.9, "valid_targets_min": 1790 }, { "epoch": 1.6423948220064726, "grad_norm": 0.5352962063119632, "learning_rate": 3.7841695415721826e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.24081295728683472, "step": 1015, "valid_targets_mean": 4187.8, "valid_targets_min": 470 }, { "epoch": 1.650485436893204, "grad_norm": 0.5789057849731076, "learning_rate": 3.78050852011119e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.25976818799972534, "step": 1020, "valid_targets_mean": 3401.8, "valid_targets_min": 957 }, { "epoch": 1.6585760517799353, "grad_norm": 0.4954056092036578, "learning_rate": 3.776818510906442e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.23031404614448547, "step": 1025, "valid_targets_mean": 4148.9, "valid_targets_min": 2287 }, { "epoch": 1.6666666666666665, "grad_norm": 0.6286314409012811, "learning_rate": 3.773099574033495e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.23707111179828644, "step": 1030, "valid_targets_mean": 3307.8, "valid_targets_min": 672 }, { "epoch": 1.674757281553398, "grad_norm": 0.6553707458396025, "learning_rate": 3.7693517700388655e-05, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.23486413061618805, "step": 1035, "valid_targets_mean": 4047.2, "valid_targets_min": 800 }, { "epoch": 1.6828478964401294, "grad_norm": 0.5934097873043159, "learning_rate": 3.765575159939045e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.2771807610988617, "step": 1040, "valid_targets_mean": 3773.2, "valid_targets_min": 507 }, { "epoch": 1.690938511326861, "grad_norm": 0.5378081205172018, "learning_rate": 3.761769805219505e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.22613410651683807, "step": 1045, "valid_targets_mean": 3719.8, "valid_targets_min": 1457 }, { "epoch": 1.6990291262135924, "grad_norm": 0.520359262056707, "learning_rate": 3.757935767833696e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.22133636474609375, "step": 1050, "valid_targets_mean": 3763.7, "valid_targets_min": 456 }, { "epoch": 1.7071197411003236, "grad_norm": 0.5008194986466029, "learning_rate": 3.7540731102020405e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.22984489798545837, "step": 1055, "valid_targets_mean": 3929.0, "valid_targets_min": 909 }, { "epoch": 1.715210355987055, "grad_norm": 0.5838525301390869, "learning_rate": 3.7501818952109156e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.22893069684505463, "step": 1060, "valid_targets_mean": 3512.1, "valid_targets_min": 739 }, { "epoch": 1.7233009708737863, "grad_norm": 1.3176771422050513, "learning_rate": 3.746262186211629e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.24603205919265747, "step": 1065, "valid_targets_mean": 3416.9, "valid_targets_min": 480 }, { "epoch": 1.7313915857605178, "grad_norm": 0.49404756439683184, "learning_rate": 3.742314047019386e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.22380509972572327, "step": 1070, "valid_targets_mean": 3805.4, "valid_targets_min": 259 }, { "epoch": 1.7394822006472492, "grad_norm": 0.5236273776513967, "learning_rate": 3.7383375419122565e-05, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.21787169575691223, "step": 1075, "valid_targets_mean": 3729.4, "valid_targets_min": 549 }, { "epoch": 1.7475728155339807, "grad_norm": 0.5366758234665157, "learning_rate": 3.734332735630121e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.22697246074676514, "step": 1080, "valid_targets_mean": 3726.1, "valid_targets_min": 460 }, { "epoch": 1.755663430420712, "grad_norm": 0.5880569909763975, "learning_rate": 3.730299693373622e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.24402067065238953, "step": 1085, "valid_targets_mean": 3389.1, "valid_targets_min": 551 }, { "epoch": 1.7637540453074434, "grad_norm": 0.5732738836935737, "learning_rate": 3.7262384808031004e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.23770153522491455, "step": 1090, "valid_targets_mean": 3941.0, "valid_targets_min": 2001 }, { "epoch": 1.7718446601941746, "grad_norm": 0.5790818828962175, "learning_rate": 3.722149164037525e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508291006088257, "step": 1095, "valid_targets_mean": 3566.1, "valid_targets_min": 872 }, { "epoch": 1.779935275080906, "grad_norm": 0.5588093189627107, "learning_rate": 3.718031809653419e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.2560824155807495, "step": 1100, "valid_targets_mean": 4033.4, "valid_targets_min": 1396 }, { "epoch": 1.7880258899676376, "grad_norm": 0.5358396313208293, "learning_rate": 3.713886484683776e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.2311561405658722, "step": 1105, "valid_targets_mean": 3314.1, "valid_targets_min": 372 }, { "epoch": 1.796116504854369, "grad_norm": 0.5222906484183111, "learning_rate": 3.7097132566169644e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.2244446873664856, "step": 1110, "valid_targets_mean": 3713.9, "valid_targets_min": 599 }, { "epoch": 1.8042071197411005, "grad_norm": 0.5719814501478453, "learning_rate": 3.7055121933956344e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.24464090168476105, "step": 1115, "valid_targets_mean": 3385.4, "valid_targets_min": 1076 }, { "epoch": 1.8122977346278317, "grad_norm": 0.49942174241821524, "learning_rate": 3.7012833634156074e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.21926362812519073, "step": 1120, "valid_targets_mean": 3780.5, "valid_targets_min": 1138 }, { "epoch": 1.820388349514563, "grad_norm": 0.5236595180717353, "learning_rate": 3.6970268355247664e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.23075798153877258, "step": 1125, "valid_targets_mean": 4367.0, "valid_targets_min": 2408 }, { "epoch": 1.8284789644012944, "grad_norm": 0.512201160936164, "learning_rate": 3.6927426790219296e-05, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.22904011607170105, "step": 1130, "valid_targets_mean": 3974.8, "valid_targets_min": 430 }, { "epoch": 1.8365695792880259, "grad_norm": 0.5421531914600399, "learning_rate": 3.6884309636557294e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.23919343948364258, "step": 1135, "valid_targets_mean": 4035.8, "valid_targets_min": 613 }, { "epoch": 1.8446601941747574, "grad_norm": 0.5030012800087369, "learning_rate": 3.6840917596234706e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.21478207409381866, "step": 1140, "valid_targets_mean": 3792.1, "valid_targets_min": 1940 }, { "epoch": 1.8527508090614888, "grad_norm": 0.4942511653414622, "learning_rate": 3.67972513756999e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.22776880860328674, "step": 1145, "valid_targets_mean": 4292.5, "valid_targets_min": 3142 }, { "epoch": 1.86084142394822, "grad_norm": 0.5531908060139232, "learning_rate": 3.675331168586507e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.2260960340499878, "step": 1150, "valid_targets_mean": 3819.9, "valid_targets_min": 2287 }, { "epoch": 1.8689320388349513, "grad_norm": 0.5470369953036037, "learning_rate": 3.670909924209464e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2212294042110443, "step": 1155, "valid_targets_mean": 3313.6, "valid_targets_min": 1344 }, { "epoch": 1.8770226537216828, "grad_norm": 0.6663201618271906, "learning_rate": 3.666461476419366e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.22908449172973633, "step": 1160, "valid_targets_mean": 3906.2, "valid_targets_min": 1558 }, { "epoch": 1.8851132686084142, "grad_norm": 0.5574954468183086, "learning_rate": 3.6619858976396024e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.2327789068222046, "step": 1165, "valid_targets_mean": 3522.2, "valid_targets_min": 431 }, { "epoch": 1.8932038834951457, "grad_norm": 0.5620174972243343, "learning_rate": 3.657483260735274e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.24146509170532227, "step": 1170, "valid_targets_mean": 3762.1, "valid_targets_min": 488 }, { "epoch": 1.9012944983818771, "grad_norm": 0.5361897984263154, "learning_rate": 3.652953639012001e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.23045086860656738, "step": 1175, "valid_targets_mean": 3549.8, "valid_targets_min": 599 }, { "epoch": 1.9093851132686084, "grad_norm": 0.5229274187192743, "learning_rate": 3.648397106214737e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.23464813828468323, "step": 1180, "valid_targets_mean": 3790.5, "valid_targets_min": 509 }, { "epoch": 1.9174757281553398, "grad_norm": 0.5543253937763715, "learning_rate": 3.6438137365265605e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228466123342514, "step": 1185, "valid_targets_mean": 3626.7, "valid_targets_min": 1124 }, { "epoch": 1.925566343042071, "grad_norm": 0.529511456822995, "learning_rate": 3.639203604567471e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.24794839322566986, "step": 1190, "valid_targets_mean": 3834.1, "valid_targets_min": 1399 }, { "epoch": 1.9336569579288025, "grad_norm": 0.531993228725407, "learning_rate": 3.634566785393175e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.25982001423835754, "step": 1195, "valid_targets_mean": 4059.9, "valid_targets_min": 436 }, { "epoch": 1.941747572815534, "grad_norm": 0.5265102733273151, "learning_rate": 3.629903354493863e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.2254936546087265, "step": 1200, "valid_targets_mean": 3641.8, "valid_targets_min": 364 }, { "epoch": 1.9498381877022655, "grad_norm": 0.501456617132805, "learning_rate": 3.625213387792979e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.2376459538936615, "step": 1205, "valid_targets_mean": 4138.9, "valid_targets_min": 816 }, { "epoch": 1.9579288025889967, "grad_norm": 0.5764064629638148, "learning_rate": 3.620496961645986e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2591501772403717, "step": 1210, "valid_targets_mean": 3676.3, "valid_targets_min": 1492 }, { "epoch": 1.9660194174757282, "grad_norm": 0.5031251840065841, "learning_rate": 3.615754152839122e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.22879642248153687, "step": 1215, "valid_targets_mean": 4046.3, "valid_targets_min": 2065 }, { "epoch": 1.9741100323624594, "grad_norm": 0.5059144405997464, "learning_rate": 3.610985038588153e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.19675277173519135, "step": 1220, "valid_targets_mean": 3762.8, "valid_targets_min": 1268 }, { "epoch": 1.9822006472491909, "grad_norm": 0.5147056567182494, "learning_rate": 3.606189696537112e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.22215335071086884, "step": 1225, "valid_targets_mean": 4182.2, "valid_targets_min": 2542 }, { "epoch": 1.9902912621359223, "grad_norm": 0.4962653381732891, "learning_rate": 3.601368204757034e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.21097412705421448, "step": 1230, "valid_targets_mean": 4162.3, "valid_targets_min": 1656 }, { "epoch": 1.9983818770226538, "grad_norm": 0.577252598785239, "learning_rate": 3.596520641744691e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.23722471296787262, "step": 1235, "valid_targets_mean": 3291.0, "valid_targets_min": 454 }, { "epoch": 2.0064724919093853, "grad_norm": 0.4993415945161253, "learning_rate": 3.591647086421308e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.21230442821979523, "step": 1240, "valid_targets_mean": 3964.4, "valid_targets_min": 2176 }, { "epoch": 2.0145631067961167, "grad_norm": 0.5966427219749822, "learning_rate": 3.586747618131281e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.23013052344322205, "step": 1245, "valid_targets_mean": 3509.5, "valid_targets_min": 478 }, { "epoch": 2.0226537216828477, "grad_norm": 0.5074745492260596, "learning_rate": 3.581822316640884e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.18717864155769348, "step": 1250, "valid_targets_mean": 3663.1, "valid_targets_min": 1630 }, { "epoch": 2.030744336569579, "grad_norm": 0.5173949946365176, "learning_rate": 3.5768712621369724e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.18645232915878296, "step": 1255, "valid_targets_mean": 3951.8, "valid_targets_min": 1333 }, { "epoch": 2.0388349514563107, "grad_norm": 0.5448045943609541, "learning_rate": 3.571894535225674e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799754500389099, "step": 1260, "valid_targets_mean": 3515.6, "valid_targets_min": 775 }, { "epoch": 2.046925566343042, "grad_norm": 0.5746768972560183, "learning_rate": 3.566892216931081e-05, "loss": 0.2061, "loss_nan_ranks": 0, "loss_rank_avg": 0.19511979818344116, "step": 1265, "valid_targets_mean": 3279.9, "valid_targets_min": 551 }, { "epoch": 2.0550161812297736, "grad_norm": 0.5648116924397264, "learning_rate": 3.561864388693926e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.2113444060087204, "step": 1270, "valid_targets_mean": 3652.9, "valid_targets_min": 1138 }, { "epoch": 2.063106796116505, "grad_norm": 0.5516073010997726, "learning_rate": 3.556811132370261e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.20847252011299133, "step": 1275, "valid_targets_mean": 3552.1, "valid_targets_min": 499 }, { "epoch": 2.071197411003236, "grad_norm": 0.7203895860407499, "learning_rate": 3.551732530230123e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.21450018882751465, "step": 1280, "valid_targets_mean": 3142.6, "valid_targets_min": 470 }, { "epoch": 2.0792880258899675, "grad_norm": 0.8756711994922913, "learning_rate": 3.54662866495619e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.18415921926498413, "step": 1285, "valid_targets_mean": 3720.0, "valid_targets_min": 1326 }, { "epoch": 2.087378640776699, "grad_norm": 0.5096759527620363, "learning_rate": 3.5414996196424435e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.18555939197540283, "step": 1290, "valid_targets_mean": 3764.2, "valid_targets_min": 533 }, { "epoch": 2.0954692556634305, "grad_norm": 0.5196043558651653, "learning_rate": 3.536345477792809e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.21714207530021667, "step": 1295, "valid_targets_mean": 4167.4, "valid_targets_min": 1319 }, { "epoch": 2.103559870550162, "grad_norm": 0.5198619298874421, "learning_rate": 3.5311663233197984e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.21272701025009155, "step": 1300, "valid_targets_mean": 3971.4, "valid_targets_min": 2091 }, { "epoch": 2.1116504854368934, "grad_norm": 0.5928562565695267, "learning_rate": 3.525962240543144e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.22063596546649933, "step": 1305, "valid_targets_mean": 3416.7, "valid_targets_min": 607 }, { "epoch": 2.1197411003236244, "grad_norm": 0.5216255221584896, "learning_rate": 3.520733314188429e-05, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.21724799275398254, "step": 1310, "valid_targets_mean": 4127.8, "valid_targets_min": 2446 }, { "epoch": 2.127831715210356, "grad_norm": 0.5474600583613157, "learning_rate": 3.515479629385699e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.20810237526893616, "step": 1315, "valid_targets_mean": 3830.8, "valid_targets_min": 834 }, { "epoch": 2.1359223300970873, "grad_norm": 0.48930392242915055, "learning_rate": 3.5102012716680875e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.19523948431015015, "step": 1320, "valid_targets_mean": 4223.8, "valid_targets_min": 2806 }, { "epoch": 2.144012944983819, "grad_norm": 0.5866244137062765, "learning_rate": 3.504898326970414e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.200786292552948, "step": 1325, "valid_targets_mean": 3740.6, "valid_targets_min": 479 }, { "epoch": 2.1521035598705502, "grad_norm": 0.546507028724296, "learning_rate": 3.499570881627791e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.20447948575019836, "step": 1330, "valid_targets_mean": 4271.7, "valid_targets_min": 2185 }, { "epoch": 2.1601941747572817, "grad_norm": 0.5501111945463919, "learning_rate": 3.494219022374215e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.17158368229866028, "step": 1335, "valid_targets_mean": 3503.9, "valid_targets_min": 1555 }, { "epoch": 2.168284789644013, "grad_norm": 0.5332981963079229, "learning_rate": 3.4888428363411564e-05, "loss": 0.2126, "loss_nan_ranks": 0, "loss_rank_avg": 0.2065584659576416, "step": 1340, "valid_targets_mean": 3692.7, "valid_targets_min": 1725 }, { "epoch": 2.176375404530744, "grad_norm": 0.5227522173533274, "learning_rate": 3.48344241105614e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.17856690287590027, "step": 1345, "valid_targets_mean": 3659.4, "valid_targets_min": 428 }, { "epoch": 2.1844660194174756, "grad_norm": 0.5249981570603643, "learning_rate": 3.478017834441319e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.2090633660554886, "step": 1350, "valid_targets_mean": 3779.1, "valid_targets_min": 1938 }, { "epoch": 2.192556634304207, "grad_norm": 0.5704929170229348, "learning_rate": 3.472569194812045e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.20181623101234436, "step": 1355, "valid_targets_mean": 3276.9, "valid_targets_min": 469 }, { "epoch": 2.2006472491909386, "grad_norm": 0.5588805782852425, "learning_rate": 3.467096580875432e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.22426563501358032, "step": 1360, "valid_targets_mean": 3875.8, "valid_targets_min": 1872 }, { "epoch": 2.20873786407767, "grad_norm": 0.5509007102722255, "learning_rate": 3.4616000817289076e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.19825254380702972, "step": 1365, "valid_targets_mean": 3587.5, "valid_targets_min": 503 }, { "epoch": 2.2168284789644015, "grad_norm": 0.5222770840734019, "learning_rate": 3.456079786858766e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.18225571513175964, "step": 1370, "valid_targets_mean": 3472.8, "valid_targets_min": 421 }, { "epoch": 2.2249190938511325, "grad_norm": 0.5335762760883815, "learning_rate": 3.450535786138709e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.2157287895679474, "step": 1375, "valid_targets_mean": 4006.0, "valid_targets_min": 810 }, { "epoch": 2.233009708737864, "grad_norm": 0.5911174264119916, "learning_rate": 3.4449681698283856e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.22825801372528076, "step": 1380, "valid_targets_mean": 3319.5, "valid_targets_min": 433 }, { "epoch": 2.2411003236245954, "grad_norm": 0.5582155327413821, "learning_rate": 3.4393770285719196e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.18830609321594238, "step": 1385, "valid_targets_mean": 3346.9, "valid_targets_min": 409 }, { "epoch": 2.249190938511327, "grad_norm": 0.5048820994486662, "learning_rate": 3.433762453396434e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.18742072582244873, "step": 1390, "valid_targets_mean": 4147.5, "valid_targets_min": 456 }, { "epoch": 2.2572815533980584, "grad_norm": 0.5410154491099326, "learning_rate": 3.4281245357105726e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.20132315158843994, "step": 1395, "valid_targets_mean": 3883.0, "valid_targets_min": 1641 }, { "epoch": 2.26537216828479, "grad_norm": 0.5709057031867241, "learning_rate": 3.4224633673030074e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.20349285006523132, "step": 1400, "valid_targets_mean": 3687.4, "valid_targets_min": 1259 }, { "epoch": 2.273462783171521, "grad_norm": 0.5195581585764436, "learning_rate": 3.416779040340945e-05, "loss": 0.2041, "loss_nan_ranks": 0, "loss_rank_avg": 0.18851682543754578, "step": 1405, "valid_targets_mean": 3685.3, "valid_targets_min": 547 }, { "epoch": 2.2815533980582523, "grad_norm": 0.6363313435467606, "learning_rate": 3.4110716473686305e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.2130783498287201, "step": 1410, "valid_targets_mean": 3862.9, "valid_targets_min": 479 }, { "epoch": 2.2896440129449838, "grad_norm": 0.5643587316981776, "learning_rate": 3.405341281305835e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.18532046675682068, "step": 1415, "valid_targets_mean": 3771.4, "valid_targets_min": 1340 }, { "epoch": 2.2977346278317152, "grad_norm": 0.6002935838348056, "learning_rate": 3.3995880354463444e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.19355767965316772, "step": 1420, "valid_targets_mean": 3108.6, "valid_targets_min": 457 }, { "epoch": 2.3058252427184467, "grad_norm": 0.6594173942377517, "learning_rate": 3.393812003456444e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.1892772614955902, "step": 1425, "valid_targets_mean": 3523.7, "valid_targets_min": 419 }, { "epoch": 2.313915857605178, "grad_norm": 0.5392073312759366, "learning_rate": 3.3880132793733896e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.17127923667430878, "step": 1430, "valid_targets_mean": 3360.4, "valid_targets_min": 909 }, { "epoch": 2.3220064724919096, "grad_norm": 0.6041744216730695, "learning_rate": 3.382191957603878e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.21991001069545746, "step": 1435, "valid_targets_mean": 3557.8, "valid_targets_min": 1446 }, { "epoch": 2.3300970873786406, "grad_norm": 0.5036421334771191, "learning_rate": 3.376348132922509e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.19798916578292847, "step": 1440, "valid_targets_mean": 4315.9, "valid_targets_min": 3091 }, { "epoch": 2.338187702265372, "grad_norm": 0.5210163872616127, "learning_rate": 3.3704819004702444e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.19083701074123383, "step": 1445, "valid_targets_mean": 3990.8, "valid_targets_min": 1812 }, { "epoch": 2.3462783171521036, "grad_norm": 0.5382923205946923, "learning_rate": 3.364593355752857e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.22279268503189087, "step": 1450, "valid_targets_mean": 4153.6, "valid_targets_min": 2749 }, { "epoch": 2.354368932038835, "grad_norm": 0.5690802179863486, "learning_rate": 3.358682594639379e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.21023952960968018, "step": 1455, "valid_targets_mean": 4108.8, "valid_targets_min": 422 }, { "epoch": 2.3624595469255665, "grad_norm": 0.5587521088638144, "learning_rate": 3.3527497133605345e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.21760553121566772, "step": 1460, "valid_targets_mean": 4084.8, "valid_targets_min": 2096 }, { "epoch": 2.3705501618122975, "grad_norm": 0.6327920191794262, "learning_rate": 3.346794808507182e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.19593237340450287, "step": 1465, "valid_targets_mean": 3724.5, "valid_targets_min": 460 }, { "epoch": 2.378640776699029, "grad_norm": 0.5243331783837871, "learning_rate": 3.340817977028732e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890985071659088, "step": 1470, "valid_targets_mean": 3856.2, "valid_targets_min": 1060 }, { "epoch": 2.3867313915857604, "grad_norm": 0.6002411735204223, "learning_rate": 3.3348193162315786e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.21150943636894226, "step": 1475, "valid_targets_mean": 3088.4, "valid_targets_min": 426 }, { "epoch": 2.394822006472492, "grad_norm": 0.6149693570960357, "learning_rate": 3.3287989237775064e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.20418787002563477, "step": 1480, "valid_targets_mean": 3793.6, "valid_targets_min": 1215 }, { "epoch": 2.4029126213592233, "grad_norm": 0.5452824529033008, "learning_rate": 3.322756897682106e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.19814196228981018, "step": 1485, "valid_targets_mean": 3985.6, "valid_targets_min": 1819 }, { "epoch": 2.411003236245955, "grad_norm": 0.5481539653642269, "learning_rate": 3.3166933363131765e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.18332578241825104, "step": 1490, "valid_targets_mean": 3920.4, "valid_targets_min": 313 }, { "epoch": 2.4190938511326863, "grad_norm": 0.5389343062157606, "learning_rate": 3.310608338389124e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.19974827766418457, "step": 1495, "valid_targets_mean": 4036.6, "valid_targets_min": 712 }, { "epoch": 2.4271844660194173, "grad_norm": 0.5611663097998205, "learning_rate": 3.304502002977355e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.18663233518600464, "step": 1500, "valid_targets_mean": 4147.1, "valid_targets_min": 2026 }, { "epoch": 2.4352750809061487, "grad_norm": 0.5505208094874494, "learning_rate": 3.2983744294926614e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.20405398309230804, "step": 1505, "valid_targets_mean": 3872.2, "valid_targets_min": 535 }, { "epoch": 2.44336569579288, "grad_norm": 0.7012874764369187, "learning_rate": 3.292225717695606e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.2327345907688141, "step": 1510, "valid_targets_mean": 3637.6, "valid_targets_min": 313 }, { "epoch": 2.4514563106796117, "grad_norm": 1.1024977498248867, "learning_rate": 3.286055967690894e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.21150124073028564, "step": 1515, "valid_targets_mean": 4220.2, "valid_targets_min": 3011 }, { "epoch": 2.459546925566343, "grad_norm": 0.7097144552349174, "learning_rate": 3.279865279925748e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.20087671279907227, "step": 1520, "valid_targets_mean": 3596.6, "valid_targets_min": 1667 }, { "epoch": 2.4676375404530746, "grad_norm": 0.6102242644893953, "learning_rate": 3.273653755188265e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.21528849005699158, "step": 1525, "valid_targets_mean": 3797.2, "valid_targets_min": 1174 }, { "epoch": 2.475728155339806, "grad_norm": 0.5996789804839444, "learning_rate": 3.267421494605786e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.2003488689661026, "step": 1530, "valid_targets_mean": 3306.8, "valid_targets_min": 330 }, { "epoch": 2.483818770226537, "grad_norm": 0.5539684053989401, "learning_rate": 3.261168599643239e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.19859477877616882, "step": 1535, "valid_targets_mean": 3921.0, "valid_targets_min": 1528 }, { "epoch": 2.4919093851132685, "grad_norm": 0.5800147569212741, "learning_rate": 3.254895172101495e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.20788471400737762, "step": 1540, "valid_targets_mean": 3650.2, "valid_targets_min": 1779 }, { "epoch": 2.5, "grad_norm": 0.5444327898653049, "learning_rate": 3.248601314115709e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.19758197665214539, "step": 1545, "valid_targets_mean": 3911.5, "valid_targets_min": 1092 }, { "epoch": 2.5080906148867315, "grad_norm": 0.5585959818809851, "learning_rate": 3.2422871281536504e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.20119929313659668, "step": 1550, "valid_targets_mean": 3706.0, "valid_targets_min": 391 }, { "epoch": 2.516181229773463, "grad_norm": 0.5786946765486497, "learning_rate": 3.235952717014046e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.18431814014911652, "step": 1555, "valid_targets_mean": 3852.7, "valid_targets_min": 1344 }, { "epoch": 2.524271844660194, "grad_norm": 0.722163694671597, "learning_rate": 3.229598183824897e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.19687601923942566, "step": 1560, "valid_targets_mean": 3535.8, "valid_targets_min": 377 }, { "epoch": 2.5323624595469254, "grad_norm": 0.5945221722717067, "learning_rate": 3.223223632041806e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.19220665097236633, "step": 1565, "valid_targets_mean": 3312.9, "valid_targets_min": 1484 }, { "epoch": 2.540453074433657, "grad_norm": 0.5463852945973736, "learning_rate": 3.216829165446288e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.20611058175563812, "step": 1570, "valid_targets_mean": 3802.0, "valid_targets_min": 997 }, { "epoch": 2.5485436893203883, "grad_norm": 0.5992106420260478, "learning_rate": 3.210414888144085e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.2046264111995697, "step": 1575, "valid_targets_mean": 3380.8, "valid_targets_min": 480 }, { "epoch": 2.55663430420712, "grad_norm": 0.5425409151257213, "learning_rate": 3.203980904563467e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.19060689210891724, "step": 1580, "valid_targets_mean": 4033.8, "valid_targets_min": 1890 }, { "epoch": 2.5647249190938513, "grad_norm": 0.5481719828708285, "learning_rate": 3.1975273194535365e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17384769022464752, "step": 1585, "valid_targets_mean": 3420.6, "valid_targets_min": 422 }, { "epoch": 2.5728155339805827, "grad_norm": 0.5535876172620676, "learning_rate": 3.191054237882519e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.20850872993469238, "step": 1590, "valid_targets_mean": 3588.6, "valid_targets_min": 330 }, { "epoch": 2.5809061488673137, "grad_norm": 0.5799991839791976, "learning_rate": 3.1845617652360556e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.204398050904274, "step": 1595, "valid_targets_mean": 3439.6, "valid_targets_min": 957 }, { "epoch": 2.588996763754045, "grad_norm": 0.5277347822812265, "learning_rate": 3.178050007215483e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1802809089422226, "step": 1600, "valid_targets_mean": 3597.8, "valid_targets_min": 409 }, { "epoch": 2.5970873786407767, "grad_norm": 0.5922385180939794, "learning_rate": 3.171519069836118e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.20629601180553436, "step": 1605, "valid_targets_mean": 3622.6, "valid_targets_min": 1991 }, { "epoch": 2.605177993527508, "grad_norm": 0.5880468064461831, "learning_rate": 3.1649690594255265e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.19900715351104736, "step": 1610, "valid_targets_mean": 3396.1, "valid_targets_min": 572 }, { "epoch": 2.6132686084142396, "grad_norm": 0.5697903771803728, "learning_rate": 3.1584000826217974e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.18581387400627136, "step": 1615, "valid_targets_mean": 3602.9, "valid_targets_min": 1060 }, { "epoch": 2.6213592233009706, "grad_norm": 0.6018213495545038, "learning_rate": 3.151812246371802e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.18213129043579102, "step": 1620, "valid_targets_mean": 3693.2, "valid_targets_min": 1311 }, { "epoch": 2.6294498381877025, "grad_norm": 0.5772009351308939, "learning_rate": 3.145205657929454e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.20195090770721436, "step": 1625, "valid_targets_mean": 3644.8, "valid_targets_min": 480 }, { "epoch": 2.6375404530744335, "grad_norm": 0.5878583193941402, "learning_rate": 3.1385804248539665e-05, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117636501789093, "step": 1630, "valid_targets_mean": 3500.8, "valid_targets_min": 793 }, { "epoch": 2.645631067961165, "grad_norm": 0.561998252403094, "learning_rate": 3.131936655008097e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.21909379959106445, "step": 1635, "valid_targets_mean": 4789.3, "valid_targets_min": 2141 }, { "epoch": 2.6537216828478964, "grad_norm": 0.6250002374027832, "learning_rate": 3.125274456556392e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.21586726605892181, "step": 1640, "valid_targets_mean": 3864.6, "valid_targets_min": 441 }, { "epoch": 2.661812297734628, "grad_norm": 0.6877067793902955, "learning_rate": 3.1185939379634274e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.2070537805557251, "step": 1645, "valid_targets_mean": 3693.6, "valid_targets_min": 1004 }, { "epoch": 2.6699029126213594, "grad_norm": 0.5200491955654815, "learning_rate": 3.111895207992042e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.1959010660648346, "step": 1650, "valid_targets_mean": 4079.2, "valid_targets_min": 465 }, { "epoch": 2.6779935275080904, "grad_norm": 0.5326594070559258, "learning_rate": 3.1051783757015686e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.18363815546035767, "step": 1655, "valid_targets_mean": 4011.5, "valid_targets_min": 597 }, { "epoch": 2.686084142394822, "grad_norm": 0.5389554367064366, "learning_rate": 3.098443550446051e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.209175705909729, "step": 1660, "valid_targets_mean": 4220.7, "valid_targets_min": 2153 }, { "epoch": 2.6941747572815533, "grad_norm": 0.5459696709484382, "learning_rate": 3.0916908418724765e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.18107455968856812, "step": 1665, "valid_targets_mean": 3520.8, "valid_targets_min": 974 }, { "epoch": 2.7022653721682848, "grad_norm": 0.5798237314369729, "learning_rate": 3.0849203599189776e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.20543158054351807, "step": 1670, "valid_targets_mean": 3632.6, "valid_targets_min": 703 }, { "epoch": 2.7103559870550162, "grad_norm": 0.5316270837678921, "learning_rate": 3.0781322148130514e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.20163953304290771, "step": 1675, "valid_targets_mean": 3576.5, "valid_targets_min": 815 }, { "epoch": 2.7184466019417477, "grad_norm": 0.4904568873109919, "learning_rate": 3.071326517069761e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.1812264323234558, "step": 1680, "valid_targets_mean": 4223.2, "valid_targets_min": 2104 }, { "epoch": 2.726537216828479, "grad_norm": 0.5354083648536498, "learning_rate": 3.064503377489936e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.20075714588165283, "step": 1685, "valid_targets_mean": 3889.9, "valid_targets_min": 1032 }, { "epoch": 2.73462783171521, "grad_norm": 0.5820578665530104, "learning_rate": 3.0576629071583704e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.22076207399368286, "step": 1690, "valid_targets_mean": 3753.3, "valid_targets_min": 1575 }, { "epoch": 2.7427184466019416, "grad_norm": 0.60823767625081, "learning_rate": 3.0508052174420132e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.21139661967754364, "step": 1695, "valid_targets_mean": 3182.8, "valid_targets_min": 418 }, { "epoch": 2.750809061488673, "grad_norm": 0.5396414265678104, "learning_rate": 3.0439304199881543e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.19884394109249115, "step": 1700, "valid_targets_mean": 3960.8, "valid_targets_min": 444 }, { "epoch": 2.7588996763754046, "grad_norm": 0.6318198192740533, "learning_rate": 3.03703862672261e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.2142893671989441, "step": 1705, "valid_targets_mean": 3710.0, "valid_targets_min": 958 }, { "epoch": 2.766990291262136, "grad_norm": 0.5118804639309135, "learning_rate": 3.030129949847895e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.19666945934295654, "step": 1710, "valid_targets_mean": 4017.2, "valid_targets_min": 1524 }, { "epoch": 2.775080906148867, "grad_norm": 0.5233752971594281, "learning_rate": 3.023204501841403e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.1879742294549942, "step": 1715, "valid_targets_mean": 3730.5, "valid_targets_min": 411 }, { "epoch": 2.783171521035599, "grad_norm": 0.5545239643662999, "learning_rate": 3.01626239545357e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.21372893452644348, "step": 1720, "valid_targets_mean": 3842.9, "valid_targets_min": 615 }, { "epoch": 2.79126213592233, "grad_norm": 0.5296179785533861, "learning_rate": 3.00930374370604e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.17748533189296722, "step": 1725, "valid_targets_mean": 3760.2, "valid_targets_min": 1638 }, { "epoch": 2.7993527508090614, "grad_norm": 0.5915432116224574, "learning_rate": 3.002328659889826e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.1959744095802307, "step": 1730, "valid_targets_mean": 3509.1, "valid_targets_min": 1201 }, { "epoch": 2.807443365695793, "grad_norm": 0.5095307798896164, "learning_rate": 2.995337257563466e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.18040308356285095, "step": 1735, "valid_targets_mean": 4305.2, "valid_targets_min": 3091 }, { "epoch": 2.8155339805825244, "grad_norm": 0.6272482204481657, "learning_rate": 2.9883296505511704e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.19337265193462372, "step": 1740, "valid_targets_mean": 3533.1, "valid_targets_min": 534 }, { "epoch": 2.823624595469256, "grad_norm": 0.5315105215288927, "learning_rate": 2.981305952940973e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.18375645577907562, "step": 1745, "valid_targets_mean": 4295.6, "valid_targets_min": 2906 }, { "epoch": 2.831715210355987, "grad_norm": 0.5351373135111939, "learning_rate": 2.9742662790828732e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.18155202269554138, "step": 1750, "valid_targets_mean": 3872.8, "valid_targets_min": 718 }, { "epoch": 2.8398058252427183, "grad_norm": 0.5882867567839128, "learning_rate": 2.9672107435869727e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.20388536155223846, "step": 1755, "valid_targets_mean": 3398.5, "valid_targets_min": 397 }, { "epoch": 2.8478964401294498, "grad_norm": 0.5166204472764317, "learning_rate": 2.9601394613216086e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.1891598403453827, "step": 1760, "valid_targets_mean": 3952.1, "valid_targets_min": 471 }, { "epoch": 2.855987055016181, "grad_norm": 0.495203793195684, "learning_rate": 2.953052547411487e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.19284304976463318, "step": 1765, "valid_targets_mean": 4468.9, "valid_targets_min": 3669 }, { "epoch": 2.8640776699029127, "grad_norm": 0.5707255444123573, "learning_rate": 2.9459501172358046e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.19373999536037445, "step": 1770, "valid_targets_mean": 4088.8, "valid_targets_min": 1916 }, { "epoch": 2.872168284789644, "grad_norm": 0.603965037928362, "learning_rate": 2.9388322864263747e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.2008977234363556, "step": 1775, "valid_targets_mean": 3390.8, "valid_targets_min": 397 }, { "epoch": 2.8802588996763756, "grad_norm": 0.6153412854635089, "learning_rate": 2.9316991708657382e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.19763140380382538, "step": 1780, "valid_targets_mean": 3698.1, "valid_targets_min": 442 }, { "epoch": 2.8883495145631066, "grad_norm": 0.5740792099777532, "learning_rate": 2.924550886685285e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.21043045818805695, "step": 1785, "valid_targets_mean": 3918.6, "valid_targets_min": 451 }, { "epoch": 2.896440129449838, "grad_norm": 0.5205108968750519, "learning_rate": 2.917387550263357e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.19361340999603271, "step": 1790, "valid_targets_mean": 4294.6, "valid_targets_min": 1695 }, { "epoch": 2.9045307443365695, "grad_norm": 0.5515212654195533, "learning_rate": 2.9102092782233563e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.19037625193595886, "step": 1795, "valid_targets_mean": 3688.1, "valid_targets_min": 672 }, { "epoch": 2.912621359223301, "grad_norm": 0.5966136509189564, "learning_rate": 2.9030161874318455e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.21651627123355865, "step": 1800, "valid_targets_mean": 3206.2, "valid_targets_min": 463 }, { "epoch": 2.9207119741100325, "grad_norm": 0.6501703618729953, "learning_rate": 2.895808394996644e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.20761127769947052, "step": 1805, "valid_targets_mean": 3975.1, "valid_targets_min": 721 }, { "epoch": 2.9288025889967635, "grad_norm": 0.5679104463871691, "learning_rate": 2.8885860182649263e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.19638538360595703, "step": 1810, "valid_targets_mean": 3561.3, "valid_targets_min": 478 }, { "epoch": 2.9368932038834954, "grad_norm": 0.6224037383738494, "learning_rate": 2.881349174821305e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.22906172275543213, "step": 1815, "valid_targets_mean": 3815.6, "valid_targets_min": 269 }, { "epoch": 2.9449838187702264, "grad_norm": 0.5687126118661141, "learning_rate": 2.8740979824859194e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.18152084946632385, "step": 1820, "valid_targets_mean": 3180.0, "valid_targets_min": 445 }, { "epoch": 2.953074433656958, "grad_norm": 0.5633436924003058, "learning_rate": 2.8668325593125192e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.19939512014389038, "step": 1825, "valid_targets_mean": 3791.1, "valid_targets_min": 599 }, { "epoch": 2.9611650485436893, "grad_norm": 0.5634935052804328, "learning_rate": 2.8595530235865397e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.20533940196037292, "step": 1830, "valid_targets_mean": 3936.6, "valid_targets_min": 775 }, { "epoch": 2.969255663430421, "grad_norm": 0.5169570794160626, "learning_rate": 2.8522594938231755e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.1793152093887329, "step": 1835, "valid_targets_mean": 4222.0, "valid_targets_min": 2249 }, { "epoch": 2.9773462783171523, "grad_norm": 0.5914192243747182, "learning_rate": 2.8449520887654558e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.23565539717674255, "step": 1840, "valid_targets_mean": 3811.9, "valid_targets_min": 606 }, { "epoch": 2.9854368932038833, "grad_norm": 0.5042664015367552, "learning_rate": 2.8376309273823047e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.2007623314857483, "step": 1845, "valid_targets_mean": 4263.4, "valid_targets_min": 2313 }, { "epoch": 2.9935275080906147, "grad_norm": 0.5391052395522601, "learning_rate": 2.8302961288666094e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.1861807405948639, "step": 1850, "valid_targets_mean": 4023.2, "valid_targets_min": 1822 }, { "epoch": 3.001618122977346, "grad_norm": 0.5919409123484987, "learning_rate": 2.8229478126332766e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.1760110855102539, "step": 1855, "valid_targets_mean": 4402.6, "valid_targets_min": 2340 }, { "epoch": 3.0097087378640777, "grad_norm": 0.6049776201529414, "learning_rate": 2.815586098317291e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.18497231602668762, "step": 1860, "valid_targets_mean": 4040.8, "valid_targets_min": 752 }, { "epoch": 3.017799352750809, "grad_norm": 0.5632642899702008, "learning_rate": 2.8082111057717655e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.16407430171966553, "step": 1865, "valid_targets_mean": 3755.1, "valid_targets_min": 2032 }, { "epoch": 3.0258899676375406, "grad_norm": 0.5813140896256607, "learning_rate": 2.8008229550659883e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.17744824290275574, "step": 1870, "valid_targets_mean": 3664.5, "valid_targets_min": 1030 }, { "epoch": 3.033980582524272, "grad_norm": 0.5670865086302852, "learning_rate": 2.793421766483474e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.155634805560112, "step": 1875, "valid_targets_mean": 3756.2, "valid_targets_min": 2223 }, { "epoch": 3.042071197411003, "grad_norm": 0.5823101361167331, "learning_rate": 2.7860076605199995e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.16646599769592285, "step": 1880, "valid_targets_mean": 3607.3, "valid_targets_min": 1695 }, { "epoch": 3.0501618122977345, "grad_norm": 0.8908406522912229, "learning_rate": 2.7785807578816448e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.17764373123645782, "step": 1885, "valid_targets_mean": 3329.0, "valid_targets_min": 269 }, { "epoch": 3.058252427184466, "grad_norm": 0.66787286744631, "learning_rate": 2.7711411794828274e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.17671708762645721, "step": 1890, "valid_targets_mean": 3682.6, "valid_targets_min": 786 }, { "epoch": 3.0663430420711975, "grad_norm": 1.713966990953561, "learning_rate": 2.7636890464443333e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.1910078227519989, "step": 1895, "valid_targets_mean": 3873.7, "valid_targets_min": 2165 }, { "epoch": 3.074433656957929, "grad_norm": 0.5994989410802046, "learning_rate": 2.756224480091347e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.17505040764808655, "step": 1900, "valid_targets_mean": 3232.8, "valid_targets_min": 481 }, { "epoch": 3.0825242718446604, "grad_norm": 0.5795213439206806, "learning_rate": 2.7487476019514726e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.17841529846191406, "step": 1905, "valid_targets_mean": 3820.4, "valid_targets_min": 634 }, { "epoch": 3.0906148867313914, "grad_norm": 0.630803442604153, "learning_rate": 2.74125853375276e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.1717372089624405, "step": 1910, "valid_targets_mean": 3442.6, "valid_targets_min": 488 }, { "epoch": 3.098705501618123, "grad_norm": 0.5607447512719843, "learning_rate": 2.7337573974217177e-05, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.18259483575820923, "step": 1915, "valid_targets_mean": 4125.4, "valid_targets_min": 2164 }, { "epoch": 3.1067961165048543, "grad_norm": 0.5173894268282134, "learning_rate": 2.726244315081334e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.1611001193523407, "step": 1920, "valid_targets_mean": 3982.5, "valid_targets_min": 605 }, { "epoch": 3.114886731391586, "grad_norm": 0.5917839297779477, "learning_rate": 2.718719409049082e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.15416556596755981, "step": 1925, "valid_targets_mean": 4123.0, "valid_targets_min": 2318 }, { "epoch": 3.1229773462783172, "grad_norm": 0.5712043686830873, "learning_rate": 2.711182801834933e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.15566003322601318, "step": 1930, "valid_targets_mean": 3407.0, "valid_targets_min": 499 }, { "epoch": 3.1310679611650487, "grad_norm": 0.5813335365274586, "learning_rate": 2.7036346161393617e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.19251751899719238, "step": 1935, "valid_targets_mean": 3737.6, "valid_targets_min": 1389 }, { "epoch": 3.1391585760517797, "grad_norm": 0.7481785553939617, "learning_rate": 2.696074974851346e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.18153071403503418, "step": 1940, "valid_targets_mean": 3754.9, "valid_targets_min": 1889 }, { "epoch": 3.147249190938511, "grad_norm": 0.6364983099115371, "learning_rate": 2.688504001046367e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.17164380848407745, "step": 1945, "valid_targets_mean": 3317.8, "valid_targets_min": 1357 }, { "epoch": 3.1553398058252426, "grad_norm": 0.5736813602974871, "learning_rate": 2.6809218179844085e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.17162342369556427, "step": 1950, "valid_targets_mean": 3369.4, "valid_targets_min": 397 }, { "epoch": 3.163430420711974, "grad_norm": 0.6226569121757463, "learning_rate": 2.6733285491079453e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.19535747170448303, "step": 1955, "valid_targets_mean": 4032.9, "valid_targets_min": 1219 }, { "epoch": 3.1715210355987056, "grad_norm": 0.6020916586272426, "learning_rate": 2.6657243180399373e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.19260089099407196, "step": 1960, "valid_targets_mean": 3971.1, "valid_targets_min": 507 }, { "epoch": 3.179611650485437, "grad_norm": 0.5228726712361733, "learning_rate": 2.658109248581814e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.16513675451278687, "step": 1965, "valid_targets_mean": 4421.4, "valid_targets_min": 2181 }, { "epoch": 3.1877022653721685, "grad_norm": 0.6756728849384417, "learning_rate": 2.650483464711462e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.19772417843341827, "step": 1970, "valid_targets_mean": 3761.0, "valid_targets_min": 834 }, { "epoch": 3.1957928802588995, "grad_norm": 0.5713446845470945, "learning_rate": 2.6428470905812047e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.17231231927871704, "step": 1975, "valid_targets_mean": 3961.8, "valid_targets_min": 391 }, { "epoch": 3.203883495145631, "grad_norm": 0.5742649893192334, "learning_rate": 2.6352002505157802e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.17857617139816284, "step": 1980, "valid_targets_mean": 3959.9, "valid_targets_min": 456 }, { "epoch": 3.2119741100323624, "grad_norm": 0.5570549296210755, "learning_rate": 2.6275430690103188e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.16560588777065277, "step": 1985, "valid_targets_mean": 3895.8, "valid_targets_min": 462 }, { "epoch": 3.220064724919094, "grad_norm": 0.6784253073209046, "learning_rate": 2.6198756707283153e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.20054873824119568, "step": 1990, "valid_targets_mean": 3521.2, "valid_targets_min": 984 }, { "epoch": 3.2281553398058254, "grad_norm": 0.5829948937510232, "learning_rate": 2.612198180499601e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702016144990921, "step": 1995, "valid_targets_mean": 4062.2, "valid_targets_min": 1310 }, { "epoch": 3.236245954692557, "grad_norm": 0.6454144281714788, "learning_rate": 2.604510723318309e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.19506880640983582, "step": 2000, "valid_targets_mean": 3623.4, "valid_targets_min": 289 }, { "epoch": 3.244336569579288, "grad_norm": 0.6449676332877781, "learning_rate": 2.5968134243408405e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.17631593346595764, "step": 2005, "valid_targets_mean": 3297.8, "valid_targets_min": 444 }, { "epoch": 3.2524271844660193, "grad_norm": 0.5997971315950034, "learning_rate": 2.5891064088838278e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.17917688190937042, "step": 2010, "valid_targets_mean": 3738.5, "valid_targets_min": 1014 }, { "epoch": 3.2605177993527508, "grad_norm": 0.5492504542337715, "learning_rate": 2.5813898024220912e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.1532193124294281, "step": 2015, "valid_targets_mean": 4056.2, "valid_targets_min": 1876 }, { "epoch": 3.2686084142394822, "grad_norm": 0.6096358205706522, "learning_rate": 2.573663730586601e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.17237809300422668, "step": 2020, "valid_targets_mean": 3330.9, "valid_targets_min": 495 }, { "epoch": 3.2766990291262137, "grad_norm": 0.5783520220955675, "learning_rate": 2.5659283191624277e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1740003228187561, "step": 2025, "valid_targets_mean": 4061.6, "valid_targets_min": 1840 }, { "epoch": 3.284789644012945, "grad_norm": 0.6089773249005341, "learning_rate": 2.5581836940866967e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.15423806011676788, "step": 2030, "valid_targets_mean": 3516.4, "valid_targets_min": 706 }, { "epoch": 3.292880258899676, "grad_norm": 0.6155420560621121, "learning_rate": 2.550429981446537e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1603637933731079, "step": 2035, "valid_targets_mean": 3189.5, "valid_targets_min": 731 }, { "epoch": 3.3009708737864076, "grad_norm": 0.5640533692970745, "learning_rate": 2.542667307477027e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.16283290088176727, "step": 2040, "valid_targets_mean": 3909.0, "valid_targets_min": 1231 }, { "epoch": 3.309061488673139, "grad_norm": 0.705469954007443, "learning_rate": 2.534895798559144e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1684490144252777, "step": 2045, "valid_targets_mean": 2735.7, "valid_targets_min": 463 }, { "epoch": 3.3171521035598706, "grad_norm": 0.5321890260336842, "learning_rate": 2.527115581217702e-05, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.15115907788276672, "step": 2050, "valid_targets_mean": 3915.1, "valid_targets_min": 1589 }, { "epoch": 3.325242718446602, "grad_norm": 0.6319090887888136, "learning_rate": 2.5193267821192914e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.1694541871547699, "step": 2055, "valid_targets_mean": 3444.1, "valid_targets_min": 313 }, { "epoch": 3.3333333333333335, "grad_norm": 0.6041257377819086, "learning_rate": 2.5115295280702222e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.177719846367836, "step": 2060, "valid_targets_mean": 3456.6, "valid_targets_min": 1040 }, { "epoch": 3.341423948220065, "grad_norm": 0.6358966333325975, "learning_rate": 2.5037239460144534e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.17559629678726196, "step": 2065, "valid_targets_mean": 3449.5, "valid_targets_min": 718 }, { "epoch": 3.349514563106796, "grad_norm": 0.5906966992314931, "learning_rate": 2.4959101630315315e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.19974157214164734, "step": 2070, "valid_targets_mean": 4124.6, "valid_targets_min": 377 }, { "epoch": 3.3576051779935274, "grad_norm": 0.5645320929874551, "learning_rate": 2.4880883063345157e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.15666401386260986, "step": 2075, "valid_targets_mean": 3943.2, "valid_targets_min": 2646 }, { "epoch": 3.365695792880259, "grad_norm": 0.640752643762248, "learning_rate": 2.480258503267912e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.16370724141597748, "step": 2080, "valid_targets_mean": 3595.3, "valid_targets_min": 473 }, { "epoch": 3.3737864077669903, "grad_norm": 0.6051795750412866, "learning_rate": 2.472420881305599e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.16652750968933105, "step": 2085, "valid_targets_mean": 3438.4, "valid_targets_min": 249 }, { "epoch": 3.381877022653722, "grad_norm": 0.56914949365543, "learning_rate": 2.4645755680487497e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.15044154226779938, "step": 2090, "valid_targets_mean": 3443.5, "valid_targets_min": 803 }, { "epoch": 3.389967637540453, "grad_norm": 0.6078709562725402, "learning_rate": 2.4567226912237566e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.18583205342292786, "step": 2095, "valid_targets_mean": 3916.0, "valid_targets_min": 2345 }, { "epoch": 3.3980582524271843, "grad_norm": 0.632101264354982, "learning_rate": 2.4488623786801523e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.18830320239067078, "step": 2100, "valid_targets_mean": 3117.6, "valid_targets_min": 386 }, { "epoch": 3.4061488673139158, "grad_norm": 0.5952149912286673, "learning_rate": 2.4409947583885272e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.15162335336208344, "step": 2105, "valid_targets_mean": 3879.4, "valid_targets_min": 1340 }, { "epoch": 3.414239482200647, "grad_norm": 0.5796451186001909, "learning_rate": 2.4331199584384448e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17198210954666138, "step": 2110, "valid_targets_mean": 4103.7, "valid_targets_min": 579 }, { "epoch": 3.4223300970873787, "grad_norm": 0.5465540090675008, "learning_rate": 2.425238107036359e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.14355331659317017, "step": 2115, "valid_targets_mean": 4076.2, "valid_targets_min": 2289 }, { "epoch": 3.43042071197411, "grad_norm": 0.594717506650347, "learning_rate": 2.4173493325035255e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.18043139576911926, "step": 2120, "valid_targets_mean": 3892.8, "valid_targets_min": 443 }, { "epoch": 3.4385113268608416, "grad_norm": 0.5419410813351541, "learning_rate": 2.4094537632739126e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.16672024130821228, "step": 2125, "valid_targets_mean": 4480.9, "valid_targets_min": 462 }, { "epoch": 3.4466019417475726, "grad_norm": 0.6037829229049166, "learning_rate": 2.40155152789211e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.17883463203907013, "step": 2130, "valid_targets_mean": 3816.6, "valid_targets_min": 1345 }, { "epoch": 3.454692556634304, "grad_norm": 0.5647817759923721, "learning_rate": 2.3936427550112375e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.17558303475379944, "step": 2135, "valid_targets_mean": 3933.2, "valid_targets_min": 1142 }, { "epoch": 3.4627831715210355, "grad_norm": 0.6313512858911249, "learning_rate": 2.3857275733908476e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.17078541219234467, "step": 2140, "valid_targets_mean": 3346.6, "valid_targets_min": 494 }, { "epoch": 3.470873786407767, "grad_norm": 0.5891762304651471, "learning_rate": 2.377806111894832e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.15590104460716248, "step": 2145, "valid_targets_mean": 3573.3, "valid_targets_min": 966 }, { "epoch": 3.4789644012944985, "grad_norm": 0.6482887954040247, "learning_rate": 2.3698784994893214e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.16722315549850464, "step": 2150, "valid_targets_mean": 3687.2, "valid_targets_min": 473 }, { "epoch": 3.48705501618123, "grad_norm": 0.6128863861838072, "learning_rate": 2.3619448652405885e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.15946364402770996, "step": 2155, "valid_targets_mean": 3502.8, "valid_targets_min": 421 }, { "epoch": 3.4951456310679614, "grad_norm": 0.5765896527856256, "learning_rate": 2.3540053383129458e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.188400000333786, "step": 2160, "valid_targets_mean": 3874.4, "valid_targets_min": 547 }, { "epoch": 3.5032362459546924, "grad_norm": 0.5859054394697829, "learning_rate": 2.346060047966638e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1690550446510315, "step": 2165, "valid_targets_mean": 4166.0, "valid_targets_min": 1667 }, { "epoch": 3.511326860841424, "grad_norm": 0.7036463701667274, "learning_rate": 2.3381091235557475e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.1957768201828003, "step": 2170, "valid_targets_mean": 3727.4, "valid_targets_min": 1747 }, { "epoch": 3.5194174757281553, "grad_norm": 0.5916107265381505, "learning_rate": 2.330152694526077e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.1751423478126526, "step": 2175, "valid_targets_mean": 3770.8, "valid_targets_min": 1953 }, { "epoch": 3.527508090614887, "grad_norm": 0.593608794686705, "learning_rate": 2.322190890413053e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.18094240128993988, "step": 2180, "valid_targets_mean": 4127.8, "valid_targets_min": 2488 }, { "epoch": 3.5355987055016183, "grad_norm": 0.5654915385772826, "learning_rate": 2.3142238408396076e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.14299830794334412, "step": 2185, "valid_targets_mean": 3797.2, "valid_targets_min": 1422 }, { "epoch": 3.5436893203883493, "grad_norm": 0.6289935817923777, "learning_rate": 2.3062516755140733e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.17214451730251312, "step": 2190, "valid_targets_mean": 3183.4, "valid_targets_min": 718 }, { "epoch": 3.551779935275081, "grad_norm": 0.597140353068917, "learning_rate": 2.2982745242280716e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.16503599286079407, "step": 2195, "valid_targets_mean": 3889.6, "valid_targets_min": 654 }, { "epoch": 3.559870550161812, "grad_norm": 0.5994193806365925, "learning_rate": 2.290292516854396e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.18332546949386597, "step": 2200, "valid_targets_mean": 3912.4, "valid_targets_min": 683 }, { "epoch": 3.5679611650485437, "grad_norm": 0.6642282116127255, "learning_rate": 2.2823057833449013e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.18105272948741913, "step": 2205, "valid_targets_mean": 3320.1, "valid_targets_min": 523 }, { "epoch": 3.576051779935275, "grad_norm": 0.6015323897456493, "learning_rate": 2.274314453728386e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.1692677140235901, "step": 2210, "valid_targets_mean": 3614.8, "valid_targets_min": 374 }, { "epoch": 3.5841423948220066, "grad_norm": 0.6537271526172133, "learning_rate": 2.2663186581084777e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.20455987751483917, "step": 2215, "valid_targets_mean": 3651.8, "valid_targets_min": 842 }, { "epoch": 3.592233009708738, "grad_norm": 0.6232084648287293, "learning_rate": 2.258318526661511e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.16232970356941223, "step": 2220, "valid_targets_mean": 3327.6, "valid_targets_min": 749 }, { "epoch": 3.600323624595469, "grad_norm": 0.6296326256388624, "learning_rate": 2.250314189634412e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.19072610139846802, "step": 2225, "valid_targets_mean": 4073.9, "valid_targets_min": 2199 }, { "epoch": 3.6084142394822005, "grad_norm": 0.6449233967179974, "learning_rate": 2.2423057773425745e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1651957631111145, "step": 2230, "valid_targets_mean": 3022.1, "valid_targets_min": 434 }, { "epoch": 3.616504854368932, "grad_norm": 0.6559395560780564, "learning_rate": 2.2342934201677422e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.17878469824790955, "step": 2235, "valid_targets_mean": 3622.1, "valid_targets_min": 516 }, { "epoch": 3.6245954692556634, "grad_norm": 0.6173129941768686, "learning_rate": 2.2262772485558814e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.18011218309402466, "step": 2240, "valid_targets_mean": 3820.5, "valid_targets_min": 1903 }, { "epoch": 3.632686084142395, "grad_norm": 0.5753461959712433, "learning_rate": 2.218257393015062e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.1866929829120636, "step": 2245, "valid_targets_mean": 4092.4, "valid_targets_min": 391 }, { "epoch": 3.6407766990291264, "grad_norm": 0.5728173710154111, "learning_rate": 2.2102339841133285e-05, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.1651284098625183, "step": 2250, "valid_targets_mean": 3805.8, "valid_targets_min": 1586 }, { "epoch": 3.648867313915858, "grad_norm": 0.5916078253429511, "learning_rate": 2.2022071524765786e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.149724543094635, "step": 2255, "valid_targets_mean": 3961.8, "valid_targets_min": 2621 }, { "epoch": 3.656957928802589, "grad_norm": 0.6744997056371559, "learning_rate": 2.1941770287864315e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.19032660126686096, "step": 2260, "valid_targets_mean": 3410.2, "valid_targets_min": 453 }, { "epoch": 3.6650485436893203, "grad_norm": 0.6195720257754521, "learning_rate": 2.1861437437781045e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.1680455058813095, "step": 2265, "valid_targets_mean": 3784.2, "valid_targets_min": 702 }, { "epoch": 3.6731391585760518, "grad_norm": 0.672887046130233, "learning_rate": 2.1781074282382834e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.1819503754377365, "step": 2270, "valid_targets_mean": 3372.5, "valid_targets_min": 790 }, { "epoch": 3.6812297734627832, "grad_norm": 0.6776193321599489, "learning_rate": 2.170068213002992e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.18788284063339233, "step": 2275, "valid_targets_mean": 3483.5, "valid_targets_min": 419 }, { "epoch": 3.6893203883495147, "grad_norm": 0.6052000663341688, "learning_rate": 2.1620262289554628e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.1812586486339569, "step": 2280, "valid_targets_mean": 3708.8, "valid_targets_min": 1630 }, { "epoch": 3.6974110032362457, "grad_norm": 0.661641976363746, "learning_rate": 2.1539816070240062e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.19451472163200378, "step": 2285, "valid_targets_mean": 3528.8, "valid_targets_min": 456 }, { "epoch": 3.705501618122977, "grad_norm": 0.5930807874788253, "learning_rate": 2.1459344781798807e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.15635108947753906, "step": 2290, "valid_targets_mean": 4005.1, "valid_targets_min": 402 }, { "epoch": 3.7135922330097086, "grad_norm": 0.6112149905774165, "learning_rate": 2.1378849734351565e-05, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.162587970495224, "step": 2295, "valid_targets_mean": 3795.4, "valid_targets_min": 2380 }, { "epoch": 3.72168284789644, "grad_norm": 0.6057359622968203, "learning_rate": 2.1298332238405856e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.17883029580116272, "step": 2300, "valid_targets_mean": 4006.3, "valid_targets_min": 1048 }, { "epoch": 3.7297734627831716, "grad_norm": 0.6144431941266508, "learning_rate": 2.1217793604834687e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.17724230885505676, "step": 2305, "valid_targets_mean": 4024.4, "valid_targets_min": 2274 }, { "epoch": 3.737864077669903, "grad_norm": 0.6057468889256321, "learning_rate": 2.1137235144855177e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.15354929864406586, "step": 2310, "valid_targets_mean": 3366.8, "valid_targets_min": 475 }, { "epoch": 3.7459546925566345, "grad_norm": 0.6053175336946324, "learning_rate": 2.1056658170007247e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.17170631885528564, "step": 2315, "valid_targets_mean": 3616.9, "valid_targets_min": 428 }, { "epoch": 3.7540453074433655, "grad_norm": 0.6213868430128134, "learning_rate": 2.0976063992132252e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.1570182740688324, "step": 2320, "valid_targets_mean": 3374.6, "valid_targets_min": 650 }, { "epoch": 3.762135922330097, "grad_norm": 0.7286560834537692, "learning_rate": 2.0895453923351613e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.20686554908752441, "step": 2325, "valid_targets_mean": 3858.3, "valid_targets_min": 613 }, { "epoch": 3.7702265372168284, "grad_norm": 0.6560663109735195, "learning_rate": 2.0814829276045465e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.18524110317230225, "step": 2330, "valid_targets_mean": 3464.4, "valid_targets_min": 1675 }, { "epoch": 3.77831715210356, "grad_norm": 0.6254622237386656, "learning_rate": 2.0734191362831294e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.16618870198726654, "step": 2335, "valid_targets_mean": 3355.0, "valid_targets_min": 460 }, { "epoch": 3.7864077669902914, "grad_norm": 0.5906343788820818, "learning_rate": 2.0653541496542566e-05, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.17420311272144318, "step": 2340, "valid_targets_mean": 4128.1, "valid_targets_min": 3301 }, { "epoch": 3.794498381877023, "grad_norm": 0.6495213062678279, "learning_rate": 2.0572880990207343e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.1777752935886383, "step": 2345, "valid_targets_mean": 3703.5, "valid_targets_min": 431 }, { "epoch": 3.8025889967637543, "grad_norm": 0.6281322531518733, "learning_rate": 2.049221115702692e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1519239991903305, "step": 2350, "valid_targets_mean": 3610.2, "valid_targets_min": 1169 }, { "epoch": 3.8106796116504853, "grad_norm": 0.6161485822405318, "learning_rate": 2.0411533310354433e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.15030154585838318, "step": 2355, "valid_targets_mean": 4126.1, "valid_targets_min": 1810 }, { "epoch": 3.8187702265372168, "grad_norm": 0.5757629774093376, "learning_rate": 2.0330848763673484e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.15009431540966034, "step": 2360, "valid_targets_mean": 3805.3, "valid_targets_min": 1449 }, { "epoch": 3.8268608414239482, "grad_norm": 0.5666043552752347, "learning_rate": 2.0250158830576764e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.14444783329963684, "step": 2365, "valid_targets_mean": 4227.1, "valid_targets_min": 682 }, { "epoch": 3.8349514563106797, "grad_norm": 0.6061569302969273, "learning_rate": 2.0169464824744636e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.1677263081073761, "step": 2370, "valid_targets_mean": 3836.5, "valid_targets_min": 413 }, { "epoch": 3.843042071197411, "grad_norm": 0.6299856336138258, "learning_rate": 2.0088768059923795e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.18110263347625732, "step": 2375, "valid_targets_mean": 3476.6, "valid_targets_min": 1588 }, { "epoch": 3.851132686084142, "grad_norm": 0.6644952355917083, "learning_rate": 2.0008069849905847e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.18871355056762695, "step": 2380, "valid_targets_mean": 3636.7, "valid_targets_min": 436 }, { "epoch": 3.8592233009708736, "grad_norm": 0.6650438404888883, "learning_rate": 1.9927371508505915e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.1898743063211441, "step": 2385, "valid_targets_mean": 3361.4, "valid_targets_min": 601 }, { "epoch": 3.867313915857605, "grad_norm": 0.6480640499016951, "learning_rate": 1.984667434954126e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.17341741919517517, "step": 2390, "valid_targets_mean": 3357.9, "valid_targets_min": 432 }, { "epoch": 3.8754045307443366, "grad_norm": 0.6704594696673299, "learning_rate": 1.9765979686809912e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.16611242294311523, "step": 2395, "valid_targets_mean": 3253.0, "valid_targets_min": 496 }, { "epoch": 3.883495145631068, "grad_norm": 0.5941524325792283, "learning_rate": 1.968528883406925e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.16716042160987854, "step": 2400, "valid_targets_mean": 4301.2, "valid_targets_min": 1379 }, { "epoch": 3.8915857605177995, "grad_norm": 0.6006935814066899, "learning_rate": 1.9604603105014616e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.16704756021499634, "step": 2405, "valid_targets_mean": 3946.9, "valid_targets_min": 2249 }, { "epoch": 3.899676375404531, "grad_norm": 0.6642684578913485, "learning_rate": 1.9523923813257957e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.161843404173851, "step": 2410, "valid_targets_mean": 3472.9, "valid_targets_min": 459 }, { "epoch": 3.907766990291262, "grad_norm": 0.5724065210606161, "learning_rate": 1.9443252272306384e-05, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.17966113984584808, "step": 2415, "valid_targets_mean": 4337.2, "valid_targets_min": 1683 }, { "epoch": 3.9158576051779934, "grad_norm": 0.6194183255977415, "learning_rate": 1.9362589795540852e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.16092973947525024, "step": 2420, "valid_targets_mean": 3506.6, "valid_targets_min": 770 }, { "epoch": 3.923948220064725, "grad_norm": 0.6219635655220017, "learning_rate": 1.9281937696194723e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.17510530352592468, "step": 2425, "valid_targets_mean": 3865.4, "valid_targets_min": 1030 }, { "epoch": 3.9320388349514563, "grad_norm": 0.6231486842433605, "learning_rate": 1.9201297287332428e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.16570451855659485, "step": 2430, "valid_targets_mean": 3851.4, "valid_targets_min": 374 }, { "epoch": 3.940129449838188, "grad_norm": 0.7102714071978097, "learning_rate": 1.912066988182806e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856686770915985, "step": 2435, "valid_targets_mean": 3550.0, "valid_targets_min": 1528 }, { "epoch": 3.948220064724919, "grad_norm": 0.6300878458902386, "learning_rate": 1.9040056792344005e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.1716354787349701, "step": 2440, "valid_targets_mean": 3878.1, "valid_targets_min": 1171 }, { "epoch": 3.9563106796116507, "grad_norm": 0.5406998255380289, "learning_rate": 1.8959459331309576e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490856409072876, "step": 2445, "valid_targets_mean": 4219.6, "valid_targets_min": 2389 }, { "epoch": 3.9644012944983817, "grad_norm": 0.6750562788965354, "learning_rate": 1.8878878810899653e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.16222772002220154, "step": 2450, "valid_targets_mean": 3240.6, "valid_targets_min": 506 }, { "epoch": 3.972491909385113, "grad_norm": 0.6453126907074695, "learning_rate": 1.8798316543013317e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.18792478740215302, "step": 2455, "valid_targets_mean": 3656.6, "valid_targets_min": 449 }, { "epoch": 3.9805825242718447, "grad_norm": 0.6466575183901547, "learning_rate": 1.8717773839252477e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.17349807918071747, "step": 2460, "valid_targets_mean": 4207.3, "valid_targets_min": 1258 }, { "epoch": 3.988673139158576, "grad_norm": 0.5677694171684091, "learning_rate": 1.8637252010900515e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.14839619398117065, "step": 2465, "valid_targets_mean": 3616.2, "valid_targets_min": 369 }, { "epoch": 3.9967637540453076, "grad_norm": 0.5817112797352827, "learning_rate": 1.8556752368900972e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.15644389390945435, "step": 2470, "valid_targets_mean": 4212.1, "valid_targets_min": 598 }, { "epoch": 4.004854368932039, "grad_norm": 0.5838872954552842, "learning_rate": 1.8476276223836177e-05, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1359456181526184, "step": 2475, "valid_targets_mean": 3580.9, "valid_targets_min": 460 }, { "epoch": 4.0129449838187705, "grad_norm": 0.6181440361500631, "learning_rate": 1.8395824885905898e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.15484167635440826, "step": 2480, "valid_targets_mean": 4019.4, "valid_targets_min": 1593 }, { "epoch": 4.0210355987055015, "grad_norm": 0.6311832020407332, "learning_rate": 1.8315399664906062e-05, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.1441861242055893, "step": 2485, "valid_targets_mean": 3870.4, "valid_targets_min": 1748 }, { "epoch": 4.029126213592233, "grad_norm": 0.6857583489532473, "learning_rate": 1.823500187020735e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345384567975998, "step": 2490, "valid_targets_mean": 3765.9, "valid_targets_min": 1322 }, { "epoch": 4.0372168284789645, "grad_norm": 0.7113640655797298, "learning_rate": 1.815463281073396e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.1583227813243866, "step": 2495, "valid_targets_mean": 3249.9, "valid_targets_min": 539 }, { "epoch": 4.0453074433656955, "grad_norm": 0.662581106462447, "learning_rate": 1.8074293794942262e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.1287870854139328, "step": 2500, "valid_targets_mean": 3816.8, "valid_targets_min": 926 }, { "epoch": 4.053398058252427, "grad_norm": 0.5793919248054356, "learning_rate": 1.7993986130799477e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330222338438034, "step": 2505, "valid_targets_mean": 4338.5, "valid_targets_min": 2365 }, { "epoch": 4.061488673139158, "grad_norm": 0.6078390592693177, "learning_rate": 1.7913711125762435e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1425902545452118, "step": 2510, "valid_targets_mean": 4566.3, "valid_targets_min": 2815 }, { "epoch": 4.06957928802589, "grad_norm": 0.8150168677382256, "learning_rate": 1.7833470086756214e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14174199104309082, "step": 2515, "valid_targets_mean": 3431.4, "valid_targets_min": 780 }, { "epoch": 4.077669902912621, "grad_norm": 0.670471952566526, "learning_rate": 1.7753264320152934e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.15361058712005615, "step": 2520, "valid_targets_mean": 3481.4, "valid_targets_min": 816 }, { "epoch": 4.085760517799352, "grad_norm": 0.6021110394444014, "learning_rate": 1.7673095131750454e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.14771947264671326, "step": 2525, "valid_targets_mean": 3895.3, "valid_targets_min": 370 }, { "epoch": 4.093851132686084, "grad_norm": 0.6313198974033982, "learning_rate": 1.759296382675112e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.13901178538799286, "step": 2530, "valid_targets_mean": 3643.3, "valid_targets_min": 562 }, { "epoch": 4.101941747572815, "grad_norm": 1.115383670240578, "learning_rate": 1.7512871709740515e-05, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.14427712559700012, "step": 2535, "valid_targets_mean": 3357.8, "valid_targets_min": 1258 }, { "epoch": 4.110032362459547, "grad_norm": 0.5945728257795431, "learning_rate": 1.743282008466619e-05, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.13450026512145996, "step": 2540, "valid_targets_mean": 3983.9, "valid_targets_min": 2594 }, { "epoch": 4.118122977346278, "grad_norm": 0.6485166896234807, "learning_rate": 1.7352810254816498e-05, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.1662842035293579, "step": 2545, "valid_targets_mean": 3923.2, "valid_targets_min": 691 }, { "epoch": 4.12621359223301, "grad_norm": 0.6534762301883935, "learning_rate": 1.727284352279934e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.13402123749256134, "step": 2550, "valid_targets_mean": 3921.8, "valid_targets_min": 2214 }, { "epoch": 4.134304207119741, "grad_norm": 0.6786977646467098, "learning_rate": 1.7192921190520936e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.14459103345870972, "step": 2555, "valid_targets_mean": 4039.2, "valid_targets_min": 1643 }, { "epoch": 4.142394822006472, "grad_norm": 0.6573301423442405, "learning_rate": 1.7113044559164657e-05, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.15165367722511292, "step": 2560, "valid_targets_mean": 3763.1, "valid_targets_min": 622 }, { "epoch": 4.150485436893204, "grad_norm": 0.6621324780494194, "learning_rate": 1.7033214929169847e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.14901897311210632, "step": 2565, "valid_targets_mean": 3928.9, "valid_targets_min": 2003 }, { "epoch": 4.158576051779935, "grad_norm": 0.649660750750346, "learning_rate": 1.695343360021064e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.14463084936141968, "step": 2570, "valid_targets_mean": 4004.2, "valid_targets_min": 1628 }, { "epoch": 4.166666666666667, "grad_norm": 0.6870184255662538, "learning_rate": 1.6873701871174782e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.14344152808189392, "step": 2575, "valid_targets_mean": 3691.4, "valid_targets_min": 621 }, { "epoch": 4.174757281553398, "grad_norm": 0.6505329392557849, "learning_rate": 1.6794021040142534e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1347620189189911, "step": 2580, "valid_targets_mean": 3929.4, "valid_targets_min": 953 }, { "epoch": 4.18284789644013, "grad_norm": 0.7350776506050503, "learning_rate": 1.6714392404365467e-05, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.15007461607456207, "step": 2585, "valid_targets_mean": 4382.9, "valid_targets_min": 2220 }, { "epoch": 4.190938511326861, "grad_norm": 0.754225049943721, "learning_rate": 1.6634817260245417e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.16796696186065674, "step": 2590, "valid_targets_mean": 3107.8, "valid_targets_min": 451 }, { "epoch": 4.199029126213592, "grad_norm": 0.651272931082461, "learning_rate": 1.655529690331332e-05, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.1237691193819046, "step": 2595, "valid_targets_mean": 3806.5, "valid_targets_min": 909 }, { "epoch": 4.207119741100324, "grad_norm": 0.6508181443890371, "learning_rate": 1.6475832628208165e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.13523957133293152, "step": 2600, "valid_targets_mean": 3647.2, "valid_targets_min": 957 }, { "epoch": 4.215210355987055, "grad_norm": 0.7227632839629261, "learning_rate": 1.6396425728655874e-05, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.1514357030391693, "step": 2605, "valid_targets_mean": 3626.4, "valid_targets_min": 536 }, { "epoch": 4.223300970873787, "grad_norm": 0.6640700426495993, "learning_rate": 1.6317077497448278e-05, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.1584387570619583, "step": 2610, "valid_targets_mean": 3992.6, "valid_targets_min": 451 }, { "epoch": 4.231391585760518, "grad_norm": 0.8556463930160811, "learning_rate": 1.6237789226422033e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.14512553811073303, "step": 2615, "valid_targets_mean": 3118.4, "valid_targets_min": 428 }, { "epoch": 4.239482200647249, "grad_norm": 0.7077309518646648, "learning_rate": 1.6158562206437634e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.14674773812294006, "step": 2620, "valid_targets_mean": 3484.4, "valid_targets_min": 349 }, { "epoch": 4.247572815533981, "grad_norm": 0.6862643174407498, "learning_rate": 1.6079397727358345e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.17743253707885742, "step": 2625, "valid_targets_mean": 3890.9, "valid_targets_min": 1035 }, { "epoch": 4.255663430420712, "grad_norm": 0.6813524473623369, "learning_rate": 1.6000297078029256e-05, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.15772217512130737, "step": 2630, "valid_targets_mean": 4023.1, "valid_targets_min": 533 }, { "epoch": 4.263754045307444, "grad_norm": 0.6563813142401669, "learning_rate": 1.5921261546256236e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.12581901252269745, "step": 2635, "valid_targets_mean": 3186.6, "valid_targets_min": 946 }, { "epoch": 4.271844660194175, "grad_norm": 0.679061048016753, "learning_rate": 1.5842292418785026e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.13736608624458313, "step": 2640, "valid_targets_mean": 3609.4, "valid_targets_min": 826 }, { "epoch": 4.2799352750809065, "grad_norm": 0.6955635366220325, "learning_rate": 1.5763390981280258e-05, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.13078239560127258, "step": 2645, "valid_targets_mean": 3810.5, "valid_targets_min": 1642 }, { "epoch": 4.288025889967638, "grad_norm": 0.6710216957754729, "learning_rate": 1.568455851830453e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374095380306244, "step": 2650, "valid_targets_mean": 3627.3, "valid_targets_min": 1344 }, { "epoch": 4.296116504854369, "grad_norm": 0.6781973790355561, "learning_rate": 1.5605796313297502e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.14508819580078125, "step": 2655, "valid_targets_mean": 3500.6, "valid_targets_min": 426 }, { "epoch": 4.3042071197411005, "grad_norm": 0.7376450559475305, "learning_rate": 1.552710564855498e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402195245027542, "step": 2660, "valid_targets_mean": 3175.8, "valid_targets_min": 449 }, { "epoch": 4.3122977346278315, "grad_norm": 0.7192468794992135, "learning_rate": 1.5448487805208047e-05, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.14955146610736847, "step": 2665, "valid_targets_mean": 3211.4, "valid_targets_min": 269 }, { "epoch": 4.320388349514563, "grad_norm": 0.6228075319720846, "learning_rate": 1.5369944063202228e-05, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1207929328083992, "step": 2670, "valid_targets_mean": 3558.4, "valid_targets_min": 499 }, { "epoch": 4.328478964401294, "grad_norm": 0.7485342397517419, "learning_rate": 1.529147570127663e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.14952194690704346, "step": 2675, "valid_targets_mean": 3660.6, "valid_targets_min": 790 }, { "epoch": 4.336569579288026, "grad_norm": 0.6931771759253382, "learning_rate": 1.5213083996943124e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.1318070888519287, "step": 2680, "valid_targets_mean": 3454.6, "valid_targets_min": 522 }, { "epoch": 4.344660194174757, "grad_norm": 0.6979626156230478, "learning_rate": 1.5134770226465533e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.146072655916214, "step": 2685, "valid_targets_mean": 3518.3, "valid_targets_min": 538 }, { "epoch": 4.352750809061488, "grad_norm": 0.6557240448616157, "learning_rate": 1.5056535664838894e-05, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.14116227626800537, "step": 2690, "valid_targets_mean": 4056.6, "valid_targets_min": 2699 }, { "epoch": 4.36084142394822, "grad_norm": 0.6417394256829899, "learning_rate": 1.4978381585768676e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.16907694935798645, "step": 2695, "valid_targets_mean": 4150.7, "valid_targets_min": 1647 }, { "epoch": 4.368932038834951, "grad_norm": 0.6447473771244111, "learning_rate": 1.490030926165002e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.12808853387832642, "step": 2700, "valid_targets_mean": 3274.6, "valid_targets_min": 650 }, { "epoch": 4.377022653721683, "grad_norm": 0.6135227436036308, "learning_rate": 1.4822319963547083e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.15349863469600677, "step": 2705, "valid_targets_mean": 3956.3, "valid_targets_min": 2449 }, { "epoch": 4.385113268608414, "grad_norm": 0.6632921549893784, "learning_rate": 1.4744414961172267e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.152324840426445, "step": 2710, "valid_targets_mean": 3791.8, "valid_targets_min": 1014 }, { "epoch": 4.393203883495145, "grad_norm": 0.6832544029610803, "learning_rate": 1.4666595522865628e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.16460612416267395, "step": 2715, "valid_targets_mean": 3845.2, "valid_targets_min": 910 }, { "epoch": 4.401294498381877, "grad_norm": 0.6833501669663028, "learning_rate": 1.4588862915574158e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.16949523985385895, "step": 2720, "valid_targets_mean": 4021.8, "valid_targets_min": 1366 }, { "epoch": 4.409385113268608, "grad_norm": 0.6096949346655066, "learning_rate": 1.4511218404831208e-05, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.12424943596124649, "step": 2725, "valid_targets_mean": 3627.6, "valid_targets_min": 559 }, { "epoch": 4.41747572815534, "grad_norm": 0.6522445618690355, "learning_rate": 1.4433663254735868e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1399524211883545, "step": 2730, "valid_targets_mean": 3913.4, "valid_targets_min": 2373 }, { "epoch": 4.425566343042071, "grad_norm": 0.6078107797038349, "learning_rate": 1.4356198727932357e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.14214907586574554, "step": 2735, "valid_targets_mean": 4400.7, "valid_targets_min": 3234 }, { "epoch": 4.433656957928803, "grad_norm": 0.6322546695687536, "learning_rate": 1.427882608558951e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.1225961297750473, "step": 2740, "valid_targets_mean": 3752.8, "valid_targets_min": 1584 }, { "epoch": 4.441747572815534, "grad_norm": 0.6617047906893644, "learning_rate": 1.420154658738023e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.15037743747234344, "step": 2745, "valid_targets_mean": 3884.7, "valid_targets_min": 650 }, { "epoch": 4.449838187702265, "grad_norm": 0.6450489483141357, "learning_rate": 1.4124361491460979e-05, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.14448890089988708, "step": 2750, "valid_targets_mean": 4195.3, "valid_targets_min": 2233 }, { "epoch": 4.457928802588997, "grad_norm": 0.7196615177429064, "learning_rate": 1.4047272054451288e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.15937447547912598, "step": 2755, "valid_targets_mean": 3453.7, "valid_targets_min": 442 }, { "epoch": 4.466019417475728, "grad_norm": 0.7185337546342929, "learning_rate": 1.397027953141329e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.11660395562648773, "step": 2760, "valid_targets_mean": 3775.2, "valid_targets_min": 1588 }, { "epoch": 4.47411003236246, "grad_norm": 0.689052637867341, "learning_rate": 1.3893385175831326e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.15225495398044586, "step": 2765, "valid_targets_mean": 3532.5, "valid_targets_min": 433 }, { "epoch": 4.482200647249191, "grad_norm": 0.6084241558336754, "learning_rate": 1.3816590239591502e-05, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.12444262951612473, "step": 2770, "valid_targets_mean": 3905.1, "valid_targets_min": 997 }, { "epoch": 4.490291262135923, "grad_norm": 0.7634877881621217, "learning_rate": 1.3739895972961312e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.16124451160430908, "step": 2775, "valid_targets_mean": 3246.4, "valid_targets_min": 431 }, { "epoch": 4.498381877022654, "grad_norm": 0.7282789159692459, "learning_rate": 1.3663303624569303e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560203731060028, "step": 2780, "valid_targets_mean": 3731.1, "valid_targets_min": 605 }, { "epoch": 4.506472491909385, "grad_norm": 0.6105558503523129, "learning_rate": 1.3586814441384707e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.12341571599245071, "step": 2785, "valid_targets_mean": 4048.4, "valid_targets_min": 2250 }, { "epoch": 4.514563106796117, "grad_norm": 0.6571177564002022, "learning_rate": 1.3510429668697188e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218075305223465, "step": 2790, "valid_targets_mean": 3747.4, "valid_targets_min": 1315 }, { "epoch": 4.522653721682848, "grad_norm": 0.6801848412658954, "learning_rate": 1.3434150550096534e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.16177475452423096, "step": 2795, "valid_targets_mean": 4049.3, "valid_targets_min": 1667 }, { "epoch": 4.53074433656958, "grad_norm": 0.6207342193834591, "learning_rate": 1.3357978327452425e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.13945342600345612, "step": 2800, "valid_targets_mean": 4553.1, "valid_targets_min": 2577 }, { "epoch": 4.538834951456311, "grad_norm": 0.6573784092270141, "learning_rate": 1.3281914240894218e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.1442652940750122, "step": 2805, "valid_targets_mean": 4044.2, "valid_targets_min": 1903 }, { "epoch": 4.546925566343042, "grad_norm": 0.7805486249949233, "learning_rate": 1.320595952879073e-05, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.15102678537368774, "step": 2810, "valid_targets_mean": 3677.2, "valid_targets_min": 330 }, { "epoch": 4.555016181229774, "grad_norm": 0.67466501003837, "learning_rate": 1.3130115427730106e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.14177349209785461, "step": 2815, "valid_targets_mean": 3778.1, "valid_targets_min": 2097 }, { "epoch": 4.563106796116505, "grad_norm": 0.6530112142615018, "learning_rate": 1.3054383172499688e-05, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1437305212020874, "step": 2820, "valid_targets_mean": 4198.1, "valid_targets_min": 2700 }, { "epoch": 4.5711974110032365, "grad_norm": 0.677754173384933, "learning_rate": 1.2978763996065888e-05, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1430257260799408, "step": 2825, "valid_targets_mean": 3589.8, "valid_targets_min": 1004 }, { "epoch": 4.5792880258899675, "grad_norm": 0.748140170284871, "learning_rate": 1.2903259129554138e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.16187545657157898, "step": 2830, "valid_targets_mean": 4454.9, "valid_targets_min": 1996 }, { "epoch": 4.5873786407766985, "grad_norm": 0.725070674975314, "learning_rate": 1.2827869802228816e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.16014769673347473, "step": 2835, "valid_targets_mean": 3145.8, "valid_targets_min": 473 }, { "epoch": 4.5954692556634305, "grad_norm": 0.6695155511796875, "learning_rate": 1.2752597241473273e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.13507728278636932, "step": 2840, "valid_targets_mean": 3233.1, "valid_targets_min": 522 }, { "epoch": 4.6035598705501615, "grad_norm": 0.6874745243656388, "learning_rate": 1.2677442672769832e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317557394504547, "step": 2845, "valid_targets_mean": 4060.1, "valid_targets_min": 1601 }, { "epoch": 4.611650485436893, "grad_norm": 0.6614289983469602, "learning_rate": 1.2602407319679822e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529705822467804, "step": 2850, "valid_targets_mean": 3698.4, "valid_targets_min": 1094 }, { "epoch": 4.619741100323624, "grad_norm": 0.6751540658943308, "learning_rate": 1.2527492403823664e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433483511209488, "step": 2855, "valid_targets_mean": 3522.2, "valid_targets_min": 249 }, { "epoch": 4.627831715210356, "grad_norm": 0.7103834955161041, "learning_rate": 1.2452699144861012e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1555805206298828, "step": 2860, "valid_targets_mean": 4060.1, "valid_targets_min": 470 }, { "epoch": 4.635922330097087, "grad_norm": 0.7622609109059741, "learning_rate": 1.237802876047086e-05, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1385229527950287, "step": 2865, "valid_targets_mean": 3845.6, "valid_targets_min": 1340 }, { "epoch": 4.644012944983819, "grad_norm": 0.7214538094938855, "learning_rate": 1.2303482466331727e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.15360170602798462, "step": 2870, "valid_targets_mean": 3656.2, "valid_targets_min": 738 }, { "epoch": 4.65210355987055, "grad_norm": 0.6916396910551235, "learning_rate": 1.2229061476101883e-05, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1525598168373108, "step": 2875, "valid_targets_mean": 3600.1, "valid_targets_min": 1357 }, { "epoch": 4.660194174757281, "grad_norm": 0.6729985151314064, "learning_rate": 1.2154767001399551e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.14135336875915527, "step": 2880, "valid_targets_mean": 3632.1, "valid_targets_min": 575 }, { "epoch": 4.668284789644013, "grad_norm": 0.6962655582465614, "learning_rate": 1.2080600251783233e-05, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368042379617691, "step": 2885, "valid_targets_mean": 3786.1, "valid_targets_min": 388 }, { "epoch": 4.676375404530744, "grad_norm": 0.7090725837062865, "learning_rate": 1.2006562434731968e-05, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.14932994544506073, "step": 2890, "valid_targets_mean": 3464.5, "valid_targets_min": 2115 }, { "epoch": 4.684466019417476, "grad_norm": 0.6985018150678612, "learning_rate": 1.193265475562571e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1416228860616684, "step": 2895, "valid_targets_mean": 3852.8, "valid_targets_min": 1231 }, { "epoch": 4.692556634304207, "grad_norm": 0.6608970430018517, "learning_rate": 1.1858878417725683e-05, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.13789209723472595, "step": 2900, "valid_targets_mean": 3671.8, "valid_targets_min": 685 }, { "epoch": 4.700647249190938, "grad_norm": 0.6626344499235478, "learning_rate": 1.1785234622154797e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.16734716296195984, "step": 2905, "valid_targets_mean": 3912.6, "valid_targets_min": 444 }, { "epoch": 4.70873786407767, "grad_norm": 0.729467490979312, "learning_rate": 1.1711724567878095e-05, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.141088604927063, "step": 2910, "valid_targets_mean": 3118.9, "valid_targets_min": 1241 }, { "epoch": 4.716828478964401, "grad_norm": 0.6271378285039474, "learning_rate": 1.1638349451683237e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.12910325825214386, "step": 2915, "valid_targets_mean": 3909.6, "valid_targets_min": 481 }, { "epoch": 4.724919093851133, "grad_norm": 0.7315823978800721, "learning_rate": 1.1565110468160996e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.16693362593650818, "step": 2920, "valid_targets_mean": 3973.8, "valid_targets_min": 1861 }, { "epoch": 4.733009708737864, "grad_norm": 0.6961422251454465, "learning_rate": 1.1492008809685856e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15453936159610748, "step": 2925, "valid_targets_mean": 3943.8, "valid_targets_min": 422 }, { "epoch": 4.741100323624595, "grad_norm": 0.7947679996073709, "learning_rate": 1.141904566639652e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.159670889377594, "step": 2930, "valid_targets_mean": 3625.1, "valid_targets_min": 1755 }, { "epoch": 4.749190938511327, "grad_norm": 0.6820283456884491, "learning_rate": 1.1346222226176606e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.13358992338180542, "step": 2935, "valid_targets_mean": 3843.3, "valid_targets_min": 462 }, { "epoch": 4.757281553398058, "grad_norm": 0.688613911291754, "learning_rate": 1.1273539674635296e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.14009517431259155, "step": 2940, "valid_targets_mean": 3796.8, "valid_targets_min": 468 }, { "epoch": 4.76537216828479, "grad_norm": 0.741239831951198, "learning_rate": 1.1200999195088e-05, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.13354428112506866, "step": 2945, "valid_targets_mean": 3529.9, "valid_targets_min": 985 }, { "epoch": 4.773462783171521, "grad_norm": 0.6855567557895231, "learning_rate": 1.1128601968537111e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.14763250946998596, "step": 2950, "valid_targets_mean": 4232.2, "valid_targets_min": 862 }, { "epoch": 4.781553398058253, "grad_norm": 0.6953856815463785, "learning_rate": 1.1056349173652791e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.14699126780033112, "step": 2955, "valid_targets_mean": 3721.8, "valid_targets_min": 463 }, { "epoch": 4.789644012944984, "grad_norm": 0.6429481817754351, "learning_rate": 1.098424198675375e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.12160778045654297, "step": 2960, "valid_targets_mean": 3576.0, "valid_targets_min": 1326 }, { "epoch": 4.797734627831716, "grad_norm": 0.6696602169332752, "learning_rate": 1.0912281581788138e-05, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489216685295105, "step": 2965, "valid_targets_mean": 4214.5, "valid_targets_min": 515 }, { "epoch": 4.805825242718447, "grad_norm": 0.6628125000555849, "learning_rate": 1.0840469130314382e-05, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368810534477234, "step": 2970, "valid_targets_mean": 4117.8, "valid_targets_min": 364 }, { "epoch": 4.813915857605178, "grad_norm": 0.6993787147902919, "learning_rate": 1.0768805801482151e-05, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.13343513011932373, "step": 2975, "valid_targets_mean": 3098.6, "valid_targets_min": 427 }, { "epoch": 4.82200647249191, "grad_norm": 0.7330396364465878, "learning_rate": 1.0697292762013304e-05, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.1259125918149948, "step": 2980, "valid_targets_mean": 3147.1, "valid_targets_min": 470 }, { "epoch": 4.830097087378641, "grad_norm": 0.722436884104266, "learning_rate": 1.0625931176182905e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.10967875272035599, "step": 2985, "valid_targets_mean": 3203.4, "valid_targets_min": 686 }, { "epoch": 4.8381877022653725, "grad_norm": 0.7138949308865148, "learning_rate": 1.0554722205800245e-05, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445237249135971, "step": 2990, "valid_targets_mean": 3971.1, "valid_targets_min": 1266 }, { "epoch": 4.8462783171521036, "grad_norm": 0.6823622727229742, "learning_rate": 1.0483667010189973e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1553669422864914, "step": 2995, "valid_targets_mean": 3809.2, "valid_targets_min": 422 }, { "epoch": 4.854368932038835, "grad_norm": 0.7813029712176784, "learning_rate": 1.0412766746173168e-05, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.17688441276550293, "step": 3000, "valid_targets_mean": 4146.6, "valid_targets_min": 2345 }, { "epoch": 4.8624595469255665, "grad_norm": 0.7018435375236487, "learning_rate": 1.0342022568048543e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.13416077196598053, "step": 3005, "valid_targets_mean": 3526.8, "valid_targets_min": 731 }, { "epoch": 4.8705501618122975, "grad_norm": 0.7073555559675111, "learning_rate": 1.0271435627573631e-05, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.13437259197235107, "step": 3010, "valid_targets_mean": 3547.7, "valid_targets_min": 1613 }, { "epoch": 4.878640776699029, "grad_norm": 0.7970239445560131, "learning_rate": 1.0201007073946041e-05, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.11350645124912262, "step": 3015, "valid_targets_mean": 3346.7, "valid_targets_min": 478 }, { "epoch": 4.88673139158576, "grad_norm": 0.6785346013570012, "learning_rate": 1.0130738053784768e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.144822895526886, "step": 3020, "valid_targets_mean": 4021.6, "valid_targets_min": 1996 }, { "epoch": 4.894822006472491, "grad_norm": 0.7767919403819858, "learning_rate": 1.0060629711111494e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.14588266611099243, "step": 3025, "valid_targets_mean": 3322.8, "valid_targets_min": 1553 }, { "epoch": 4.902912621359223, "grad_norm": 0.6946416256584877, "learning_rate": 9.99068318733195e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.14380928874015808, "step": 3030, "valid_targets_mean": 3390.6, "valid_targets_min": 446 }, { "epoch": 4.911003236245954, "grad_norm": 0.6506329244470211, "learning_rate": 9.92089962121741e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.11819320917129517, "step": 3035, "valid_targets_mean": 4117.6, "valid_targets_min": 423 }, { "epoch": 4.919093851132686, "grad_norm": 0.6476148960343205, "learning_rate": 9.851280148886061e-06, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.12191256880760193, "step": 3040, "valid_targets_mean": 3871.6, "valid_targets_min": 1215 }, { "epoch": 4.927184466019417, "grad_norm": 0.6425251067861399, "learning_rate": 9.78182590378455e-06, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.12856820225715637, "step": 3045, "valid_targets_mean": 3881.7, "valid_targets_min": 590 }, { "epoch": 4.935275080906149, "grad_norm": 0.6608994309697848, "learning_rate": 9.712538016669557e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.16227906942367554, "step": 3050, "valid_targets_mean": 4399.9, "valid_targets_min": 1498 }, { "epoch": 4.94336569579288, "grad_norm": 0.6863530052280413, "learning_rate": 9.643417615589299e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1477239429950714, "step": 3055, "valid_targets_mean": 4083.6, "valid_targets_min": 1446 }, { "epoch": 4.951456310679612, "grad_norm": 0.6955301304136801, "learning_rate": 9.574465825865276e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.14413318037986755, "step": 3060, "valid_targets_mean": 3786.9, "valid_targets_min": 909 }, { "epoch": 4.959546925566343, "grad_norm": 0.7140674650867661, "learning_rate": 9.50568377007386e-06, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1486683040857315, "step": 3065, "valid_targets_mean": 3171.9, "valid_targets_min": 405 }, { "epoch": 4.967637540453074, "grad_norm": 0.6709510332322777, "learning_rate": 9.43707256802806e-06, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.13565918803215027, "step": 3070, "valid_targets_mean": 4014.1, "valid_targets_min": 450 }, { "epoch": 4.975728155339806, "grad_norm": 0.7251112737304829, "learning_rate": 9.368633336759292e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.14906924962997437, "step": 3075, "valid_targets_mean": 3706.9, "valid_targets_min": 1849 }, { "epoch": 4.983818770226537, "grad_norm": 0.6722351700077497, "learning_rate": 9.300367190499178e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1070292741060257, "step": 3080, "valid_targets_mean": 3536.6, "valid_targets_min": 774 }, { "epoch": 4.991909385113269, "grad_norm": 0.7375188285335043, "learning_rate": 9.232275240661403e-06, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.14554689824581146, "step": 3085, "valid_targets_mean": 3175.9, "valid_targets_min": 405 }, { "epoch": 5.0, "grad_norm": 0.7498091683809376, "learning_rate": 9.164358595823661e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.13450586795806885, "step": 3090, "valid_targets_mean": 3267.0, "valid_targets_min": 390 }, { "epoch": 5.008090614886731, "grad_norm": 0.7255837834802069, "learning_rate": 9.096618361709545e-06, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.13300150632858276, "step": 3095, "valid_targets_mean": 3423.9, "valid_targets_min": 522 }, { "epoch": 5.016181229773463, "grad_norm": 0.705829673432509, "learning_rate": 9.029055641170588e-06, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11673476547002792, "step": 3100, "valid_targets_mean": 4109.0, "valid_targets_min": 2786 }, { "epoch": 5.024271844660194, "grad_norm": 0.6817632348570839, "learning_rate": 8.961671534168292e-06, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.12463103979825974, "step": 3105, "valid_targets_mean": 3897.5, "valid_targets_min": 1063 }, { "epoch": 5.032362459546926, "grad_norm": 0.7346020556413199, "learning_rate": 8.894467137756228e-06, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.13819938898086548, "step": 3110, "valid_targets_mean": 3778.1, "valid_targets_min": 1357 }, { "epoch": 5.040453074433657, "grad_norm": 0.6649553794586656, "learning_rate": 8.827443546062165e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.11913490295410156, "step": 3115, "valid_targets_mean": 3797.8, "valid_targets_min": 1538 }, { "epoch": 5.048543689320389, "grad_norm": 0.7359575993819188, "learning_rate": 8.760601850270277e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277879774570465, "step": 3120, "valid_targets_mean": 3530.2, "valid_targets_min": 507 }, { "epoch": 5.05663430420712, "grad_norm": 0.7258097409461821, "learning_rate": 8.69394313860335e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.1081918478012085, "step": 3125, "valid_targets_mean": 3826.4, "valid_targets_min": 1124 }, { "epoch": 5.064724919093851, "grad_norm": 0.7402612846004758, "learning_rate": 8.62746849630508e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.12437973916530609, "step": 3130, "valid_targets_mean": 3779.6, "valid_targets_min": 1287 }, { "epoch": 5.072815533980583, "grad_norm": 0.7365753473236456, "learning_rate": 8.561179005622411e-06, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.13570137321949005, "step": 3135, "valid_targets_mean": 3778.3, "valid_targets_min": 374 }, { "epoch": 5.080906148867314, "grad_norm": 0.647195839952784, "learning_rate": 8.495075745787895e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.1312873214483261, "step": 3140, "valid_targets_mean": 4459.8, "valid_targets_min": 1050 }, { "epoch": 5.088996763754046, "grad_norm": 0.6554961316240389, "learning_rate": 8.429159793002164e-06, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.11646975576877594, "step": 3145, "valid_targets_mean": 4235.4, "valid_targets_min": 2303 }, { "epoch": 5.097087378640777, "grad_norm": 0.7274467943356496, "learning_rate": 8.363432220416336e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1406169980764389, "step": 3150, "valid_targets_mean": 3789.8, "valid_targets_min": 377 }, { "epoch": 5.105177993527508, "grad_norm": 0.7281449684268655, "learning_rate": 8.297894098114612e-06, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.1407594084739685, "step": 3155, "valid_targets_mean": 3965.4, "valid_targets_min": 1744 }, { "epoch": 5.11326860841424, "grad_norm": 0.645898547032898, "learning_rate": 8.232546493096836e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1111171543598175, "step": 3160, "valid_targets_mean": 4013.9, "valid_targets_min": 1588 }, { "epoch": 5.121359223300971, "grad_norm": 0.838705244056076, "learning_rate": 8.167390469261105e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.1620527058839798, "step": 3165, "valid_targets_mean": 3344.5, "valid_targets_min": 733 }, { "epoch": 5.1294498381877025, "grad_norm": 0.7039566787306656, "learning_rate": 8.102427087386457e-06, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.12740206718444824, "step": 3170, "valid_targets_mean": 3907.6, "valid_targets_min": 706 }, { "epoch": 5.1375404530744335, "grad_norm": 0.6536128106483406, "learning_rate": 8.037657405115611e-06, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.111982561647892, "step": 3175, "valid_targets_mean": 4094.3, "valid_targets_min": 2918 }, { "epoch": 5.145631067961165, "grad_norm": 0.7820516641963816, "learning_rate": 7.973082476937728e-06, "loss": 0.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.10970476269721985, "step": 3180, "valid_targets_mean": 3919.2, "valid_targets_min": 786 }, { "epoch": 5.1537216828478964, "grad_norm": 0.6291251865125252, "learning_rate": 7.908703354171283e-06, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.09216032922267914, "step": 3185, "valid_targets_mean": 3711.6, "valid_targets_min": 460 }, { "epoch": 5.1618122977346275, "grad_norm": 0.7393911233590429, "learning_rate": 7.844521084946895e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.1511136293411255, "step": 3190, "valid_targets_mean": 4163.1, "valid_targets_min": 473 }, { "epoch": 5.169902912621359, "grad_norm": 0.7767299244512159, "learning_rate": 7.780536714190298e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440705955028534, "step": 3195, "valid_targets_mean": 4079.9, "valid_targets_min": 1240 }, { "epoch": 5.17799352750809, "grad_norm": 0.7478484576498746, "learning_rate": 7.716751283605324e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.15292268991470337, "step": 3200, "valid_targets_mean": 3749.6, "valid_targets_min": 428 }, { "epoch": 5.186084142394822, "grad_norm": 0.7339598062609202, "learning_rate": 7.653165831656937e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475408971309662, "step": 3205, "valid_targets_mean": 3905.8, "valid_targets_min": 494 }, { "epoch": 5.194174757281553, "grad_norm": 0.8093145246529954, "learning_rate": 7.589781393554321e-06, "loss": 0.1232, "loss_nan_ranks": 0, "loss_rank_avg": 0.13094545900821686, "step": 3210, "valid_targets_mean": 3094.6, "valid_targets_min": 402 }, { "epoch": 5.202265372168285, "grad_norm": 0.6854868228623259, "learning_rate": 7.526599001234058e-06, "loss": 0.1183, "loss_nan_ranks": 0, "loss_rank_avg": 0.10869428515434265, "step": 3215, "valid_targets_mean": 3835.5, "valid_targets_min": 502 }, { "epoch": 5.210355987055016, "grad_norm": 0.7125430732031628, "learning_rate": 7.463619683343284e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297406703233719, "step": 3220, "valid_targets_mean": 3900.7, "valid_targets_min": 1782 }, { "epoch": 5.218446601941747, "grad_norm": 0.7181396945472707, "learning_rate": 7.400844465222963e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.11025745421648026, "step": 3225, "valid_targets_mean": 3510.6, "valid_targets_min": 725 }, { "epoch": 5.226537216828479, "grad_norm": 0.7152506418537288, "learning_rate": 7.338274368891198e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.1154252365231514, "step": 3230, "valid_targets_mean": 3738.3, "valid_targets_min": 1605 }, { "epoch": 5.23462783171521, "grad_norm": 0.6911405200556111, "learning_rate": 7.275910413026579e-06, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.12859441339969635, "step": 3235, "valid_targets_mean": 4039.9, "valid_targets_min": 1402 }, { "epoch": 5.242718446601942, "grad_norm": 0.7006616335265696, "learning_rate": 7.213753612951624e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.14889748394489288, "step": 3240, "valid_targets_mean": 4240.6, "valid_targets_min": 2902 }, { "epoch": 5.250809061488673, "grad_norm": 0.7881678572983208, "learning_rate": 7.1518049806162196e-06, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.11947671324014664, "step": 3245, "valid_targets_mean": 3953.6, "valid_targets_min": 513 }, { "epoch": 5.258899676375404, "grad_norm": 0.721046849366806, "learning_rate": 7.090065524581136e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.14251643419265747, "step": 3250, "valid_targets_mean": 3847.2, "valid_targets_min": 496 }, { "epoch": 5.266990291262136, "grad_norm": 0.754366038514852, "learning_rate": 7.0285362500016675e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330687701702118, "step": 3255, "valid_targets_mean": 3853.8, "valid_targets_min": 518 }, { "epoch": 5.275080906148867, "grad_norm": 0.7508046199447793, "learning_rate": 6.967218158611202e-06, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.13121311366558075, "step": 3260, "valid_targets_mean": 3239.1, "valid_targets_min": 454 }, { "epoch": 5.283171521035599, "grad_norm": 0.7209699847161913, "learning_rate": 6.906112248704939e-06, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.14587056636810303, "step": 3265, "valid_targets_mean": 3749.4, "valid_targets_min": 1751 }, { "epoch": 5.29126213592233, "grad_norm": 0.6904937107421983, "learning_rate": 6.845219515123667e-06, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.12392056733369827, "step": 3270, "valid_targets_mean": 3961.6, "valid_targets_min": 1610 }, { "epoch": 5.299352750809062, "grad_norm": 0.8350113985180451, "learning_rate": 6.784540949237484e-06, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.13344715535640717, "step": 3275, "valid_targets_mean": 3784.6, "valid_targets_min": 749 }, { "epoch": 5.307443365695793, "grad_norm": 0.7364469113973013, "learning_rate": 6.724077538929759e-06, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.1438203901052475, "step": 3280, "valid_targets_mean": 3925.2, "valid_targets_min": 2514 }, { "epoch": 5.315533980582524, "grad_norm": 0.7279618289406372, "learning_rate": 6.663830268580971e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13427822291851044, "step": 3285, "valid_targets_mean": 3814.9, "valid_targets_min": 1737 }, { "epoch": 5.323624595469256, "grad_norm": 0.6239991635895354, "learning_rate": 6.6038001190527146e-06, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.09467694163322449, "step": 3290, "valid_targets_mean": 4052.6, "valid_targets_min": 1040 }, { "epoch": 5.331715210355987, "grad_norm": 0.7630179063607263, "learning_rate": 6.543988067671752e-06, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.13112042844295502, "step": 3295, "valid_targets_mean": 3648.1, "valid_targets_min": 433 }, { "epoch": 5.339805825242719, "grad_norm": 0.6959899769773115, "learning_rate": 6.484395088214037e-06, "loss": 0.1161, "loss_nan_ranks": 0, "loss_rank_avg": 0.1262616068124771, "step": 3300, "valid_targets_mean": 3619.4, "valid_targets_min": 1452 }, { "epoch": 5.34789644012945, "grad_norm": 0.6733214313566337, "learning_rate": 6.425022150888924e-06, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.10100290179252625, "step": 3305, "valid_targets_mean": 3921.1, "valid_targets_min": 1636 }, { "epoch": 5.355987055016181, "grad_norm": 0.7645979406542432, "learning_rate": 6.36587022232336e-06, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.10890600085258484, "step": 3310, "valid_targets_mean": 3571.8, "valid_targets_min": 1506 }, { "epoch": 5.364077669902913, "grad_norm": 0.7144191140895096, "learning_rate": 6.306940265546117e-06, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.11766283959150314, "step": 3315, "valid_targets_mean": 3672.7, "valid_targets_min": 463 }, { "epoch": 5.372168284789644, "grad_norm": 0.686173617625609, "learning_rate": 6.248233239972144e-06, "loss": 0.1148, "loss_nan_ranks": 0, "loss_rank_avg": 0.11546348035335541, "step": 3320, "valid_targets_mean": 3776.6, "valid_targets_min": 702 }, { "epoch": 5.380258899676376, "grad_norm": 0.7404569018613136, "learning_rate": 6.189750101386931e-06, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.14495286345481873, "step": 3325, "valid_targets_mean": 3686.4, "valid_targets_min": 464 }, { "epoch": 5.388349514563107, "grad_norm": 0.6976672794771177, "learning_rate": 6.1314918019309535e-06, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.10965608060359955, "step": 3330, "valid_targets_mean": 4057.9, "valid_targets_min": 1991 }, { "epoch": 5.3964401294498385, "grad_norm": 0.7464635834173435, "learning_rate": 6.073459290084185e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.14042946696281433, "step": 3335, "valid_targets_mean": 3666.9, "valid_targets_min": 1900 }, { "epoch": 5.4045307443365695, "grad_norm": 0.758392528587745, "learning_rate": 6.01565351065063e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.1299818456172943, "step": 3340, "valid_targets_mean": 3642.3, "valid_targets_min": 439 }, { "epoch": 5.412621359223301, "grad_norm": 0.7761136854296529, "learning_rate": 5.958075404742951e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.13393014669418335, "step": 3345, "valid_targets_mean": 3275.5, "valid_targets_min": 269 }, { "epoch": 5.4207119741100325, "grad_norm": 0.7053876074430606, "learning_rate": 5.900725909767155e-06, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.10762079060077667, "step": 3350, "valid_targets_mean": 4022.1, "valid_targets_min": 1340 }, { "epoch": 5.4288025889967635, "grad_norm": 0.7642056847412017, "learning_rate": 5.843605959407326e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.14689894020557404, "step": 3355, "valid_targets_mean": 3795.8, "valid_targets_min": 2510 }, { "epoch": 5.436893203883495, "grad_norm": 0.7355013386223096, "learning_rate": 5.7867164836104174e-06, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.13858428597450256, "step": 3360, "valid_targets_mean": 4008.9, "valid_targets_min": 968 }, { "epoch": 5.444983818770226, "grad_norm": 0.7315669914910475, "learning_rate": 5.730058408571135e-06, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.10367206484079361, "step": 3365, "valid_targets_mean": 3741.8, "valid_targets_min": 469 }, { "epoch": 5.453074433656958, "grad_norm": 0.7225588349944803, "learning_rate": 5.673632656716825e-06, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.10480669885873795, "step": 3370, "valid_targets_mean": 3860.3, "valid_targets_min": 2206 }, { "epoch": 5.461165048543689, "grad_norm": 0.7237332483919786, "learning_rate": 5.617440146692485e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.12040352076292038, "step": 3375, "valid_targets_mean": 3892.9, "valid_targets_min": 1076 }, { "epoch": 5.46925566343042, "grad_norm": 0.7602472039558393, "learning_rate": 5.561481793345786e-06, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.12410160899162292, "step": 3380, "valid_targets_mean": 3685.4, "valid_targets_min": 738 }, { "epoch": 5.477346278317152, "grad_norm": 0.7380439821179074, "learning_rate": 5.505758507712196e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12352344393730164, "step": 3385, "valid_targets_mean": 4037.8, "valid_targets_min": 562 }, { "epoch": 5.485436893203883, "grad_norm": 0.7890588781049627, "learning_rate": 5.450271197000128e-06, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1398930549621582, "step": 3390, "valid_targets_mean": 3493.1, "valid_targets_min": 662 }, { "epoch": 5.493527508090615, "grad_norm": 0.8416557602820898, "learning_rate": 5.395020764576211e-06, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.1332603096961975, "step": 3395, "valid_targets_mean": 3456.3, "valid_targets_min": 433 }, { "epoch": 5.501618122977346, "grad_norm": 0.6903723606199367, "learning_rate": 5.340008109950512e-06, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297823190689087, "step": 3400, "valid_targets_mean": 3866.8, "valid_targets_min": 1020 }, { "epoch": 5.509708737864077, "grad_norm": 0.6579088713294159, "learning_rate": 5.285234128761969e-06, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.10706949234008789, "step": 3405, "valid_targets_mean": 3828.5, "valid_targets_min": 1661 }, { "epoch": 5.517799352750809, "grad_norm": 0.7010522478745738, "learning_rate": 5.230699712763758e-06, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.12073405086994171, "step": 3410, "valid_targets_mean": 3811.7, "valid_targets_min": 753 }, { "epoch": 5.52588996763754, "grad_norm": 0.7773182598525699, "learning_rate": 5.176405749808786e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.15182915329933167, "step": 3415, "valid_targets_mean": 4130.1, "valid_targets_min": 259 }, { "epoch": 5.533980582524272, "grad_norm": 0.8638464314660135, "learning_rate": 5.122353123835262e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.1541995108127594, "step": 3420, "valid_targets_mean": 3474.5, "valid_targets_min": 1122 }, { "epoch": 5.542071197411003, "grad_norm": 0.6892371890482751, "learning_rate": 5.068542714852254e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293623000383377, "step": 3425, "valid_targets_mean": 3804.9, "valid_targets_min": 1364 }, { "epoch": 5.550161812297735, "grad_norm": 0.7405131577003049, "learning_rate": 5.014975398925408e-06, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.12245788425207138, "step": 3430, "valid_targets_mean": 3846.7, "valid_targets_min": 2016 }, { "epoch": 5.558252427184466, "grad_norm": 0.7063009742960525, "learning_rate": 4.9616520481626794e-06, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.11486178636550903, "step": 3435, "valid_targets_mean": 3717.2, "valid_targets_min": 480 }, { "epoch": 5.566343042071198, "grad_norm": 0.7074391715770296, "learning_rate": 4.908573530700111e-06, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.13461247086524963, "step": 3440, "valid_targets_mean": 4163.8, "valid_targets_min": 675 }, { "epoch": 5.574433656957929, "grad_norm": 0.8056262006079112, "learning_rate": 4.8557407106877175e-06, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.11532510817050934, "step": 3445, "valid_targets_mean": 3564.0, "valid_targets_min": 1009 }, { "epoch": 5.58252427184466, "grad_norm": 0.6689071640066644, "learning_rate": 4.8031544482754136e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.12339470535516739, "step": 3450, "valid_targets_mean": 3999.7, "valid_targets_min": 1739 }, { "epoch": 5.590614886731392, "grad_norm": 0.7727457741265664, "learning_rate": 4.7508155995989944e-06, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.12754319608211517, "step": 3455, "valid_targets_mean": 3478.6, "valid_targets_min": 433 }, { "epoch": 5.598705501618123, "grad_norm": 0.7051623852726349, "learning_rate": 4.6987250167662435e-06, "loss": 0.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.13093580305576324, "step": 3460, "valid_targets_mean": 4168.9, "valid_targets_min": 897 }, { "epoch": 5.606796116504855, "grad_norm": 0.7539130701198374, "learning_rate": 4.6468835478430045e-06, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.12748193740844727, "step": 3465, "valid_targets_mean": 3325.4, "valid_targets_min": 444 }, { "epoch": 5.614886731391586, "grad_norm": 0.7286866436675753, "learning_rate": 4.595292036839383e-06, "loss": 0.1225, "loss_nan_ranks": 0, "loss_rank_avg": 0.11541740596294403, "step": 3470, "valid_targets_mean": 3640.0, "valid_targets_min": 420 }, { "epoch": 5.622977346278317, "grad_norm": 0.7234246657508987, "learning_rate": 4.543951323696058e-06, "loss": 0.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.11532118916511536, "step": 3475, "valid_targets_mean": 3745.8, "valid_targets_min": 1187 }, { "epoch": 5.631067961165049, "grad_norm": 0.7620959965037666, "learning_rate": 4.492862244270544e-06, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.13576315343379974, "step": 3480, "valid_targets_mean": 3854.0, "valid_targets_min": 862 }, { "epoch": 5.63915857605178, "grad_norm": 0.7060173631264054, "learning_rate": 4.442025630323607e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12959304451942444, "step": 3485, "valid_targets_mean": 4153.1, "valid_targets_min": 515 }, { "epoch": 5.647249190938512, "grad_norm": 0.830192046283675, "learning_rate": 4.3914423095057516e-06, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11251272261142731, "step": 3490, "valid_targets_mean": 3465.1, "valid_targets_min": 612 }, { "epoch": 5.655339805825243, "grad_norm": 0.678502014152424, "learning_rate": 4.341113105343673e-06, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.11163593083620071, "step": 3495, "valid_targets_mean": 3950.2, "valid_targets_min": 505 }, { "epoch": 5.663430420711974, "grad_norm": 0.7849757937871225, "learning_rate": 4.291038837226935e-06, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.13538207113742828, "step": 3500, "valid_targets_mean": 3912.1, "valid_targets_min": 1647 }, { "epoch": 5.671521035598706, "grad_norm": 0.7234102654591658, "learning_rate": 4.241220320394574e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282060295343399, "step": 3505, "valid_targets_mean": 3848.4, "valid_targets_min": 479 }, { "epoch": 5.679611650485437, "grad_norm": 0.7422885539309136, "learning_rate": 4.191658365921838e-06, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.12916360795497894, "step": 3510, "valid_targets_mean": 3610.4, "valid_targets_min": 1850 }, { "epoch": 5.6877022653721685, "grad_norm": 0.7125773638661527, "learning_rate": 4.1423537807070065e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.11903668940067291, "step": 3515, "valid_targets_mean": 3842.6, "valid_targets_min": 1601 }, { "epoch": 5.6957928802588995, "grad_norm": 0.752523330730224, "learning_rate": 4.0933073674582054e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.1267009973526001, "step": 3520, "valid_targets_mean": 3492.9, "valid_targets_min": 1014 }, { "epoch": 5.703883495145631, "grad_norm": 0.7270519639308166, "learning_rate": 4.044519924680379e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.12510140240192413, "step": 3525, "valid_targets_mean": 3632.8, "valid_targets_min": 460 }, { "epoch": 5.711974110032362, "grad_norm": 0.7187809324224477, "learning_rate": 3.99599224666229e-06, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.12706691026687622, "step": 3530, "valid_targets_mean": 3854.6, "valid_targets_min": 2008 }, { "epoch": 5.720064724919094, "grad_norm": 0.6986751025778004, "learning_rate": 3.947725123463559e-06, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.14450600743293762, "step": 3535, "valid_targets_mean": 4264.0, "valid_targets_min": 449 }, { "epoch": 5.728155339805825, "grad_norm": 0.7752207817322075, "learning_rate": 3.8997193409018245e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.11388484388589859, "step": 3540, "valid_targets_mean": 3403.1, "valid_targets_min": 453 }, { "epoch": 5.736245954692556, "grad_norm": 0.8051040328349554, "learning_rate": 3.851975680539941e-06, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.13021591305732727, "step": 3545, "valid_targets_mean": 3859.8, "valid_targets_min": 1954 }, { "epoch": 5.744336569579288, "grad_norm": 0.8416631487491211, "learning_rate": 3.804494919673254e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455630362033844, "step": 3550, "valid_targets_mean": 3486.1, "valid_targets_min": 731 }, { "epoch": 5.752427184466019, "grad_norm": 0.7539706877774351, "learning_rate": 3.757277831316961e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.13057079911231995, "step": 3555, "valid_targets_mean": 3653.4, "valid_targets_min": 460 }, { "epoch": 5.760517799352751, "grad_norm": 0.7345729665958677, "learning_rate": 3.7103251841934993e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.121879443526268, "step": 3560, "valid_targets_mean": 3892.4, "valid_targets_min": 2001 }, { "epoch": 5.768608414239482, "grad_norm": 0.7300947831568095, "learning_rate": 3.663637742720052e-06, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.12066502124071121, "step": 3565, "valid_targets_mean": 3785.7, "valid_targets_min": 1726 }, { "epoch": 5.776699029126213, "grad_norm": 0.7854108618258545, "learning_rate": 3.617216266996093e-06, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.09828585386276245, "step": 3570, "valid_targets_mean": 3547.1, "valid_targets_min": 448 }, { "epoch": 5.784789644012945, "grad_norm": 0.6950199968709713, "learning_rate": 3.571061512791012e-06, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12642902135849, "step": 3575, "valid_targets_mean": 4099.1, "valid_targets_min": 2514 }, { "epoch": 5.792880258899676, "grad_norm": 0.6788504116739233, "learning_rate": 3.525174231531814e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12123347818851471, "step": 3580, "valid_targets_mean": 3896.4, "valid_targets_min": 642 }, { "epoch": 5.800970873786408, "grad_norm": 0.8682257553577993, "learning_rate": 3.4795551702908935e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.16144192218780518, "step": 3585, "valid_targets_mean": 3735.9, "valid_targets_min": 1174 }, { "epoch": 5.809061488673139, "grad_norm": 0.6913961014302824, "learning_rate": 3.434205071773855e-06, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.12861505150794983, "step": 3590, "valid_targets_mean": 4488.1, "valid_targets_min": 2276 }, { "epoch": 5.81715210355987, "grad_norm": 0.7809800057454481, "learning_rate": 3.3891246743074245e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.11062463372945786, "step": 3595, "valid_targets_mean": 4145.9, "valid_targets_min": 2503 }, { "epoch": 5.825242718446602, "grad_norm": 0.6702913762142105, "learning_rate": 3.344314711827441e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.11128797382116318, "step": 3600, "valid_targets_mean": 3917.0, "valid_targets_min": 834 }, { "epoch": 5.833333333333333, "grad_norm": 0.7697182542474907, "learning_rate": 3.299775913866894e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.1268385350704193, "step": 3605, "valid_targets_mean": 3472.0, "valid_targets_min": 459 }, { "epoch": 5.841423948220065, "grad_norm": 0.7155200788961812, "learning_rate": 3.255509005544062e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.11924313008785248, "step": 3610, "valid_targets_mean": 4219.1, "valid_targets_min": 3201 }, { "epoch": 5.849514563106796, "grad_norm": 0.6954308628669343, "learning_rate": 3.2115147075506957e-06, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.12587472796440125, "step": 3615, "valid_targets_mean": 3964.8, "valid_targets_min": 2650 }, { "epoch": 5.857605177993528, "grad_norm": 0.7923704942527922, "learning_rate": 3.1677937361402654e-06, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.13604333996772766, "step": 3620, "valid_targets_mean": 3791.6, "valid_targets_min": 1586 }, { "epoch": 5.865695792880259, "grad_norm": 0.7963806010437653, "learning_rate": 3.124346803116354e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.12812381982803345, "step": 3625, "valid_targets_mean": 3818.2, "valid_targets_min": 434 }, { "epoch": 5.87378640776699, "grad_norm": 0.8065922087851086, "learning_rate": 3.0811746158210165e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12494488060474396, "step": 3630, "valid_targets_mean": 3470.3, "valid_targets_min": 801 }, { "epoch": 5.881877022653722, "grad_norm": 0.6934755628970144, "learning_rate": 3.0382778771232766e-06, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.11633384227752686, "step": 3635, "valid_targets_mean": 3957.1, "valid_targets_min": 1752 }, { "epoch": 5.889967637540453, "grad_norm": 0.6957018475982958, "learning_rate": 2.9956572854077205e-06, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.11870764195919037, "step": 3640, "valid_targets_mean": 4018.0, "valid_targets_min": 1690 }, { "epoch": 5.898058252427185, "grad_norm": 0.7920517590567935, "learning_rate": 2.9533135345630536e-06, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.14628848433494568, "step": 3645, "valid_targets_mean": 3822.6, "valid_targets_min": 950 }, { "epoch": 5.906148867313916, "grad_norm": 0.7682562383139114, "learning_rate": 2.911247313970882e-06, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.1245870590209961, "step": 3650, "valid_targets_mean": 3558.5, "valid_targets_min": 643 }, { "epoch": 5.914239482200648, "grad_norm": 0.7764934542624735, "learning_rate": 2.8694593084944356e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.11907865107059479, "step": 3655, "valid_targets_mean": 4022.9, "valid_targets_min": 1227 }, { "epoch": 5.922330097087379, "grad_norm": 0.7915955290706294, "learning_rate": 2.8279501984674396e-06, "loss": 0.1121, "loss_nan_ranks": 0, "loss_rank_avg": 0.12054628133773804, "step": 3660, "valid_targets_mean": 3649.9, "valid_targets_min": 475 }, { "epoch": 5.93042071197411, "grad_norm": 0.686045896267701, "learning_rate": 2.7867206596830355e-06, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.10917463898658752, "step": 3665, "valid_targets_mean": 4130.0, "valid_targets_min": 2201 }, { "epoch": 5.938511326860842, "grad_norm": 0.7249342585567816, "learning_rate": 2.7457713633827763e-06, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12481742352247238, "step": 3670, "valid_targets_mean": 3999.8, "valid_targets_min": 2119 }, { "epoch": 5.946601941747573, "grad_norm": 0.7335052345451426, "learning_rate": 2.705102976245697e-06, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1226348727941513, "step": 3675, "valid_targets_mean": 3779.4, "valid_targets_min": 1258 }, { "epoch": 5.9546925566343045, "grad_norm": 0.7240696636506034, "learning_rate": 2.6647161603774763e-06, "loss": 0.1225, "loss_nan_ranks": 0, "loss_rank_avg": 0.12565986812114716, "step": 3680, "valid_targets_mean": 3699.1, "valid_targets_min": 1361 }, { "epoch": 5.9627831715210355, "grad_norm": 0.9844611721489968, "learning_rate": 2.624611573299629e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12091508507728577, "step": 3685, "valid_targets_mean": 3558.1, "valid_targets_min": 313 }, { "epoch": 5.970873786407767, "grad_norm": 0.7889095453729414, "learning_rate": 2.5847898679388217e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.12522706389427185, "step": 3690, "valid_targets_mean": 3903.6, "valid_targets_min": 1472 }, { "epoch": 5.9789644012944985, "grad_norm": 0.7583140618259258, "learning_rate": 2.5452516926162394e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313149333000183, "step": 3695, "valid_targets_mean": 3939.1, "valid_targets_min": 503 }, { "epoch": 5.9870550161812295, "grad_norm": 0.7620324187487387, "learning_rate": 2.5059976910370255e-06, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.1112971380352974, "step": 3700, "valid_targets_mean": 3635.0, "valid_targets_min": 703 }, { "epoch": 5.995145631067961, "grad_norm": 0.7140358860481412, "learning_rate": 2.467028502279802e-06, "loss": 0.1171, "loss_nan_ranks": 0, "loss_rank_avg": 0.11595533788204193, "step": 3705, "valid_targets_mean": 3788.3, "valid_targets_min": 1853 }, { "epoch": 6.003236245954692, "grad_norm": 0.6509891193331984, "learning_rate": 2.428344760786283e-06, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.09506258368492126, "step": 3710, "valid_targets_mean": 3532.4, "valid_targets_min": 650 }, { "epoch": 6.011326860841424, "grad_norm": 0.7139744229116504, "learning_rate": 2.389947096350913e-06, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.10088154673576355, "step": 3715, "valid_targets_mean": 3833.9, "valid_targets_min": 1259 }, { "epoch": 6.019417475728155, "grad_norm": 0.6897387337767092, "learning_rate": 2.3518361341106366e-06, "loss": 0.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.10516591370105743, "step": 3720, "valid_targets_mean": 3907.6, "valid_targets_min": 1849 }, { "epoch": 6.027508090614886, "grad_norm": 0.7425321933146951, "learning_rate": 2.3140124945347188e-06, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.12143640220165253, "step": 3725, "valid_targets_mean": 3391.8, "valid_targets_min": 397 }, { "epoch": 6.035598705501618, "grad_norm": 0.694108149750431, "learning_rate": 2.2764767934146304e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.120110422372818, "step": 3730, "valid_targets_mean": 3814.7, "valid_targets_min": 1117 }, { "epoch": 6.043689320388349, "grad_norm": 0.7002918869971856, "learning_rate": 2.2392296418540527e-06, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.09147246181964874, "step": 3735, "valid_targets_mean": 3512.8, "valid_targets_min": 1510 }, { "epoch": 6.051779935275081, "grad_norm": 0.7931772871720706, "learning_rate": 2.20227164625888e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.13165760040283203, "step": 3740, "valid_targets_mean": 3220.9, "valid_targets_min": 430 }, { "epoch": 6.059870550161812, "grad_norm": 0.7318335669267926, "learning_rate": 2.165603408327386e-06, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.09360679239034653, "step": 3745, "valid_targets_mean": 3538.3, "valid_targets_min": 1886 }, { "epoch": 6.067961165048544, "grad_norm": 0.6564949740471046, "learning_rate": 2.129225525040428e-06, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.11405914276838303, "step": 3750, "valid_targets_mean": 4078.1, "valid_targets_min": 1100 }, { "epoch": 6.076051779935275, "grad_norm": 0.7352580575605189, "learning_rate": 2.0931385886517043e-06, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.11465087532997131, "step": 3755, "valid_targets_mean": 3844.5, "valid_targets_min": 1201 }, { "epoch": 6.084142394822006, "grad_norm": 0.74020729169368, "learning_rate": 2.05734318667812e-06, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.10614818334579468, "step": 3760, "valid_targets_mean": 3700.8, "valid_targets_min": 1405 }, { "epoch": 6.092233009708738, "grad_norm": 0.7715214057611403, "learning_rate": 2.0218399018902368e-06, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.122889444231987, "step": 3765, "valid_targets_mean": 3979.6, "valid_targets_min": 606 }, { "epoch": 6.100323624595469, "grad_norm": 0.7281761064430898, "learning_rate": 1.986629312302759e-06, "loss": 0.1123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1031067818403244, "step": 3770, "valid_targets_mean": 3470.1, "valid_targets_min": 471 }, { "epoch": 6.108414239482201, "grad_norm": 0.7454398419847319, "learning_rate": 1.9517119911651594e-06, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.11875297129154205, "step": 3775, "valid_targets_mean": 3795.9, "valid_targets_min": 1507 }, { "epoch": 6.116504854368932, "grad_norm": 0.661496166671743, "learning_rate": 1.917088506952307e-06, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.09311284124851227, "step": 3780, "valid_targets_mean": 3664.3, "valid_targets_min": 1643 }, { "epoch": 6.124595469255663, "grad_norm": 0.835262575264935, "learning_rate": 1.8827594233552338e-06, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381199210882187, "step": 3785, "valid_targets_mean": 3730.8, "valid_targets_min": 413 }, { "epoch": 6.132686084142395, "grad_norm": 0.7026566817099582, "learning_rate": 1.8487252992719562e-06, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.1321025788784027, "step": 3790, "valid_targets_mean": 4019.1, "valid_targets_min": 1063 }, { "epoch": 6.140776699029126, "grad_norm": 0.8163113871171781, "learning_rate": 1.8149866887983747e-06, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.11378465592861176, "step": 3795, "valid_targets_mean": 3231.6, "valid_targets_min": 349 }, { "epoch": 6.148867313915858, "grad_norm": 0.7477376471533267, "learning_rate": 1.7815441412192447e-06, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.10754677653312683, "step": 3800, "valid_targets_mean": 3431.2, "valid_targets_min": 1641 }, { "epoch": 6.156957928802589, "grad_norm": 0.728794180353719, "learning_rate": 1.7483982009992506e-06, "loss": 0.1166, "loss_nan_ranks": 0, "loss_rank_avg": 0.08733691275119781, "step": 3805, "valid_targets_mean": 3602.6, "valid_targets_min": 1726 }, { "epoch": 6.165048543689321, "grad_norm": 0.7562254178879685, "learning_rate": 1.715549407774124e-06, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.12288179993629456, "step": 3810, "valid_targets_mean": 4288.5, "valid_targets_min": 1982 }, { "epoch": 6.173139158576052, "grad_norm": 0.8169277563659051, "learning_rate": 1.6829982963418667e-06, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.13156858086585999, "step": 3815, "valid_targets_mean": 3638.5, "valid_targets_min": 450 }, { "epoch": 6.181229773462783, "grad_norm": 0.791581886463547, "learning_rate": 1.6507453966540454e-06, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.11052010953426361, "step": 3820, "valid_targets_mean": 3243.2, "valid_targets_min": 872 }, { "epoch": 6.189320388349515, "grad_norm": 0.8071179807020908, "learning_rate": 1.6187912338071577e-06, "loss": 0.1142, "loss_nan_ranks": 0, "loss_rank_avg": 0.09611040353775024, "step": 3825, "valid_targets_mean": 3300.4, "valid_targets_min": 405 }, { "epoch": 6.197411003236246, "grad_norm": 0.7341034704709207, "learning_rate": 1.5871363280340913e-06, "loss": 0.1183, "loss_nan_ranks": 0, "loss_rank_avg": 0.1326591819524765, "step": 3830, "valid_targets_mean": 4006.7, "valid_targets_min": 2289 }, { "epoch": 6.205501618122978, "grad_norm": 0.6722924657092954, "learning_rate": 1.555781194695649e-06, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.09945492446422577, "step": 3835, "valid_targets_mean": 3795.8, "valid_targets_min": 490 }, { "epoch": 6.213592233009709, "grad_norm": 0.7674389171998626, "learning_rate": 1.5247263442721494e-06, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.12633197009563446, "step": 3840, "valid_targets_mean": 3439.7, "valid_targets_min": 462 }, { "epoch": 6.2216828478964405, "grad_norm": 0.7534393253923913, "learning_rate": 1.4939722823551428e-06, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1213739737868309, "step": 3845, "valid_targets_mean": 3602.9, "valid_targets_min": 397 }, { "epoch": 6.229773462783172, "grad_norm": 0.705373170660076, "learning_rate": 1.4635195096391463e-06, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.11145274341106415, "step": 3850, "valid_targets_mean": 3498.0, "valid_targets_min": 1047 }, { "epoch": 6.237864077669903, "grad_norm": 0.7336287787765475, "learning_rate": 1.4333685219135163e-06, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.134007066488266, "step": 3855, "valid_targets_mean": 4273.0, "valid_targets_min": 1809 }, { "epoch": 6.2459546925566345, "grad_norm": 0.6955768107461284, "learning_rate": 1.403519810054379e-06, "loss": 0.1128, "loss_nan_ranks": 0, "loss_rank_avg": 0.11127742379903793, "step": 3860, "valid_targets_mean": 4114.2, "valid_targets_min": 1593 }, { "epoch": 6.2540453074433655, "grad_norm": 0.6957722780972634, "learning_rate": 1.373973860016602e-06, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1035354882478714, "step": 3865, "valid_targets_mean": 3479.8, "valid_targets_min": 706 }, { "epoch": 6.262135922330097, "grad_norm": 0.7271832148458794, "learning_rate": 1.3447311528259354e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.12107687443494797, "step": 3870, "valid_targets_mean": 3875.2, "valid_targets_min": 1717 }, { "epoch": 6.270226537216828, "grad_norm": 0.7225262524495937, "learning_rate": 1.3157921645711436e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.12497846782207489, "step": 3875, "valid_targets_mean": 3914.5, "valid_targets_min": 507 }, { "epoch": 6.2783171521035595, "grad_norm": 0.8559665525671778, "learning_rate": 1.2871573663962611e-06, "loss": 0.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.14065983891487122, "step": 3880, "valid_targets_mean": 3619.2, "valid_targets_min": 514 }, { "epoch": 6.286407766990291, "grad_norm": 0.7858491084715699, "learning_rate": 1.2588272244929401e-06, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.10485831648111343, "step": 3885, "valid_targets_mean": 3352.1, "valid_targets_min": 338 }, { "epoch": 6.294498381877022, "grad_norm": 0.8093000501376625, "learning_rate": 1.2308022000928287e-06, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.13177737593650818, "step": 3890, "valid_targets_mean": 3496.9, "valid_targets_min": 1605 }, { "epoch": 6.302588996763754, "grad_norm": 0.7852769738079134, "learning_rate": 1.203082749460085e-06, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.12200696766376495, "step": 3895, "valid_targets_mean": 3838.5, "valid_targets_min": 910 }, { "epoch": 6.310679611650485, "grad_norm": 0.7287577190496319, "learning_rate": 1.1756693238839566e-06, "loss": 0.1165, "loss_nan_ranks": 0, "loss_rank_avg": 0.09417057782411575, "step": 3900, "valid_targets_mean": 3651.3, "valid_targets_min": 815 }, { "epoch": 6.318770226537217, "grad_norm": 0.8302132261220526, "learning_rate": 1.1485623696714043e-06, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.11933784186840057, "step": 3905, "valid_targets_mean": 2984.4, "valid_targets_min": 419 }, { "epoch": 6.326860841423948, "grad_norm": 0.7327391037417946, "learning_rate": 1.1217623281398571e-06, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.10303106904029846, "step": 3910, "valid_targets_mean": 3733.2, "valid_targets_min": 2249 }, { "epoch": 6.334951456310679, "grad_norm": 0.8208833041383687, "learning_rate": 1.0952696356100234e-06, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.14065951108932495, "step": 3915, "valid_targets_mean": 3564.1, "valid_targets_min": 442 }, { "epoch": 6.343042071197411, "grad_norm": 0.8332779535360231, "learning_rate": 1.069084723398781e-06, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.12287405133247375, "step": 3920, "valid_targets_mean": 3350.1, "valid_targets_min": 428 }, { "epoch": 6.351132686084142, "grad_norm": 0.7407469695551226, "learning_rate": 1.0432080178121695e-06, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.09893627464771271, "step": 3925, "valid_targets_mean": 3427.6, "valid_targets_min": 411 }, { "epoch": 6.359223300970874, "grad_norm": 0.6991975233530747, "learning_rate": 1.0176399401384306e-06, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.11751756072044373, "step": 3930, "valid_targets_mean": 4126.1, "valid_targets_min": 1631 }, { "epoch": 6.367313915857605, "grad_norm": 0.8407713857506784, "learning_rate": 9.92380906641166e-07, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.12533585727214813, "step": 3935, "valid_targets_mean": 3362.1, "valid_targets_min": 483 }, { "epoch": 6.375404530744337, "grad_norm": 0.7586330784594048, "learning_rate": 9.674313285525484e-07, "loss": 0.1123, "loss_nan_ranks": 0, "loss_rank_avg": 0.09893623739480972, "step": 3940, "valid_targets_mean": 3274.6, "valid_targets_min": 439 }, { "epoch": 6.383495145631068, "grad_norm": 0.7214335052263516, "learning_rate": 9.427916120666314e-07, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.1176610141992569, "step": 3945, "valid_targets_mean": 3927.4, "valid_targets_min": 953 }, { "epoch": 6.391585760517799, "grad_norm": 0.7486444334046114, "learning_rate": 9.18462158332738e-07, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.11216044425964355, "step": 3950, "valid_targets_mean": 3802.6, "valid_targets_min": 1736 }, { "epoch": 6.399676375404531, "grad_norm": 0.8208321060913947, "learning_rate": 8.944433634489335e-07, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.14981669187545776, "step": 3955, "valid_targets_mean": 4065.8, "valid_targets_min": 1853 }, { "epoch": 6.407766990291262, "grad_norm": 0.7055682571578344, "learning_rate": 8.707356184555626e-07, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1000659316778183, "step": 3960, "valid_targets_mean": 3765.9, "valid_targets_min": 1240 }, { "epoch": 6.415857605177994, "grad_norm": 0.7801809393232032, "learning_rate": 8.473393093288962e-07, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.14615213871002197, "step": 3965, "valid_targets_mean": 3748.4, "valid_targets_min": 2320 }, { "epoch": 6.423948220064725, "grad_norm": 0.7478694444542925, "learning_rate": 8.242548169748388e-07, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.11330067366361618, "step": 3970, "valid_targets_mean": 3463.9, "valid_targets_min": 877 }, { "epoch": 6.432038834951456, "grad_norm": 0.8291515604455668, "learning_rate": 8.014825172227359e-07, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.1242062896490097, "step": 3975, "valid_targets_mean": 2997.5, "valid_targets_min": 786 }, { "epoch": 6.440129449838188, "grad_norm": 0.7779823610215374, "learning_rate": 7.790227808192497e-07, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.13047200441360474, "step": 3980, "valid_targets_mean": 3859.4, "valid_targets_min": 791 }, { "epoch": 6.448220064724919, "grad_norm": 0.7255560841829936, "learning_rate": 7.568759734223263e-07, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.12434525042772293, "step": 3985, "valid_targets_mean": 4043.9, "valid_targets_min": 2429 }, { "epoch": 6.456310679611651, "grad_norm": 0.7324000370218157, "learning_rate": 7.350424555952318e-07, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.08710053563117981, "step": 3990, "valid_targets_mean": 3343.6, "valid_targets_min": 451 }, { "epoch": 6.464401294498382, "grad_norm": 0.7057838956585973, "learning_rate": 7.135225828007009e-07, "loss": 0.1056, "loss_nan_ranks": 0, "loss_rank_avg": 0.12603047490119934, "step": 3995, "valid_targets_mean": 4327.1, "valid_targets_min": 2402 }, { "epoch": 6.472491909385114, "grad_norm": 0.7370428093673492, "learning_rate": 6.92316705395133e-07, "loss": 0.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.10717878490686417, "step": 4000, "valid_targets_mean": 3758.0, "valid_targets_min": 416 }, { "epoch": 6.480582524271845, "grad_norm": 0.7267237980545936, "learning_rate": 6.714251686228968e-07, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581575125455856, "step": 4005, "valid_targets_mean": 3525.8, "valid_targets_min": 473 }, { "epoch": 6.488673139158576, "grad_norm": 0.7017774925879499, "learning_rate": 6.508483126107146e-07, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.09369301050901413, "step": 4010, "valid_targets_mean": 3786.3, "valid_targets_min": 1142 }, { "epoch": 6.496763754045308, "grad_norm": 0.7376578583187179, "learning_rate": 6.305864723621025e-07, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.12038631737232208, "step": 4015, "valid_targets_mean": 3682.2, "valid_targets_min": 505 }, { "epoch": 6.504854368932039, "grad_norm": 0.7144299289177106, "learning_rate": 6.10639977751939e-07, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.10524886101484299, "step": 4020, "valid_targets_mean": 3945.4, "valid_targets_min": 2737 }, { "epoch": 6.5129449838187705, "grad_norm": 0.7662258033033662, "learning_rate": 5.91009153521096e-07, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.11165094375610352, "step": 4025, "valid_targets_mean": 3897.4, "valid_targets_min": 413 }, { "epoch": 6.5210355987055015, "grad_norm": 0.785191390319755, "learning_rate": 5.716943192711277e-07, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.13537812232971191, "step": 4030, "valid_targets_mean": 3815.9, "valid_targets_min": 729 }, { "epoch": 6.529126213592233, "grad_norm": 0.7320628094314221, "learning_rate": 5.526957894590923e-07, "loss": 0.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.12145470082759857, "step": 4035, "valid_targets_mean": 3545.4, "valid_targets_min": 1248 }, { "epoch": 6.5372168284789645, "grad_norm": 0.7311528372301167, "learning_rate": 5.340138733924161e-07, "loss": 0.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.10949958860874176, "step": 4040, "valid_targets_mean": 3639.9, "valid_targets_min": 624 }, { "epoch": 6.5453074433656955, "grad_norm": 0.7597891188614194, "learning_rate": 5.156488752238708e-07, "loss": 0.1165, "loss_nan_ranks": 0, "loss_rank_avg": 0.11516404151916504, "step": 4045, "valid_targets_mean": 3899.2, "valid_targets_min": 1357 }, { "epoch": 6.553398058252427, "grad_norm": 0.7310469987564887, "learning_rate": 4.976010939466136e-07, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.11317206919193268, "step": 4050, "valid_targets_mean": 3734.9, "valid_targets_min": 502 }, { "epoch": 6.561488673139158, "grad_norm": 0.8474280332116642, "learning_rate": 4.798708233893168e-07, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.1260000318288803, "step": 4055, "valid_targets_mean": 2874.1, "valid_targets_min": 410 }, { "epoch": 6.56957928802589, "grad_norm": 0.7565848227122396, "learning_rate": 4.624583522113879e-07, "loss": 0.1138, "loss_nan_ranks": 0, "loss_rank_avg": 0.11290078610181808, "step": 4060, "valid_targets_mean": 3216.5, "valid_targets_min": 460 }, { "epoch": 6.577669902912621, "grad_norm": 0.7190620351644219, "learning_rate": 4.4536396389827986e-07, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.12443754076957703, "step": 4065, "valid_targets_mean": 3827.2, "valid_targets_min": 445 }, { "epoch": 6.585760517799352, "grad_norm": 0.7681106155104229, "learning_rate": 4.285879367568546e-07, "loss": 0.1051, "loss_nan_ranks": 0, "loss_rank_avg": 0.09754884243011475, "step": 4070, "valid_targets_mean": 3443.1, "valid_targets_min": 468 }, { "epoch": 6.593851132686084, "grad_norm": 0.7045013465157438, "learning_rate": 4.1213054391086914e-07, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.11584879457950592, "step": 4075, "valid_targets_mean": 4158.1, "valid_targets_min": 1562 }, { "epoch": 6.601941747572815, "grad_norm": 0.711241502567802, "learning_rate": 3.959920532965278e-07, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.09637920558452606, "step": 4080, "valid_targets_mean": 3688.4, "valid_targets_min": 390 }, { "epoch": 6.610032362459547, "grad_norm": 0.7548140115130028, "learning_rate": 3.8017272765810795e-07, "loss": 0.1053, "loss_nan_ranks": 0, "loss_rank_avg": 0.10875862836837769, "step": 4085, "valid_targets_mean": 3557.0, "valid_targets_min": 1169 }, { "epoch": 6.618122977346278, "grad_norm": 0.7476845196613187, "learning_rate": 3.646728245436926e-07, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.09515687823295593, "step": 4090, "valid_targets_mean": 3448.2, "valid_targets_min": 459 }, { "epoch": 6.62621359223301, "grad_norm": 0.6760149991841168, "learning_rate": 3.4949259630097985e-07, "loss": 0.11, "loss_nan_ranks": 0, "loss_rank_avg": 0.09844258427619934, "step": 4095, "valid_targets_mean": 4119.4, "valid_targets_min": 1825 }, { "epoch": 6.634304207119741, "grad_norm": 0.7450570767921598, "learning_rate": 3.346322900731602e-07, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.112000972032547, "step": 4100, "valid_targets_mean": 3919.7, "valid_targets_min": 599 }, { "epoch": 6.642394822006472, "grad_norm": 0.7870969672189868, "learning_rate": 3.2009214779491703e-07, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.12304633855819702, "step": 4105, "valid_targets_mean": 3315.8, "valid_targets_min": 672 }, { "epoch": 6.650485436893204, "grad_norm": 0.7864861620237504, "learning_rate": 3.0587240618845437e-07, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.12119387090206146, "step": 4110, "valid_targets_mean": 3842.4, "valid_targets_min": 1747 }, { "epoch": 6.658576051779935, "grad_norm": 0.7593935726615797, "learning_rate": 2.9197329675967556e-07, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.11751753836870193, "step": 4115, "valid_targets_mean": 3600.8, "valid_targets_min": 443 }, { "epoch": 6.666666666666667, "grad_norm": 0.7668039686269429, "learning_rate": 2.7839504579439734e-07, "loss": 0.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.11438554525375366, "step": 4120, "valid_targets_mean": 3635.9, "valid_targets_min": 1920 }, { "epoch": 6.674757281553398, "grad_norm": 0.7321055225681964, "learning_rate": 2.651378743546662e-07, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.09255105257034302, "step": 4125, "valid_targets_mean": 3288.8, "valid_targets_min": 459 }, { "epoch": 6.68284789644013, "grad_norm": 0.769844001201492, "learning_rate": 2.5220199827516335e-07, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.11600494384765625, "step": 4130, "valid_targets_mean": 3590.6, "valid_targets_min": 828 }, { "epoch": 6.690938511326861, "grad_norm": 0.7654676282072668, "learning_rate": 2.395876281596898e-07, "loss": 0.1128, "loss_nan_ranks": 0, "loss_rank_avg": 0.11756563186645508, "step": 4135, "valid_targets_mean": 3544.8, "valid_targets_min": 433 }, { "epoch": 6.699029126213592, "grad_norm": 0.7222893887701092, "learning_rate": 2.2729496937773375e-07, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.10802868008613586, "step": 4140, "valid_targets_mean": 4240.8, "valid_targets_min": 1119 }, { "epoch": 6.707119741100324, "grad_norm": 0.6656401401793538, "learning_rate": 2.1532422206113957e-07, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.10636568814516068, "step": 4145, "valid_targets_mean": 4059.1, "valid_targets_min": 1253 }, { "epoch": 6.715210355987055, "grad_norm": 0.7023584062905446, "learning_rate": 2.036755811008284e-07, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.10692491382360458, "step": 4150, "valid_targets_mean": 4141.0, "valid_targets_min": 1538 }, { "epoch": 6.723300970873787, "grad_norm": 0.7815100848686617, "learning_rate": 1.9234923614364298e-07, "loss": 0.1167, "loss_nan_ranks": 0, "loss_rank_avg": 0.12436103820800781, "step": 4155, "valid_targets_mean": 3200.8, "valid_targets_min": 443 }, { "epoch": 6.731391585760518, "grad_norm": 0.7383871231544672, "learning_rate": 1.813453715892588e-07, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.1116761788725853, "step": 4160, "valid_targets_mean": 3907.4, "valid_targets_min": 1241 }, { "epoch": 6.739482200647249, "grad_norm": 0.8179783335491289, "learning_rate": 1.706641665871689e-07, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.14059647917747498, "step": 4165, "valid_targets_mean": 4028.5, "valid_targets_min": 950 }, { "epoch": 6.747572815533981, "grad_norm": 0.778583312094626, "learning_rate": 1.603057950337794e-07, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11424525082111359, "step": 4170, "valid_targets_mean": 3257.9, "valid_targets_min": 435 }, { "epoch": 6.755663430420712, "grad_norm": 0.7483501823341687, "learning_rate": 1.5027042556958083e-07, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.11524796485900879, "step": 4175, "valid_targets_mean": 3492.9, "valid_targets_min": 1974 }, { "epoch": 6.763754045307444, "grad_norm": 0.7262116629208208, "learning_rate": 1.4055822157638566e-07, "loss": 0.1057, "loss_nan_ranks": 0, "loss_rank_avg": 0.1036527007818222, "step": 4180, "valid_targets_mean": 3663.7, "valid_targets_min": 1761 }, { "epoch": 6.771844660194175, "grad_norm": 0.8294870662688552, "learning_rate": 1.3116934117468617e-07, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13269130885601044, "step": 4185, "valid_targets_mean": 3551.8, "valid_targets_min": 515 }, { "epoch": 6.779935275080906, "grad_norm": 0.7952419125548885, "learning_rate": 1.2210393722106973e-07, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1315314769744873, "step": 4190, "valid_targets_mean": 3879.2, "valid_targets_min": 418 }, { "epoch": 6.788025889967638, "grad_norm": 0.7813021917376338, "learning_rate": 1.1336215730573863e-07, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.12635990977287292, "step": 4195, "valid_targets_mean": 3937.9, "valid_targets_min": 719 }, { "epoch": 6.796116504854369, "grad_norm": 0.7753053311834444, "learning_rate": 1.0494414375009642e-07, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.11267022788524628, "step": 4200, "valid_targets_mean": 3228.6, "valid_targets_min": 505 }, { "epoch": 6.8042071197411005, "grad_norm": 0.7121555430743358, "learning_rate": 9.68500336044409e-08, "loss": 0.1121, "loss_nan_ranks": 0, "loss_rank_avg": 0.0996587723493576, "step": 4205, "valid_targets_mean": 3622.3, "valid_targets_min": 1215 }, { "epoch": 6.8122977346278315, "grad_norm": 0.7164530066965938, "learning_rate": 8.907995864572583e-08, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.11022158712148666, "step": 4210, "valid_targets_mean": 3876.0, "valid_targets_min": 423 }, { "epoch": 6.820388349514563, "grad_norm": 0.6698497069366108, "learning_rate": 8.16340453754183e-08, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.11347459256649017, "step": 4215, "valid_targets_mean": 4525.3, "valid_targets_min": 1506 }, { "epoch": 6.828478964401294, "grad_norm": 0.6864775791788594, "learning_rate": 7.451241501744255e-08, "loss": 0.1046, "loss_nan_ranks": 0, "loss_rank_avg": 0.09482621401548386, "step": 4220, "valid_targets_mean": 3799.6, "valid_targets_min": 463 }, { "epoch": 6.836569579288026, "grad_norm": 0.752535267660768, "learning_rate": 6.771518351619932e-08, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.11658801138401031, "step": 4225, "valid_targets_mean": 4117.6, "valid_targets_min": 442 }, { "epoch": 6.844660194174757, "grad_norm": 0.7713882605978399, "learning_rate": 6.124246153468516e-08, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.12442426383495331, "step": 4230, "valid_targets_mean": 3770.4, "valid_targets_min": 650 }, { "epoch": 6.852750809061488, "grad_norm": 0.7068637325141903, "learning_rate": 5.5094354452684964e-08, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.11987002193927765, "step": 4235, "valid_targets_mean": 3828.8, "valid_targets_min": 1076 }, { "epoch": 6.86084142394822, "grad_norm": 0.8714684323249712, "learning_rate": 4.927096236505779e-08, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273711919784546, "step": 4240, "valid_targets_mean": 3429.4, "valid_targets_min": 721 }, { "epoch": 6.868932038834951, "grad_norm": 0.7973774333149717, "learning_rate": 4.3772380080111534e-08, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.120909184217453, "step": 4245, "valid_targets_mean": 3205.2, "valid_targets_min": 524 }, { "epoch": 6.877022653721683, "grad_norm": 0.7932995409173373, "learning_rate": 3.85986971180552e-08, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.11187095940113068, "step": 4250, "valid_targets_mean": 3380.6, "valid_targets_min": 910 }, { "epoch": 6.885113268608414, "grad_norm": 0.8134749447064917, "learning_rate": 3.374999770954013e-08, "loss": 0.1171, "loss_nan_ranks": 0, "loss_rank_avg": 0.132695734500885, "step": 4255, "valid_targets_mean": 3588.1, "valid_targets_min": 497 }, { "epoch": 6.893203883495145, "grad_norm": 0.7963874900596022, "learning_rate": 2.9226360794296638e-08, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.14102879166603088, "step": 4260, "valid_targets_mean": 3959.9, "valid_targets_min": 909 }, { "epoch": 6.901294498381877, "grad_norm": 0.7062095481538098, "learning_rate": 2.502786001983726e-08, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.106046661734581, "step": 4265, "valid_targets_mean": 3602.3, "valid_targets_min": 1241 }, { "epoch": 6.909385113268608, "grad_norm": 0.7013180525553683, "learning_rate": 2.1154563740266588e-08, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.11417189240455627, "step": 4270, "valid_targets_mean": 3765.8, "valid_targets_min": 1292 }, { "epoch": 6.91747572815534, "grad_norm": 0.7261543939015853, "learning_rate": 1.7606535015164405e-08, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.0980582907795906, "step": 4275, "valid_targets_mean": 3846.7, "valid_targets_min": 801 }, { "epoch": 6.925566343042071, "grad_norm": 0.7465722632159841, "learning_rate": 1.4383831608562048e-08, "loss": 0.1081, "loss_nan_ranks": 0, "loss_rank_avg": 0.12335227429866791, "step": 4280, "valid_targets_mean": 3942.1, "valid_targets_min": 701 }, { "epoch": 6.933656957928802, "grad_norm": 0.6729429573207937, "learning_rate": 1.14865059879965e-08, "loss": 0.1065, "loss_nan_ranks": 0, "loss_rank_avg": 0.10008923709392548, "step": 4285, "valid_targets_mean": 4052.6, "valid_targets_min": 1449 }, { "epoch": 6.941747572815534, "grad_norm": 0.7904605212036413, "learning_rate": 8.914605323664394e-09, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.11163502931594849, "step": 4290, "valid_targets_mean": 3616.7, "valid_targets_min": 1563 }, { "epoch": 6.949838187702265, "grad_norm": 0.7795168919241651, "learning_rate": 6.66817148764487e-09, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.13894109427928925, "step": 4295, "valid_targets_mean": 3961.6, "valid_targets_min": 595 }, { "epoch": 6.957928802588997, "grad_norm": 0.6999769879445384, "learning_rate": 4.7472410532245495e-09, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.10274814814329147, "step": 4300, "valid_targets_mean": 3830.3, "valid_targets_min": 1634 }, { "epoch": 6.966019417475728, "grad_norm": 1.0280666868305712, "learning_rate": 3.151845294302458e-09, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.09658776223659515, "step": 4305, "valid_targets_mean": 3119.4, "valid_targets_min": 443 }, { "epoch": 6.97411003236246, "grad_norm": 0.6709657407395602, "learning_rate": 1.882010184874883e-09, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.08560613542795181, "step": 4310, "valid_targets_mean": 3504.5, "valid_targets_min": 433 }, { "epoch": 6.982200647249191, "grad_norm": 0.7173680419597602, "learning_rate": 9.377563986157078e-10, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.11601495742797852, "step": 4315, "valid_targets_mean": 3960.2, "valid_targets_min": 2203 }, { "epoch": 6.990291262135923, "grad_norm": 0.7570102861156914, "learning_rate": 3.1909930854112646e-10, "loss": 0.1084, "loss_nan_ranks": 0, "loss_rank_avg": 0.10227625072002411, "step": 4320, "valid_targets_mean": 3076.0, "valid_targets_min": 1004 }, { "epoch": 6.998381877022654, "grad_norm": 0.7093115701651048, "learning_rate": 2.6048986760951466e-11, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.11005377024412155, "step": 4325, "valid_targets_mean": 3910.6, "valid_targets_min": 1792 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.11569061130285263, "step": 4326, "total_flos": 1582790264291328.0, "train_loss": 0.19078887684569554, "train_runtime": 21380.015, "train_samples_per_second": 3.236, "train_steps_per_second": 0.202, "valid_targets_mean": 2886.1, "valid_targets_min": 416 } ], "logging_steps": 5, "max_steps": 4326, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1582790264291328.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }