{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 5210, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0048, "grad_norm": 9.841835067235065, "learning_rate": 3.071017274472169e-07, "loss": 0.4918, "loss_nan_ranks": 0, "loss_rank_avg": 0.17842981219291687, "step": 5, "valid_targets_mean": 9620.0, "valid_targets_min": 4054 }, { "epoch": 0.0096, "grad_norm": 9.037327151868297, "learning_rate": 6.909788867562381e-07, "loss": 0.4922, "loss_nan_ranks": 0, "loss_rank_avg": 0.15718884766101837, "step": 10, "valid_targets_mean": 8666.8, "valid_targets_min": 2206 }, { "epoch": 0.0144, "grad_norm": 6.033909463391279, "learning_rate": 1.074856046065259e-06, "loss": 0.4709, "loss_nan_ranks": 0, "loss_rank_avg": 0.15585705637931824, "step": 15, "valid_targets_mean": 8733.8, "valid_targets_min": 4350 }, { "epoch": 0.0192, "grad_norm": 3.2861111342090337, "learning_rate": 1.4587332053742803e-06, "loss": 0.4312, "loss_nan_ranks": 0, "loss_rank_avg": 0.14734426140785217, "step": 20, "valid_targets_mean": 7922.4, "valid_targets_min": 1729 }, { "epoch": 0.024, "grad_norm": 1.6258530010888506, "learning_rate": 1.8426103646833015e-06, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.13337181508541107, "step": 25, "valid_targets_mean": 9515.2, "valid_targets_min": 1791 }, { "epoch": 0.0288, "grad_norm": 1.1794986084798527, "learning_rate": 2.2264875239923228e-06, "loss": 0.378, "loss_nan_ranks": 0, "loss_rank_avg": 0.11573775112628937, "step": 30, "valid_targets_mean": 8802.9, "valid_targets_min": 2606 }, { "epoch": 0.0336, "grad_norm": 0.7048103409679258, "learning_rate": 2.6103646833013433e-06, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.10993142426013947, "step": 35, "valid_targets_mean": 8278.6, "valid_targets_min": 740 }, { "epoch": 0.0384, "grad_norm": 0.5264062159110527, "learning_rate": 2.9942418426103648e-06, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.10869134962558746, "step": 40, "valid_targets_mean": 8495.2, "valid_targets_min": 2561 }, { "epoch": 0.0432, "grad_norm": 0.4514711080116693, "learning_rate": 3.378119001919386e-06, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.09915158152580261, "step": 45, "valid_targets_mean": 9248.5, "valid_targets_min": 2873 }, { "epoch": 0.048, "grad_norm": 0.3420802729257966, "learning_rate": 3.761996161228407e-06, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.09442837536334991, "step": 50, "valid_targets_mean": 9355.0, "valid_targets_min": 1269 }, { "epoch": 0.0528, "grad_norm": 0.28683988209383904, "learning_rate": 4.145873320537428e-06, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.08352220058441162, "step": 55, "valid_targets_mean": 8734.5, "valid_targets_min": 3777 }, { "epoch": 0.0576, "grad_norm": 0.23737129343553093, "learning_rate": 4.52975047984645e-06, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.08115425705909729, "step": 60, "valid_targets_mean": 9034.8, "valid_targets_min": 3693 }, { "epoch": 0.0624, "grad_norm": 0.19876401961795503, "learning_rate": 4.91362763915547e-06, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.07270577549934387, "step": 65, "valid_targets_mean": 8782.1, "valid_targets_min": 4980 }, { "epoch": 0.0672, "grad_norm": 0.18075045396174094, "learning_rate": 5.297504798464492e-06, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.06922709941864014, "step": 70, "valid_targets_mean": 9367.7, "valid_targets_min": 3471 }, { "epoch": 0.072, "grad_norm": 0.16424216569165836, "learning_rate": 5.681381957773513e-06, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.07363235950469971, "step": 75, "valid_targets_mean": 9389.4, "valid_targets_min": 4957 }, { "epoch": 0.0768, "grad_norm": 0.17072015557944906, "learning_rate": 6.065259117082534e-06, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.06568406522274017, "step": 80, "valid_targets_mean": 8954.7, "valid_targets_min": 2729 }, { "epoch": 0.0816, "grad_norm": 0.16204494202483938, "learning_rate": 6.449136276391556e-06, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.06659156829118729, "step": 85, "valid_targets_mean": 8714.0, "valid_targets_min": 3139 }, { "epoch": 0.0864, "grad_norm": 0.16165159991381337, "learning_rate": 6.833013435700576e-06, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.05660694092512131, "step": 90, "valid_targets_mean": 8498.3, "valid_targets_min": 2404 }, { "epoch": 0.0912, "grad_norm": 0.1560247037025123, "learning_rate": 7.216890595009598e-06, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.06358037143945694, "step": 95, "valid_targets_mean": 8950.7, "valid_targets_min": 3809 }, { "epoch": 0.096, "grad_norm": 0.1616062884997598, "learning_rate": 7.600767754318619e-06, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.06089777871966362, "step": 100, "valid_targets_mean": 9242.6, "valid_targets_min": 5629 }, { "epoch": 0.1008, "grad_norm": 0.19586837078411862, "learning_rate": 7.98464491362764e-06, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.06420055031776428, "step": 105, "valid_targets_mean": 8664.1, "valid_targets_min": 4408 }, { "epoch": 0.1056, "grad_norm": 0.16113724556095765, "learning_rate": 8.368522072936662e-06, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.06036144495010376, "step": 110, "valid_targets_mean": 8733.9, "valid_targets_min": 1577 }, { "epoch": 0.1104, "grad_norm": 0.16110423128629503, "learning_rate": 8.752399232245682e-06, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.06447982788085938, "step": 115, "valid_targets_mean": 9054.4, "valid_targets_min": 3944 }, { "epoch": 0.1152, "grad_norm": 0.176566106291253, "learning_rate": 9.136276391554704e-06, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.062302470207214355, "step": 120, "valid_targets_mean": 9205.4, "valid_targets_min": 1719 }, { "epoch": 0.12, "grad_norm": 0.17059615182231894, "learning_rate": 9.520153550863724e-06, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.058050885796546936, "step": 125, "valid_targets_mean": 8502.4, "valid_targets_min": 3732 }, { "epoch": 0.1248, "grad_norm": 0.17066809947335904, "learning_rate": 9.904030710172746e-06, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.05489126592874527, "step": 130, "valid_targets_mean": 7924.6, "valid_targets_min": 2935 }, { "epoch": 0.1296, "grad_norm": 0.17976768953493777, "learning_rate": 1.0287907869481766e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.06662755459547043, "step": 135, "valid_targets_mean": 9386.0, "valid_targets_min": 6181 }, { "epoch": 0.1344, "grad_norm": 0.16878851071563028, "learning_rate": 1.067178502879079e-05, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.05300961434841156, "step": 140, "valid_targets_mean": 8530.2, "valid_targets_min": 4057 }, { "epoch": 0.1392, "grad_norm": 0.18017955223205775, "learning_rate": 1.105566218809981e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.052747681736946106, "step": 145, "valid_targets_mean": 8150.8, "valid_targets_min": 1979 }, { "epoch": 0.144, "grad_norm": 0.17011201848682178, "learning_rate": 1.143953934740883e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.053786564618349075, "step": 150, "valid_targets_mean": 9036.5, "valid_targets_min": 1344 }, { "epoch": 0.1488, "grad_norm": 0.14948621014727742, "learning_rate": 1.182341650671785e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.04889284819364548, "step": 155, "valid_targets_mean": 9374.1, "valid_targets_min": 5222 }, { "epoch": 0.1536, "grad_norm": 0.17837038997047153, "learning_rate": 1.2207293666026872e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.05337853729724884, "step": 160, "valid_targets_mean": 9026.4, "valid_targets_min": 941 }, { "epoch": 0.1584, "grad_norm": 0.16794019625060191, "learning_rate": 1.2591170825335894e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.0580047108232975, "step": 165, "valid_targets_mean": 8909.0, "valid_targets_min": 4147 }, { "epoch": 0.1632, "grad_norm": 0.16451121852700687, "learning_rate": 1.2975047984644915e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.05628425255417824, "step": 170, "valid_targets_mean": 9237.3, "valid_targets_min": 2879 }, { "epoch": 0.168, "grad_norm": 0.1620845277038851, "learning_rate": 1.3358925143953936e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.05485953390598297, "step": 175, "valid_targets_mean": 8967.8, "valid_targets_min": 1950 }, { "epoch": 0.1728, "grad_norm": 0.18552111008573974, "learning_rate": 1.3742802303262956e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.05156928300857544, "step": 180, "valid_targets_mean": 8037.1, "valid_targets_min": 3591 }, { "epoch": 0.1776, "grad_norm": 0.1834362128640418, "learning_rate": 1.4126679462571978e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.05930773541331291, "step": 185, "valid_targets_mean": 8785.6, "valid_targets_min": 2286 }, { "epoch": 0.1824, "grad_norm": 0.7040750475552785, "learning_rate": 1.4510556621881e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.05356145650148392, "step": 190, "valid_targets_mean": 8743.2, "valid_targets_min": 3331 }, { "epoch": 0.1872, "grad_norm": 0.17845848988906052, "learning_rate": 1.4894433781190021e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.050542086362838745, "step": 195, "valid_targets_mean": 8117.4, "valid_targets_min": 2982 }, { "epoch": 0.192, "grad_norm": 0.1646793822772226, "learning_rate": 1.527831094049904e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.05630158260464668, "step": 200, "valid_targets_mean": 9397.2, "valid_targets_min": 3908 }, { "epoch": 0.1968, "grad_norm": 0.1653369285434222, "learning_rate": 1.566218809980806e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.05802737921476364, "step": 205, "valid_targets_mean": 9779.3, "valid_targets_min": 2867 }, { "epoch": 0.2016, "grad_norm": 0.17699392141610665, "learning_rate": 1.6046065259117082e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.05261120945215225, "step": 210, "valid_targets_mean": 8929.7, "valid_targets_min": 3230 }, { "epoch": 0.2064, "grad_norm": 0.15546901424567497, "learning_rate": 1.6429942418426105e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.0501735582947731, "step": 215, "valid_targets_mean": 9803.3, "valid_targets_min": 4354 }, { "epoch": 0.2112, "grad_norm": 0.1647739852350217, "learning_rate": 1.6813819577735126e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.05220291018486023, "step": 220, "valid_targets_mean": 8609.9, "valid_targets_min": 1686 }, { "epoch": 0.216, "grad_norm": 0.18923635383897736, "learning_rate": 1.7197696737044146e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.05251702666282654, "step": 225, "valid_targets_mean": 9155.3, "valid_targets_min": 2869 }, { "epoch": 0.2208, "grad_norm": 0.17077125348550806, "learning_rate": 1.758157389635317e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.04130622744560242, "step": 230, "valid_targets_mean": 8067.4, "valid_targets_min": 1355 }, { "epoch": 0.2256, "grad_norm": 0.16749430547993427, "learning_rate": 1.796545105566219e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.046884313225746155, "step": 235, "valid_targets_mean": 8949.4, "valid_targets_min": 5015 }, { "epoch": 0.2304, "grad_norm": 0.1686236778589441, "learning_rate": 1.8349328214971213e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.04728979989886284, "step": 240, "valid_targets_mean": 8402.7, "valid_targets_min": 2024 }, { "epoch": 0.2352, "grad_norm": 0.17340081794047488, "learning_rate": 1.8733205374280233e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.04933461174368858, "step": 245, "valid_targets_mean": 9134.0, "valid_targets_min": 2863 }, { "epoch": 0.24, "grad_norm": 0.18643553683889033, "learning_rate": 1.9117082533589253e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.05289412662386894, "step": 250, "valid_targets_mean": 9414.7, "valid_targets_min": 2948 }, { "epoch": 0.2448, "grad_norm": 0.16686892259142147, "learning_rate": 1.9500959692898273e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.0571310892701149, "step": 255, "valid_targets_mean": 9362.2, "valid_targets_min": 1413 }, { "epoch": 0.2496, "grad_norm": 0.16428543489008277, "learning_rate": 1.9884836852207294e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.04735701531171799, "step": 260, "valid_targets_mean": 8750.2, "valid_targets_min": 4447 }, { "epoch": 0.2544, "grad_norm": 0.1713855287966125, "learning_rate": 2.0268714011516314e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.04655732959508896, "step": 265, "valid_targets_mean": 8087.2, "valid_targets_min": 2311 }, { "epoch": 0.2592, "grad_norm": 0.16600507062294687, "learning_rate": 2.0652591170825337e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.04228595644235611, "step": 270, "valid_targets_mean": 8538.3, "valid_targets_min": 3618 }, { "epoch": 0.264, "grad_norm": 0.16203412094758496, "learning_rate": 2.103646833013436e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.04873499274253845, "step": 275, "valid_targets_mean": 8714.5, "valid_targets_min": 2308 }, { "epoch": 0.2688, "grad_norm": 0.16232368985693238, "learning_rate": 2.142034548944338e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.04977979511022568, "step": 280, "valid_targets_mean": 7793.4, "valid_targets_min": 2243 }, { "epoch": 0.2736, "grad_norm": 0.16963787072822398, "learning_rate": 2.18042226487524e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.04747937619686127, "step": 285, "valid_targets_mean": 8890.7, "valid_targets_min": 3910 }, { "epoch": 0.2784, "grad_norm": 0.15596812207408062, "learning_rate": 2.218809980806142e-05, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.04897751659154892, "step": 290, "valid_targets_mean": 8705.1, "valid_targets_min": 2007 }, { "epoch": 0.2832, "grad_norm": 0.17698628792600066, "learning_rate": 2.2571976967370445e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.04906153678894043, "step": 295, "valid_targets_mean": 8524.2, "valid_targets_min": 2711 }, { "epoch": 0.288, "grad_norm": 0.15226044506219266, "learning_rate": 2.2955854126679465e-05, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.04470205307006836, "step": 300, "valid_targets_mean": 9084.5, "valid_targets_min": 4514 }, { "epoch": 0.2928, "grad_norm": 0.1631758341391722, "learning_rate": 2.3339731285988485e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.0455140583217144, "step": 305, "valid_targets_mean": 8223.5, "valid_targets_min": 2624 }, { "epoch": 0.2976, "grad_norm": 0.16266001506773634, "learning_rate": 2.372360844529751e-05, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.04833702743053436, "step": 310, "valid_targets_mean": 9030.3, "valid_targets_min": 2595 }, { "epoch": 0.3024, "grad_norm": 0.1552003389279275, "learning_rate": 2.4107485604606525e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.04400190711021423, "step": 315, "valid_targets_mean": 8977.0, "valid_targets_min": 3447 }, { "epoch": 0.3072, "grad_norm": 0.16366961875606295, "learning_rate": 2.449136276391555e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.052342720329761505, "step": 320, "valid_targets_mean": 8492.8, "valid_targets_min": 1643 }, { "epoch": 0.312, "grad_norm": 0.21633571289591977, "learning_rate": 2.4875239923224573e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.06043235957622528, "step": 325, "valid_targets_mean": 9089.8, "valid_targets_min": 3622 }, { "epoch": 0.3168, "grad_norm": 0.16778566765447833, "learning_rate": 2.525911708253359e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.04372868314385414, "step": 330, "valid_targets_mean": 8514.7, "valid_targets_min": 1581 }, { "epoch": 0.3216, "grad_norm": 0.1525783264460117, "learning_rate": 2.5642994241842613e-05, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.04171153903007507, "step": 335, "valid_targets_mean": 8744.2, "valid_targets_min": 2937 }, { "epoch": 0.3264, "grad_norm": 0.17090017951805586, "learning_rate": 2.6026871401151633e-05, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.046074796468019485, "step": 340, "valid_targets_mean": 8279.8, "valid_targets_min": 2561 }, { "epoch": 0.3312, "grad_norm": 0.16550150425181892, "learning_rate": 2.6410748560460657e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.04613085091114044, "step": 345, "valid_targets_mean": 8464.2, "valid_targets_min": 2617 }, { "epoch": 0.336, "grad_norm": 0.15473637741869978, "learning_rate": 2.6794625719769677e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.049118585884571075, "step": 350, "valid_targets_mean": 9190.0, "valid_targets_min": 4909 }, { "epoch": 0.3408, "grad_norm": 0.1530756738736752, "learning_rate": 2.7178502879078697e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.04675169289112091, "step": 355, "valid_targets_mean": 8826.0, "valid_targets_min": 2023 }, { "epoch": 0.3456, "grad_norm": 0.16704144085394457, "learning_rate": 2.756238003838772e-05, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.05301285907626152, "step": 360, "valid_targets_mean": 9298.4, "valid_targets_min": 2038 }, { "epoch": 0.3504, "grad_norm": 0.1705539915112971, "learning_rate": 2.7946257197696737e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.047162771224975586, "step": 365, "valid_targets_mean": 8848.1, "valid_targets_min": 2694 }, { "epoch": 0.3552, "grad_norm": 0.17172115669532714, "learning_rate": 2.833013435700576e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.04858285188674927, "step": 370, "valid_targets_mean": 8245.0, "valid_targets_min": 3959 }, { "epoch": 0.36, "grad_norm": 0.1635738602794979, "learning_rate": 2.8714011516314784e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.05017467588186264, "step": 375, "valid_targets_mean": 8803.3, "valid_targets_min": 4631 }, { "epoch": 0.3648, "grad_norm": 0.14689162023635646, "learning_rate": 2.90978886756238e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.04908227548003197, "step": 380, "valid_targets_mean": 9190.8, "valid_targets_min": 2141 }, { "epoch": 0.3696, "grad_norm": 0.1735748309731461, "learning_rate": 2.9481765834932825e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.05058016628026962, "step": 385, "valid_targets_mean": 8794.3, "valid_targets_min": 2139 }, { "epoch": 0.3744, "grad_norm": 0.16453333610787235, "learning_rate": 2.9865642994241845e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.044411011040210724, "step": 390, "valid_targets_mean": 9082.6, "valid_targets_min": 3334 }, { "epoch": 0.3792, "grad_norm": 0.16928223848401386, "learning_rate": 3.0249520153550865e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.04547496512532234, "step": 395, "valid_targets_mean": 8381.7, "valid_targets_min": 1637 }, { "epoch": 0.384, "grad_norm": 0.16575962515587384, "learning_rate": 3.063339731285989e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.052196696400642395, "step": 400, "valid_targets_mean": 9116.9, "valid_targets_min": 3837 }, { "epoch": 0.3888, "grad_norm": 0.1465834004473263, "learning_rate": 3.101727447216891e-05, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.042442236095666885, "step": 405, "valid_targets_mean": 8501.0, "valid_targets_min": 2762 }, { "epoch": 0.3936, "grad_norm": 0.168887624117521, "learning_rate": 3.140115163147793e-05, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.04733353853225708, "step": 410, "valid_targets_mean": 9785.0, "valid_targets_min": 4165 }, { "epoch": 0.3984, "grad_norm": 0.1674817302783263, "learning_rate": 3.178502879078695e-05, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.04236965253949165, "step": 415, "valid_targets_mean": 7495.3, "valid_targets_min": 2040 }, { "epoch": 0.4032, "grad_norm": 0.1633791795734902, "learning_rate": 3.216890595009597e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.04652637243270874, "step": 420, "valid_targets_mean": 9678.3, "valid_targets_min": 3511 }, { "epoch": 0.408, "grad_norm": 0.15017097856344935, "learning_rate": 3.2552783109404996e-05, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.04723096638917923, "step": 425, "valid_targets_mean": 8518.3, "valid_targets_min": 5212 }, { "epoch": 0.4128, "grad_norm": 0.16403792996616412, "learning_rate": 3.2936660268714016e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.045905664563179016, "step": 430, "valid_targets_mean": 8233.1, "valid_targets_min": 1554 }, { "epoch": 0.4176, "grad_norm": 0.15363370389018594, "learning_rate": 3.3320537428023036e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.047167956829071045, "step": 435, "valid_targets_mean": 9401.3, "valid_targets_min": 2729 }, { "epoch": 0.4224, "grad_norm": 0.14941194784466624, "learning_rate": 3.3704414587332056e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.04570108652114868, "step": 440, "valid_targets_mean": 8790.9, "valid_targets_min": 1588 }, { "epoch": 0.4272, "grad_norm": 0.1366092155715405, "learning_rate": 3.4088291746641077e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.04900815337896347, "step": 445, "valid_targets_mean": 9022.6, "valid_targets_min": 3456 }, { "epoch": 0.432, "grad_norm": 0.15770732910450744, "learning_rate": 3.4472168905950104e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.04628250002861023, "step": 450, "valid_targets_mean": 8808.2, "valid_targets_min": 5148 }, { "epoch": 0.4368, "grad_norm": 0.1629314200910405, "learning_rate": 3.485604606525912e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.0451054573059082, "step": 455, "valid_targets_mean": 8471.3, "valid_targets_min": 2409 }, { "epoch": 0.4416, "grad_norm": 0.160272458945177, "learning_rate": 3.5239923224568144e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.048758409917354584, "step": 460, "valid_targets_mean": 8512.3, "valid_targets_min": 3525 }, { "epoch": 0.4464, "grad_norm": 0.16561926988288322, "learning_rate": 3.5623800383877164e-05, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.05006253719329834, "step": 465, "valid_targets_mean": 8585.6, "valid_targets_min": 2285 }, { "epoch": 0.4512, "grad_norm": 0.16050505436260384, "learning_rate": 3.6007677543186184e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.05636896938085556, "step": 470, "valid_targets_mean": 9733.6, "valid_targets_min": 2143 }, { "epoch": 0.456, "grad_norm": 0.14490817773722517, "learning_rate": 3.6391554702495204e-05, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.047622889280319214, "step": 475, "valid_targets_mean": 9244.6, "valid_targets_min": 3390 }, { "epoch": 0.4608, "grad_norm": 0.15192210465120123, "learning_rate": 3.6775431861804224e-05, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.044686153531074524, "step": 480, "valid_targets_mean": 8674.3, "valid_targets_min": 2361 }, { "epoch": 0.4656, "grad_norm": 0.15068638781498972, "learning_rate": 3.7159309021113245e-05, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.04900766536593437, "step": 485, "valid_targets_mean": 9105.2, "valid_targets_min": 2433 }, { "epoch": 0.4704, "grad_norm": 0.16096900900073532, "learning_rate": 3.7543186180422265e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.04619026556611061, "step": 490, "valid_targets_mean": 8567.6, "valid_targets_min": 4220 }, { "epoch": 0.4752, "grad_norm": 0.15476058661894235, "learning_rate": 3.792706333973129e-05, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.04463457316160202, "step": 495, "valid_targets_mean": 8529.2, "valid_targets_min": 2511 }, { "epoch": 0.48, "grad_norm": 0.15092582689941947, "learning_rate": 3.831094049904031e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.03905282914638519, "step": 500, "valid_targets_mean": 8270.3, "valid_targets_min": 2377 }, { "epoch": 0.4848, "grad_norm": 0.1537525325660721, "learning_rate": 3.869481765834933e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.041663214564323425, "step": 505, "valid_targets_mean": 7962.0, "valid_targets_min": 3432 }, { "epoch": 0.4896, "grad_norm": 0.15466191978224791, "learning_rate": 3.907869481765835e-05, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.04699457436800003, "step": 510, "valid_targets_mean": 8543.5, "valid_targets_min": 1866 }, { "epoch": 0.4944, "grad_norm": 0.14871033158460176, "learning_rate": 3.946257197696737e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.04727835953235626, "step": 515, "valid_targets_mean": 8456.3, "valid_targets_min": 4250 }, { "epoch": 0.4992, "grad_norm": 0.14338051178538652, "learning_rate": 3.984644913627639e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.040438905358314514, "step": 520, "valid_targets_mean": 8662.9, "valid_targets_min": 2256 }, { "epoch": 0.504, "grad_norm": 0.15742380971099282, "learning_rate": 3.999995959997414e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.04269728064537048, "step": 525, "valid_targets_mean": 8493.9, "valid_targets_min": 2420 }, { "epoch": 0.5088, "grad_norm": 0.15670069467354014, "learning_rate": 3.999971271151827e-05, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.04551412910223007, "step": 530, "valid_targets_mean": 9344.8, "valid_targets_min": 5656 }, { "epoch": 0.5136, "grad_norm": 0.15374405667621877, "learning_rate": 3.9999241381832614e-05, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.0490286722779274, "step": 535, "valid_targets_mean": 8047.5, "valid_targets_min": 3717 }, { "epoch": 0.5184, "grad_norm": 0.1519411027027414, "learning_rate": 3.999854561620655e-05, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.045247673988342285, "step": 540, "valid_targets_mean": 9440.2, "valid_targets_min": 2358 }, { "epoch": 0.5232, "grad_norm": 0.14569122526754544, "learning_rate": 3.9997625422448114e-05, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.04392744228243828, "step": 545, "valid_targets_mean": 9050.4, "valid_targets_min": 5323 }, { "epoch": 0.528, "grad_norm": 0.13609907027733714, "learning_rate": 3.999648081088391e-05, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.04291406646370888, "step": 550, "valid_targets_mean": 9465.5, "valid_targets_min": 2912 }, { "epoch": 0.5328, "grad_norm": 0.1377783947779239, "learning_rate": 3.999511179435905e-05, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.040753189474344254, "step": 555, "valid_targets_mean": 9555.9, "valid_targets_min": 2568 }, { "epoch": 0.5376, "grad_norm": 0.1379593120954164, "learning_rate": 3.999351838823691e-05, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.04435383528470993, "step": 560, "valid_targets_mean": 9169.4, "valid_targets_min": 3276 }, { "epoch": 0.5424, "grad_norm": 0.1418424270920895, "learning_rate": 3.999170061039908e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.046147946268320084, "step": 565, "valid_targets_mean": 9111.7, "valid_targets_min": 1397 }, { "epoch": 0.5472, "grad_norm": 0.14040633557580692, "learning_rate": 3.998965848124505e-05, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.048749588429927826, "step": 570, "valid_targets_mean": 9351.5, "valid_targets_min": 5556 }, { "epoch": 0.552, "grad_norm": 0.13449375343867295, "learning_rate": 3.998739202369205e-05, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.041300173848867416, "step": 575, "valid_targets_mean": 8922.3, "valid_targets_min": 2736 }, { "epoch": 0.5568, "grad_norm": 0.14743580069920623, "learning_rate": 3.998490126317477e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.04395359009504318, "step": 580, "valid_targets_mean": 8960.4, "valid_targets_min": 2701 }, { "epoch": 0.5616, "grad_norm": 0.14157038751939097, "learning_rate": 3.9982186227645085e-05, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.04324673116207123, "step": 585, "valid_targets_mean": 8823.2, "valid_targets_min": 418 }, { "epoch": 0.5664, "grad_norm": 0.1582091638266866, "learning_rate": 3.9979246947571724e-05, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.04149835929274559, "step": 590, "valid_targets_mean": 7495.4, "valid_targets_min": 2352 }, { "epoch": 0.5712, "grad_norm": 0.14899721581452358, "learning_rate": 3.9976083455939945e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.04160813242197037, "step": 595, "valid_targets_mean": 8655.7, "valid_targets_min": 2572 }, { "epoch": 0.576, "grad_norm": 0.1539653528766409, "learning_rate": 3.9972695788251155e-05, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.04525775834918022, "step": 600, "valid_targets_mean": 8892.5, "valid_targets_min": 5296 }, { "epoch": 0.5808, "grad_norm": 0.14943883780637449, "learning_rate": 3.996908398252251e-05, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.043959811329841614, "step": 605, "valid_targets_mean": 8608.5, "valid_targets_min": 3362 }, { "epoch": 0.5856, "grad_norm": 0.13367238747822863, "learning_rate": 3.9965248079286505e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.04346688464283943, "step": 610, "valid_targets_mean": 9197.5, "valid_targets_min": 1977 }, { "epoch": 0.5904, "grad_norm": 0.13643029241656873, "learning_rate": 3.99611881215905e-05, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.041380517184734344, "step": 615, "valid_targets_mean": 8393.2, "valid_targets_min": 2051 }, { "epoch": 0.5952, "grad_norm": 0.1377113571496518, "learning_rate": 3.995690415499624e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.04686662554740906, "step": 620, "valid_targets_mean": 9150.6, "valid_targets_min": 3686 }, { "epoch": 0.6, "grad_norm": 0.1403099261926008, "learning_rate": 3.995239622757936e-05, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.0410618893802166, "step": 625, "valid_targets_mean": 8159.0, "valid_targets_min": 3947 }, { "epoch": 0.6048, "grad_norm": 0.14096536721898614, "learning_rate": 3.994766438992882e-05, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.03911704570055008, "step": 630, "valid_targets_mean": 7991.7, "valid_targets_min": 1670 }, { "epoch": 0.6096, "grad_norm": 0.13195736313161857, "learning_rate": 3.994270869514635e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.0424465574324131, "step": 635, "valid_targets_mean": 8870.5, "valid_targets_min": 2210 }, { "epoch": 0.6144, "grad_norm": 0.13332668179988635, "learning_rate": 3.9937529198845864e-05, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.04478909820318222, "step": 640, "valid_targets_mean": 8382.8, "valid_targets_min": 2213 }, { "epoch": 0.6192, "grad_norm": 0.13716325538151122, "learning_rate": 3.9932125959152833e-05, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.04378994181752205, "step": 645, "valid_targets_mean": 8748.3, "valid_targets_min": 2320 }, { "epoch": 0.624, "grad_norm": 0.1308079107487341, "learning_rate": 3.9926499036703607e-05, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.038693659007549286, "step": 650, "valid_targets_mean": 8223.2, "valid_targets_min": 3239 }, { "epoch": 0.6288, "grad_norm": 0.14424264976490078, "learning_rate": 3.992064849464476e-05, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.043246474117040634, "step": 655, "valid_targets_mean": 7944.7, "valid_targets_min": 1974 }, { "epoch": 0.6336, "grad_norm": 0.14454916157149716, "learning_rate": 3.991457439863238e-05, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.052069369703531265, "step": 660, "valid_targets_mean": 9785.6, "valid_targets_min": 2127 }, { "epoch": 0.6384, "grad_norm": 0.13727057460729494, "learning_rate": 3.990827681683133e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.04632120579481125, "step": 665, "valid_targets_mean": 8698.8, "valid_targets_min": 1935 }, { "epoch": 0.6432, "grad_norm": 0.1398377748234492, "learning_rate": 3.990175581991448e-05, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.04159468784928322, "step": 670, "valid_targets_mean": 8791.3, "valid_targets_min": 3886 }, { "epoch": 0.648, "grad_norm": 0.1345378725929749, "learning_rate": 3.989501148106189e-05, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.04403248429298401, "step": 675, "valid_targets_mean": 8627.5, "valid_targets_min": 1892 }, { "epoch": 0.6528, "grad_norm": 0.12953037003518647, "learning_rate": 3.988804387596005e-05, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.042582374066114426, "step": 680, "valid_targets_mean": 9106.1, "valid_targets_min": 3962 }, { "epoch": 0.6576, "grad_norm": 0.1350393492828008, "learning_rate": 3.9880853082800965e-05, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.041537463665008545, "step": 685, "valid_targets_mean": 8600.3, "valid_targets_min": 3511 }, { "epoch": 0.6624, "grad_norm": 0.13206633754473568, "learning_rate": 3.987343918228133e-05, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.044280827045440674, "step": 690, "valid_targets_mean": 8396.4, "valid_targets_min": 3428 }, { "epoch": 0.6672, "grad_norm": 0.13729845663078688, "learning_rate": 3.9865802257601584e-05, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.04000245779752731, "step": 695, "valid_targets_mean": 8540.1, "valid_targets_min": 1813 }, { "epoch": 0.672, "grad_norm": 0.13635663924478578, "learning_rate": 3.9857942394464976e-05, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.03872641175985336, "step": 700, "valid_targets_mean": 8601.8, "valid_targets_min": 4288 }, { "epoch": 0.6768, "grad_norm": 0.15057437392276532, "learning_rate": 3.984985968107667e-05, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.04191380739212036, "step": 705, "valid_targets_mean": 8113.8, "valid_targets_min": 1824 }, { "epoch": 0.6816, "grad_norm": 0.15262968979836647, "learning_rate": 3.984155420814266e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.045424915850162506, "step": 710, "valid_targets_mean": 9187.2, "valid_targets_min": 3023 }, { "epoch": 0.6864, "grad_norm": 0.14131561005827004, "learning_rate": 3.9833026068868814e-05, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.04640107974410057, "step": 715, "valid_targets_mean": 9442.9, "valid_targets_min": 2870 }, { "epoch": 0.6912, "grad_norm": 0.1536532150005904, "learning_rate": 3.982427535895982e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.04061667248606682, "step": 720, "valid_targets_mean": 7744.2, "valid_targets_min": 1807 }, { "epoch": 0.696, "grad_norm": 0.14566890333011928, "learning_rate": 3.9815302176618076e-05, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.037999723106622696, "step": 725, "valid_targets_mean": 8014.6, "valid_targets_min": 2692 }, { "epoch": 0.7008, "grad_norm": 0.1329319602860735, "learning_rate": 3.980610662254264e-05, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.043485239148139954, "step": 730, "valid_targets_mean": 8674.2, "valid_targets_min": 1914 }, { "epoch": 0.7056, "grad_norm": 0.13214607087955763, "learning_rate": 3.9796688799928075e-05, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.03650156408548355, "step": 735, "valid_targets_mean": 8052.5, "valid_targets_min": 1535 }, { "epoch": 0.7104, "grad_norm": 0.14666052223087997, "learning_rate": 3.978704881446327e-05, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.040827296674251556, "step": 740, "valid_targets_mean": 8658.8, "valid_targets_min": 3364 }, { "epoch": 0.7152, "grad_norm": 0.13199011134390393, "learning_rate": 3.9777186774330304e-05, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.03985761106014252, "step": 745, "valid_targets_mean": 8315.3, "valid_targets_min": 2041 }, { "epoch": 0.72, "grad_norm": 0.13006510073207833, "learning_rate": 3.976710279020318e-05, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.050185881555080414, "step": 750, "valid_targets_mean": 8819.3, "valid_targets_min": 3518 }, { "epoch": 0.7248, "grad_norm": 0.12635946950837632, "learning_rate": 3.975679697524661e-05, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.0413113571703434, "step": 755, "valid_targets_mean": 9287.8, "valid_targets_min": 2520 }, { "epoch": 0.7296, "grad_norm": 0.16619628024740615, "learning_rate": 3.974626944511475e-05, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.040970057249069214, "step": 760, "valid_targets_mean": 8394.7, "valid_targets_min": 3787 }, { "epoch": 0.7344, "grad_norm": 0.13983220811078784, "learning_rate": 3.973552031794988e-05, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.04032052308320999, "step": 765, "valid_targets_mean": 8312.5, "valid_targets_min": 1690 }, { "epoch": 0.7392, "grad_norm": 0.13276909522770805, "learning_rate": 3.9724549714381106e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.0410274863243103, "step": 770, "valid_targets_mean": 9437.8, "valid_targets_min": 4807 }, { "epoch": 0.744, "grad_norm": 0.14074663236062346, "learning_rate": 3.971335775752298e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.04447145760059357, "step": 775, "valid_targets_mean": 8283.8, "valid_targets_min": 2255 }, { "epoch": 0.7488, "grad_norm": 0.13345475156150907, "learning_rate": 3.970194457297414e-05, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.0476519837975502, "step": 780, "valid_targets_mean": 8958.5, "valid_targets_min": 2037 }, { "epoch": 0.7536, "grad_norm": 0.13590512683057793, "learning_rate": 3.9690310288815876e-05, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.038623590022325516, "step": 785, "valid_targets_mean": 8875.8, "valid_targets_min": 1547 }, { "epoch": 0.7584, "grad_norm": 0.12392055016932459, "learning_rate": 3.967845503561073e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.03856155276298523, "step": 790, "valid_targets_mean": 8824.8, "valid_targets_min": 3008 }, { "epoch": 0.7632, "grad_norm": 0.12808803769496246, "learning_rate": 3.9666378946400974e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.04124930500984192, "step": 795, "valid_targets_mean": 8398.5, "valid_targets_min": 4402 }, { "epoch": 0.768, "grad_norm": 0.12400753315300732, "learning_rate": 3.965408215670719e-05, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.04107067734003067, "step": 800, "valid_targets_mean": 9418.2, "valid_targets_min": 5645 }, { "epoch": 0.7728, "grad_norm": 0.1321463233062571, "learning_rate": 3.964156480452667e-05, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.040333010256290436, "step": 805, "valid_targets_mean": 9123.3, "valid_targets_min": 2232 }, { "epoch": 0.7776, "grad_norm": 0.15850818767395258, "learning_rate": 3.962882703033195e-05, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.04237630218267441, "step": 810, "valid_targets_mean": 9014.5, "valid_targets_min": 1757 }, { "epoch": 0.7824, "grad_norm": 0.13022752887109454, "learning_rate": 3.961586897706915e-05, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.03962777554988861, "step": 815, "valid_targets_mean": 8785.4, "valid_targets_min": 3393 }, { "epoch": 0.7872, "grad_norm": 0.1411987989970659, "learning_rate": 3.960269079015643e-05, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.04631964862346649, "step": 820, "valid_targets_mean": 9530.4, "valid_targets_min": 5058 }, { "epoch": 0.792, "grad_norm": 0.13216475655191032, "learning_rate": 3.958929261748236e-05, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.04475382715463638, "step": 825, "valid_targets_mean": 8892.8, "valid_targets_min": 2083 }, { "epoch": 0.7968, "grad_norm": 0.12772498172212535, "learning_rate": 3.957567460940419e-05, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.04453466087579727, "step": 830, "valid_targets_mean": 8443.8, "valid_targets_min": 806 }, { "epoch": 0.8016, "grad_norm": 0.1288360457272141, "learning_rate": 3.9561836918746256e-05, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.04772651568055153, "step": 835, "valid_targets_mean": 9130.0, "valid_targets_min": 3135 }, { "epoch": 0.8064, "grad_norm": 0.12904971741193666, "learning_rate": 3.95477797007982e-05, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.041636817157268524, "step": 840, "valid_targets_mean": 9023.4, "valid_targets_min": 4250 }, { "epoch": 0.8112, "grad_norm": 0.1326001544343892, "learning_rate": 3.953350311331325e-05, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.04039324074983597, "step": 845, "valid_targets_mean": 9260.4, "valid_targets_min": 3688 }, { "epoch": 0.816, "grad_norm": 0.12642447244379482, "learning_rate": 3.951900731650645e-05, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.039405159652233124, "step": 850, "valid_targets_mean": 8837.0, "valid_targets_min": 2405 }, { "epoch": 0.8208, "grad_norm": 0.13173156761588117, "learning_rate": 3.950429247305286e-05, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.03566863760352135, "step": 855, "valid_targets_mean": 7964.2, "valid_targets_min": 1228 }, { "epoch": 0.8256, "grad_norm": 0.20449125184239303, "learning_rate": 3.9489358748085737e-05, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.044600710272789, "step": 860, "valid_targets_mean": 8969.1, "valid_targets_min": 2519 }, { "epoch": 0.8304, "grad_norm": 0.1267782883516138, "learning_rate": 3.947420630919466e-05, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.040724076330661774, "step": 865, "valid_targets_mean": 8701.4, "valid_targets_min": 2522 }, { "epoch": 0.8352, "grad_norm": 0.13947426674783286, "learning_rate": 3.9458835326423674e-05, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.03723190724849701, "step": 870, "valid_targets_mean": 8694.7, "valid_targets_min": 3628 }, { "epoch": 0.84, "grad_norm": 0.1429427588322893, "learning_rate": 3.9443245972269376e-05, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.044337622821331024, "step": 875, "valid_targets_mean": 9151.8, "valid_targets_min": 4207 }, { "epoch": 0.8448, "grad_norm": 0.12601811128568607, "learning_rate": 3.942743842167896e-05, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.03860004246234894, "step": 880, "valid_targets_mean": 8116.6, "valid_targets_min": 3504 }, { "epoch": 0.8496, "grad_norm": 0.1231651306256786, "learning_rate": 3.941141285204829e-05, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.03568350523710251, "step": 885, "valid_targets_mean": 8602.6, "valid_targets_min": 3333 }, { "epoch": 0.8544, "grad_norm": 0.1327633357414085, "learning_rate": 3.939516944321986e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.03741621971130371, "step": 890, "valid_targets_mean": 7680.4, "valid_targets_min": 2034 }, { "epoch": 0.8592, "grad_norm": 0.12782058862734189, "learning_rate": 3.937870837748085e-05, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.04108661413192749, "step": 895, "valid_targets_mean": 9461.2, "valid_targets_min": 4191 }, { "epoch": 0.864, "grad_norm": 0.13095812423706943, "learning_rate": 3.936202983956098e-05, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.04491672292351723, "step": 900, "valid_targets_mean": 9060.0, "valid_targets_min": 4238 }, { "epoch": 0.8688, "grad_norm": 0.14435955628562666, "learning_rate": 3.934513401663052e-05, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.04353254288434982, "step": 905, "valid_targets_mean": 8174.2, "valid_targets_min": 2049 }, { "epoch": 0.8736, "grad_norm": 0.13777422571076636, "learning_rate": 3.9328021098298164e-05, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.04200918227434158, "step": 910, "valid_targets_mean": 7853.6, "valid_targets_min": 2161 }, { "epoch": 0.8784, "grad_norm": 0.12925096382507895, "learning_rate": 3.9310691276608894e-05, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.03885449841618538, "step": 915, "valid_targets_mean": 8998.7, "valid_targets_min": 4216 }, { "epoch": 0.8832, "grad_norm": 0.1299999207480068, "learning_rate": 3.9293144746041824e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.0414196252822876, "step": 920, "valid_targets_mean": 9441.6, "valid_targets_min": 3116 }, { "epoch": 0.888, "grad_norm": 0.14119631019377754, "learning_rate": 3.9275381703508034e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.04161785542964935, "step": 925, "valid_targets_mean": 9032.9, "valid_targets_min": 3320 }, { "epoch": 0.8928, "grad_norm": 0.1335427102135748, "learning_rate": 3.925740234834833e-05, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.039411455392837524, "step": 930, "valid_targets_mean": 8125.8, "valid_targets_min": 2362 }, { "epoch": 0.8976, "grad_norm": 1.299524668859639, "learning_rate": 3.9239206882331045e-05, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.04274000972509384, "step": 935, "valid_targets_mean": 9362.2, "valid_targets_min": 2499 }, { "epoch": 0.9024, "grad_norm": 0.14595064075165548, "learning_rate": 3.922079550964976e-05, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.041862644255161285, "step": 940, "valid_targets_mean": 8516.2, "valid_targets_min": 2866 }, { "epoch": 0.9072, "grad_norm": 0.1406716428331579, "learning_rate": 3.920216843692099e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.039388202130794525, "step": 945, "valid_targets_mean": 8288.1, "valid_targets_min": 1520 }, { "epoch": 0.912, "grad_norm": 0.12120059012749052, "learning_rate": 3.918332587318189e-05, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.03998667746782303, "step": 950, "valid_targets_mean": 9838.4, "valid_targets_min": 3065 }, { "epoch": 0.9168, "grad_norm": 0.12432674716745307, "learning_rate": 3.916426802988791e-05, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.034975167363882065, "step": 955, "valid_targets_mean": 8630.9, "valid_targets_min": 3664 }, { "epoch": 0.9216, "grad_norm": 0.12453368828142465, "learning_rate": 3.9144995120910414e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.040313076227903366, "step": 960, "valid_targets_mean": 8565.8, "valid_targets_min": 1313 }, { "epoch": 0.9264, "grad_norm": 0.12414549421169692, "learning_rate": 3.912550736253428e-05, "loss": 0.1165, "loss_nan_ranks": 0, "loss_rank_avg": 0.03618764504790306, "step": 965, "valid_targets_mean": 9026.8, "valid_targets_min": 2861 }, { "epoch": 0.9312, "grad_norm": 0.12295142873666405, "learning_rate": 3.9105804973455466e-05, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.037326935678720474, "step": 970, "valid_targets_mean": 8990.8, "valid_targets_min": 5060 }, { "epoch": 0.936, "grad_norm": 0.1199361629404387, "learning_rate": 3.908588817477858e-05, "loss": 0.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.03776358813047409, "step": 975, "valid_targets_mean": 9242.8, "valid_targets_min": 2535 }, { "epoch": 0.9408, "grad_norm": 0.11968391724432256, "learning_rate": 3.9065757190014356e-05, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.04064861685037613, "step": 980, "valid_targets_mean": 8815.6, "valid_targets_min": 2016 }, { "epoch": 0.9456, "grad_norm": 0.13010903116296166, "learning_rate": 3.90454122450772e-05, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.03588135540485382, "step": 985, "valid_targets_mean": 8170.3, "valid_targets_min": 3799 }, { "epoch": 0.9504, "grad_norm": 0.12285238315467241, "learning_rate": 3.9024853568282615e-05, "loss": 0.1192, "loss_nan_ranks": 0, "loss_rank_avg": 0.03708403930068016, "step": 990, "valid_targets_mean": 9025.9, "valid_targets_min": 5318 }, { "epoch": 0.9552, "grad_norm": 0.13047767902641233, "learning_rate": 3.900408139034464e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.04085266962647438, "step": 995, "valid_targets_mean": 8927.5, "valid_targets_min": 2808 }, { "epoch": 0.96, "grad_norm": 0.12509338732915287, "learning_rate": 3.89830959443733e-05, "loss": 0.1213, "loss_nan_ranks": 0, "loss_rank_avg": 0.042269591242074966, "step": 1000, "valid_targets_mean": 9112.8, "valid_targets_min": 3104 }, { "epoch": 0.9648, "grad_norm": 0.12707976296407147, "learning_rate": 3.896189746587192e-05, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.04251757264137268, "step": 1005, "valid_targets_mean": 9197.0, "valid_targets_min": 4955 }, { "epoch": 0.9696, "grad_norm": 0.13513570063473687, "learning_rate": 3.894048619273457e-05, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.0449819378554821, "step": 1010, "valid_targets_mean": 8805.6, "valid_targets_min": 2816 }, { "epoch": 0.9744, "grad_norm": 0.11628596725040473, "learning_rate": 3.89188623652433e-05, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.03957689553499222, "step": 1015, "valid_targets_mean": 9101.4, "valid_targets_min": 5845 }, { "epoch": 0.9792, "grad_norm": 0.1395600161258974, "learning_rate": 3.889702622606553e-05, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.04011973738670349, "step": 1020, "valid_targets_mean": 8340.6, "valid_targets_min": 2670 }, { "epoch": 0.984, "grad_norm": 0.12278646466936824, "learning_rate": 3.887497802025129e-05, "loss": 0.1149, "loss_nan_ranks": 0, "loss_rank_avg": 0.03440343588590622, "step": 1025, "valid_targets_mean": 8029.5, "valid_targets_min": 2752 }, { "epoch": 0.9888, "grad_norm": 0.12604219136442135, "learning_rate": 3.885271799523043e-05, "loss": 0.12, "loss_nan_ranks": 0, "loss_rank_avg": 0.04180954396724701, "step": 1030, "valid_targets_mean": 8562.8, "valid_targets_min": 2962 }, { "epoch": 0.9936, "grad_norm": 0.12564503884119702, "learning_rate": 3.8830246400809925e-05, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.03574180603027344, "step": 1035, "valid_targets_mean": 8152.6, "valid_targets_min": 4152 }, { "epoch": 0.9984, "grad_norm": 0.12286222401223959, "learning_rate": 3.880756348917101e-05, "loss": 0.1201, "loss_nan_ranks": 0, "loss_rank_avg": 0.04260804131627083, "step": 1040, "valid_targets_mean": 9008.5, "valid_targets_min": 4527 }, { "epoch": 1.00288, "grad_norm": 0.13532126940346526, "learning_rate": 3.8784669514866365e-05, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.03753751516342163, "step": 1045, "valid_targets_mean": 10100.1, "valid_targets_min": 5514 }, { "epoch": 1.00768, "grad_norm": 0.12973697576755405, "learning_rate": 3.876156473481727e-05, "loss": 0.1065, "loss_nan_ranks": 0, "loss_rank_avg": 0.03712521493434906, "step": 1050, "valid_targets_mean": 9113.7, "valid_targets_min": 3701 }, { "epoch": 1.01248, "grad_norm": 0.12040784575878684, "learning_rate": 3.8738249408310716e-05, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.04298216104507446, "step": 1055, "valid_targets_mean": 9181.2, "valid_targets_min": 3126 }, { "epoch": 1.01728, "grad_norm": 0.1290882287304988, "learning_rate": 3.871472379699648e-05, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.03602221980690956, "step": 1060, "valid_targets_mean": 8772.9, "valid_targets_min": 2607 }, { "epoch": 1.02208, "grad_norm": 0.12406914379482467, "learning_rate": 3.869098816488422e-05, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.03653515875339508, "step": 1065, "valid_targets_mean": 9124.3, "valid_targets_min": 5033 }, { "epoch": 1.02688, "grad_norm": 0.13729165019846906, "learning_rate": 3.866704277834049e-05, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.035046130418777466, "step": 1070, "valid_targets_mean": 8623.2, "valid_targets_min": 3230 }, { "epoch": 1.03168, "grad_norm": 0.12036440804151036, "learning_rate": 3.864288790608573e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.034265272319316864, "step": 1075, "valid_targets_mean": 9006.2, "valid_targets_min": 2326 }, { "epoch": 1.03648, "grad_norm": 0.12363412561657591, "learning_rate": 3.861852381919132e-05, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.038711585104465485, "step": 1080, "valid_targets_mean": 8283.0, "valid_targets_min": 2443 }, { "epoch": 1.04128, "grad_norm": 0.12022387745735609, "learning_rate": 3.8593950791076446e-05, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.03348660469055176, "step": 1085, "valid_targets_mean": 8197.9, "valid_targets_min": 1325 }, { "epoch": 1.04608, "grad_norm": 0.12541307411660785, "learning_rate": 3.856916909750512e-05, "loss": 0.1097, "loss_nan_ranks": 0, "loss_rank_avg": 0.03612164780497551, "step": 1090, "valid_targets_mean": 8937.5, "valid_targets_min": 4843 }, { "epoch": 1.05088, "grad_norm": 0.12767600777176324, "learning_rate": 3.854417901658301e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.036185123026371, "step": 1095, "valid_targets_mean": 8712.5, "valid_targets_min": 4257 }, { "epoch": 1.05568, "grad_norm": 0.12527917305408634, "learning_rate": 3.851898082875438e-05, "loss": 0.1095, "loss_nan_ranks": 0, "loss_rank_avg": 0.037031348794698715, "step": 1100, "valid_targets_mean": 9053.6, "valid_targets_min": 3371 }, { "epoch": 1.06048, "grad_norm": 0.13136956141466558, "learning_rate": 3.849357481679891e-05, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.041252005845308304, "step": 1105, "valid_targets_mean": 8509.0, "valid_targets_min": 3914 }, { "epoch": 1.06528, "grad_norm": 0.12922975818642823, "learning_rate": 3.846796126582851e-05, "loss": 0.1094, "loss_nan_ranks": 0, "loss_rank_avg": 0.03326720371842384, "step": 1110, "valid_targets_mean": 8771.5, "valid_targets_min": 3884 }, { "epoch": 1.07008, "grad_norm": 0.12106396045806493, "learning_rate": 3.844214046328416e-05, "loss": 0.1097, "loss_nan_ranks": 0, "loss_rank_avg": 0.043117620050907135, "step": 1115, "valid_targets_mean": 8209.8, "valid_targets_min": 3243 }, { "epoch": 1.07488, "grad_norm": 0.13002226111527115, "learning_rate": 3.841611269893266e-05, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.03778604418039322, "step": 1120, "valid_targets_mean": 8510.7, "valid_targets_min": 2567 }, { "epoch": 1.07968, "grad_norm": 0.12456407780457754, "learning_rate": 3.8389878264863364e-05, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.03702523559331894, "step": 1125, "valid_targets_mean": 9058.4, "valid_targets_min": 5648 }, { "epoch": 1.08448, "grad_norm": 0.12625041807761278, "learning_rate": 3.836343745548495e-05, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.03746821731328964, "step": 1130, "valid_targets_mean": 9379.8, "valid_targets_min": 2461 }, { "epoch": 1.08928, "grad_norm": 0.12729402444355445, "learning_rate": 3.833679056752205e-05, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.03369244933128357, "step": 1135, "valid_targets_mean": 8650.1, "valid_targets_min": 2519 }, { "epoch": 1.09408, "grad_norm": 0.12251279578419882, "learning_rate": 3.8309937900012e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.035309284925460815, "step": 1140, "valid_targets_mean": 8545.1, "valid_targets_min": 2214 }, { "epoch": 1.09888, "grad_norm": 0.12475486299736205, "learning_rate": 3.8282879754301395e-05, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.036522600799798965, "step": 1145, "valid_targets_mean": 9047.7, "valid_targets_min": 2994 }, { "epoch": 1.10368, "grad_norm": 0.12100576465873229, "learning_rate": 3.825561643404277e-05, "loss": 0.1114, "loss_nan_ranks": 0, "loss_rank_avg": 0.04240952804684639, "step": 1150, "valid_targets_mean": 9005.7, "valid_targets_min": 4329 }, { "epoch": 1.10848, "grad_norm": 0.12172067784502344, "learning_rate": 3.8228148245191195e-05, "loss": 0.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.03200407326221466, "step": 1155, "valid_targets_mean": 8406.1, "valid_targets_min": 4143 }, { "epoch": 1.11328, "grad_norm": 0.13157757940674708, "learning_rate": 3.820047549600078e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.0324568971991539, "step": 1160, "valid_targets_mean": 8611.8, "valid_targets_min": 4615 }, { "epoch": 1.11808, "grad_norm": 0.13712186902776327, "learning_rate": 3.8172598497021304e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.032350365072488785, "step": 1165, "valid_targets_mean": 8286.6, "valid_targets_min": 3998 }, { "epoch": 1.12288, "grad_norm": 0.12296139282257143, "learning_rate": 3.8144517561094635e-05, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.03495969623327255, "step": 1170, "valid_targets_mean": 8338.6, "valid_targets_min": 2001 }, { "epoch": 1.12768, "grad_norm": 0.12885506741767813, "learning_rate": 3.811623300335129e-05, "loss": 0.106, "loss_nan_ranks": 0, "loss_rank_avg": 0.03439897298812866, "step": 1175, "valid_targets_mean": 8294.6, "valid_targets_min": 3388 }, { "epoch": 1.13248, "grad_norm": 0.13353947355498724, "learning_rate": 3.808774514120689e-05, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.03528585284948349, "step": 1180, "valid_targets_mean": 8710.7, "valid_targets_min": 2226 }, { "epoch": 1.13728, "grad_norm": 0.11554578661926901, "learning_rate": 3.805905429435856e-05, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.0375838503241539, "step": 1185, "valid_targets_mean": 9312.7, "valid_targets_min": 4938 }, { "epoch": 1.14208, "grad_norm": 0.13553731807499625, "learning_rate": 3.803016078478137e-05, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.03697044402360916, "step": 1190, "valid_targets_mean": 8790.3, "valid_targets_min": 3411 }, { "epoch": 1.14688, "grad_norm": 0.19558858259974732, "learning_rate": 3.800106493672472e-05, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.0370432510972023, "step": 1195, "valid_targets_mean": 8896.2, "valid_targets_min": 2351 }, { "epoch": 1.15168, "grad_norm": 0.12694965655544607, "learning_rate": 3.7971767076708704e-05, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.03679373487830162, "step": 1200, "valid_targets_mean": 8190.5, "valid_targets_min": 1331 }, { "epoch": 1.15648, "grad_norm": 0.1294349062636514, "learning_rate": 3.794226753352042e-05, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.03450850769877434, "step": 1205, "valid_targets_mean": 7733.4, "valid_targets_min": 2324 }, { "epoch": 1.16128, "grad_norm": 0.13350423195151842, "learning_rate": 3.791256663821032e-05, "loss": 0.1128, "loss_nan_ranks": 0, "loss_rank_avg": 0.03809414058923721, "step": 1210, "valid_targets_mean": 8429.0, "valid_targets_min": 1850 }, { "epoch": 1.16608, "grad_norm": 0.11693967487810589, "learning_rate": 3.788266472408846e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.04129686951637268, "step": 1215, "valid_targets_mean": 9791.9, "valid_targets_min": 3448 }, { "epoch": 1.17088, "grad_norm": 0.1171411660888164, "learning_rate": 3.785256212672077e-05, "loss": 0.1114, "loss_nan_ranks": 0, "loss_rank_avg": 0.032727207988500595, "step": 1220, "valid_targets_mean": 8760.9, "valid_targets_min": 3157 }, { "epoch": 1.17568, "grad_norm": 0.12246093881306887, "learning_rate": 3.7822259183925324e-05, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.03792506083846092, "step": 1225, "valid_targets_mean": 8479.7, "valid_targets_min": 2780 }, { "epoch": 1.18048, "grad_norm": 0.11630087988559276, "learning_rate": 3.7791756235768476e-05, "loss": 0.1126, "loss_nan_ranks": 0, "loss_rank_avg": 0.030140887945890427, "step": 1230, "valid_targets_mean": 8280.7, "valid_targets_min": 1912 }, { "epoch": 1.1852800000000001, "grad_norm": 0.12034312206493047, "learning_rate": 3.7761053624561104e-05, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.041859276592731476, "step": 1235, "valid_targets_mean": 9125.2, "valid_targets_min": 4384 }, { "epoch": 1.19008, "grad_norm": 0.12495575991658803, "learning_rate": 3.7730151694854757e-05, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.03812647983431816, "step": 1240, "valid_targets_mean": 8895.1, "valid_targets_min": 3239 }, { "epoch": 1.19488, "grad_norm": 0.1279797576014592, "learning_rate": 3.769905079343777e-05, "loss": 0.1094, "loss_nan_ranks": 0, "loss_rank_avg": 0.03480718284845352, "step": 1245, "valid_targets_mean": 9148.8, "valid_targets_min": 3375 }, { "epoch": 1.19968, "grad_norm": 0.1429209094833432, "learning_rate": 3.766775126933138e-05, "loss": 0.1146, "loss_nan_ranks": 0, "loss_rank_avg": 0.03262244164943695, "step": 1250, "valid_targets_mean": 7446.3, "valid_targets_min": 1642 }, { "epoch": 1.20448, "grad_norm": 0.11651049817133567, "learning_rate": 3.7636253473785815e-05, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.04041413217782974, "step": 1255, "valid_targets_mean": 9296.9, "valid_targets_min": 1921 }, { "epoch": 1.20928, "grad_norm": 0.12715956000371428, "learning_rate": 3.760455776027636e-05, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.036815039813518524, "step": 1260, "valid_targets_mean": 8492.6, "valid_targets_min": 2198 }, { "epoch": 1.21408, "grad_norm": 0.13088428982143835, "learning_rate": 3.7572664484499365e-05, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.04161841422319412, "step": 1265, "valid_targets_mean": 9645.4, "valid_targets_min": 5888 }, { "epoch": 1.21888, "grad_norm": 0.11844945935335202, "learning_rate": 3.7540574004368264e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.035760242491960526, "step": 1270, "valid_targets_mean": 8232.6, "valid_targets_min": 972 }, { "epoch": 1.2236799999999999, "grad_norm": 0.1217454331633701, "learning_rate": 3.750828668000959e-05, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.044121257960796356, "step": 1275, "valid_targets_mean": 9731.1, "valid_targets_min": 4826 }, { "epoch": 1.22848, "grad_norm": 0.11438951119465016, "learning_rate": 3.747580287375887e-05, "loss": 0.1094, "loss_nan_ranks": 0, "loss_rank_avg": 0.03459799289703369, "step": 1280, "valid_targets_mean": 8311.7, "valid_targets_min": 3380 }, { "epoch": 1.23328, "grad_norm": 0.12344370046566683, "learning_rate": 3.744312295015662e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.03901112824678421, "step": 1285, "valid_targets_mean": 9534.2, "valid_targets_min": 4213 }, { "epoch": 1.23808, "grad_norm": 0.1282738291200301, "learning_rate": 3.7410247275944223e-05, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.0330953374505043, "step": 1290, "valid_targets_mean": 7552.4, "valid_targets_min": 1647 }, { "epoch": 1.24288, "grad_norm": 0.11797698703131318, "learning_rate": 3.737717622005981e-05, "loss": 0.1128, "loss_nan_ranks": 0, "loss_rank_avg": 0.04117663949728012, "step": 1295, "valid_targets_mean": 8844.8, "valid_targets_min": 4651 }, { "epoch": 1.24768, "grad_norm": 0.12402104881406364, "learning_rate": 3.734391015363413e-05, "loss": 0.1138, "loss_nan_ranks": 0, "loss_rank_avg": 0.03869440779089928, "step": 1300, "valid_targets_mean": 9305.2, "valid_targets_min": 3205 }, { "epoch": 1.25248, "grad_norm": 0.11958484310256949, "learning_rate": 3.7310449449986404e-05, "loss": 0.1073, "loss_nan_ranks": 0, "loss_rank_avg": 0.035795748233795166, "step": 1305, "valid_targets_mean": 9048.6, "valid_targets_min": 4788 }, { "epoch": 1.25728, "grad_norm": 0.13049242536465502, "learning_rate": 3.727679448462009e-05, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.03678382933139801, "step": 1310, "valid_targets_mean": 8353.3, "valid_targets_min": 2833 }, { "epoch": 1.26208, "grad_norm": 0.1181583760477813, "learning_rate": 3.7242945635218696e-05, "loss": 0.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.03211447596549988, "step": 1315, "valid_targets_mean": 8366.3, "valid_targets_min": 1833 }, { "epoch": 1.26688, "grad_norm": 0.11742791216030482, "learning_rate": 3.720890328164156e-05, "loss": 0.1084, "loss_nan_ranks": 0, "loss_rank_avg": 0.042314011603593826, "step": 1320, "valid_targets_mean": 9944.7, "valid_targets_min": 3926 }, { "epoch": 1.27168, "grad_norm": 0.11792444140621308, "learning_rate": 3.717466780591956e-05, "loss": 0.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.037658244371414185, "step": 1325, "valid_targets_mean": 8533.1, "valid_targets_min": 2539 }, { "epoch": 1.27648, "grad_norm": 0.12225024480557042, "learning_rate": 3.7140239592250804e-05, "loss": 0.1062, "loss_nan_ranks": 0, "loss_rank_avg": 0.037245847284793854, "step": 1330, "valid_targets_mean": 9268.9, "valid_targets_min": 5670 }, { "epoch": 1.28128, "grad_norm": 0.12318589546339119, "learning_rate": 3.71056190269964e-05, "loss": 0.1077, "loss_nan_ranks": 0, "loss_rank_avg": 0.034685347229242325, "step": 1335, "valid_targets_mean": 8202.7, "valid_targets_min": 1834 }, { "epoch": 1.2860800000000001, "grad_norm": 0.12403966425319882, "learning_rate": 3.7070806498676025e-05, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.042274922132492065, "step": 1340, "valid_targets_mean": 9153.2, "valid_targets_min": 4013 }, { "epoch": 1.29088, "grad_norm": 0.11766905420453012, "learning_rate": 3.7035802397963625e-05, "loss": 0.1071, "loss_nan_ranks": 0, "loss_rank_avg": 0.0366162545979023, "step": 1345, "valid_targets_mean": 8794.9, "valid_targets_min": 1738 }, { "epoch": 1.29568, "grad_norm": 0.12007586908411454, "learning_rate": 3.700060711768302e-05, "loss": 0.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.033832572400569916, "step": 1350, "valid_targets_mean": 9080.9, "valid_targets_min": 3899 }, { "epoch": 1.30048, "grad_norm": 0.11667979309051224, "learning_rate": 3.696522105280348e-05, "loss": 0.1073, "loss_nan_ranks": 0, "loss_rank_avg": 0.036710452288389206, "step": 1355, "valid_targets_mean": 9003.8, "valid_targets_min": 2184 }, { "epoch": 1.30528, "grad_norm": 0.1263624995125729, "learning_rate": 3.6929644600435303e-05, "loss": 0.1084, "loss_nan_ranks": 0, "loss_rank_avg": 0.03441833704710007, "step": 1360, "valid_targets_mean": 8348.5, "valid_targets_min": 2806 }, { "epoch": 1.3100800000000001, "grad_norm": 0.11740982313324688, "learning_rate": 3.689387815982536e-05, "loss": 0.1063, "loss_nan_ranks": 0, "loss_rank_avg": 0.038560301065444946, "step": 1365, "valid_targets_mean": 9448.6, "valid_targets_min": 1822 }, { "epoch": 1.31488, "grad_norm": 0.1252151515739968, "learning_rate": 3.6857922132352617e-05, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.03624051809310913, "step": 1370, "valid_targets_mean": 8632.9, "valid_targets_min": 2701 }, { "epoch": 1.31968, "grad_norm": 0.13381310745789513, "learning_rate": 3.6821776921523615e-05, "loss": 0.103, "loss_nan_ranks": 0, "loss_rank_avg": 0.0364258736371994, "step": 1375, "valid_targets_mean": 8644.5, "valid_targets_min": 4506 }, { "epoch": 1.3244799999999999, "grad_norm": 0.1264214384761902, "learning_rate": 3.678544293296797e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.034762680530548096, "step": 1380, "valid_targets_mean": 8907.5, "valid_targets_min": 3498 }, { "epoch": 1.32928, "grad_norm": 0.11949522852717019, "learning_rate": 3.674892057443378e-05, "loss": 0.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.03189823776483536, "step": 1385, "valid_targets_mean": 8336.2, "valid_targets_min": 2895 }, { "epoch": 1.33408, "grad_norm": 0.12933718554974194, "learning_rate": 3.671221025578309e-05, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.03692135214805603, "step": 1390, "valid_targets_mean": 8362.5, "valid_targets_min": 2327 }, { "epoch": 1.33888, "grad_norm": 0.1370376515161672, "learning_rate": 3.6675312388987274e-05, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.03446727246046066, "step": 1395, "valid_targets_mean": 8036.2, "valid_targets_min": 3531 }, { "epoch": 1.34368, "grad_norm": 0.11519564170999727, "learning_rate": 3.663822738812241e-05, "loss": 0.1033, "loss_nan_ranks": 0, "loss_rank_avg": 0.03143679350614548, "step": 1400, "valid_targets_mean": 8900.0, "valid_targets_min": 4505 }, { "epoch": 1.34848, "grad_norm": 0.13667160069855397, "learning_rate": 3.660095566936462e-05, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.04038439691066742, "step": 1405, "valid_targets_mean": 8623.7, "valid_targets_min": 2516 }, { "epoch": 1.35328, "grad_norm": 0.11628807563727038, "learning_rate": 3.656349765098546e-05, "loss": 0.103, "loss_nan_ranks": 0, "loss_rank_avg": 0.03632277250289917, "step": 1410, "valid_targets_mean": 9662.0, "valid_targets_min": 5223 }, { "epoch": 1.35808, "grad_norm": 0.12165285738799775, "learning_rate": 3.652585375334714e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.03766203299164772, "step": 1415, "valid_targets_mean": 9023.7, "valid_targets_min": 2526 }, { "epoch": 1.36288, "grad_norm": 0.1210936758517175, "learning_rate": 3.648802439889785e-05, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.03593523055315018, "step": 1420, "valid_targets_mean": 8797.6, "valid_targets_min": 1723 }, { "epoch": 1.36768, "grad_norm": 0.12212797482243638, "learning_rate": 3.645001001216705e-05, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.03319096192717552, "step": 1425, "valid_targets_mean": 8514.3, "valid_targets_min": 1460 }, { "epoch": 1.37248, "grad_norm": 0.12043836652635324, "learning_rate": 3.641181101976065e-05, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.039879005402326584, "step": 1430, "valid_targets_mean": 9830.4, "valid_targets_min": 6223 }, { "epoch": 1.37728, "grad_norm": 0.12419659997953224, "learning_rate": 3.637342785035624e-05, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.03451387211680412, "step": 1435, "valid_targets_mean": 7784.2, "valid_targets_min": 3446 }, { "epoch": 1.38208, "grad_norm": 0.12369177870382055, "learning_rate": 3.633486093469829e-05, "loss": 0.1023, "loss_nan_ranks": 0, "loss_rank_avg": 0.03320624306797981, "step": 1440, "valid_targets_mean": 8363.7, "valid_targets_min": 2814 }, { "epoch": 1.3868800000000001, "grad_norm": 0.11909211402446875, "learning_rate": 3.629611070559333e-05, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.03433164581656456, "step": 1445, "valid_targets_mean": 8183.8, "valid_targets_min": 3490 }, { "epoch": 1.39168, "grad_norm": 0.11691264105478555, "learning_rate": 3.625717759790506e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.0365409217774868, "step": 1450, "valid_targets_mean": 9171.9, "valid_targets_min": 4784 }, { "epoch": 1.39648, "grad_norm": 0.125375436081025, "learning_rate": 3.621806204854947e-05, "loss": 0.1049, "loss_nan_ranks": 0, "loss_rank_avg": 0.03655450791120529, "step": 1455, "valid_targets_mean": 8703.1, "valid_targets_min": 4353 }, { "epoch": 1.40128, "grad_norm": 0.1286467880870536, "learning_rate": 3.617876449648998e-05, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.039029087871313095, "step": 1460, "valid_targets_mean": 9403.0, "valid_targets_min": 3483 }, { "epoch": 1.40608, "grad_norm": 0.11716905685866259, "learning_rate": 3.613928538273247e-05, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.035078015178442, "step": 1465, "valid_targets_mean": 9139.4, "valid_targets_min": 3472 }, { "epoch": 1.4108800000000001, "grad_norm": 0.11672670553448981, "learning_rate": 3.609962515032034e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.03533966466784477, "step": 1470, "valid_targets_mean": 9032.0, "valid_targets_min": 1767 }, { "epoch": 1.41568, "grad_norm": 0.1243509687324732, "learning_rate": 3.605978424432954e-05, "loss": 0.1027, "loss_nan_ranks": 0, "loss_rank_avg": 0.03651345893740654, "step": 1475, "valid_targets_mean": 8722.7, "valid_targets_min": 2884 }, { "epoch": 1.42048, "grad_norm": 0.12648765813571894, "learning_rate": 3.601976311186361e-05, "loss": 0.1071, "loss_nan_ranks": 0, "loss_rank_avg": 0.03581051528453827, "step": 1480, "valid_targets_mean": 8290.9, "valid_targets_min": 2516 }, { "epoch": 1.4252799999999999, "grad_norm": 0.11343351700255543, "learning_rate": 3.597956220204861e-05, "loss": 0.1029, "loss_nan_ranks": 0, "loss_rank_avg": 0.036967843770980835, "step": 1485, "valid_targets_mean": 9481.8, "valid_targets_min": 2996 }, { "epoch": 1.43008, "grad_norm": 0.1177270154654175, "learning_rate": 3.5939181966028084e-05, "loss": 0.1058, "loss_nan_ranks": 0, "loss_rank_avg": 0.036307480186223984, "step": 1490, "valid_targets_mean": 9119.7, "valid_targets_min": 2089 }, { "epoch": 1.43488, "grad_norm": 0.11948223416122511, "learning_rate": 3.589862285695804e-05, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.03213457390666008, "step": 1495, "valid_targets_mean": 8838.8, "valid_targets_min": 3712 }, { "epoch": 1.43968, "grad_norm": 0.1211211334641555, "learning_rate": 3.585788533000184e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.03254202753305435, "step": 1500, "valid_targets_mean": 8756.7, "valid_targets_min": 3942 }, { "epoch": 1.44448, "grad_norm": 0.11573696505962047, "learning_rate": 3.581696984232508e-05, "loss": 0.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.027192670851945877, "step": 1505, "valid_targets_mean": 7469.8, "valid_targets_min": 3106 }, { "epoch": 1.44928, "grad_norm": 0.12070460723365516, "learning_rate": 3.5775876853090465e-05, "loss": 0.1049, "loss_nan_ranks": 0, "loss_rank_avg": 0.03165585547685623, "step": 1510, "valid_targets_mean": 8158.2, "valid_targets_min": 2105 }, { "epoch": 1.45408, "grad_norm": 0.11620223694923805, "learning_rate": 3.5734606823452686e-05, "loss": 0.1047, "loss_nan_ranks": 0, "loss_rank_avg": 0.037208959460258484, "step": 1515, "valid_targets_mean": 9556.5, "valid_targets_min": 4435 }, { "epoch": 1.45888, "grad_norm": 0.11920297505293288, "learning_rate": 3.569316021655319e-05, "loss": 0.1012, "loss_nan_ranks": 0, "loss_rank_avg": 0.02987070195376873, "step": 1520, "valid_targets_mean": 8496.3, "valid_targets_min": 1915 }, { "epoch": 1.46368, "grad_norm": 0.1268442978445187, "learning_rate": 3.565153749751505e-05, "loss": 0.1041, "loss_nan_ranks": 0, "loss_rank_avg": 0.03451787680387497, "step": 1525, "valid_targets_mean": 9130.9, "valid_targets_min": 2246 }, { "epoch": 1.46848, "grad_norm": 0.11701707630340304, "learning_rate": 3.5609739133437666e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.038270652294158936, "step": 1530, "valid_targets_mean": 9155.3, "valid_targets_min": 2324 }, { "epoch": 1.47328, "grad_norm": 0.1282421956144873, "learning_rate": 3.55677655933916e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.03175165131688118, "step": 1535, "valid_targets_mean": 8443.1, "valid_targets_min": 2640 }, { "epoch": 1.47808, "grad_norm": 0.11886359147221487, "learning_rate": 3.5525617348413265e-05, "loss": 0.1008, "loss_nan_ranks": 0, "loss_rank_avg": 0.035145074129104614, "step": 1540, "valid_targets_mean": 9429.3, "valid_targets_min": 4368 }, { "epoch": 1.48288, "grad_norm": 0.11951433549636696, "learning_rate": 3.5483294871499646e-05, "loss": 0.1009, "loss_nan_ranks": 0, "loss_rank_avg": 0.032362401485443115, "step": 1545, "valid_targets_mean": 8555.6, "valid_targets_min": 1834 }, { "epoch": 1.4876800000000001, "grad_norm": 0.1342430527003154, "learning_rate": 3.544079863760302e-05, "loss": 0.1009, "loss_nan_ranks": 0, "loss_rank_avg": 0.03826196864247322, "step": 1550, "valid_targets_mean": 8434.8, "valid_targets_min": 2927 }, { "epoch": 1.49248, "grad_norm": 0.1212927589438056, "learning_rate": 3.5398129123625565e-05, "loss": 0.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.03314611315727234, "step": 1555, "valid_targets_mean": 8709.2, "valid_targets_min": 3627 }, { "epoch": 1.49728, "grad_norm": 0.1259979005913219, "learning_rate": 3.535528680841408e-05, "loss": 0.1005, "loss_nan_ranks": 0, "loss_rank_avg": 0.03330939635634422, "step": 1560, "valid_targets_mean": 9163.6, "valid_targets_min": 3883 }, { "epoch": 1.5020799999999999, "grad_norm": 0.12508394927198732, "learning_rate": 3.5312272172754566e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.03124111518263817, "step": 1565, "valid_targets_mean": 7667.9, "valid_targets_min": 1721 }, { "epoch": 1.50688, "grad_norm": 0.11330418088972559, "learning_rate": 3.5269085699366844e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.03747326508164406, "step": 1570, "valid_targets_mean": 9535.7, "valid_targets_min": 3502 }, { "epoch": 1.5116800000000001, "grad_norm": 0.1238192398134257, "learning_rate": 3.5225727872899136e-05, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.03966061398386955, "step": 1575, "valid_targets_mean": 9409.5, "valid_targets_min": 2901 }, { "epoch": 1.51648, "grad_norm": 0.12732035071816244, "learning_rate": 3.518219917992262e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.04096482694149017, "step": 1580, "valid_targets_mean": 9869.8, "valid_targets_min": 4770 }, { "epoch": 1.52128, "grad_norm": 0.1342131928296109, "learning_rate": 3.5138500108926e-05, "loss": 0.1022, "loss_nan_ranks": 0, "loss_rank_avg": 0.03232832998037338, "step": 1585, "valid_targets_mean": 7960.3, "valid_targets_min": 1879 }, { "epoch": 1.5260799999999999, "grad_norm": 0.1279082191084901, "learning_rate": 3.509463115030995e-05, "loss": 0.1003, "loss_nan_ranks": 0, "loss_rank_avg": 0.033002547919750214, "step": 1590, "valid_targets_mean": 8454.8, "valid_targets_min": 1940 }, { "epoch": 1.53088, "grad_norm": 0.2811577290255808, "learning_rate": 3.505059279638172e-05, "loss": 0.1005, "loss_nan_ranks": 0, "loss_rank_avg": 0.02976314350962639, "step": 1595, "valid_targets_mean": 8734.9, "valid_targets_min": 3366 }, { "epoch": 1.5356800000000002, "grad_norm": 0.11869308529617718, "learning_rate": 3.500638554134952e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.03650416061282158, "step": 1600, "valid_targets_mean": 9252.2, "valid_targets_min": 4673 }, { "epoch": 1.54048, "grad_norm": 0.12182529682260378, "learning_rate": 3.4962009881317005e-05, "loss": 0.1, "loss_nan_ranks": 0, "loss_rank_avg": 0.03326595202088356, "step": 1605, "valid_targets_mean": 8089.7, "valid_targets_min": 2269 }, { "epoch": 1.54528, "grad_norm": 0.11767713809063114, "learning_rate": 3.491746631427772e-05, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.04178375005722046, "step": 1610, "valid_targets_mean": 9172.2, "valid_targets_min": 2496 }, { "epoch": 1.55008, "grad_norm": 0.13558879371333668, "learning_rate": 3.487275534010948e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.034719523042440414, "step": 1615, "valid_targets_mean": 8640.8, "valid_targets_min": 2299 }, { "epoch": 1.55488, "grad_norm": 0.11731890716900249, "learning_rate": 3.482787746056881e-05, "loss": 0.099, "loss_nan_ranks": 0, "loss_rank_avg": 0.03394527733325958, "step": 1620, "valid_targets_mean": 9216.6, "valid_targets_min": 3766 }, { "epoch": 1.55968, "grad_norm": 0.11494354049312823, "learning_rate": 3.4782833179285256e-05, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.03388223424553871, "step": 1625, "valid_targets_mean": 8900.3, "valid_targets_min": 3332 }, { "epoch": 1.56448, "grad_norm": 0.10943738571395106, "learning_rate": 3.473762300175578e-05, "loss": 0.0999, "loss_nan_ranks": 0, "loss_rank_avg": 0.030476726591587067, "step": 1630, "valid_targets_mean": 8088.4, "valid_targets_min": 3008 }, { "epoch": 1.56928, "grad_norm": 0.11506597550483152, "learning_rate": 3.469224743533906e-05, "loss": 0.098, "loss_nan_ranks": 0, "loss_rank_avg": 0.031209899112582207, "step": 1635, "valid_targets_mean": 9256.1, "valid_targets_min": 4635 }, { "epoch": 1.57408, "grad_norm": 0.13082551295998132, "learning_rate": 3.464670698924981e-05, "loss": 0.1008, "loss_nan_ranks": 0, "loss_rank_avg": 0.03382524102926254, "step": 1640, "valid_targets_mean": 8714.7, "valid_targets_min": 3433 }, { "epoch": 1.5788799999999998, "grad_norm": 0.12427360078336991, "learning_rate": 3.4601002174553055e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.03731769323348999, "step": 1645, "valid_targets_mean": 8702.7, "valid_targets_min": 2481 }, { "epoch": 1.58368, "grad_norm": 0.11446263987092861, "learning_rate": 3.45551335041584e-05, "loss": 0.1004, "loss_nan_ranks": 0, "loss_rank_avg": 0.034496426582336426, "step": 1650, "valid_targets_mean": 9184.0, "valid_targets_min": 3710 }, { "epoch": 1.5884800000000001, "grad_norm": 0.12739756370428226, "learning_rate": 3.4509101492814286e-05, "loss": 0.0994, "loss_nan_ranks": 0, "loss_rank_avg": 0.034381356090307236, "step": 1655, "valid_targets_mean": 8748.2, "valid_targets_min": 1423 }, { "epoch": 1.59328, "grad_norm": 0.11751460240058818, "learning_rate": 3.446290665710219e-05, "loss": 0.1019, "loss_nan_ranks": 0, "loss_rank_avg": 0.029714802280068398, "step": 1660, "valid_targets_mean": 7678.1, "valid_targets_min": 2099 }, { "epoch": 1.59808, "grad_norm": 0.11814198326450993, "learning_rate": 3.441654951543085e-05, "loss": 0.0992, "loss_nan_ranks": 0, "loss_rank_avg": 0.036534734070301056, "step": 1665, "valid_targets_mean": 9461.3, "valid_targets_min": 4091 }, { "epoch": 1.6028799999999999, "grad_norm": 0.11295334978255936, "learning_rate": 3.4370030588030425e-05, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.032168176025152206, "step": 1670, "valid_targets_mean": 8824.2, "valid_targets_min": 5342 }, { "epoch": 1.60768, "grad_norm": 0.11944262820417971, "learning_rate": 3.432335039694669e-05, "loss": 0.1009, "loss_nan_ranks": 0, "loss_rank_avg": 0.03803761303424835, "step": 1675, "valid_targets_mean": 8744.9, "valid_targets_min": 1956 }, { "epoch": 1.6124800000000001, "grad_norm": 0.1188365242887442, "learning_rate": 3.427650946603513e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.031139787286520004, "step": 1680, "valid_targets_mean": 8154.3, "valid_targets_min": 1736 }, { "epoch": 1.61728, "grad_norm": 0.12123730509386084, "learning_rate": 3.422950832095511e-05, "loss": 0.0994, "loss_nan_ranks": 0, "loss_rank_avg": 0.03488922864198685, "step": 1685, "valid_targets_mean": 8890.8, "valid_targets_min": 2762 }, { "epoch": 1.62208, "grad_norm": 0.12417921438454016, "learning_rate": 3.418234748916395e-05, "loss": 0.1001, "loss_nan_ranks": 0, "loss_rank_avg": 0.03286389634013176, "step": 1690, "valid_targets_mean": 8685.7, "valid_targets_min": 4649 }, { "epoch": 1.6268799999999999, "grad_norm": 0.12427965821978078, "learning_rate": 3.4135027499911003e-05, "loss": 0.1015, "loss_nan_ranks": 0, "loss_rank_avg": 0.03643377870321274, "step": 1695, "valid_targets_mean": 9603.3, "valid_targets_min": 4519 }, { "epoch": 1.63168, "grad_norm": 0.12379457220006589, "learning_rate": 3.408754888423173e-05, "loss": 0.1035, "loss_nan_ranks": 0, "loss_rank_avg": 0.03129050135612488, "step": 1700, "valid_targets_mean": 8723.2, "valid_targets_min": 3745 }, { "epoch": 1.6364800000000002, "grad_norm": 0.12275475278899578, "learning_rate": 3.403991217494172e-05, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.031930018216371536, "step": 1705, "valid_targets_mean": 8601.5, "valid_targets_min": 3257 }, { "epoch": 1.64128, "grad_norm": 0.1201804881346642, "learning_rate": 3.3992117906630744e-05, "loss": 0.1, "loss_nan_ranks": 0, "loss_rank_avg": 0.03500905632972717, "step": 1710, "valid_targets_mean": 9292.2, "valid_targets_min": 2432 }, { "epoch": 1.64608, "grad_norm": 0.12998259303408505, "learning_rate": 3.394416661565671e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.03601759672164917, "step": 1715, "valid_targets_mean": 9329.5, "valid_targets_min": 3473 }, { "epoch": 1.65088, "grad_norm": 0.15209411679668441, "learning_rate": 3.389605884013969e-05, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.03493211418390274, "step": 1720, "valid_targets_mean": 8974.5, "valid_targets_min": 3096 }, { "epoch": 1.65568, "grad_norm": 0.11967594276263603, "learning_rate": 3.384779511995587e-05, "loss": 0.1004, "loss_nan_ranks": 0, "loss_rank_avg": 0.028926797211170197, "step": 1725, "valid_targets_mean": 8098.5, "valid_targets_min": 3942 }, { "epoch": 1.66048, "grad_norm": 0.1263183650621345, "learning_rate": 3.379937599673144e-05, "loss": 0.0968, "loss_nan_ranks": 0, "loss_rank_avg": 0.029895996674895287, "step": 1730, "valid_targets_mean": 9455.5, "valid_targets_min": 4168 }, { "epoch": 1.66528, "grad_norm": 0.1116628577909989, "learning_rate": 3.3750802013836596e-05, "loss": 0.0961, "loss_nan_ranks": 0, "loss_rank_avg": 0.029331346973776817, "step": 1735, "valid_targets_mean": 8593.4, "valid_targets_min": 2814 }, { "epoch": 1.67008, "grad_norm": 0.11669743828129955, "learning_rate": 3.370207371637939e-05, "loss": 0.0981, "loss_nan_ranks": 0, "loss_rank_avg": 0.03486446291208267, "step": 1740, "valid_targets_mean": 8908.1, "valid_targets_min": 3582 }, { "epoch": 1.67488, "grad_norm": 0.11206048763400174, "learning_rate": 3.3653191651199635e-05, "loss": 0.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.029872918501496315, "step": 1745, "valid_targets_mean": 8751.2, "valid_targets_min": 3097 }, { "epoch": 1.6796799999999998, "grad_norm": 0.12149392067550448, "learning_rate": 3.360415636686274e-05, "loss": 0.0992, "loss_nan_ranks": 0, "loss_rank_avg": 0.03125841170549393, "step": 1750, "valid_targets_mean": 9348.4, "valid_targets_min": 1952 }, { "epoch": 1.68448, "grad_norm": 0.11409949572763738, "learning_rate": 3.355496841365359e-05, "loss": 0.0998, "loss_nan_ranks": 0, "loss_rank_avg": 0.034153811633586884, "step": 1755, "valid_targets_mean": 9130.1, "valid_targets_min": 3227 }, { "epoch": 1.6892800000000001, "grad_norm": 0.12180781545084879, "learning_rate": 3.350562834357034e-05, "loss": 0.0995, "loss_nan_ranks": 0, "loss_rank_avg": 0.03245352953672409, "step": 1760, "valid_targets_mean": 8648.5, "valid_targets_min": 4313 }, { "epoch": 1.69408, "grad_norm": 0.13247571796223342, "learning_rate": 3.345613671031827e-05, "loss": 0.1011, "loss_nan_ranks": 0, "loss_rank_avg": 0.03612162172794342, "step": 1765, "valid_targets_mean": 8704.3, "valid_targets_min": 4184 }, { "epoch": 1.69888, "grad_norm": 0.21647507224098106, "learning_rate": 3.340649406930349e-05, "loss": 0.0977, "loss_nan_ranks": 0, "loss_rank_avg": 0.029728224501013756, "step": 1770, "valid_targets_mean": 8391.2, "valid_targets_min": 1727 }, { "epoch": 1.7036799999999999, "grad_norm": 0.12422077040157983, "learning_rate": 3.335670097762677e-05, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.029321834444999695, "step": 1775, "valid_targets_mean": 8637.8, "valid_targets_min": 1912 }, { "epoch": 1.70848, "grad_norm": 0.11698536286578931, "learning_rate": 3.330675799407728e-05, "loss": 0.1, "loss_nan_ranks": 0, "loss_rank_avg": 0.032984182238578796, "step": 1780, "valid_targets_mean": 8554.4, "valid_targets_min": 3850 }, { "epoch": 1.7132800000000001, "grad_norm": 0.12071451043408635, "learning_rate": 3.32566656791263e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.030606457963585854, "step": 1785, "valid_targets_mean": 8076.9, "valid_targets_min": 1413 }, { "epoch": 1.71808, "grad_norm": 0.12127568160825884, "learning_rate": 3.320642459492095e-05, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.03138080984354019, "step": 1790, "valid_targets_mean": 8827.6, "valid_targets_min": 3318 }, { "epoch": 1.72288, "grad_norm": 0.12309891269800873, "learning_rate": 3.315603530527785e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.034938737750053406, "step": 1795, "valid_targets_mean": 8190.7, "valid_targets_min": 1990 }, { "epoch": 1.7276799999999999, "grad_norm": 0.13448328329653705, "learning_rate": 3.310549837567685e-05, "loss": 0.094, "loss_nan_ranks": 0, "loss_rank_avg": 0.03196977078914642, "step": 1800, "valid_targets_mean": 8209.2, "valid_targets_min": 4291 }, { "epoch": 1.73248, "grad_norm": 0.1270134755763155, "learning_rate": 3.3054814373254615e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.03308798000216484, "step": 1805, "valid_targets_mean": 9097.6, "valid_targets_min": 3023 }, { "epoch": 1.7372800000000002, "grad_norm": 0.1215462716174612, "learning_rate": 3.300398386679831e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.03231578692793846, "step": 1810, "valid_targets_mean": 8737.8, "valid_targets_min": 2789 }, { "epoch": 1.74208, "grad_norm": 0.12659381214839838, "learning_rate": 3.2953007426739204e-05, "loss": 0.0994, "loss_nan_ranks": 0, "loss_rank_avg": 0.030647259205579758, "step": 1815, "valid_targets_mean": 9287.0, "valid_targets_min": 3191 }, { "epoch": 1.74688, "grad_norm": 0.12152296869764756, "learning_rate": 3.290188562514624e-05, "loss": 0.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.02994205430150032, "step": 1820, "valid_targets_mean": 8389.3, "valid_targets_min": 4479 }, { "epoch": 1.75168, "grad_norm": 0.11579730176913727, "learning_rate": 3.285061903571968e-05, "loss": 0.0976, "loss_nan_ranks": 0, "loss_rank_avg": 0.03409838303923607, "step": 1825, "valid_targets_mean": 8725.6, "valid_targets_min": 3671 }, { "epoch": 1.75648, "grad_norm": 0.12042202731658365, "learning_rate": 3.27992082337846e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.03129231929779053, "step": 1830, "valid_targets_mean": 8376.2, "valid_targets_min": 2786 }, { "epoch": 1.76128, "grad_norm": 0.1150574556332984, "learning_rate": 3.274765379628447e-05, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.03116718865931034, "step": 1835, "valid_targets_mean": 9754.7, "valid_targets_min": 2668 }, { "epoch": 1.76608, "grad_norm": 0.12221087122396483, "learning_rate": 3.2695956301774664e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.03059461899101734, "step": 1840, "valid_targets_mean": 8807.2, "valid_targets_min": 1560 }, { "epoch": 1.77088, "grad_norm": 0.12550586828813198, "learning_rate": 3.264411633041598e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.03288565203547478, "step": 1845, "valid_targets_mean": 8430.9, "valid_targets_min": 4166 }, { "epoch": 1.77568, "grad_norm": 0.11800390703235397, "learning_rate": 3.259213446396812e-05, "loss": 0.0971, "loss_nan_ranks": 0, "loss_rank_avg": 0.03617793321609497, "step": 1850, "valid_targets_mean": 8808.0, "valid_targets_min": 2379 }, { "epoch": 1.7804799999999998, "grad_norm": 0.12065501117992328, "learning_rate": 3.254001128578317e-05, "loss": 0.0971, "loss_nan_ranks": 0, "loss_rank_avg": 0.03944634646177292, "step": 1855, "valid_targets_mean": 9181.4, "valid_targets_min": 3240 }, { "epoch": 1.78528, "grad_norm": 0.12815781801241774, "learning_rate": 3.2487747380799036e-05, "loss": 0.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.03340938687324524, "step": 1860, "valid_targets_mean": 9103.5, "valid_targets_min": 5535 }, { "epoch": 1.7900800000000001, "grad_norm": 0.12256539621255265, "learning_rate": 3.243534333553291e-05, "loss": 0.096, "loss_nan_ranks": 0, "loss_rank_avg": 0.03244269639253616, "step": 1865, "valid_targets_mean": 9035.9, "valid_targets_min": 3874 }, { "epoch": 1.79488, "grad_norm": 0.11939887366602382, "learning_rate": 3.2382799738074635e-05, "loss": 0.0963, "loss_nan_ranks": 0, "loss_rank_avg": 0.036362893879413605, "step": 1870, "valid_targets_mean": 9146.4, "valid_targets_min": 3073 }, { "epoch": 1.79968, "grad_norm": 0.11295140221263837, "learning_rate": 3.2330117178080184e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.03275471180677414, "step": 1875, "valid_targets_mean": 9356.5, "valid_targets_min": 3597 }, { "epoch": 1.8044799999999999, "grad_norm": 0.11596482995260982, "learning_rate": 3.227729624676497e-05, "loss": 0.0991, "loss_nan_ranks": 0, "loss_rank_avg": 0.033212386071681976, "step": 1880, "valid_targets_mean": 8404.9, "valid_targets_min": 1753 }, { "epoch": 1.80928, "grad_norm": 0.12299614142264025, "learning_rate": 3.222433753689724e-05, "loss": 0.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.030806001275777817, "step": 1885, "valid_targets_mean": 9172.8, "valid_targets_min": 2605 }, { "epoch": 1.8140800000000001, "grad_norm": 0.12294732258255374, "learning_rate": 3.2171241642791443e-05, "loss": 0.0963, "loss_nan_ranks": 0, "loss_rank_avg": 0.03270886838436127, "step": 1890, "valid_targets_mean": 8817.4, "valid_targets_min": 3170 }, { "epoch": 1.81888, "grad_norm": 0.12454651137241947, "learning_rate": 3.211800916030152e-05, "loss": 0.0964, "loss_nan_ranks": 0, "loss_rank_avg": 0.03188232332468033, "step": 1895, "valid_targets_mean": 8884.1, "valid_targets_min": 3236 }, { "epoch": 1.82368, "grad_norm": 0.11875714790732037, "learning_rate": 3.206464068681424e-05, "loss": 0.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.03125854209065437, "step": 1900, "valid_targets_mean": 8837.4, "valid_targets_min": 3141 }, { "epoch": 1.8284799999999999, "grad_norm": 0.25615170544022126, "learning_rate": 3.20111368212425e-05, "loss": 0.0972, "loss_nan_ranks": 0, "loss_rank_avg": 0.031216248869895935, "step": 1905, "valid_targets_mean": 8927.4, "valid_targets_min": 2351 }, { "epoch": 1.83328, "grad_norm": 0.11553048251166381, "learning_rate": 3.19574981640186e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.032985836267471313, "step": 1910, "valid_targets_mean": 9137.7, "valid_targets_min": 2457 }, { "epoch": 1.8380800000000002, "grad_norm": 0.12332033201339215, "learning_rate": 3.1903725317087495e-05, "loss": 0.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.02826140820980072, "step": 1915, "valid_targets_mean": 7582.6, "valid_targets_min": 1979 }, { "epoch": 1.84288, "grad_norm": 0.12373198100671594, "learning_rate": 3.184981888390003e-05, "loss": 0.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.03438425809144974, "step": 1920, "valid_targets_mean": 8750.5, "valid_targets_min": 3715 }, { "epoch": 1.84768, "grad_norm": 0.11898830073691476, "learning_rate": 3.1795779469406226e-05, "loss": 0.0996, "loss_nan_ranks": 0, "loss_rank_avg": 0.027855921536684036, "step": 1925, "valid_targets_mean": 8388.7, "valid_targets_min": 3606 }, { "epoch": 1.85248, "grad_norm": 0.13049198537601311, "learning_rate": 3.174160768004842e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.03077923133969307, "step": 1930, "valid_targets_mean": 9521.2, "valid_targets_min": 3478 }, { "epoch": 1.85728, "grad_norm": 0.12890383965255006, "learning_rate": 3.168730412375449e-05, "loss": 0.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.033480048179626465, "step": 1935, "valid_targets_mean": 8513.8, "valid_targets_min": 2941 }, { "epoch": 1.86208, "grad_norm": 0.1259489564584358, "learning_rate": 3.1632869409931036e-05, "loss": 0.096, "loss_nan_ranks": 0, "loss_rank_avg": 0.03304038196802139, "step": 1940, "valid_targets_mean": 8453.8, "valid_targets_min": 3095 }, { "epoch": 1.86688, "grad_norm": 0.12379490782070443, "learning_rate": 3.1578304149456544e-05, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.02992902509868145, "step": 1945, "valid_targets_mean": 8997.7, "valid_targets_min": 2944 }, { "epoch": 1.87168, "grad_norm": 0.1908649386565199, "learning_rate": 3.1523608954674524e-05, "loss": 0.0985, "loss_nan_ranks": 0, "loss_rank_avg": 0.030526556074619293, "step": 1950, "valid_targets_mean": 8728.9, "valid_targets_min": 3733 }, { "epoch": 1.87648, "grad_norm": 0.12058817025819538, "learning_rate": 3.1468784439386614e-05, "loss": 0.0978, "loss_nan_ranks": 0, "loss_rank_avg": 0.029100410640239716, "step": 1955, "valid_targets_mean": 7976.5, "valid_targets_min": 1588 }, { "epoch": 1.8812799999999998, "grad_norm": 0.12374514028101315, "learning_rate": 3.141383121884576e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.030075032263994217, "step": 1960, "valid_targets_mean": 9350.9, "valid_targets_min": 2993 }, { "epoch": 1.88608, "grad_norm": 0.12949723183843131, "learning_rate": 3.1358749909749214e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.02782047912478447, "step": 1965, "valid_targets_mean": 8918.0, "valid_targets_min": 4011 }, { "epoch": 1.8908800000000001, "grad_norm": 0.12321752636472717, "learning_rate": 3.1303541130231703e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.03179875388741493, "step": 1970, "valid_targets_mean": 8427.1, "valid_targets_min": 2242 }, { "epoch": 1.89568, "grad_norm": 0.1250357323229381, "learning_rate": 3.1248205499858446e-05, "loss": 0.0974, "loss_nan_ranks": 0, "loss_rank_avg": 0.031728826463222504, "step": 1975, "valid_targets_mean": 8332.0, "valid_targets_min": 1698 }, { "epoch": 1.90048, "grad_norm": 0.1269808845116901, "learning_rate": 3.119274363961821e-05, "loss": 0.0976, "loss_nan_ranks": 0, "loss_rank_avg": 0.030242368578910828, "step": 1980, "valid_targets_mean": 8013.0, "valid_targets_min": 2329 }, { "epoch": 1.9052799999999999, "grad_norm": 0.12594906129488526, "learning_rate": 3.113715617191634e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.033120714128017426, "step": 1985, "valid_targets_mean": 9525.1, "valid_targets_min": 5176 }, { "epoch": 1.91008, "grad_norm": 0.1128437524239124, "learning_rate": 3.1081443720567785e-05, "loss": 0.0976, "loss_nan_ranks": 0, "loss_rank_avg": 0.03407108783721924, "step": 1990, "valid_targets_mean": 8913.7, "valid_targets_min": 2222 }, { "epoch": 1.9148800000000001, "grad_norm": 0.12271441054409966, "learning_rate": 3.102560691079007e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.03202490508556366, "step": 1995, "valid_targets_mean": 8219.6, "valid_targets_min": 4856 }, { "epoch": 1.91968, "grad_norm": 0.11928104900985406, "learning_rate": 3.0969646369196307e-05, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.03154480457305908, "step": 2000, "valid_targets_mean": 7679.9, "valid_targets_min": 2327 }, { "epoch": 1.92448, "grad_norm": 0.11764578388415199, "learning_rate": 3.0913562723788174e-05, "loss": 0.0937, "loss_nan_ranks": 0, "loss_rank_avg": 0.028950994834303856, "step": 2005, "valid_targets_mean": 8590.5, "valid_targets_min": 2687 }, { "epoch": 1.9292799999999999, "grad_norm": 0.11959529477268145, "learning_rate": 3.085735660394881e-05, "loss": 0.096, "loss_nan_ranks": 0, "loss_rank_avg": 0.03188043832778931, "step": 2010, "valid_targets_mean": 8712.7, "valid_targets_min": 2239 }, { "epoch": 1.93408, "grad_norm": 0.12288064731447748, "learning_rate": 3.080102864043581e-05, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.03270117938518524, "step": 2015, "valid_targets_mean": 8825.5, "valid_targets_min": 2184 }, { "epoch": 1.9388800000000002, "grad_norm": 0.12062672309603491, "learning_rate": 3.074457946537413e-05, "loss": 0.0947, "loss_nan_ranks": 0, "loss_rank_avg": 0.03260117769241333, "step": 2020, "valid_targets_mean": 8145.7, "valid_targets_min": 3013 }, { "epoch": 1.94368, "grad_norm": 0.11717401223355793, "learning_rate": 3.068800971224898e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.030992349609732628, "step": 2025, "valid_targets_mean": 8825.3, "valid_targets_min": 1526 }, { "epoch": 1.94848, "grad_norm": 0.11964450711810551, "learning_rate": 3.0631320015898735e-05, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.03208611160516739, "step": 2030, "valid_targets_mean": 9341.5, "valid_targets_min": 4514 }, { "epoch": 1.95328, "grad_norm": 0.1300777102273075, "learning_rate": 3.057451101250778e-05, "loss": 0.0926, "loss_nan_ranks": 0, "loss_rank_avg": 0.027757877483963966, "step": 2035, "valid_targets_mean": 8905.0, "valid_targets_min": 4482 }, { "epoch": 1.95808, "grad_norm": 0.13016926678324173, "learning_rate": 3.051758333959941e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.034215047955513, "step": 2040, "valid_targets_mean": 9087.2, "valid_targets_min": 4268 }, { "epoch": 1.96288, "grad_norm": 0.13459529117746524, "learning_rate": 3.046053763602865e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.03139539062976837, "step": 2045, "valid_targets_mean": 7871.2, "valid_targets_min": 2346 }, { "epoch": 1.96768, "grad_norm": 0.11324489273915117, "learning_rate": 3.0403374541975078e-05, "loss": 0.0928, "loss_nan_ranks": 0, "loss_rank_avg": 0.029846232384443283, "step": 2050, "valid_targets_mean": 8258.1, "valid_targets_min": 2241 }, { "epoch": 1.97248, "grad_norm": 0.11489197140280931, "learning_rate": 3.034609469893567e-05, "loss": 0.0929, "loss_nan_ranks": 0, "loss_rank_avg": 0.032914385199546814, "step": 2055, "valid_targets_mean": 9554.0, "valid_targets_min": 4598 }, { "epoch": 1.97728, "grad_norm": 0.11581208074394174, "learning_rate": 3.028869874971758e-05, "loss": 0.0959, "loss_nan_ranks": 0, "loss_rank_avg": 0.03447406738996506, "step": 2060, "valid_targets_mean": 8354.8, "valid_targets_min": 2758 }, { "epoch": 1.9820799999999998, "grad_norm": 0.11852330994590476, "learning_rate": 3.0231187338430944e-05, "loss": 0.0931, "loss_nan_ranks": 0, "loss_rank_avg": 0.03049747459590435, "step": 2065, "valid_targets_mean": 8763.3, "valid_targets_min": 3186 }, { "epoch": 1.98688, "grad_norm": 0.12012402161638631, "learning_rate": 3.0173561110481606e-05, "loss": 0.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.030883774161338806, "step": 2070, "valid_targets_mean": 9102.0, "valid_targets_min": 3763 }, { "epoch": 1.9916800000000001, "grad_norm": 0.12029947880726818, "learning_rate": 3.011582071256394e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.03472603112459183, "step": 2075, "valid_targets_mean": 9187.4, "valid_targets_min": 4685 }, { "epoch": 1.99648, "grad_norm": 0.12080815720093505, "learning_rate": 3.0057966792653547e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.03140140324831009, "step": 2080, "valid_targets_mean": 7961.4, "valid_targets_min": 2523 }, { "epoch": 2.00096, "grad_norm": 0.127348881807781, "learning_rate": 3.0000000000000004e-05, "loss": 0.0898, "loss_nan_ranks": 0, "loss_rank_avg": 0.029651004821062088, "step": 2085, "valid_targets_mean": 9488.9, "valid_targets_min": 2667 }, { "epoch": 2.00576, "grad_norm": 0.12239161231781547, "learning_rate": 2.9941920985119562e-05, "loss": 0.0878, "loss_nan_ranks": 0, "loss_rank_avg": 0.02701239474117756, "step": 2090, "valid_targets_mean": 8532.2, "valid_targets_min": 2701 }, { "epoch": 2.01056, "grad_norm": 0.11882885393990238, "learning_rate": 2.988373039978786e-05, "loss": 0.0868, "loss_nan_ranks": 0, "loss_rank_avg": 0.03091384470462799, "step": 2095, "valid_targets_mean": 9679.6, "valid_targets_min": 2730 }, { "epoch": 2.01536, "grad_norm": 0.11563223856575051, "learning_rate": 2.98254288970326e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.0300716795027256, "step": 2100, "valid_targets_mean": 8815.1, "valid_targets_min": 2632 }, { "epoch": 2.02016, "grad_norm": 0.12238216828812892, "learning_rate": 2.9767017131126245e-05, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.031115412712097168, "step": 2105, "valid_targets_mean": 9428.0, "valid_targets_min": 4481 }, { "epoch": 2.02496, "grad_norm": 0.11820045344397803, "learning_rate": 2.9708495757578633e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.0273810513317585, "step": 2110, "valid_targets_mean": 8535.9, "valid_targets_min": 3766 }, { "epoch": 2.02976, "grad_norm": 0.110408263933541, "learning_rate": 2.964986543312964e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.02771226316690445, "step": 2115, "valid_targets_mean": 8563.7, "valid_targets_min": 2594 }, { "epoch": 2.03456, "grad_norm": 0.12029390455853219, "learning_rate": 2.9591126815741832e-05, "loss": 0.0869, "loss_nan_ranks": 0, "loss_rank_avg": 0.03002401813864708, "step": 2120, "valid_targets_mean": 8298.8, "valid_targets_min": 2022 }, { "epoch": 2.03936, "grad_norm": 0.11511228961091312, "learning_rate": 2.953228056459305e-05, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.026876386255025864, "step": 2125, "valid_targets_mean": 9043.5, "valid_targets_min": 3188 }, { "epoch": 2.04416, "grad_norm": 0.1226523942167117, "learning_rate": 2.947332734006903e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.026805460453033447, "step": 2130, "valid_targets_mean": 8803.2, "valid_targets_min": 3904 }, { "epoch": 2.04896, "grad_norm": 0.11684267393301566, "learning_rate": 2.9414267803755988e-05, "loss": 0.0896, "loss_nan_ranks": 0, "loss_rank_avg": 0.03486183285713196, "step": 2135, "valid_targets_mean": 9706.5, "valid_targets_min": 3528 }, { "epoch": 2.05376, "grad_norm": 0.11633157562826041, "learning_rate": 2.9355102618433197e-05, "loss": 0.0867, "loss_nan_ranks": 0, "loss_rank_avg": 0.02780848927795887, "step": 2140, "valid_targets_mean": 8743.6, "valid_targets_min": 2084 }, { "epoch": 2.05856, "grad_norm": 0.1176794789427386, "learning_rate": 2.929583244806553e-05, "loss": 0.0864, "loss_nan_ranks": 0, "loss_rank_avg": 0.030458780005574226, "step": 2145, "valid_targets_mean": 7875.6, "valid_targets_min": 1516 }, { "epoch": 2.06336, "grad_norm": 0.11576596805179132, "learning_rate": 2.9236457957796047e-05, "loss": 0.0881, "loss_nan_ranks": 0, "loss_rank_avg": 0.025129785761237144, "step": 2150, "valid_targets_mean": 8653.1, "valid_targets_min": 1776 }, { "epoch": 2.0681599999999998, "grad_norm": 0.1125861546534315, "learning_rate": 2.9176979813938494e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.030581803992390633, "step": 2155, "valid_targets_mean": 7886.0, "valid_targets_min": 3848 }, { "epoch": 2.07296, "grad_norm": 0.11990337393515425, "learning_rate": 2.9117398683969857e-05, "loss": 0.0897, "loss_nan_ranks": 0, "loss_rank_avg": 0.02741706185042858, "step": 2160, "valid_targets_mean": 8171.0, "valid_targets_min": 1914 }, { "epoch": 2.07776, "grad_norm": 0.12242894662914258, "learning_rate": 2.9057715236522833e-05, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.029523633420467377, "step": 2165, "valid_targets_mean": 8559.4, "valid_targets_min": 3236 }, { "epoch": 2.08256, "grad_norm": 0.1241427713541584, "learning_rate": 2.899793014137836e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.030984241515398026, "step": 2170, "valid_targets_mean": 9196.1, "valid_targets_min": 3004 }, { "epoch": 2.08736, "grad_norm": 0.12063838069741276, "learning_rate": 2.8938044069458094e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.028892911970615387, "step": 2175, "valid_targets_mean": 8572.5, "valid_targets_min": 3225 }, { "epoch": 2.09216, "grad_norm": 0.11160240696578047, "learning_rate": 2.8878057692816877e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.026819078251719475, "step": 2180, "valid_targets_mean": 8104.5, "valid_targets_min": 2774 }, { "epoch": 2.09696, "grad_norm": 0.15191956279033425, "learning_rate": 2.8817971684635178e-05, "loss": 0.0888, "loss_nan_ranks": 0, "loss_rank_avg": 0.02786080725491047, "step": 2185, "valid_targets_mean": 8554.4, "valid_targets_min": 1925 }, { "epoch": 2.10176, "grad_norm": 0.12240055182601953, "learning_rate": 2.8757786719211555e-05, "loss": 0.0856, "loss_nan_ranks": 0, "loss_rank_avg": 0.02772444486618042, "step": 2190, "valid_targets_mean": 8159.0, "valid_targets_min": 2615 }, { "epoch": 2.10656, "grad_norm": 0.11643689287045982, "learning_rate": 2.8697503471955106e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.02837887965142727, "step": 2195, "valid_targets_mean": 8464.4, "valid_targets_min": 1413 }, { "epoch": 2.11136, "grad_norm": 0.11654047788382643, "learning_rate": 2.8637122619377848e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.03045256994664669, "step": 2200, "valid_targets_mean": 8479.0, "valid_targets_min": 3845 }, { "epoch": 2.11616, "grad_norm": 0.12522178378425464, "learning_rate": 2.8576644839087152e-05, "loss": 0.0885, "loss_nan_ranks": 0, "loss_rank_avg": 0.03251127153635025, "step": 2205, "valid_targets_mean": 9498.2, "valid_targets_min": 3661 }, { "epoch": 2.12096, "grad_norm": 0.1828803070115879, "learning_rate": 2.8516070809778145e-05, "loss": 0.086, "loss_nan_ranks": 0, "loss_rank_avg": 0.02694122865796089, "step": 2210, "valid_targets_mean": 8186.5, "valid_targets_min": 2913 }, { "epoch": 2.12576, "grad_norm": 0.11379440969301187, "learning_rate": 2.845540121122607e-05, "loss": 0.0835, "loss_nan_ranks": 0, "loss_rank_avg": 0.02929331548511982, "step": 2215, "valid_targets_mean": 8543.1, "valid_targets_min": 2580 }, { "epoch": 2.13056, "grad_norm": 0.13579664419486132, "learning_rate": 2.839463672427867e-05, "loss": 0.086, "loss_nan_ranks": 0, "loss_rank_avg": 0.029128937050700188, "step": 2220, "valid_targets_mean": 8281.3, "valid_targets_min": 2203 }, { "epoch": 2.13536, "grad_norm": 0.15179636273038324, "learning_rate": 2.833377803084855e-05, "loss": 0.0848, "loss_nan_ranks": 0, "loss_rank_avg": 0.03110337257385254, "step": 2225, "valid_targets_mean": 9488.6, "valid_targets_min": 3850 }, { "epoch": 2.14016, "grad_norm": 0.12272951835579388, "learning_rate": 2.8272825813905522e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.03079194948077202, "step": 2230, "valid_targets_mean": 8683.3, "valid_targets_min": 1928 }, { "epoch": 2.14496, "grad_norm": 0.12474318671383416, "learning_rate": 2.8211780757468942e-05, "loss": 0.089, "loss_nan_ranks": 0, "loss_rank_avg": 0.030205946415662766, "step": 2235, "valid_targets_mean": 8289.2, "valid_targets_min": 2163 }, { "epoch": 2.14976, "grad_norm": 0.11310821373925851, "learning_rate": 2.8150643546600012e-05, "loss": 0.0861, "loss_nan_ranks": 0, "loss_rank_avg": 0.025783589109778404, "step": 2240, "valid_targets_mean": 8930.8, "valid_targets_min": 2381 }, { "epoch": 2.15456, "grad_norm": 0.12359622662935445, "learning_rate": 2.808941486739414e-05, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.02596352994441986, "step": 2245, "valid_targets_mean": 8079.3, "valid_targets_min": 2770 }, { "epoch": 2.15936, "grad_norm": 0.11807904032902185, "learning_rate": 2.80280954069732e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.027037806808948517, "step": 2250, "valid_targets_mean": 8114.3, "valid_targets_min": 2376 }, { "epoch": 2.16416, "grad_norm": 0.12242403638033678, "learning_rate": 2.7966685853477828e-05, "loss": 0.0879, "loss_nan_ranks": 0, "loss_rank_avg": 0.030830947682261467, "step": 2255, "valid_targets_mean": 9222.7, "valid_targets_min": 3138 }, { "epoch": 2.16896, "grad_norm": 0.11760527959631821, "learning_rate": 2.790518689605971e-05, "loss": 0.0839, "loss_nan_ranks": 0, "loss_rank_avg": 0.03028050996363163, "step": 2260, "valid_targets_mean": 8239.4, "valid_targets_min": 3664 }, { "epoch": 2.17376, "grad_norm": 0.12713317820214887, "learning_rate": 2.7843599224873833e-05, "loss": 0.0854, "loss_nan_ranks": 0, "loss_rank_avg": 0.029034830629825592, "step": 2265, "valid_targets_mean": 8398.4, "valid_targets_min": 2683 }, { "epoch": 2.17856, "grad_norm": 0.11448227095558705, "learning_rate": 2.7781923531070775e-05, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.02563052624464035, "step": 2270, "valid_targets_mean": 9533.0, "valid_targets_min": 1521 }, { "epoch": 2.18336, "grad_norm": 0.12163245887119671, "learning_rate": 2.7720160506788896e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.026498647406697273, "step": 2275, "valid_targets_mean": 9146.3, "valid_targets_min": 3145 }, { "epoch": 2.18816, "grad_norm": 0.1227312763442586, "learning_rate": 2.7658310845146598e-05, "loss": 0.0858, "loss_nan_ranks": 0, "loss_rank_avg": 0.03034115955233574, "step": 2280, "valid_targets_mean": 9096.8, "valid_targets_min": 2617 }, { "epoch": 2.19296, "grad_norm": 0.13297660140986542, "learning_rate": 2.7596375240234574e-05, "loss": 0.0853, "loss_nan_ranks": 0, "loss_rank_avg": 0.026283323764801025, "step": 2285, "valid_targets_mean": 8396.1, "valid_targets_min": 1588 }, { "epoch": 2.19776, "grad_norm": 0.12220411513735026, "learning_rate": 2.7534354387107975e-05, "loss": 0.0885, "loss_nan_ranks": 0, "loss_rank_avg": 0.030644144862890244, "step": 2290, "valid_targets_mean": 8958.4, "valid_targets_min": 4317 }, { "epoch": 2.20256, "grad_norm": 0.11764379302404512, "learning_rate": 2.747224898177862e-05, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.025263972580432892, "step": 2295, "valid_targets_mean": 9061.1, "valid_targets_min": 3336 }, { "epoch": 2.20736, "grad_norm": 0.12966871279969255, "learning_rate": 2.7410059721207187e-05, "loss": 0.0859, "loss_nan_ranks": 0, "loss_rank_avg": 0.028944432735443115, "step": 2300, "valid_targets_mean": 9488.6, "valid_targets_min": 3839 }, { "epoch": 2.21216, "grad_norm": 0.11142932566793738, "learning_rate": 2.734778730329543e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.03101763129234314, "step": 2305, "valid_targets_mean": 9028.5, "valid_targets_min": 1917 }, { "epoch": 2.21696, "grad_norm": 0.1143112294079201, "learning_rate": 2.7285432426878275e-05, "loss": 0.0891, "loss_nan_ranks": 0, "loss_rank_avg": 0.02940632961690426, "step": 2310, "valid_targets_mean": 9081.0, "valid_targets_min": 2201 }, { "epoch": 2.22176, "grad_norm": 0.14446948206235952, "learning_rate": 2.7222995791716034e-05, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.029054325073957443, "step": 2315, "valid_targets_mean": 8472.1, "valid_targets_min": 2854 }, { "epoch": 2.22656, "grad_norm": 0.1298305463827391, "learning_rate": 2.716047809848653e-05, "loss": 0.0868, "loss_nan_ranks": 0, "loss_rank_avg": 0.027578776702284813, "step": 2320, "valid_targets_mean": 8983.7, "valid_targets_min": 2322 }, { "epoch": 2.23136, "grad_norm": 0.11734106721527403, "learning_rate": 2.7097880048777238e-05, "loss": 0.0883, "loss_nan_ranks": 0, "loss_rank_avg": 0.026591507717967033, "step": 2325, "valid_targets_mean": 8910.7, "valid_targets_min": 2719 }, { "epoch": 2.23616, "grad_norm": 0.1185128622335491, "learning_rate": 2.703520234507742e-05, "loss": 0.087, "loss_nan_ranks": 0, "loss_rank_avg": 0.028162341564893723, "step": 2330, "valid_targets_mean": 9224.5, "valid_targets_min": 2254 }, { "epoch": 2.24096, "grad_norm": 0.12387215840197503, "learning_rate": 2.697244569077021e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.02742118015885353, "step": 2335, "valid_targets_mean": 8428.2, "valid_targets_min": 2526 }, { "epoch": 2.24576, "grad_norm": 0.12075017881250852, "learning_rate": 2.6909610790124772e-05, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.03025822341442108, "step": 2340, "valid_targets_mean": 9657.5, "valid_targets_min": 4578 }, { "epoch": 2.25056, "grad_norm": 0.11206154418590676, "learning_rate": 2.684669834828835e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.030417874455451965, "step": 2345, "valid_targets_mean": 9800.4, "valid_targets_min": 4694 }, { "epoch": 2.25536, "grad_norm": 0.12123597031997373, "learning_rate": 2.6783709071278372e-05, "loss": 0.0858, "loss_nan_ranks": 0, "loss_rank_avg": 0.02864830195903778, "step": 2350, "valid_targets_mean": 9171.4, "valid_targets_min": 3791 }, { "epoch": 2.26016, "grad_norm": 0.1124147307567478, "learning_rate": 2.6720643665974522e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.028500908985733986, "step": 2355, "valid_targets_mean": 8550.7, "valid_targets_min": 1956 }, { "epoch": 2.26496, "grad_norm": 0.12143490811782527, "learning_rate": 2.665750284011085e-05, "loss": 0.0856, "loss_nan_ranks": 0, "loss_rank_avg": 0.02900022640824318, "step": 2360, "valid_targets_mean": 8569.2, "valid_targets_min": 2633 }, { "epoch": 2.2697599999999998, "grad_norm": 0.14818249191876692, "learning_rate": 2.6594287302267744e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.030275695025920868, "step": 2365, "valid_targets_mean": 8356.2, "valid_targets_min": 3503 }, { "epoch": 2.27456, "grad_norm": 0.12193784051429168, "learning_rate": 2.653099776186405e-05, "loss": 0.0855, "loss_nan_ranks": 0, "loss_rank_avg": 0.030562900006771088, "step": 2370, "valid_targets_mean": 8735.8, "valid_targets_min": 3683 }, { "epoch": 2.27936, "grad_norm": 0.12820083550312378, "learning_rate": 2.646763492914908e-05, "loss": 0.089, "loss_nan_ranks": 0, "loss_rank_avg": 0.02770865336060524, "step": 2375, "valid_targets_mean": 8340.5, "valid_targets_min": 3782 }, { "epoch": 2.28416, "grad_norm": 0.12584158181503047, "learning_rate": 2.640419951519467e-05, "loss": 0.0846, "loss_nan_ranks": 0, "loss_rank_avg": 0.027583956718444824, "step": 2380, "valid_targets_mean": 8902.2, "valid_targets_min": 2519 }, { "epoch": 2.28896, "grad_norm": 0.11669888252699596, "learning_rate": 2.634069223188715e-05, "loss": 0.084, "loss_nan_ranks": 0, "loss_rank_avg": 0.02490045502781868, "step": 2385, "valid_targets_mean": 8558.5, "valid_targets_min": 1749 }, { "epoch": 2.29376, "grad_norm": 0.13839389337555474, "learning_rate": 2.627711379191939e-05, "loss": 0.0846, "loss_nan_ranks": 0, "loss_rank_avg": 0.03266286849975586, "step": 2390, "valid_targets_mean": 8944.8, "valid_targets_min": 1162 }, { "epoch": 2.29856, "grad_norm": 0.11514986701905704, "learning_rate": 2.621346490878281e-05, "loss": 0.0885, "loss_nan_ranks": 0, "loss_rank_avg": 0.02784108743071556, "step": 2395, "valid_targets_mean": 8955.2, "valid_targets_min": 3938 }, { "epoch": 2.30336, "grad_norm": 0.11881869791073651, "learning_rate": 2.614974629675935e-05, "loss": 0.092, "loss_nan_ranks": 0, "loss_rank_avg": 0.023495035246014595, "step": 2400, "valid_targets_mean": 7342.0, "valid_targets_min": 169 }, { "epoch": 2.30816, "grad_norm": 0.12360572532300317, "learning_rate": 2.608595867091346e-05, "loss": 0.0815, "loss_nan_ranks": 0, "loss_rank_avg": 0.027920987457036972, "step": 2405, "valid_targets_mean": 8327.4, "valid_targets_min": 2364 }, { "epoch": 2.31296, "grad_norm": 0.11715967892279636, "learning_rate": 2.6022102747084084e-05, "loss": 0.0842, "loss_nan_ranks": 0, "loss_rank_avg": 0.027643052861094475, "step": 2410, "valid_targets_mean": 7846.9, "valid_targets_min": 2577 }, { "epoch": 2.31776, "grad_norm": 0.12758321508927314, "learning_rate": 2.595817924187663e-05, "loss": 0.081, "loss_nan_ranks": 0, "loss_rank_avg": 0.02899922803044319, "step": 2415, "valid_targets_mean": 9130.7, "valid_targets_min": 3316 }, { "epoch": 2.32256, "grad_norm": 0.13414710490899953, "learning_rate": 2.589418887265489e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.026726992800831795, "step": 2420, "valid_targets_mean": 8485.5, "valid_targets_min": 3077 }, { "epoch": 2.32736, "grad_norm": 0.13587055559492064, "learning_rate": 2.5830132357533044e-05, "loss": 0.0845, "loss_nan_ranks": 0, "loss_rank_avg": 0.029106823727488518, "step": 2425, "valid_targets_mean": 8432.3, "valid_targets_min": 4446 }, { "epoch": 2.33216, "grad_norm": 0.15493957733521915, "learning_rate": 2.5766010415367567e-05, "loss": 0.0813, "loss_nan_ranks": 0, "loss_rank_avg": 0.022029448300600052, "step": 2430, "valid_targets_mean": 8394.6, "valid_targets_min": 3922 }, { "epoch": 2.33696, "grad_norm": 0.13728604655180596, "learning_rate": 2.5701823765749187e-05, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.027791917324066162, "step": 2435, "valid_targets_mean": 8548.2, "valid_targets_min": 4766 }, { "epoch": 2.34176, "grad_norm": 0.1543128408800076, "learning_rate": 2.563757312899477e-05, "loss": 0.0821, "loss_nan_ranks": 0, "loss_rank_avg": 0.026925476267933846, "step": 2440, "valid_targets_mean": 8387.8, "valid_targets_min": 2338 }, { "epoch": 2.34656, "grad_norm": 0.13024914354519151, "learning_rate": 2.557325922613926e-05, "loss": 0.0791, "loss_nan_ranks": 0, "loss_rank_avg": 0.02424551174044609, "step": 2445, "valid_targets_mean": 7773.3, "valid_targets_min": 2357 }, { "epoch": 2.35136, "grad_norm": 0.11383491062887292, "learning_rate": 2.5508882778927615e-05, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.02507830783724785, "step": 2450, "valid_targets_mean": 9141.1, "valid_targets_min": 2616 }, { "epoch": 2.35616, "grad_norm": 0.1354783740772417, "learning_rate": 2.5444444509806654e-05, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.02786952257156372, "step": 2455, "valid_targets_mean": 9109.7, "valid_targets_min": 1796 }, { "epoch": 2.36096, "grad_norm": 0.12620305822721312, "learning_rate": 2.5379945141916976e-05, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.026485783979296684, "step": 2460, "valid_targets_mean": 8629.1, "valid_targets_min": 1912 }, { "epoch": 2.36576, "grad_norm": 0.1257587782311723, "learning_rate": 2.531538539908486e-05, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.03141780570149422, "step": 2465, "valid_targets_mean": 8329.3, "valid_targets_min": 2077 }, { "epoch": 2.3705600000000002, "grad_norm": 0.12781978557050486, "learning_rate": 2.5250766005814108e-05, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.026302650570869446, "step": 2470, "valid_targets_mean": 8031.9, "valid_targets_min": 2063 }, { "epoch": 2.37536, "grad_norm": 0.12209146990464828, "learning_rate": 2.5186087687277956e-05, "loss": 0.0812, "loss_nan_ranks": 0, "loss_rank_avg": 0.025557709857821465, "step": 2475, "valid_targets_mean": 8948.2, "valid_targets_min": 5096 }, { "epoch": 2.38016, "grad_norm": 0.1382679318537906, "learning_rate": 2.5121351169310887e-05, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.024665851145982742, "step": 2480, "valid_targets_mean": 8454.4, "valid_targets_min": 2141 }, { "epoch": 2.38496, "grad_norm": 0.13902487378784473, "learning_rate": 2.505655717840052e-05, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.031393177807331085, "step": 2485, "valid_targets_mean": 8371.2, "valid_targets_min": 1984 }, { "epoch": 2.38976, "grad_norm": 0.13282389888635227, "learning_rate": 2.499170644167946e-05, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.024904152378439903, "step": 2490, "valid_targets_mean": 8406.3, "valid_targets_min": 1938 }, { "epoch": 2.3945600000000002, "grad_norm": 0.1299330392423453, "learning_rate": 2.49267996869171e-05, "loss": 0.079, "loss_nan_ranks": 0, "loss_rank_avg": 0.03227228298783302, "step": 2495, "valid_targets_mean": 9098.1, "valid_targets_min": 4981 }, { "epoch": 2.39936, "grad_norm": 0.1252546953275161, "learning_rate": 2.486183764251151e-05, "loss": 0.0804, "loss_nan_ranks": 0, "loss_rank_avg": 0.02573280595242977, "step": 2500, "valid_targets_mean": 8719.9, "valid_targets_min": 2288 }, { "epoch": 2.40416, "grad_norm": 0.12721435122351463, "learning_rate": 2.4796821037481215e-05, "loss": 0.0789, "loss_nan_ranks": 0, "loss_rank_avg": 0.027574259787797928, "step": 2505, "valid_targets_mean": 8806.6, "valid_targets_min": 1830 }, { "epoch": 2.40896, "grad_norm": 0.13390795751399273, "learning_rate": 2.473175060145703e-05, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.026054752990603447, "step": 2510, "valid_targets_mean": 8937.4, "valid_targets_min": 2541 }, { "epoch": 2.41376, "grad_norm": 0.1184645193517672, "learning_rate": 2.4666627064673892e-05, "loss": 0.0793, "loss_nan_ranks": 0, "loss_rank_avg": 0.024346385151147842, "step": 2515, "valid_targets_mean": 7785.2, "valid_targets_min": 2980 }, { "epoch": 2.41856, "grad_norm": 0.1364358933879091, "learning_rate": 2.4601451157962616e-05, "loss": 0.0808, "loss_nan_ranks": 0, "loss_rank_avg": 0.029486022889614105, "step": 2520, "valid_targets_mean": 9084.0, "valid_targets_min": 4241 }, { "epoch": 2.42336, "grad_norm": 0.14177621555064562, "learning_rate": 2.4536223612741754e-05, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.025790728628635406, "step": 2525, "valid_targets_mean": 9287.2, "valid_targets_min": 2587 }, { "epoch": 2.42816, "grad_norm": 0.12254560093831562, "learning_rate": 2.447094516100934e-05, "loss": 0.0801, "loss_nan_ranks": 0, "loss_rank_avg": 0.025828056037425995, "step": 2530, "valid_targets_mean": 8999.5, "valid_targets_min": 3557 }, { "epoch": 2.43296, "grad_norm": 0.12839180536574532, "learning_rate": 2.4405616535334695e-05, "loss": 0.079, "loss_nan_ranks": 0, "loss_rank_avg": 0.030729684978723526, "step": 2535, "valid_targets_mean": 9717.8, "valid_targets_min": 5031 }, { "epoch": 2.43776, "grad_norm": 0.11585615309614611, "learning_rate": 2.43402384688502e-05, "loss": 0.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.023497575893998146, "step": 2540, "valid_targets_mean": 9059.8, "valid_targets_min": 1635 }, { "epoch": 2.44256, "grad_norm": 0.12134766967020498, "learning_rate": 2.4274811695243085e-05, "loss": 0.0801, "loss_nan_ranks": 0, "loss_rank_avg": 0.02694030851125717, "step": 2545, "valid_targets_mean": 8850.2, "valid_targets_min": 3299 }, { "epoch": 2.4473599999999998, "grad_norm": 0.1316863971028815, "learning_rate": 2.4209336948747168e-05, "loss": 0.0803, "loss_nan_ranks": 0, "loss_rank_avg": 0.02972356602549553, "step": 2550, "valid_targets_mean": 9398.3, "valid_targets_min": 4232 }, { "epoch": 2.45216, "grad_norm": 0.12287062451907484, "learning_rate": 2.414381496413464e-05, "loss": 0.0782, "loss_nan_ranks": 0, "loss_rank_avg": 0.0246087945997715, "step": 2555, "valid_targets_mean": 8041.0, "valid_targets_min": 2944 }, { "epoch": 2.45696, "grad_norm": 0.12535471909521592, "learning_rate": 2.4078246476707793e-05, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.024066515266895294, "step": 2560, "valid_targets_mean": 8603.2, "valid_targets_min": 2279 }, { "epoch": 2.46176, "grad_norm": 0.1264236899638182, "learning_rate": 2.4012632222290802e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.02529139630496502, "step": 2565, "valid_targets_mean": 8860.7, "valid_targets_min": 3159 }, { "epoch": 2.46656, "grad_norm": 0.12748116305719281, "learning_rate": 2.3946972937221444e-05, "loss": 0.0805, "loss_nan_ranks": 0, "loss_rank_avg": 0.03009450063109398, "step": 2570, "valid_targets_mean": 9358.7, "valid_targets_min": 1975 }, { "epoch": 2.47136, "grad_norm": 0.13952086450619908, "learning_rate": 2.3881269358342828e-05, "loss": 0.0785, "loss_nan_ranks": 0, "loss_rank_avg": 0.028878334909677505, "step": 2575, "valid_targets_mean": 8155.2, "valid_targets_min": 2432 }, { "epoch": 2.47616, "grad_norm": 0.12234682090534985, "learning_rate": 2.3815522222995158e-05, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.023882580921053886, "step": 2580, "valid_targets_mean": 7829.0, "valid_targets_min": 2730 }, { "epoch": 2.48096, "grad_norm": 0.1212451765174174, "learning_rate": 2.3749732269007427e-05, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.02354244887828827, "step": 2585, "valid_targets_mean": 8768.0, "valid_targets_min": 1602 }, { "epoch": 2.48576, "grad_norm": 0.12337580575976319, "learning_rate": 2.3683900234689142e-05, "loss": 0.075, "loss_nan_ranks": 0, "loss_rank_avg": 0.021861132234334946, "step": 2590, "valid_targets_mean": 8479.1, "valid_targets_min": 1756 }, { "epoch": 2.49056, "grad_norm": 0.1264164703524998, "learning_rate": 2.3618026858822054e-05, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.030043430626392365, "step": 2595, "valid_targets_mean": 8425.5, "valid_targets_min": 2912 }, { "epoch": 2.49536, "grad_norm": 0.13322500466357357, "learning_rate": 2.355211288065187e-05, "loss": 0.0773, "loss_nan_ranks": 0, "loss_rank_avg": 0.02616289258003235, "step": 2600, "valid_targets_mean": 8737.0, "valid_targets_min": 2762 }, { "epoch": 2.50016, "grad_norm": 0.14281821332399597, "learning_rate": 2.348615903987991e-05, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.027944108471274376, "step": 2605, "valid_targets_mean": 8119.4, "valid_targets_min": 1852 }, { "epoch": 2.50496, "grad_norm": 0.12278110816702006, "learning_rate": 2.3420166076654873e-05, "loss": 0.0767, "loss_nan_ranks": 0, "loss_rank_avg": 0.02698206529021263, "step": 2610, "valid_targets_mean": 9372.3, "valid_targets_min": 1970 }, { "epoch": 2.50976, "grad_norm": 0.12717072751197384, "learning_rate": 2.335413473156449e-05, "loss": 0.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.02557991072535515, "step": 2615, "valid_targets_mean": 8949.4, "valid_targets_min": 3090 }, { "epoch": 2.51456, "grad_norm": 0.1215114979896222, "learning_rate": 2.328806574562722e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.021433714777231216, "step": 2620, "valid_targets_mean": 8481.4, "valid_targets_min": 3181 }, { "epoch": 2.51936, "grad_norm": 0.13269527558167965, "learning_rate": 2.322195986028393e-05, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.023230556398630142, "step": 2625, "valid_targets_mean": 8499.2, "valid_targets_min": 3799 }, { "epoch": 2.52416, "grad_norm": 0.12500369623855434, "learning_rate": 2.315581781738959e-05, "loss": 0.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.02225703001022339, "step": 2630, "valid_targets_mean": 8066.4, "valid_targets_min": 2881 }, { "epoch": 2.52896, "grad_norm": 0.12839309833611812, "learning_rate": 2.3089640359204937e-05, "loss": 0.0775, "loss_nan_ranks": 0, "loss_rank_avg": 0.02520071715116501, "step": 2635, "valid_targets_mean": 8992.2, "valid_targets_min": 1565 }, { "epoch": 2.53376, "grad_norm": 0.1309485140869025, "learning_rate": 2.3023428228388144e-05, "loss": 0.0765, "loss_nan_ranks": 0, "loss_rank_avg": 0.02432047203183174, "step": 2640, "valid_targets_mean": 8642.0, "valid_targets_min": 1852 }, { "epoch": 2.53856, "grad_norm": 0.13195500479172162, "learning_rate": 2.2957182167986486e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.02704329788684845, "step": 2645, "valid_targets_mean": 8725.4, "valid_targets_min": 2588 }, { "epoch": 2.54336, "grad_norm": 0.14879671880870712, "learning_rate": 2.2890902921428004e-05, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.023556988686323166, "step": 2650, "valid_targets_mean": 8299.9, "valid_targets_min": 1915 }, { "epoch": 2.54816, "grad_norm": 0.13418012766582119, "learning_rate": 2.2824591232513153e-05, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.024494722485542297, "step": 2655, "valid_targets_mean": 7699.7, "valid_targets_min": 1729 }, { "epoch": 2.55296, "grad_norm": 0.11860664564020829, "learning_rate": 2.2758247845406495e-05, "loss": 0.0759, "loss_nan_ranks": 0, "loss_rank_avg": 0.025114569813013077, "step": 2660, "valid_targets_mean": 8217.2, "valid_targets_min": 2032 }, { "epoch": 2.55776, "grad_norm": 0.13999752211175603, "learning_rate": 2.2691873504628282e-05, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.02651476487517357, "step": 2665, "valid_targets_mean": 8598.3, "valid_targets_min": 3847 }, { "epoch": 2.56256, "grad_norm": 0.12447169923083799, "learning_rate": 2.2625468955046143e-05, "loss": 0.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.02548210322856903, "step": 2670, "valid_targets_mean": 8152.9, "valid_targets_min": 1921 }, { "epoch": 2.56736, "grad_norm": 0.1225074570696376, "learning_rate": 2.2559034941866727e-05, "loss": 0.0734, "loss_nan_ranks": 0, "loss_rank_avg": 0.025047052651643753, "step": 2675, "valid_targets_mean": 8584.6, "valid_targets_min": 2518 }, { "epoch": 2.5721600000000002, "grad_norm": 0.1257466044762218, "learning_rate": 2.2492572210627325e-05, "loss": 0.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.02429202012717724, "step": 2680, "valid_targets_mean": 8235.4, "valid_targets_min": 2038 }, { "epoch": 2.57696, "grad_norm": 0.13557857735015535, "learning_rate": 2.24260815071875e-05, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.023734377697110176, "step": 2685, "valid_targets_mean": 8223.3, "valid_targets_min": 1543 }, { "epoch": 2.58176, "grad_norm": 0.12431085511827711, "learning_rate": 2.2359563577720743e-05, "loss": 0.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.026736926287412643, "step": 2690, "valid_targets_mean": 9182.7, "valid_targets_min": 3127 }, { "epoch": 2.58656, "grad_norm": 0.11900321217430507, "learning_rate": 2.229301916870606e-05, "loss": 0.0731, "loss_nan_ranks": 0, "loss_rank_avg": 0.027746083214879036, "step": 2695, "valid_targets_mean": 9351.5, "valid_targets_min": 4599 }, { "epoch": 2.59136, "grad_norm": 0.1383700323259459, "learning_rate": 2.2226449026919637e-05, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.029470983892679214, "step": 2700, "valid_targets_mean": 9054.1, "valid_targets_min": 5678 }, { "epoch": 2.5961600000000002, "grad_norm": 0.13012742542583644, "learning_rate": 2.2159853899426427e-05, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.025567417964339256, "step": 2705, "valid_targets_mean": 9233.9, "valid_targets_min": 2233 }, { "epoch": 2.60096, "grad_norm": 0.12657750747445207, "learning_rate": 2.209323453357178e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.02532579004764557, "step": 2710, "valid_targets_mean": 8470.7, "valid_targets_min": 3447 }, { "epoch": 2.60576, "grad_norm": 0.13279951041017773, "learning_rate": 2.202659167697306e-05, "loss": 0.0764, "loss_nan_ranks": 0, "loss_rank_avg": 0.02570538967847824, "step": 2715, "valid_targets_mean": 9163.9, "valid_targets_min": 3626 }, { "epoch": 2.61056, "grad_norm": 0.12127499458765617, "learning_rate": 2.1959926077511234e-05, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.020813290029764175, "step": 2720, "valid_targets_mean": 9457.5, "valid_targets_min": 2096 }, { "epoch": 2.61536, "grad_norm": 0.1253460206942048, "learning_rate": 2.1893238483322512e-05, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.023362675681710243, "step": 2725, "valid_targets_mean": 8545.1, "valid_targets_min": 2994 }, { "epoch": 2.6201600000000003, "grad_norm": 0.13220273622382875, "learning_rate": 2.1826529642789923e-05, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.02266569808125496, "step": 2730, "valid_targets_mean": 8827.2, "valid_targets_min": 3646 }, { "epoch": 2.6249599999999997, "grad_norm": 0.1320216526163596, "learning_rate": 2.1759800304534936e-05, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.027949821203947067, "step": 2735, "valid_targets_mean": 8625.2, "valid_targets_min": 2142 }, { "epoch": 2.62976, "grad_norm": 0.11911754506105855, "learning_rate": 2.1693051217409048e-05, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.02508479729294777, "step": 2740, "valid_targets_mean": 8534.6, "valid_targets_min": 1960 }, { "epoch": 2.63456, "grad_norm": 0.12386094956552933, "learning_rate": 2.1626283130485365e-05, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.02538812719285488, "step": 2745, "valid_targets_mean": 8241.4, "valid_targets_min": 2379 }, { "epoch": 2.63936, "grad_norm": 0.1730315798377173, "learning_rate": 2.1559496793050235e-05, "loss": 0.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.027699865400791168, "step": 2750, "valid_targets_mean": 9055.9, "valid_targets_min": 3489 }, { "epoch": 2.64416, "grad_norm": 0.12946922012219694, "learning_rate": 2.1492692954594815e-05, "loss": 0.0773, "loss_nan_ranks": 0, "loss_rank_avg": 0.02325347810983658, "step": 2755, "valid_targets_mean": 8042.9, "valid_targets_min": 2633 }, { "epoch": 2.6489599999999998, "grad_norm": 0.1366619849837903, "learning_rate": 2.1425872364806642e-05, "loss": 0.0775, "loss_nan_ranks": 0, "loss_rank_avg": 0.02587948739528656, "step": 2760, "valid_targets_mean": 8853.9, "valid_targets_min": 3540 }, { "epoch": 2.65376, "grad_norm": 0.12647286473054808, "learning_rate": 2.1359035773561275e-05, "loss": 0.0787, "loss_nan_ranks": 0, "loss_rank_avg": 0.029227159917354584, "step": 2765, "valid_targets_mean": 9773.8, "valid_targets_min": 3960 }, { "epoch": 2.65856, "grad_norm": 0.14185801754999453, "learning_rate": 2.1292183930913803e-05, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.02531890943646431, "step": 2770, "valid_targets_mean": 8255.2, "valid_targets_min": 1987 }, { "epoch": 2.66336, "grad_norm": 0.12863813890549577, "learning_rate": 2.1225317587090507e-05, "loss": 0.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.027946345508098602, "step": 2775, "valid_targets_mean": 8502.0, "valid_targets_min": 1123 }, { "epoch": 2.66816, "grad_norm": 0.12736788349292172, "learning_rate": 2.1158437492480384e-05, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.01997240260243416, "step": 2780, "valid_targets_mean": 7395.3, "valid_targets_min": 2185 }, { "epoch": 2.67296, "grad_norm": 0.12976383848578613, "learning_rate": 2.1091544397626752e-05, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.025439299643039703, "step": 2785, "valid_targets_mean": 8741.4, "valid_targets_min": 3209 }, { "epoch": 2.67776, "grad_norm": 0.12360076149823336, "learning_rate": 2.102463905321881e-05, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.023299697786569595, "step": 2790, "valid_targets_mean": 8274.7, "valid_targets_min": 3255 }, { "epoch": 2.68256, "grad_norm": 0.12579718860137898, "learning_rate": 2.095772221008323e-05, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.024257106706500053, "step": 2795, "valid_targets_mean": 8911.9, "valid_targets_min": 5452 }, { "epoch": 2.68736, "grad_norm": 0.1309826914466945, "learning_rate": 2.0890794619175745e-05, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.026484040543437004, "step": 2800, "valid_targets_mean": 8579.1, "valid_targets_min": 1887 }, { "epoch": 2.69216, "grad_norm": 0.1314840553029046, "learning_rate": 2.0823857031572663e-05, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.026499971747398376, "step": 2805, "valid_targets_mean": 8582.2, "valid_targets_min": 3171 }, { "epoch": 2.69696, "grad_norm": 0.13542623007736973, "learning_rate": 2.0756910198462515e-05, "loss": 0.0746, "loss_nan_ranks": 0, "loss_rank_avg": 0.024281367659568787, "step": 2810, "valid_targets_mean": 8698.7, "valid_targets_min": 2419 }, { "epoch": 2.70176, "grad_norm": 0.12828824896006688, "learning_rate": 2.0689954871137558e-05, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.02330276370048523, "step": 2815, "valid_targets_mean": 9369.3, "valid_targets_min": 2792 }, { "epoch": 2.70656, "grad_norm": 0.1274100600671183, "learning_rate": 2.0622991800985398e-05, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.02662099152803421, "step": 2820, "valid_targets_mean": 8691.3, "valid_targets_min": 2503 }, { "epoch": 2.71136, "grad_norm": 0.13208316669833364, "learning_rate": 2.055602173948051e-05, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.023739665746688843, "step": 2825, "valid_targets_mean": 8986.6, "valid_targets_min": 4021 }, { "epoch": 2.71616, "grad_norm": 0.1347761848229569, "learning_rate": 2.0489045438175842e-05, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.022743025794625282, "step": 2830, "valid_targets_mean": 7970.3, "valid_targets_min": 2753 }, { "epoch": 2.72096, "grad_norm": 0.13563435389041437, "learning_rate": 2.042206364869436e-05, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.020514879375696182, "step": 2835, "valid_targets_mean": 8056.1, "valid_targets_min": 1768 }, { "epoch": 2.72576, "grad_norm": 0.12106789458820655, "learning_rate": 2.0355077122720625e-05, "loss": 0.0714, "loss_nan_ranks": 0, "loss_rank_avg": 0.01979285106062889, "step": 2840, "valid_targets_mean": 8668.8, "valid_targets_min": 1889 }, { "epoch": 2.73056, "grad_norm": 0.13331211562297765, "learning_rate": 2.0288086611992344e-05, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.02285662479698658, "step": 2845, "valid_targets_mean": 8784.2, "valid_targets_min": 2507 }, { "epoch": 2.73536, "grad_norm": 0.12283461413697871, "learning_rate": 2.0221092868291953e-05, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.024631857872009277, "step": 2850, "valid_targets_mean": 9224.7, "valid_targets_min": 3740 }, { "epoch": 2.74016, "grad_norm": 0.13462190750677952, "learning_rate": 2.0154096643438153e-05, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.02646755427122116, "step": 2855, "valid_targets_mean": 9081.2, "valid_targets_min": 3634 }, { "epoch": 2.74496, "grad_norm": 0.15212100488432875, "learning_rate": 2.008709868927751e-05, "loss": 0.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.02177482843399048, "step": 2860, "valid_targets_mean": 9343.9, "valid_targets_min": 1558 }, { "epoch": 2.74976, "grad_norm": 0.13891228481080325, "learning_rate": 2.0020099757675978e-05, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.023706315085291862, "step": 2865, "valid_targets_mean": 8286.4, "valid_targets_min": 4347 }, { "epoch": 2.75456, "grad_norm": 0.12578790912092921, "learning_rate": 1.9953100600510487e-05, "loss": 0.0705, "loss_nan_ranks": 0, "loss_rank_avg": 0.0233942698687315, "step": 2870, "valid_targets_mean": 8919.5, "valid_targets_min": 4034 }, { "epoch": 2.75936, "grad_norm": 0.12433449798647353, "learning_rate": 1.9886101969660504e-05, "loss": 0.0708, "loss_nan_ranks": 0, "loss_rank_avg": 0.02069215103983879, "step": 2875, "valid_targets_mean": 8321.7, "valid_targets_min": 2865 }, { "epoch": 2.76416, "grad_norm": 0.12331619896381704, "learning_rate": 1.9819104616999584e-05, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.02588079310953617, "step": 2880, "valid_targets_mean": 8835.1, "valid_targets_min": 3375 }, { "epoch": 2.76896, "grad_norm": 0.12198016602770331, "learning_rate": 1.975210929438693e-05, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.023465629667043686, "step": 2885, "valid_targets_mean": 8514.5, "valid_targets_min": 1894 }, { "epoch": 2.7737600000000002, "grad_norm": 0.1285591492170375, "learning_rate": 1.9685116753658982e-05, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.023442579433321953, "step": 2890, "valid_targets_mean": 9131.8, "valid_targets_min": 2375 }, { "epoch": 2.77856, "grad_norm": 0.14027229866879554, "learning_rate": 1.9618127746620944e-05, "loss": 0.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.027585767209529877, "step": 2895, "valid_targets_mean": 9061.1, "valid_targets_min": 3636 }, { "epoch": 2.78336, "grad_norm": 0.12175580215805587, "learning_rate": 1.9551143025038363e-05, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.025040633976459503, "step": 2900, "valid_targets_mean": 8019.9, "valid_targets_min": 4226 }, { "epoch": 2.78816, "grad_norm": 0.12631373857068798, "learning_rate": 1.9484163340628724e-05, "loss": 0.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.022008750587701797, "step": 2905, "valid_targets_mean": 8278.6, "valid_targets_min": 3655 }, { "epoch": 2.79296, "grad_norm": 0.12353277202856984, "learning_rate": 1.941718944505294e-05, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.0223405584692955, "step": 2910, "valid_targets_mean": 8777.7, "valid_targets_min": 2390 }, { "epoch": 2.7977600000000002, "grad_norm": 0.12477152321684222, "learning_rate": 1.9350222089906994e-05, "loss": 0.0731, "loss_nan_ranks": 0, "loss_rank_avg": 0.022324811667203903, "step": 2915, "valid_targets_mean": 8715.5, "valid_targets_min": 2780 }, { "epoch": 2.80256, "grad_norm": 0.1274810275629356, "learning_rate": 1.9283262026713456e-05, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.024463120847940445, "step": 2920, "valid_targets_mean": 8644.3, "valid_targets_min": 2357 }, { "epoch": 2.80736, "grad_norm": 0.15489737871525144, "learning_rate": 1.9216310006913058e-05, "loss": 0.0724, "loss_nan_ranks": 0, "loss_rank_avg": 0.0199250690639019, "step": 2925, "valid_targets_mean": 8119.0, "valid_targets_min": 2239 }, { "epoch": 2.81216, "grad_norm": 0.13087489077175116, "learning_rate": 1.914936678185629e-05, "loss": 0.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.02115030400454998, "step": 2930, "valid_targets_mean": 8713.2, "valid_targets_min": 2695 }, { "epoch": 2.81696, "grad_norm": 0.12942414716942643, "learning_rate": 1.9082433102794918e-05, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.025940679013729095, "step": 2935, "valid_targets_mean": 9562.3, "valid_targets_min": 4015 }, { "epoch": 2.8217600000000003, "grad_norm": 0.11899703583290817, "learning_rate": 1.9015509720873603e-05, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.028031064197421074, "step": 2940, "valid_targets_mean": 9664.9, "valid_targets_min": 2235 }, { "epoch": 2.8265599999999997, "grad_norm": 0.12835916290377014, "learning_rate": 1.894859738712143e-05, "loss": 0.0745, "loss_nan_ranks": 0, "loss_rank_avg": 0.023106276988983154, "step": 2945, "valid_targets_mean": 8617.7, "valid_targets_min": 2343 }, { "epoch": 2.83136, "grad_norm": 0.12234620395991247, "learning_rate": 1.888169685244352e-05, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.021706473082304, "step": 2950, "valid_targets_mean": 7974.6, "valid_targets_min": 1989 }, { "epoch": 2.83616, "grad_norm": 0.12135472934515772, "learning_rate": 1.8814808867612568e-05, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.0252741239964962, "step": 2955, "valid_targets_mean": 9213.8, "valid_targets_min": 3497 }, { "epoch": 2.84096, "grad_norm": 0.12341097629186015, "learning_rate": 1.8747934183260427e-05, "loss": 0.0711, "loss_nan_ranks": 0, "loss_rank_avg": 0.022089535370469093, "step": 2960, "valid_targets_mean": 8485.8, "valid_targets_min": 2813 }, { "epoch": 2.84576, "grad_norm": 0.12185458825230623, "learning_rate": 1.868107354986971e-05, "loss": 0.0745, "loss_nan_ranks": 0, "loss_rank_avg": 0.023958466947078705, "step": 2965, "valid_targets_mean": 8559.1, "valid_targets_min": 2934 }, { "epoch": 2.8505599999999998, "grad_norm": 0.2019700331379936, "learning_rate": 1.8614227717765327e-05, "loss": 0.0727, "loss_nan_ranks": 0, "loss_rank_avg": 0.023400334641337395, "step": 2970, "valid_targets_mean": 8567.7, "valid_targets_min": 3655 }, { "epoch": 2.85536, "grad_norm": 0.12307094056404946, "learning_rate": 1.8547397437106084e-05, "loss": 0.0711, "loss_nan_ranks": 0, "loss_rank_avg": 0.02216029167175293, "step": 2975, "valid_targets_mean": 8859.0, "valid_targets_min": 3690 }, { "epoch": 2.86016, "grad_norm": 0.1363174764510877, "learning_rate": 1.848058345787629e-05, "loss": 0.074, "loss_nan_ranks": 0, "loss_rank_avg": 0.024962490424513817, "step": 2980, "valid_targets_mean": 8806.0, "valid_targets_min": 3210 }, { "epoch": 2.86496, "grad_norm": 0.12263761790836711, "learning_rate": 1.8413786529877288e-05, "loss": 0.0706, "loss_nan_ranks": 0, "loss_rank_avg": 0.0196840763092041, "step": 2985, "valid_targets_mean": 8160.8, "valid_targets_min": 2827 }, { "epoch": 2.86976, "grad_norm": 0.12703370316175627, "learning_rate": 1.8347007402719082e-05, "loss": 0.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.025346554815769196, "step": 2990, "valid_targets_mean": 9061.6, "valid_targets_min": 4220 }, { "epoch": 2.87456, "grad_norm": 0.12244916720977835, "learning_rate": 1.828024682581191e-05, "loss": 0.0762, "loss_nan_ranks": 0, "loss_rank_avg": 0.026083365082740784, "step": 2995, "valid_targets_mean": 9098.1, "valid_targets_min": 1492 }, { "epoch": 2.87936, "grad_norm": 0.13150902110865764, "learning_rate": 1.8213505548357822e-05, "loss": 0.0729, "loss_nan_ranks": 0, "loss_rank_avg": 0.023833446204662323, "step": 3000, "valid_targets_mean": 8153.8, "valid_targets_min": 2983 }, { "epoch": 2.88416, "grad_norm": 0.12212915178092341, "learning_rate": 1.814678431934231e-05, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.02612268179655075, "step": 3005, "valid_targets_mean": 9175.3, "valid_targets_min": 4008 }, { "epoch": 2.88896, "grad_norm": 0.1346347379421597, "learning_rate": 1.8080083887525862e-05, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.023977095261216164, "step": 3010, "valid_targets_mean": 8365.3, "valid_targets_min": 2239 }, { "epoch": 2.89376, "grad_norm": 0.12570526531776613, "learning_rate": 1.801340500143557e-05, "loss": 0.0724, "loss_nan_ranks": 0, "loss_rank_avg": 0.02590319886803627, "step": 3015, "valid_targets_mean": 8906.6, "valid_targets_min": 4035 }, { "epoch": 2.89856, "grad_norm": 0.12095421806855092, "learning_rate": 1.7946748409356746e-05, "loss": 0.0758, "loss_nan_ranks": 0, "loss_rank_avg": 0.024391578510403633, "step": 3020, "valid_targets_mean": 8243.3, "valid_targets_min": 1280 }, { "epoch": 2.90336, "grad_norm": 0.13265519572762954, "learning_rate": 1.788011485932451e-05, "loss": 0.0733, "loss_nan_ranks": 0, "loss_rank_avg": 0.02277197316288948, "step": 3025, "valid_targets_mean": 8158.2, "valid_targets_min": 1629 }, { "epoch": 2.90816, "grad_norm": 0.13107630504480672, "learning_rate": 1.78135050991154e-05, "loss": 0.0744, "loss_nan_ranks": 0, "loss_rank_avg": 0.02625724859535694, "step": 3030, "valid_targets_mean": 8981.2, "valid_targets_min": 3186 }, { "epoch": 2.91296, "grad_norm": 0.41703413499653275, "learning_rate": 1.774691987623898e-05, "loss": 0.0734, "loss_nan_ranks": 0, "loss_rank_avg": 0.026596393436193466, "step": 3035, "valid_targets_mean": 9226.0, "valid_targets_min": 3192 }, { "epoch": 2.91776, "grad_norm": 0.15139444386768838, "learning_rate": 1.768035993792944e-05, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.027542371302843094, "step": 3040, "valid_targets_mean": 10083.0, "valid_targets_min": 6144 }, { "epoch": 2.92256, "grad_norm": 0.12675751853167433, "learning_rate": 1.7613826031137245e-05, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.02687855437397957, "step": 3045, "valid_targets_mean": 8895.7, "valid_targets_min": 4809 }, { "epoch": 2.92736, "grad_norm": 0.12662474766507864, "learning_rate": 1.7547318902520693e-05, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.024971062317490578, "step": 3050, "valid_targets_mean": 8946.8, "valid_targets_min": 4309 }, { "epoch": 2.93216, "grad_norm": 0.1286424743817585, "learning_rate": 1.7480839298437612e-05, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.025227583944797516, "step": 3055, "valid_targets_mean": 9259.2, "valid_targets_min": 2514 }, { "epoch": 2.93696, "grad_norm": 0.12893517435268495, "learning_rate": 1.7414387964936913e-05, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.026150595396757126, "step": 3060, "valid_targets_mean": 9149.1, "valid_targets_min": 3181 }, { "epoch": 2.94176, "grad_norm": 0.12655174215859458, "learning_rate": 1.7347965647750264e-05, "loss": 0.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.024759739637374878, "step": 3065, "valid_targets_mean": 9399.6, "valid_targets_min": 3759 }, { "epoch": 2.94656, "grad_norm": 0.13072454712552234, "learning_rate": 1.7281573092283698e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.021730834618210793, "step": 3070, "valid_targets_mean": 8040.0, "valid_targets_min": 3188 }, { "epoch": 2.95136, "grad_norm": 0.12321743168297426, "learning_rate": 1.721521104360925e-05, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.023660646751523018, "step": 3075, "valid_targets_mean": 8968.6, "valid_targets_min": 3813 }, { "epoch": 2.95616, "grad_norm": 0.12969336877295307, "learning_rate": 1.714888024645662e-05, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.027581918984651566, "step": 3080, "valid_targets_mean": 8911.6, "valid_targets_min": 1185 }, { "epoch": 2.96096, "grad_norm": 0.12602670418990503, "learning_rate": 1.708258144520478e-05, "loss": 0.0735, "loss_nan_ranks": 0, "loss_rank_avg": 0.027505237609148026, "step": 3085, "valid_targets_mean": 8821.6, "valid_targets_min": 3186 }, { "epoch": 2.96576, "grad_norm": 0.1297030798288961, "learning_rate": 1.7016315383873637e-05, "loss": 0.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.02171483263373375, "step": 3090, "valid_targets_mean": 8498.5, "valid_targets_min": 1844 }, { "epoch": 2.97056, "grad_norm": 0.14699243538398662, "learning_rate": 1.6950082806115692e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.02368342876434326, "step": 3095, "valid_targets_mean": 9345.1, "valid_targets_min": 5842 }, { "epoch": 2.9753600000000002, "grad_norm": 0.1232468312629796, "learning_rate": 1.6883884455207685e-05, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.021345708519220352, "step": 3100, "valid_targets_mean": 7081.2, "valid_targets_min": 2668 }, { "epoch": 2.98016, "grad_norm": 0.12761627571559783, "learning_rate": 1.6817721074042254e-05, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.021635062992572784, "step": 3105, "valid_targets_mean": 8916.5, "valid_targets_min": 3337 }, { "epoch": 2.98496, "grad_norm": 0.127886107487912, "learning_rate": 1.675159340511958e-05, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.024836886674165726, "step": 3110, "valid_targets_mean": 8576.9, "valid_targets_min": 3946 }, { "epoch": 2.98976, "grad_norm": 0.12291271639984096, "learning_rate": 1.6685502190539106e-05, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.02228378877043724, "step": 3115, "valid_targets_mean": 8604.4, "valid_targets_min": 3261 }, { "epoch": 2.99456, "grad_norm": 0.12950070508669648, "learning_rate": 1.6619448171991155e-05, "loss": 0.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.02772909589111805, "step": 3120, "valid_targets_mean": 9047.2, "valid_targets_min": 4860 }, { "epoch": 2.9993600000000002, "grad_norm": 0.12916728839087535, "learning_rate": 1.6553432090748624e-05, "loss": 0.0711, "loss_nan_ranks": 0, "loss_rank_avg": 0.022339988499879837, "step": 3125, "valid_targets_mean": 8654.5, "valid_targets_min": 2501 }, { "epoch": 3.00384, "grad_norm": 0.13436467200946856, "learning_rate": 1.648745468765869e-05, "loss": 0.0695, "loss_nan_ranks": 0, "loss_rank_avg": 0.02428019419312477, "step": 3130, "valid_targets_mean": 8521.2, "valid_targets_min": 2029 }, { "epoch": 3.00864, "grad_norm": 0.1213964690982203, "learning_rate": 1.6421516703134463e-05, "loss": 0.0693, "loss_nan_ranks": 0, "loss_rank_avg": 0.02279294840991497, "step": 3135, "valid_targets_mean": 9165.6, "valid_targets_min": 3462 }, { "epoch": 3.01344, "grad_norm": 0.12809915325981858, "learning_rate": 1.6355618877146685e-05, "loss": 0.0708, "loss_nan_ranks": 0, "loss_rank_avg": 0.02425113320350647, "step": 3140, "valid_targets_mean": 8720.2, "valid_targets_min": 2045 }, { "epoch": 3.01824, "grad_norm": 0.12474776089090203, "learning_rate": 1.6289761949215435e-05, "loss": 0.0686, "loss_nan_ranks": 0, "loss_rank_avg": 0.024004336446523666, "step": 3145, "valid_targets_mean": 8093.4, "valid_targets_min": 1630 }, { "epoch": 3.02304, "grad_norm": 0.121771797960631, "learning_rate": 1.6223946658401818e-05, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.023814337328076363, "step": 3150, "valid_targets_mean": 8823.8, "valid_targets_min": 4465 }, { "epoch": 3.02784, "grad_norm": 0.11750594629421643, "learning_rate": 1.6158173743299692e-05, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.021509505808353424, "step": 3155, "valid_targets_mean": 8647.9, "valid_targets_min": 4037 }, { "epoch": 3.03264, "grad_norm": 0.12614285302682426, "learning_rate": 1.6092443942027356e-05, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.0257541723549366, "step": 3160, "valid_targets_mean": 8363.3, "valid_targets_min": 4240 }, { "epoch": 3.03744, "grad_norm": 0.11499077249412011, "learning_rate": 1.602675799221927e-05, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.021260704845190048, "step": 3165, "valid_targets_mean": 8695.0, "valid_targets_min": 4039 }, { "epoch": 3.04224, "grad_norm": 0.12297680388920865, "learning_rate": 1.59611166310178e-05, "loss": 0.0699, "loss_nan_ranks": 0, "loss_rank_avg": 0.021927397698163986, "step": 3170, "valid_targets_mean": 8749.3, "valid_targets_min": 2927 }, { "epoch": 3.04704, "grad_norm": 0.12361795520196853, "learning_rate": 1.5895520595064913e-05, "loss": 0.0673, "loss_nan_ranks": 0, "loss_rank_avg": 0.0205059964209795, "step": 3175, "valid_targets_mean": 7927.1, "valid_targets_min": 2442 }, { "epoch": 3.05184, "grad_norm": 0.12814989984155925, "learning_rate": 1.5829970620493932e-05, "loss": 0.0721, "loss_nan_ranks": 0, "loss_rank_avg": 0.027933187782764435, "step": 3180, "valid_targets_mean": 8855.2, "valid_targets_min": 2084 }, { "epoch": 3.05664, "grad_norm": 0.11677970502216538, "learning_rate": 1.5764467442921274e-05, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.024320311844348907, "step": 3185, "valid_targets_mean": 8660.4, "valid_targets_min": 2754 }, { "epoch": 3.06144, "grad_norm": 0.1239216085007504, "learning_rate": 1.569901179743818e-05, "loss": 0.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.025944417342543602, "step": 3190, "valid_targets_mean": 9009.9, "valid_targets_min": 4500 }, { "epoch": 3.06624, "grad_norm": 0.12945831869172478, "learning_rate": 1.5633604418602483e-05, "loss": 0.0688, "loss_nan_ranks": 0, "loss_rank_avg": 0.023855559527873993, "step": 3195, "valid_targets_mean": 8333.2, "valid_targets_min": 2803 }, { "epoch": 3.07104, "grad_norm": 0.13013260461232284, "learning_rate": 1.5568246040430343e-05, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.023685764521360397, "step": 3200, "valid_targets_mean": 7983.8, "valid_targets_min": 4751 }, { "epoch": 3.07584, "grad_norm": 0.1273699840697591, "learning_rate": 1.5502937396388046e-05, "loss": 0.0683, "loss_nan_ranks": 0, "loss_rank_avg": 0.023623168468475342, "step": 3205, "valid_targets_mean": 8991.2, "valid_targets_min": 2308 }, { "epoch": 3.08064, "grad_norm": 0.11916279939675328, "learning_rate": 1.543767921938374e-05, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.022730082273483276, "step": 3210, "valid_targets_mean": 8499.2, "valid_targets_min": 3355 }, { "epoch": 3.08544, "grad_norm": 0.12119443723949427, "learning_rate": 1.537247224175922e-05, "loss": 0.0672, "loss_nan_ranks": 0, "loss_rank_avg": 0.021023793146014214, "step": 3215, "valid_targets_mean": 8985.7, "valid_targets_min": 2404 }, { "epoch": 3.09024, "grad_norm": 0.13319695318574473, "learning_rate": 1.53073171952817e-05, "loss": 0.0692, "loss_nan_ranks": 0, "loss_rank_avg": 0.02610372006893158, "step": 3220, "valid_targets_mean": 8657.2, "valid_targets_min": 3664 }, { "epoch": 3.09504, "grad_norm": 0.11480415485378342, "learning_rate": 1.5242214811135631e-05, "loss": 0.0698, "loss_nan_ranks": 0, "loss_rank_avg": 0.01964818686246872, "step": 3225, "valid_targets_mean": 7869.1, "valid_targets_min": 1796 }, { "epoch": 3.09984, "grad_norm": 0.1509063264703375, "learning_rate": 1.5177165819914461e-05, "loss": 0.0708, "loss_nan_ranks": 0, "loss_rank_avg": 0.023284582421183586, "step": 3230, "valid_targets_mean": 8114.5, "valid_targets_min": 2202 }, { "epoch": 3.10464, "grad_norm": 0.12290331374199842, "learning_rate": 1.5112170951612455e-05, "loss": 0.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.02735215239226818, "step": 3235, "valid_targets_mean": 9238.8, "valid_targets_min": 2446 }, { "epoch": 3.10944, "grad_norm": 0.11627326471177059, "learning_rate": 1.5047230935616497e-05, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.021479297429323196, "step": 3240, "valid_targets_mean": 8806.2, "valid_targets_min": 3618 }, { "epoch": 3.11424, "grad_norm": 0.11908066536540551, "learning_rate": 1.4982346500697916e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.02094453200697899, "step": 3245, "valid_targets_mean": 8300.2, "valid_targets_min": 4744 }, { "epoch": 3.11904, "grad_norm": 0.12430053568242028, "learning_rate": 1.4917518375004281e-05, "loss": 0.0673, "loss_nan_ranks": 0, "loss_rank_avg": 0.020661715418100357, "step": 3250, "valid_targets_mean": 8002.1, "valid_targets_min": 2486 }, { "epoch": 3.12384, "grad_norm": 0.11897850439214286, "learning_rate": 1.4852747286051254e-05, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.022244051098823547, "step": 3255, "valid_targets_mean": 9271.3, "valid_targets_min": 3148 }, { "epoch": 3.12864, "grad_norm": 0.12101646152970325, "learning_rate": 1.478803396071443e-05, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.021861432120203972, "step": 3260, "valid_targets_mean": 8306.7, "valid_targets_min": 2471 }, { "epoch": 3.1334400000000002, "grad_norm": 0.12377621716047282, "learning_rate": 1.472337912522115e-05, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.026585116982460022, "step": 3265, "valid_targets_mean": 8930.8, "valid_targets_min": 3933 }, { "epoch": 3.13824, "grad_norm": 0.12365934012769708, "learning_rate": 1.4658783505142368e-05, "loss": 0.0672, "loss_nan_ranks": 0, "loss_rank_avg": 0.023925743997097015, "step": 3270, "valid_targets_mean": 9297.8, "valid_targets_min": 3247 }, { "epoch": 3.14304, "grad_norm": 0.12034112660714659, "learning_rate": 1.4594247825384529e-05, "loss": 0.0736, "loss_nan_ranks": 0, "loss_rank_avg": 0.027109742164611816, "step": 3275, "valid_targets_mean": 8862.9, "valid_targets_min": 2457 }, { "epoch": 3.14784, "grad_norm": 0.12419182575224802, "learning_rate": 1.4529772810181398e-05, "loss": 0.0711, "loss_nan_ranks": 0, "loss_rank_avg": 0.022144844755530357, "step": 3280, "valid_targets_mean": 8546.1, "valid_targets_min": 4936 }, { "epoch": 3.15264, "grad_norm": 0.12581501967835582, "learning_rate": 1.4465359183085958e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.02213982678949833, "step": 3285, "valid_targets_mean": 8170.9, "valid_targets_min": 1037 }, { "epoch": 3.15744, "grad_norm": 0.13756118658624505, "learning_rate": 1.4401007666962276e-05, "loss": 0.0705, "loss_nan_ranks": 0, "loss_rank_avg": 0.021517571061849594, "step": 3290, "valid_targets_mean": 8457.0, "valid_targets_min": 2482 }, { "epoch": 3.16224, "grad_norm": 0.12193998039781807, "learning_rate": 1.4336718983977389e-05, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.024007262662053108, "step": 3295, "valid_targets_mean": 8692.9, "valid_targets_min": 1922 }, { "epoch": 3.16704, "grad_norm": 0.1265404462653089, "learning_rate": 1.4272493855593222e-05, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.023130342364311218, "step": 3300, "valid_targets_mean": 9112.4, "valid_targets_min": 2050 }, { "epoch": 3.17184, "grad_norm": 0.1226326357869858, "learning_rate": 1.4208333002558462e-05, "loss": 0.0714, "loss_nan_ranks": 0, "loss_rank_avg": 0.020230181515216827, "step": 3305, "valid_targets_mean": 8190.9, "valid_targets_min": 1771 }, { "epoch": 3.17664, "grad_norm": 0.11414582360833214, "learning_rate": 1.4144237144900497e-05, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.024489928036928177, "step": 3310, "valid_targets_mean": 8684.1, "valid_targets_min": 4674 }, { "epoch": 3.18144, "grad_norm": 0.12744621953971752, "learning_rate": 1.4080207001917302e-05, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.025685835629701614, "step": 3315, "valid_targets_mean": 8462.4, "valid_targets_min": 1313 }, { "epoch": 3.18624, "grad_norm": 0.12631083930426035, "learning_rate": 1.4016243292169413e-05, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.020424753427505493, "step": 3320, "valid_targets_mean": 8725.7, "valid_targets_min": 2161 }, { "epoch": 3.19104, "grad_norm": 0.11679712809878957, "learning_rate": 1.3952346733471822e-05, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.023827986791729927, "step": 3325, "valid_targets_mean": 8154.0, "valid_targets_min": 3181 }, { "epoch": 3.19584, "grad_norm": 0.125231699118407, "learning_rate": 1.3888518042885934e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.02799840085208416, "step": 3330, "valid_targets_mean": 8681.6, "valid_targets_min": 3326 }, { "epoch": 3.20064, "grad_norm": 0.11959339338389416, "learning_rate": 1.3824757936711537e-05, "loss": 0.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.02259810082614422, "step": 3335, "valid_targets_mean": 9545.6, "valid_targets_min": 2357 }, { "epoch": 3.20544, "grad_norm": 0.12174988786208792, "learning_rate": 1.3761067130478738e-05, "loss": 0.0703, "loss_nan_ranks": 0, "loss_rank_avg": 0.02313234657049179, "step": 3340, "valid_targets_mean": 8121.8, "valid_targets_min": 1979 }, { "epoch": 3.21024, "grad_norm": 0.11323346166579101, "learning_rate": 1.3697446338939942e-05, "loss": 0.0677, "loss_nan_ranks": 0, "loss_rank_avg": 0.022821880877017975, "step": 3345, "valid_targets_mean": 8020.8, "valid_targets_min": 3447 }, { "epoch": 3.21504, "grad_norm": 0.11671762619810887, "learning_rate": 1.3633896276061847e-05, "loss": 0.0668, "loss_nan_ranks": 0, "loss_rank_avg": 0.02655469998717308, "step": 3350, "valid_targets_mean": 10324.1, "valid_targets_min": 3177 }, { "epoch": 3.21984, "grad_norm": 0.11750097777157643, "learning_rate": 1.3570417655017405e-05, "loss": 0.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.0216502882540226, "step": 3355, "valid_targets_mean": 8658.6, "valid_targets_min": 3458 }, { "epoch": 3.22464, "grad_norm": 0.11820178487678269, "learning_rate": 1.3507011188177846e-05, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.022721372544765472, "step": 3360, "valid_targets_mean": 9518.7, "valid_targets_min": 4699 }, { "epoch": 3.22944, "grad_norm": 0.11417679512946696, "learning_rate": 1.3443677587104655e-05, "loss": 0.0694, "loss_nan_ranks": 0, "loss_rank_avg": 0.020779889076948166, "step": 3365, "valid_targets_mean": 8670.8, "valid_targets_min": 3094 }, { "epoch": 3.23424, "grad_norm": 0.12624839454578163, "learning_rate": 1.3380417562541604e-05, "loss": 0.067, "loss_nan_ranks": 0, "loss_rank_avg": 0.020790942013263702, "step": 3370, "valid_targets_mean": 8187.2, "valid_targets_min": 1278 }, { "epoch": 3.23904, "grad_norm": 0.14609588360307785, "learning_rate": 1.3317231824406783e-05, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.024372944608330727, "step": 3375, "valid_targets_mean": 8531.4, "valid_targets_min": 2185 }, { "epoch": 3.24384, "grad_norm": 0.117776839936567, "learning_rate": 1.325412108178461e-05, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.022288871929049492, "step": 3380, "valid_targets_mean": 8573.8, "valid_targets_min": 3315 }, { "epoch": 3.24864, "grad_norm": 0.11646493488526218, "learning_rate": 1.3191086042917895e-05, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.02496308647096157, "step": 3385, "valid_targets_mean": 9230.8, "valid_targets_min": 3590 }, { "epoch": 3.25344, "grad_norm": 0.12779066870734346, "learning_rate": 1.3128127415199883e-05, "loss": 0.0732, "loss_nan_ranks": 0, "loss_rank_avg": 0.023436348885297775, "step": 3390, "valid_targets_mean": 8449.2, "valid_targets_min": 2540 }, { "epoch": 3.25824, "grad_norm": 0.11925664271364658, "learning_rate": 1.3065245905166316e-05, "loss": 0.0655, "loss_nan_ranks": 0, "loss_rank_avg": 0.021665815263986588, "step": 3395, "valid_targets_mean": 8535.0, "valid_targets_min": 1755 }, { "epoch": 3.26304, "grad_norm": 0.11609499082097684, "learning_rate": 1.30024422184875e-05, "loss": 0.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.020767629146575928, "step": 3400, "valid_targets_mean": 9026.3, "valid_targets_min": 3114 }, { "epoch": 3.26784, "grad_norm": 0.12322940130660784, "learning_rate": 1.2939717059960384e-05, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.026769880205392838, "step": 3405, "valid_targets_mean": 9266.4, "valid_targets_min": 2437 }, { "epoch": 3.27264, "grad_norm": 0.12268486970388134, "learning_rate": 1.287707113350068e-05, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.021298786625266075, "step": 3410, "valid_targets_mean": 8315.7, "valid_targets_min": 1885 }, { "epoch": 3.27744, "grad_norm": 0.12293752242798077, "learning_rate": 1.2814505142134921e-05, "loss": 0.0682, "loss_nan_ranks": 0, "loss_rank_avg": 0.0239997711032629, "step": 3415, "valid_targets_mean": 8773.1, "valid_targets_min": 3471 }, { "epoch": 3.28224, "grad_norm": 0.11888564915744372, "learning_rate": 1.2752019787992587e-05, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.023440586403012276, "step": 3420, "valid_targets_mean": 9244.7, "valid_targets_min": 2556 }, { "epoch": 3.28704, "grad_norm": 0.12035054922676984, "learning_rate": 1.268961577229824e-05, "loss": 0.0681, "loss_nan_ranks": 0, "loss_rank_avg": 0.024956464767456055, "step": 3425, "valid_targets_mean": 9113.6, "valid_targets_min": 6681 }, { "epoch": 3.29184, "grad_norm": 0.11609541056449521, "learning_rate": 1.262729379536365e-05, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.018632816150784492, "step": 3430, "valid_targets_mean": 8057.3, "valid_targets_min": 2719 }, { "epoch": 3.29664, "grad_norm": 0.1156523388586678, "learning_rate": 1.2565054556579917e-05, "loss": 0.0695, "loss_nan_ranks": 0, "loss_rank_avg": 0.03179524093866348, "step": 3435, "valid_targets_mean": 9017.0, "valid_targets_min": 4248 }, { "epoch": 3.30144, "grad_norm": 0.12003104066174144, "learning_rate": 1.2502898754409637e-05, "loss": 0.0734, "loss_nan_ranks": 0, "loss_rank_avg": 0.027027547359466553, "step": 3440, "valid_targets_mean": 8732.1, "valid_targets_min": 2923 }, { "epoch": 3.30624, "grad_norm": 0.11525424183716788, "learning_rate": 1.2440827086379055e-05, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.023295942693948746, "step": 3445, "valid_targets_mean": 8759.2, "valid_targets_min": 4664 }, { "epoch": 3.31104, "grad_norm": 0.12531104004344787, "learning_rate": 1.2378840249070265e-05, "loss": 0.0679, "loss_nan_ranks": 0, "loss_rank_avg": 0.022183142602443695, "step": 3450, "valid_targets_mean": 8153.5, "valid_targets_min": 2609 }, { "epoch": 3.31584, "grad_norm": 0.12343198360816166, "learning_rate": 1.2316938938113356e-05, "loss": 0.0696, "loss_nan_ranks": 0, "loss_rank_avg": 0.023251008242368698, "step": 3455, "valid_targets_mean": 8565.3, "valid_targets_min": 3428 }, { "epoch": 3.32064, "grad_norm": 0.1292388288269661, "learning_rate": 1.2255123848178619e-05, "loss": 0.0686, "loss_nan_ranks": 0, "loss_rank_avg": 0.023235727101564407, "step": 3460, "valid_targets_mean": 9135.2, "valid_targets_min": 2746 }, { "epoch": 3.32544, "grad_norm": 0.1215681936479102, "learning_rate": 1.2193395672968765e-05, "loss": 0.0717, "loss_nan_ranks": 0, "loss_rank_avg": 0.02227572724223137, "step": 3465, "valid_targets_mean": 8278.0, "valid_targets_min": 3403 }, { "epoch": 3.33024, "grad_norm": 0.11710136257925326, "learning_rate": 1.2131755105211118e-05, "loss": 0.0663, "loss_nan_ranks": 0, "loss_rank_avg": 0.019895605742931366, "step": 3470, "valid_targets_mean": 8391.2, "valid_targets_min": 2984 }, { "epoch": 3.3350400000000002, "grad_norm": 0.12542638777454168, "learning_rate": 1.2070202836649855e-05, "loss": 0.0676, "loss_nan_ranks": 0, "loss_rank_avg": 0.021651022136211395, "step": 3475, "valid_targets_mean": 9145.8, "valid_targets_min": 2439 }, { "epoch": 3.33984, "grad_norm": 0.12565404407998096, "learning_rate": 1.2008739558038247e-05, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.023290030658245087, "step": 3480, "valid_targets_mean": 7567.0, "valid_targets_min": 2494 }, { "epoch": 3.34464, "grad_norm": 0.11631140589000345, "learning_rate": 1.1947365959130895e-05, "loss": 0.0667, "loss_nan_ranks": 0, "loss_rank_avg": 0.018959272652864456, "step": 3485, "valid_targets_mean": 8354.6, "valid_targets_min": 2992 }, { "epoch": 3.34944, "grad_norm": 0.1188568050783418, "learning_rate": 1.1886082728675984e-05, "loss": 0.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.024846302345395088, "step": 3490, "valid_targets_mean": 8987.2, "valid_targets_min": 4280 }, { "epoch": 3.35424, "grad_norm": 0.12019159263147859, "learning_rate": 1.1824890554407574e-05, "loss": 0.0691, "loss_nan_ranks": 0, "loss_rank_avg": 0.018579427152872086, "step": 3495, "valid_targets_mean": 8977.7, "valid_targets_min": 4890 }, { "epoch": 3.3590400000000002, "grad_norm": 0.1139585905859666, "learning_rate": 1.1763790123037873e-05, "loss": 0.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.02406950294971466, "step": 3500, "valid_targets_mean": 9003.8, "valid_targets_min": 1951 }, { "epoch": 3.36384, "grad_norm": 0.14319366739189193, "learning_rate": 1.1702782120249539e-05, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.024110540747642517, "step": 3505, "valid_targets_mean": 9082.9, "valid_targets_min": 1492 }, { "epoch": 3.36864, "grad_norm": 0.11863992872229728, "learning_rate": 1.164186723068795e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.02288087084889412, "step": 3510, "valid_targets_mean": 8180.7, "valid_targets_min": 2277 }, { "epoch": 3.37344, "grad_norm": 0.11512399838967773, "learning_rate": 1.1581046137953575e-05, "loss": 0.0687, "loss_nan_ranks": 0, "loss_rank_avg": 0.022692613303661346, "step": 3515, "valid_targets_mean": 8648.9, "valid_targets_min": 4250 }, { "epoch": 3.37824, "grad_norm": 0.13242448957401462, "learning_rate": 1.1520319524594256e-05, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.025992343202233315, "step": 3520, "valid_targets_mean": 8879.0, "valid_targets_min": 1942 }, { "epoch": 3.38304, "grad_norm": 0.12807878449294854, "learning_rate": 1.1459688072097568e-05, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.022017603740096092, "step": 3525, "valid_targets_mean": 8338.1, "valid_targets_min": 3877 }, { "epoch": 3.38784, "grad_norm": 0.11648212904241022, "learning_rate": 1.1399152460883176e-05, "loss": 0.0702, "loss_nan_ranks": 0, "loss_rank_avg": 0.020594323053956032, "step": 3530, "valid_targets_mean": 9214.3, "valid_targets_min": 2528 }, { "epoch": 3.39264, "grad_norm": 0.11821877317071199, "learning_rate": 1.1338713370295189e-05, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.026048175990581512, "step": 3535, "valid_targets_mean": 9281.7, "valid_targets_min": 2639 }, { "epoch": 3.39744, "grad_norm": 0.11736629336592669, "learning_rate": 1.1278371478594538e-05, "loss": 0.0682, "loss_nan_ranks": 0, "loss_rank_avg": 0.021891873329877853, "step": 3540, "valid_targets_mean": 8865.2, "valid_targets_min": 2688 }, { "epoch": 3.40224, "grad_norm": 0.11972853626552638, "learning_rate": 1.1218127462951367e-05, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.02370895817875862, "step": 3545, "valid_targets_mean": 8682.7, "valid_targets_min": 1583 }, { "epoch": 3.40704, "grad_norm": 0.12360516334847126, "learning_rate": 1.1157981999437444e-05, "loss": 0.0708, "loss_nan_ranks": 0, "loss_rank_avg": 0.027519740164279938, "step": 3550, "valid_targets_mean": 8607.8, "valid_targets_min": 3517 }, { "epoch": 3.4118399999999998, "grad_norm": 0.12508266248465932, "learning_rate": 1.109793576301855e-05, "loss": 0.0683, "loss_nan_ranks": 0, "loss_rank_avg": 0.019669760018587112, "step": 3555, "valid_targets_mean": 9355.0, "valid_targets_min": 1912 }, { "epoch": 3.41664, "grad_norm": 0.12060718453496497, "learning_rate": 1.1037989427546924e-05, "loss": 0.0684, "loss_nan_ranks": 0, "loss_rank_avg": 0.023211004212498665, "step": 3560, "valid_targets_mean": 8907.0, "valid_targets_min": 3938 }, { "epoch": 3.42144, "grad_norm": 0.11856868790700098, "learning_rate": 1.0978143665753692e-05, "loss": 0.0708, "loss_nan_ranks": 0, "loss_rank_avg": 0.025470038875937462, "step": 3565, "valid_targets_mean": 8779.1, "valid_targets_min": 1956 }, { "epoch": 3.42624, "grad_norm": 0.1202644007888738, "learning_rate": 1.0918399149241314e-05, "loss": 0.0671, "loss_nan_ranks": 0, "loss_rank_avg": 0.025088073685765266, "step": 3570, "valid_targets_mean": 9472.4, "valid_targets_min": 5452 }, { "epoch": 3.43104, "grad_norm": 0.11890989905758134, "learning_rate": 1.0858756548476058e-05, "loss": 0.0669, "loss_nan_ranks": 0, "loss_rank_avg": 0.019012611359357834, "step": 3575, "valid_targets_mean": 8079.2, "valid_targets_min": 2365 }, { "epoch": 3.43584, "grad_norm": 0.11535717573780561, "learning_rate": 1.0799216532780478e-05, "loss": 0.0656, "loss_nan_ranks": 0, "loss_rank_avg": 0.020330175757408142, "step": 3580, "valid_targets_mean": 8638.0, "valid_targets_min": 2657 }, { "epoch": 3.44064, "grad_norm": 0.11982122538634377, "learning_rate": 1.0739779770325885e-05, "loss": 0.0688, "loss_nan_ranks": 0, "loss_rank_avg": 0.02101993001997471, "step": 3585, "valid_targets_mean": 8114.7, "valid_targets_min": 3253 }, { "epoch": 3.44544, "grad_norm": 0.11568924363050549, "learning_rate": 1.0680446928124872e-05, "loss": 0.0699, "loss_nan_ranks": 0, "loss_rank_avg": 0.024274956434965134, "step": 3590, "valid_targets_mean": 8969.8, "valid_targets_min": 5479 }, { "epoch": 3.45024, "grad_norm": 0.12311519721414897, "learning_rate": 1.06212186720238e-05, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.02398882806301117, "step": 3595, "valid_targets_mean": 9083.4, "valid_targets_min": 2236 }, { "epoch": 3.45504, "grad_norm": 0.1176232528105872, "learning_rate": 1.0562095666695352e-05, "loss": 0.0689, "loss_nan_ranks": 0, "loss_rank_avg": 0.022245021536946297, "step": 3600, "valid_targets_mean": 8506.0, "valid_targets_min": 530 }, { "epoch": 3.45984, "grad_norm": 0.12814024690841339, "learning_rate": 1.0503078575631052e-05, "loss": 0.0565, "loss_nan_ranks": 0, "loss_rank_avg": 0.019158998504281044, "step": 3605, "valid_targets_mean": 9547.4, "valid_targets_min": 4525 }, { "epoch": 3.46464, "grad_norm": 0.1352022401477249, "learning_rate": 1.0444168061133846e-05, "loss": 0.0587, "loss_nan_ranks": 0, "loss_rank_avg": 0.019761083647608757, "step": 3610, "valid_targets_mean": 8394.5, "valid_targets_min": 4757 }, { "epoch": 3.46944, "grad_norm": 0.12312753724496196, "learning_rate": 1.0385364784310636e-05, "loss": 0.0558, "loss_nan_ranks": 0, "loss_rank_avg": 0.017157310619950294, "step": 3615, "valid_targets_mean": 8024.5, "valid_targets_min": 2974 }, { "epoch": 3.47424, "grad_norm": 0.13533009632046408, "learning_rate": 1.0326669405064904e-05, "loss": 0.056, "loss_nan_ranks": 0, "loss_rank_avg": 0.015769323334097862, "step": 3620, "valid_targets_mean": 9096.3, "valid_targets_min": 3278 }, { "epoch": 3.47904, "grad_norm": 0.14320717457173768, "learning_rate": 1.0268082582089263e-05, "loss": 0.0575, "loss_nan_ranks": 0, "loss_rank_avg": 0.01656205952167511, "step": 3625, "valid_targets_mean": 7964.6, "valid_targets_min": 2824 }, { "epoch": 3.48384, "grad_norm": 0.1436771220110468, "learning_rate": 1.0209604972858081e-05, "loss": 0.0553, "loss_nan_ranks": 0, "loss_rank_avg": 0.01845899596810341, "step": 3630, "valid_targets_mean": 8401.7, "valid_targets_min": 2868 }, { "epoch": 3.48864, "grad_norm": 0.1331002867624431, "learning_rate": 1.0151237233620115e-05, "loss": 0.0546, "loss_nan_ranks": 0, "loss_rank_avg": 0.015434859320521355, "step": 3635, "valid_targets_mean": 8922.3, "valid_targets_min": 3232 }, { "epoch": 3.49344, "grad_norm": 0.15962729586395075, "learning_rate": 1.0092980019391132e-05, "loss": 0.0592, "loss_nan_ranks": 0, "loss_rank_avg": 0.018679436296224594, "step": 3640, "valid_targets_mean": 9329.9, "valid_targets_min": 3781 }, { "epoch": 3.49824, "grad_norm": 0.15818938989627598, "learning_rate": 1.0034833983946561e-05, "loss": 0.0553, "loss_nan_ranks": 0, "loss_rank_avg": 0.016482515260577202, "step": 3645, "valid_targets_mean": 8887.6, "valid_targets_min": 1640 }, { "epoch": 3.50304, "grad_norm": 0.12431356399603527, "learning_rate": 9.976799779814157e-06, "loss": 0.0555, "loss_nan_ranks": 0, "loss_rank_avg": 0.017481375485658646, "step": 3650, "valid_targets_mean": 8482.5, "valid_targets_min": 4381 }, { "epoch": 3.50784, "grad_norm": 0.1322854401566673, "learning_rate": 9.918878058266687e-06, "loss": 0.0576, "loss_nan_ranks": 0, "loss_rank_avg": 0.017938459292054176, "step": 3655, "valid_targets_mean": 8828.8, "valid_targets_min": 3313 }, { "epoch": 3.51264, "grad_norm": 0.1253467544366567, "learning_rate": 9.86106946931462e-06, "loss": 0.0596, "loss_nan_ranks": 0, "loss_rank_avg": 0.019131455570459366, "step": 3660, "valid_targets_mean": 9941.3, "valid_targets_min": 4437 }, { "epoch": 3.51744, "grad_norm": 0.13652918694567162, "learning_rate": 9.803374661698802e-06, "loss": 0.0559, "loss_nan_ranks": 0, "loss_rank_avg": 0.019458845257759094, "step": 3665, "valid_targets_mean": 7816.9, "valid_targets_min": 1823 }, { "epoch": 3.52224, "grad_norm": 0.14742469694336255, "learning_rate": 9.745794282883215e-06, "loss": 0.057, "loss_nan_ranks": 0, "loss_rank_avg": 0.01716812141239643, "step": 3670, "valid_targets_mean": 8304.0, "valid_targets_min": 2191 }, { "epoch": 3.52704, "grad_norm": 0.13348912229457513, "learning_rate": 9.688328979047689e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.018630236387252808, "step": 3675, "valid_targets_mean": 8479.3, "valid_targets_min": 3012 }, { "epoch": 3.53184, "grad_norm": 0.13047629376112002, "learning_rate": 9.630979395080667e-06, "loss": 0.0594, "loss_nan_ranks": 0, "loss_rank_avg": 0.01872425712645054, "step": 3680, "valid_targets_mean": 7992.5, "valid_targets_min": 2228 }, { "epoch": 3.5366400000000002, "grad_norm": 0.13156923893488706, "learning_rate": 9.573746174571947e-06, "loss": 0.0555, "loss_nan_ranks": 0, "loss_rank_avg": 0.016432328149676323, "step": 3685, "valid_targets_mean": 9221.1, "valid_targets_min": 2341 }, { "epoch": 3.54144, "grad_norm": 0.13209300474839575, "learning_rate": 9.516629959805468e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.02003823220729828, "step": 3690, "valid_targets_mean": 8710.9, "valid_targets_min": 1444 }, { "epoch": 3.54624, "grad_norm": 0.13116046245364235, "learning_rate": 9.459631391752126e-06, "loss": 0.0568, "loss_nan_ranks": 0, "loss_rank_avg": 0.01843874529004097, "step": 3695, "valid_targets_mean": 8378.2, "valid_targets_min": 3062 }, { "epoch": 3.55104, "grad_norm": 0.1285017503304282, "learning_rate": 9.40275111006254e-06, "loss": 0.0548, "loss_nan_ranks": 0, "loss_rank_avg": 0.016842100769281387, "step": 3700, "valid_targets_mean": 8139.7, "valid_targets_min": 2295 }, { "epoch": 3.55584, "grad_norm": 0.1472596562975354, "learning_rate": 9.345989753059895e-06, "loss": 0.0543, "loss_nan_ranks": 0, "loss_rank_avg": 0.016040191054344177, "step": 3705, "valid_targets_mean": 7992.1, "valid_targets_min": 2724 }, { "epoch": 3.5606400000000002, "grad_norm": 0.15633419217487327, "learning_rate": 9.289347957732779e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.017493966966867447, "step": 3710, "valid_targets_mean": 8839.2, "valid_targets_min": 1647 }, { "epoch": 3.56544, "grad_norm": 0.1357694551726591, "learning_rate": 9.232826359728034e-06, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.015739034861326218, "step": 3715, "valid_targets_mean": 8887.0, "valid_targets_min": 2183 }, { "epoch": 3.57024, "grad_norm": 0.12207172176713575, "learning_rate": 9.17642559334362e-06, "loss": 0.054, "loss_nan_ranks": 0, "loss_rank_avg": 0.017870184034109116, "step": 3720, "valid_targets_mean": 8897.0, "valid_targets_min": 2011 }, { "epoch": 3.57504, "grad_norm": 0.14244558932230125, "learning_rate": 9.120146291521488e-06, "loss": 0.0561, "loss_nan_ranks": 0, "loss_rank_avg": 0.018513241782784462, "step": 3725, "valid_targets_mean": 8319.8, "valid_targets_min": 2365 }, { "epoch": 3.57984, "grad_norm": 0.13508176921493603, "learning_rate": 9.063989085840506e-06, "loss": 0.0566, "loss_nan_ranks": 0, "loss_rank_avg": 0.020369049161672592, "step": 3730, "valid_targets_mean": 8704.0, "valid_targets_min": 2203 }, { "epoch": 3.5846400000000003, "grad_norm": 0.12623222486610447, "learning_rate": 9.007954606509346e-06, "loss": 0.0534, "loss_nan_ranks": 0, "loss_rank_avg": 0.01837966777384281, "step": 3735, "valid_targets_mean": 8965.4, "valid_targets_min": 1896 }, { "epoch": 3.5894399999999997, "grad_norm": 0.13304702719999412, "learning_rate": 8.952043482359408e-06, "loss": 0.0534, "loss_nan_ranks": 0, "loss_rank_avg": 0.016147565096616745, "step": 3740, "valid_targets_mean": 8392.1, "valid_targets_min": 2734 }, { "epoch": 3.59424, "grad_norm": 0.1364610341024647, "learning_rate": 8.896256340837779e-06, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.01738559827208519, "step": 3745, "valid_targets_mean": 8307.7, "valid_targets_min": 1612 }, { "epoch": 3.59904, "grad_norm": 0.12080918237441046, "learning_rate": 8.840593808000182e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.017990585416555405, "step": 3750, "valid_targets_mean": 8898.8, "valid_targets_min": 3751 }, { "epoch": 3.60384, "grad_norm": 0.135206313127372, "learning_rate": 8.785056508503956e-06, "loss": 0.0572, "loss_nan_ranks": 0, "loss_rank_avg": 0.01876853033900261, "step": 3755, "valid_targets_mean": 8321.2, "valid_targets_min": 1956 }, { "epoch": 3.60864, "grad_norm": 0.14146043288365848, "learning_rate": 8.729645065601045e-06, "loss": 0.058, "loss_nan_ranks": 0, "loss_rank_avg": 0.0189354345202446, "step": 3760, "valid_targets_mean": 8984.0, "valid_targets_min": 1806 }, { "epoch": 3.6134399999999998, "grad_norm": 0.1357690858168711, "learning_rate": 8.674360101130994e-06, "loss": 0.0545, "loss_nan_ranks": 0, "loss_rank_avg": 0.02032206952571869, "step": 3765, "valid_targets_mean": 8590.7, "valid_targets_min": 2433 }, { "epoch": 3.61824, "grad_norm": 0.13373124703486686, "learning_rate": 8.619202235514e-06, "loss": 0.0537, "loss_nan_ranks": 0, "loss_rank_avg": 0.016812438145279884, "step": 3770, "valid_targets_mean": 8781.7, "valid_targets_min": 4288 }, { "epoch": 3.62304, "grad_norm": 0.13777338990715324, "learning_rate": 8.564172087743903e-06, "loss": 0.057, "loss_nan_ranks": 0, "loss_rank_avg": 0.01906885765492916, "step": 3775, "valid_targets_mean": 8735.4, "valid_targets_min": 3098 }, { "epoch": 3.62784, "grad_norm": 0.13709427310817707, "learning_rate": 8.50927027538128e-06, "loss": 0.0558, "loss_nan_ranks": 0, "loss_rank_avg": 0.021031895652413368, "step": 3780, "valid_targets_mean": 8737.2, "valid_targets_min": 4732 }, { "epoch": 3.63264, "grad_norm": 0.1329046208350066, "learning_rate": 8.454497414546497e-06, "loss": 0.0583, "loss_nan_ranks": 0, "loss_rank_avg": 0.019182361662387848, "step": 3785, "valid_targets_mean": 9016.9, "valid_targets_min": 3997 }, { "epoch": 3.63744, "grad_norm": 0.12784288201977764, "learning_rate": 8.39985411991279e-06, "loss": 0.0587, "loss_nan_ranks": 0, "loss_rank_avg": 0.022063791751861572, "step": 3790, "valid_targets_mean": 9467.2, "valid_targets_min": 2158 }, { "epoch": 3.64224, "grad_norm": 0.13698351144349497, "learning_rate": 8.345341004699386e-06, "loss": 0.0574, "loss_nan_ranks": 0, "loss_rank_avg": 0.01915154419839382, "step": 3795, "valid_targets_mean": 9378.7, "valid_targets_min": 3433 }, { "epoch": 3.64704, "grad_norm": 0.13732974847111012, "learning_rate": 8.290958680664591e-06, "loss": 0.0585, "loss_nan_ranks": 0, "loss_rank_avg": 0.020820364356040955, "step": 3800, "valid_targets_mean": 8005.5, "valid_targets_min": 1450 }, { "epoch": 3.65184, "grad_norm": 0.13505357343036875, "learning_rate": 8.236707758098965e-06, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.022526472806930542, "step": 3805, "valid_targets_mean": 8850.6, "valid_targets_min": 2488 }, { "epoch": 3.65664, "grad_norm": 0.1259729066577338, "learning_rate": 8.182588845818452e-06, "loss": 0.0552, "loss_nan_ranks": 0, "loss_rank_avg": 0.017887916415929794, "step": 3810, "valid_targets_mean": 8914.6, "valid_targets_min": 3411 }, { "epoch": 3.66144, "grad_norm": 0.13771971908346792, "learning_rate": 8.128602551157523e-06, "loss": 0.0546, "loss_nan_ranks": 0, "loss_rank_avg": 0.018062973394989967, "step": 3815, "valid_targets_mean": 8964.6, "valid_targets_min": 5691 }, { "epoch": 3.66624, "grad_norm": 0.1386182298823841, "learning_rate": 8.074749479962407e-06, "loss": 0.052, "loss_nan_ranks": 0, "loss_rank_avg": 0.016328800469636917, "step": 3820, "valid_targets_mean": 8711.1, "valid_targets_min": 2956 }, { "epoch": 3.67104, "grad_norm": 0.13208007285920464, "learning_rate": 8.021030236584254e-06, "loss": 0.0544, "loss_nan_ranks": 0, "loss_rank_avg": 0.01910882256925106, "step": 3825, "valid_targets_mean": 9311.3, "valid_targets_min": 2524 }, { "epoch": 3.67584, "grad_norm": 0.1526032805811713, "learning_rate": 7.967445423872384e-06, "loss": 0.0534, "loss_nan_ranks": 0, "loss_rank_avg": 0.015861565247178078, "step": 3830, "valid_targets_mean": 8945.5, "valid_targets_min": 2509 }, { "epoch": 3.68064, "grad_norm": 0.13026368761507842, "learning_rate": 7.913995643167494e-06, "loss": 0.0534, "loss_nan_ranks": 0, "loss_rank_avg": 0.017038773745298386, "step": 3835, "valid_targets_mean": 8394.8, "valid_targets_min": 2738 }, { "epoch": 3.68544, "grad_norm": 0.13774012408734024, "learning_rate": 7.860681494294917e-06, "loss": 0.056, "loss_nan_ranks": 0, "loss_rank_avg": 0.02027728408575058, "step": 3840, "valid_targets_mean": 8938.6, "valid_targets_min": 2062 }, { "epoch": 3.69024, "grad_norm": 0.14717144639640956, "learning_rate": 7.80750357555792e-06, "loss": 0.0582, "loss_nan_ranks": 0, "loss_rank_avg": 0.023341909050941467, "step": 3845, "valid_targets_mean": 8292.6, "valid_targets_min": 1771 }, { "epoch": 3.69504, "grad_norm": 0.1300340768573447, "learning_rate": 7.75446248373094e-06, "loss": 0.0552, "loss_nan_ranks": 0, "loss_rank_avg": 0.01564173400402069, "step": 3850, "valid_targets_mean": 8664.2, "valid_targets_min": 1719 }, { "epoch": 3.69984, "grad_norm": 0.13796606966954172, "learning_rate": 7.701558814052928e-06, "loss": 0.0564, "loss_nan_ranks": 0, "loss_rank_avg": 0.01939544826745987, "step": 3855, "valid_targets_mean": 8037.8, "valid_targets_min": 3725 }, { "epoch": 3.70464, "grad_norm": 0.12327605601391764, "learning_rate": 7.648793160220637e-06, "loss": 0.055, "loss_nan_ranks": 0, "loss_rank_avg": 0.019700098782777786, "step": 3860, "valid_targets_mean": 9027.4, "valid_targets_min": 3266 }, { "epoch": 3.70944, "grad_norm": 0.12894451099718549, "learning_rate": 7.596166114381991e-06, "loss": 0.0561, "loss_nan_ranks": 0, "loss_rank_avg": 0.01795964688062668, "step": 3865, "valid_targets_mean": 9631.7, "valid_targets_min": 4464 }, { "epoch": 3.71424, "grad_norm": 0.1462188211290315, "learning_rate": 7.543678267129408e-06, "loss": 0.0548, "loss_nan_ranks": 0, "loss_rank_avg": 0.021304085850715637, "step": 3870, "valid_targets_mean": 9413.1, "valid_targets_min": 3409 }, { "epoch": 3.71904, "grad_norm": 0.13526202499913728, "learning_rate": 7.491330207493215e-06, "loss": 0.0521, "loss_nan_ranks": 0, "loss_rank_avg": 0.018997564911842346, "step": 3875, "valid_targets_mean": 8982.6, "valid_targets_min": 1331 }, { "epoch": 3.72384, "grad_norm": 0.12959402426419273, "learning_rate": 7.4391225229349785e-06, "loss": 0.0537, "loss_nan_ranks": 0, "loss_rank_avg": 0.0176476389169693, "step": 3880, "valid_targets_mean": 8661.0, "valid_targets_min": 4132 }, { "epoch": 3.72864, "grad_norm": 0.1380153099186334, "learning_rate": 7.387055799340977e-06, "loss": 0.0513, "loss_nan_ranks": 0, "loss_rank_avg": 0.018710440024733543, "step": 3885, "valid_targets_mean": 8980.4, "valid_targets_min": 2790 }, { "epoch": 3.73344, "grad_norm": 0.1381226259425154, "learning_rate": 7.3351306210155645e-06, "loss": 0.0541, "loss_nan_ranks": 0, "loss_rank_avg": 0.017781345173716545, "step": 3890, "valid_targets_mean": 9528.7, "valid_targets_min": 5213 }, { "epoch": 3.7382400000000002, "grad_norm": 0.14650329599062215, "learning_rate": 7.283347570674664e-06, "loss": 0.0536, "loss_nan_ranks": 0, "loss_rank_avg": 0.019584622234106064, "step": 3895, "valid_targets_mean": 9252.9, "valid_targets_min": 1925 }, { "epoch": 3.74304, "grad_norm": 0.13350511389861328, "learning_rate": 7.231707229439191e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.018930701538920403, "step": 3900, "valid_targets_mean": 8362.8, "valid_targets_min": 3106 }, { "epoch": 3.74784, "grad_norm": 0.1301142031540442, "learning_rate": 7.180210176828557e-06, "loss": 0.0539, "loss_nan_ranks": 0, "loss_rank_avg": 0.01843518391251564, "step": 3905, "valid_targets_mean": 8952.4, "valid_targets_min": 1932 }, { "epoch": 3.75264, "grad_norm": 0.14804851725083004, "learning_rate": 7.1288569907541495e-06, "loss": 0.0542, "loss_nan_ranks": 0, "loss_rank_avg": 0.016517702490091324, "step": 3910, "valid_targets_mean": 8982.4, "valid_targets_min": 3753 }, { "epoch": 3.75744, "grad_norm": 0.1472353370607068, "learning_rate": 7.0776482475128674e-06, "loss": 0.0527, "loss_nan_ranks": 0, "loss_rank_avg": 0.01933884434401989, "step": 3915, "valid_targets_mean": 7994.6, "valid_targets_min": 1413 }, { "epoch": 3.7622400000000003, "grad_norm": 0.12792785699272863, "learning_rate": 7.026584521780628e-06, "loss": 0.052, "loss_nan_ranks": 0, "loss_rank_avg": 0.021142924204468727, "step": 3920, "valid_targets_mean": 9141.5, "valid_targets_min": 2962 }, { "epoch": 3.76704, "grad_norm": 0.1365740601360126, "learning_rate": 6.9756663866059324e-06, "loss": 0.0568, "loss_nan_ranks": 0, "loss_rank_avg": 0.017975568771362305, "step": 3925, "valid_targets_mean": 8611.1, "valid_targets_min": 3075 }, { "epoch": 3.77184, "grad_norm": 0.1280897139250657, "learning_rate": 6.924894413403434e-06, "loss": 0.0562, "loss_nan_ranks": 0, "loss_rank_avg": 0.015527415089309216, "step": 3930, "valid_targets_mean": 7602.2, "valid_targets_min": 3152 }, { "epoch": 3.77664, "grad_norm": 0.133581093629811, "learning_rate": 6.874269171947516e-06, "loss": 0.0545, "loss_nan_ranks": 0, "loss_rank_avg": 0.01571614481508732, "step": 3935, "valid_targets_mean": 8710.9, "valid_targets_min": 3037 }, { "epoch": 3.78144, "grad_norm": 0.13173898278248164, "learning_rate": 6.8237912303659195e-06, "loss": 0.0549, "loss_nan_ranks": 0, "loss_rank_avg": 0.01879742182791233, "step": 3940, "valid_targets_mean": 8989.7, "valid_targets_min": 3746 }, { "epoch": 3.7862400000000003, "grad_norm": 0.12954058129422952, "learning_rate": 6.773461155133334e-06, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.016739197075366974, "step": 3945, "valid_targets_mean": 8927.5, "valid_targets_min": 5341 }, { "epoch": 3.7910399999999997, "grad_norm": 0.12613131464245048, "learning_rate": 6.723279511065088e-06, "loss": 0.0523, "loss_nan_ranks": 0, "loss_rank_avg": 0.016926273703575134, "step": 3950, "valid_targets_mean": 9623.4, "valid_targets_min": 2541 }, { "epoch": 3.79584, "grad_norm": 0.1292964362058766, "learning_rate": 6.673246861310751e-06, "loss": 0.0532, "loss_nan_ranks": 0, "loss_rank_avg": 0.017725899815559387, "step": 3955, "valid_targets_mean": 7859.5, "valid_targets_min": 3588 }, { "epoch": 3.80064, "grad_norm": 0.130316879874074, "learning_rate": 6.623363767347874e-06, "loss": 0.0535, "loss_nan_ranks": 0, "loss_rank_avg": 0.02152263931930065, "step": 3960, "valid_targets_mean": 9065.3, "valid_targets_min": 1925 }, { "epoch": 3.80544, "grad_norm": 0.12971369743191016, "learning_rate": 6.5736307889756425e-06, "loss": 0.0545, "loss_nan_ranks": 0, "loss_rank_avg": 0.016394753009080887, "step": 3965, "valid_targets_mean": 8884.4, "valid_targets_min": 2482 }, { "epoch": 3.81024, "grad_norm": 0.1568859332985799, "learning_rate": 6.5240484843086095e-06, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.021794119849801064, "step": 3970, "valid_targets_mean": 9304.8, "valid_targets_min": 1462 }, { "epoch": 3.8150399999999998, "grad_norm": 0.13421165461310694, "learning_rate": 6.474617409770441e-06, "loss": 0.0542, "loss_nan_ranks": 0, "loss_rank_avg": 0.01763138733804226, "step": 3975, "valid_targets_mean": 8132.8, "valid_targets_min": 922 }, { "epoch": 3.81984, "grad_norm": 0.12677902333212412, "learning_rate": 6.425338120087665e-06, "loss": 0.0542, "loss_nan_ranks": 0, "loss_rank_avg": 0.017714576795697212, "step": 3980, "valid_targets_mean": 8993.7, "valid_targets_min": 2647 }, { "epoch": 3.82464, "grad_norm": 0.13212966268794687, "learning_rate": 6.3762111682834374e-06, "loss": 0.0545, "loss_nan_ranks": 0, "loss_rank_avg": 0.01865052804350853, "step": 3985, "valid_targets_mean": 8879.0, "valid_targets_min": 2453 }, { "epoch": 3.82944, "grad_norm": 0.1407986051119374, "learning_rate": 6.327237105671362e-06, "loss": 0.0558, "loss_nan_ranks": 0, "loss_rank_avg": 0.017468944191932678, "step": 3990, "valid_targets_mean": 9018.7, "valid_targets_min": 2962 }, { "epoch": 3.83424, "grad_norm": 0.1320979084915881, "learning_rate": 6.278416481849274e-06, "loss": 0.0548, "loss_nan_ranks": 0, "loss_rank_avg": 0.016698092222213745, "step": 3995, "valid_targets_mean": 8318.9, "valid_targets_min": 3301 }, { "epoch": 3.83904, "grad_norm": 0.12990710853432647, "learning_rate": 6.22974984469308e-06, "loss": 0.0537, "loss_nan_ranks": 0, "loss_rank_avg": 0.01842219941318035, "step": 4000, "valid_targets_mean": 8659.0, "valid_targets_min": 1468 }, { "epoch": 3.84384, "grad_norm": 0.13236712617272228, "learning_rate": 6.181237740350625e-06, "loss": 0.0533, "loss_nan_ranks": 0, "loss_rank_avg": 0.020259007811546326, "step": 4005, "valid_targets_mean": 8054.6, "valid_targets_min": 2687 }, { "epoch": 3.84864, "grad_norm": 0.13041784618423918, "learning_rate": 6.132880713235543e-06, "loss": 0.0554, "loss_nan_ranks": 0, "loss_rank_avg": 0.018737755715847015, "step": 4010, "valid_targets_mean": 9364.6, "valid_targets_min": 3819 }, { "epoch": 3.85344, "grad_norm": 0.13524360240078845, "learning_rate": 6.084679306021162e-06, "loss": 0.053, "loss_nan_ranks": 0, "loss_rank_avg": 0.015698693692684174, "step": 4015, "valid_targets_mean": 7918.4, "valid_targets_min": 2787 }, { "epoch": 3.85824, "grad_norm": 0.12236282756023174, "learning_rate": 6.036634059634403e-06, "loss": 0.0533, "loss_nan_ranks": 0, "loss_rank_avg": 0.016556216403841972, "step": 4020, "valid_targets_mean": 8993.7, "valid_targets_min": 3277 }, { "epoch": 3.86304, "grad_norm": 0.13236991040385118, "learning_rate": 5.988745513249723e-06, "loss": 0.0548, "loss_nan_ranks": 0, "loss_rank_avg": 0.015798557549715042, "step": 4025, "valid_targets_mean": 7554.2, "valid_targets_min": 2150 }, { "epoch": 3.86784, "grad_norm": 0.1290662796744428, "learning_rate": 5.941014204283065e-06, "loss": 0.0524, "loss_nan_ranks": 0, "loss_rank_avg": 0.017221640795469284, "step": 4030, "valid_targets_mean": 8782.2, "valid_targets_min": 3375 }, { "epoch": 3.87264, "grad_norm": 0.14205933896083572, "learning_rate": 5.893440668385797e-06, "loss": 0.056, "loss_nan_ranks": 0, "loss_rank_avg": 0.018951009958982468, "step": 4035, "valid_targets_mean": 8017.5, "valid_targets_min": 3253 }, { "epoch": 3.87744, "grad_norm": 0.1368306093679873, "learning_rate": 5.8460254394387335e-06, "loss": 0.0562, "loss_nan_ranks": 0, "loss_rank_avg": 0.018680622801184654, "step": 4040, "valid_targets_mean": 8573.9, "valid_targets_min": 3166 }, { "epoch": 3.88224, "grad_norm": 0.14792994727994602, "learning_rate": 5.798769049546136e-06, "loss": 0.0536, "loss_nan_ranks": 0, "loss_rank_avg": 0.01788490265607834, "step": 4045, "valid_targets_mean": 8650.3, "valid_targets_min": 3015 }, { "epoch": 3.88704, "grad_norm": 0.12797744609338996, "learning_rate": 5.751672029029734e-06, "loss": 0.0541, "loss_nan_ranks": 0, "loss_rank_avg": 0.017983146011829376, "step": 4050, "valid_targets_mean": 9032.2, "valid_targets_min": 3561 }, { "epoch": 3.89184, "grad_norm": 0.1368383859346621, "learning_rate": 5.704734906422775e-06, "loss": 0.0542, "loss_nan_ranks": 0, "loss_rank_avg": 0.01866726018488407, "step": 4055, "valid_targets_mean": 8509.7, "valid_targets_min": 1352 }, { "epoch": 3.89664, "grad_norm": 0.1274931135133911, "learning_rate": 5.657958208464103e-06, "loss": 0.0543, "loss_nan_ranks": 0, "loss_rank_avg": 0.017809130251407623, "step": 4060, "valid_targets_mean": 9095.2, "valid_targets_min": 3414 }, { "epoch": 3.90144, "grad_norm": 0.12446892196214056, "learning_rate": 5.611342460092244e-06, "loss": 0.0569, "loss_nan_ranks": 0, "loss_rank_avg": 0.018567975610494614, "step": 4065, "valid_targets_mean": 8345.9, "valid_targets_min": 1662 }, { "epoch": 3.90624, "grad_norm": 0.13830759122979366, "learning_rate": 5.564888184439505e-06, "loss": 0.0567, "loss_nan_ranks": 0, "loss_rank_avg": 0.017078258097171783, "step": 4070, "valid_targets_mean": 8059.1, "valid_targets_min": 1554 }, { "epoch": 3.91104, "grad_norm": 0.36165706553152754, "learning_rate": 5.5185959028261135e-06, "loss": 0.0553, "loss_nan_ranks": 0, "loss_rank_avg": 0.02065645530819893, "step": 4075, "valid_targets_mean": 9743.2, "valid_targets_min": 5526 }, { "epoch": 3.91584, "grad_norm": 0.1316808841029414, "learning_rate": 5.47246613475436e-06, "loss": 0.0547, "loss_nan_ranks": 0, "loss_rank_avg": 0.01675555296242237, "step": 4080, "valid_targets_mean": 9094.8, "valid_targets_min": 4363 }, { "epoch": 3.92064, "grad_norm": 0.14798968834118362, "learning_rate": 5.4264993979027735e-06, "loss": 0.055, "loss_nan_ranks": 0, "loss_rank_avg": 0.019093751907348633, "step": 4085, "valid_targets_mean": 9276.1, "valid_targets_min": 2780 }, { "epoch": 3.92544, "grad_norm": 0.13158694237133187, "learning_rate": 5.380696208120315e-06, "loss": 0.052, "loss_nan_ranks": 0, "loss_rank_avg": 0.020652972161769867, "step": 4090, "valid_targets_mean": 9859.9, "valid_targets_min": 4035 }, { "epoch": 3.93024, "grad_norm": 0.14195945121470888, "learning_rate": 5.335057079420571e-06, "loss": 0.0532, "loss_nan_ranks": 0, "loss_rank_avg": 0.017747461795806885, "step": 4095, "valid_targets_mean": 8872.0, "valid_targets_min": 2232 }, { "epoch": 3.93504, "grad_norm": 0.1374303761783451, "learning_rate": 5.289582523976015e-06, "loss": 0.0536, "loss_nan_ranks": 0, "loss_rank_avg": 0.017126193270087242, "step": 4100, "valid_targets_mean": 8146.2, "valid_targets_min": 2982 }, { "epoch": 3.9398400000000002, "grad_norm": 0.14182449340419634, "learning_rate": 5.244273052112241e-06, "loss": 0.0536, "loss_nan_ranks": 0, "loss_rank_avg": 0.018104974180459976, "step": 4105, "valid_targets_mean": 8459.2, "valid_targets_min": 4292 }, { "epoch": 3.94464, "grad_norm": 0.12798985706630067, "learning_rate": 5.199129172302224e-06, "loss": 0.0516, "loss_nan_ranks": 0, "loss_rank_avg": 0.018952365964651108, "step": 4110, "valid_targets_mean": 9065.8, "valid_targets_min": 2898 }, { "epoch": 3.94944, "grad_norm": 0.13189531058235807, "learning_rate": 5.154151391160638e-06, "loss": 0.0521, "loss_nan_ranks": 0, "loss_rank_avg": 0.018595896661281586, "step": 4115, "valid_targets_mean": 9053.8, "valid_targets_min": 2092 }, { "epoch": 3.95424, "grad_norm": 0.1247555985934334, "learning_rate": 5.109340213438156e-06, "loss": 0.0503, "loss_nan_ranks": 0, "loss_rank_avg": 0.015505434945225716, "step": 4120, "valid_targets_mean": 8914.9, "valid_targets_min": 2859 }, { "epoch": 3.95904, "grad_norm": 0.13611501132172, "learning_rate": 5.0646961420157995e-06, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.018326323479413986, "step": 4125, "valid_targets_mean": 8805.6, "valid_targets_min": 4681 }, { "epoch": 3.9638400000000003, "grad_norm": 0.14009893602915602, "learning_rate": 5.020219677899276e-06, "loss": 0.0567, "loss_nan_ranks": 0, "loss_rank_avg": 0.016717668622732162, "step": 4130, "valid_targets_mean": 8772.8, "valid_targets_min": 2911 }, { "epoch": 3.9686399999999997, "grad_norm": 0.12119906324919044, "learning_rate": 4.975911320213365e-06, "loss": 0.0509, "loss_nan_ranks": 0, "loss_rank_avg": 0.01370596420019865, "step": 4135, "valid_targets_mean": 8794.0, "valid_targets_min": 1818 }, { "epoch": 3.97344, "grad_norm": 0.14093350602423113, "learning_rate": 4.931771566196332e-06, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.016862042248249054, "step": 4140, "valid_targets_mean": 8397.8, "valid_targets_min": 3079 }, { "epoch": 3.97824, "grad_norm": 0.1349495489817161, "learning_rate": 4.887800911194327e-06, "loss": 0.0558, "loss_nan_ranks": 0, "loss_rank_avg": 0.02118859626352787, "step": 4145, "valid_targets_mean": 9048.3, "valid_targets_min": 5051 }, { "epoch": 3.98304, "grad_norm": 0.13142737943814867, "learning_rate": 4.8439998486558246e-06, "loss": 0.0528, "loss_nan_ranks": 0, "loss_rank_avg": 0.01611470803618431, "step": 4150, "valid_targets_mean": 8308.8, "valid_targets_min": 2652 }, { "epoch": 3.9878400000000003, "grad_norm": 0.13509533467515525, "learning_rate": 4.800368870126111e-06, "loss": 0.0528, "loss_nan_ranks": 0, "loss_rank_avg": 0.0191353652626276, "step": 4155, "valid_targets_mean": 8963.3, "valid_targets_min": 3633 }, { "epoch": 3.9926399999999997, "grad_norm": 0.14336406928605755, "learning_rate": 4.756908465241736e-06, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.01861722022294998, "step": 4160, "valid_targets_mean": 8617.6, "valid_targets_min": 1813 }, { "epoch": 3.99744, "grad_norm": 0.13786327261197132, "learning_rate": 4.713619121725039e-06, "loss": 0.052, "loss_nan_ranks": 0, "loss_rank_avg": 0.016211070120334625, "step": 4165, "valid_targets_mean": 8242.3, "valid_targets_min": 1738 }, { "epoch": 4.00192, "grad_norm": 0.13937769816078396, "learning_rate": 4.670501325378682e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.024742331355810165, "step": 4170, "valid_targets_mean": 9415.3, "valid_targets_min": 1752 }, { "epoch": 4.00672, "grad_norm": 0.13260992045284067, "learning_rate": 4.627555560080173e-06, "loss": 0.0611, "loss_nan_ranks": 0, "loss_rank_avg": 0.020355109125375748, "step": 4175, "valid_targets_mean": 8578.2, "valid_targets_min": 2279 }, { "epoch": 4.01152, "grad_norm": 0.12136644577113068, "learning_rate": 4.5847823077764565e-06, "loss": 0.059, "loss_nan_ranks": 0, "loss_rank_avg": 0.01977297104895115, "step": 4180, "valid_targets_mean": 9292.6, "valid_targets_min": 2064 }, { "epoch": 4.01632, "grad_norm": 0.12215655268804888, "learning_rate": 4.5421820484784936e-06, "loss": 0.0593, "loss_nan_ranks": 0, "loss_rank_avg": 0.01999478042125702, "step": 4185, "valid_targets_mean": 7845.3, "valid_targets_min": 2443 }, { "epoch": 4.02112, "grad_norm": 0.11025685198030728, "learning_rate": 4.499755260255881e-06, "loss": 0.0608, "loss_nan_ranks": 0, "loss_rank_avg": 0.018016569316387177, "step": 4190, "valid_targets_mean": 9317.6, "valid_targets_min": 4456 }, { "epoch": 4.02592, "grad_norm": 0.12199348277560307, "learning_rate": 4.457502419231483e-06, "loss": 0.0585, "loss_nan_ranks": 0, "loss_rank_avg": 0.018790187314152718, "step": 4195, "valid_targets_mean": 8750.2, "valid_targets_min": 2849 }, { "epoch": 4.03072, "grad_norm": 0.11851887247821241, "learning_rate": 4.415423999576091e-06, "loss": 0.0595, "loss_nan_ranks": 0, "loss_rank_avg": 0.018436409533023834, "step": 4200, "valid_targets_mean": 8257.3, "valid_targets_min": 2090 }, { "epoch": 4.03552, "grad_norm": 0.12943593708733644, "learning_rate": 4.373520473503097e-06, "loss": 0.0601, "loss_nan_ranks": 0, "loss_rank_avg": 0.022049235180020332, "step": 4205, "valid_targets_mean": 8969.0, "valid_targets_min": 1560 }, { "epoch": 4.04032, "grad_norm": 0.12087582197109357, "learning_rate": 4.33179231126321e-06, "loss": 0.0566, "loss_nan_ranks": 0, "loss_rank_avg": 0.017242740839719772, "step": 4210, "valid_targets_mean": 8371.2, "valid_targets_min": 3676 }, { "epoch": 4.04512, "grad_norm": 0.12253314755510665, "learning_rate": 4.2902399811391575e-06, "loss": 0.06, "loss_nan_ranks": 0, "loss_rank_avg": 0.019466323778033257, "step": 4215, "valid_targets_mean": 9305.2, "valid_targets_min": 4992 }, { "epoch": 4.04992, "grad_norm": 0.11319613242190042, "learning_rate": 4.248863949440436e-06, "loss": 0.0586, "loss_nan_ranks": 0, "loss_rank_avg": 0.018419280648231506, "step": 4220, "valid_targets_mean": 9305.4, "valid_targets_min": 3216 }, { "epoch": 4.05472, "grad_norm": 0.12553938847694884, "learning_rate": 4.207664680498094e-06, "loss": 0.0591, "loss_nan_ranks": 0, "loss_rank_avg": 0.01968151330947876, "step": 4225, "valid_targets_mean": 9126.7, "valid_targets_min": 2259 }, { "epoch": 4.05952, "grad_norm": 0.12183311961705774, "learning_rate": 4.166642636659495e-06, "loss": 0.0602, "loss_nan_ranks": 0, "loss_rank_avg": 0.01877449080348015, "step": 4230, "valid_targets_mean": 8311.8, "valid_targets_min": 3816 }, { "epoch": 4.06432, "grad_norm": 0.1174766482044172, "learning_rate": 4.125798278283155e-06, "loss": 0.0576, "loss_nan_ranks": 0, "loss_rank_avg": 0.017112433910369873, "step": 4235, "valid_targets_mean": 8814.9, "valid_targets_min": 2509 }, { "epoch": 4.06912, "grad_norm": 0.11859507691645307, "learning_rate": 4.085132063733554e-06, "loss": 0.0599, "loss_nan_ranks": 0, "loss_rank_avg": 0.02330220490694046, "step": 4240, "valid_targets_mean": 8392.0, "valid_targets_min": 2719 }, { "epoch": 4.07392, "grad_norm": 0.12638051636040903, "learning_rate": 4.0446444493760165e-06, "loss": 0.0614, "loss_nan_ranks": 0, "loss_rank_avg": 0.01938215270638466, "step": 4245, "valid_targets_mean": 8159.9, "valid_targets_min": 3346 }, { "epoch": 4.07872, "grad_norm": 0.1228089615134463, "learning_rate": 4.004335889571556e-06, "loss": 0.0585, "loss_nan_ranks": 0, "loss_rank_avg": 0.0213320329785347, "step": 4250, "valid_targets_mean": 8913.4, "valid_targets_min": 2661 }, { "epoch": 4.08352, "grad_norm": 0.11774846166929161, "learning_rate": 3.96420683667182e-06, "loss": 0.059, "loss_nan_ranks": 0, "loss_rank_avg": 0.017504338175058365, "step": 4255, "valid_targets_mean": 8633.9, "valid_targets_min": 3543 }, { "epoch": 4.08832, "grad_norm": 0.11486128306446362, "learning_rate": 3.924257741013968e-06, "loss": 0.0593, "loss_nan_ranks": 0, "loss_rank_avg": 0.01892087049782276, "step": 4260, "valid_targets_mean": 9490.9, "valid_targets_min": 5870 }, { "epoch": 4.09312, "grad_norm": 0.12123842804798597, "learning_rate": 3.884489050915652e-06, "loss": 0.0577, "loss_nan_ranks": 0, "loss_rank_avg": 0.017838746309280396, "step": 4265, "valid_targets_mean": 9250.5, "valid_targets_min": 2459 }, { "epoch": 4.09792, "grad_norm": 0.12190469160340199, "learning_rate": 3.844901212669962e-06, "loss": 0.0583, "loss_nan_ranks": 0, "loss_rank_avg": 0.019511397927999496, "step": 4270, "valid_targets_mean": 8654.8, "valid_targets_min": 4446 }, { "epoch": 4.10272, "grad_norm": 0.12941809477086033, "learning_rate": 3.8054946705404415e-06, "loss": 0.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.021360494196414948, "step": 4275, "valid_targets_mean": 7698.9, "valid_targets_min": 2140 }, { "epoch": 4.10752, "grad_norm": 0.11911570039785059, "learning_rate": 3.7662698667560714e-06, "loss": 0.058, "loss_nan_ranks": 0, "loss_rank_avg": 0.022066941484808922, "step": 4280, "valid_targets_mean": 8562.8, "valid_targets_min": 2101 }, { "epoch": 4.11232, "grad_norm": 0.1237060154496202, "learning_rate": 3.7272272415063484e-06, "loss": 0.0596, "loss_nan_ranks": 0, "loss_rank_avg": 0.020797599107027054, "step": 4285, "valid_targets_mean": 9182.3, "valid_targets_min": 2194 }, { "epoch": 4.11712, "grad_norm": 0.12222076744088618, "learning_rate": 3.6883672329363007e-06, "loss": 0.0615, "loss_nan_ranks": 0, "loss_rank_avg": 0.020003672689199448, "step": 4290, "valid_targets_mean": 8025.3, "valid_targets_min": 2380 }, { "epoch": 4.12192, "grad_norm": 0.1268561459483808, "learning_rate": 3.649690277141598e-06, "loss": 0.0592, "loss_nan_ranks": 0, "loss_rank_avg": 0.020146148279309273, "step": 4295, "valid_targets_mean": 8866.0, "valid_targets_min": 1757 }, { "epoch": 4.12672, "grad_norm": 0.1203324885785926, "learning_rate": 3.6111968081636507e-06, "loss": 0.0616, "loss_nan_ranks": 0, "loss_rank_avg": 0.021221231669187546, "step": 4300, "valid_targets_mean": 8719.1, "valid_targets_min": 3671 }, { "epoch": 4.13152, "grad_norm": 0.12018186551080842, "learning_rate": 3.572887257984743e-06, "loss": 0.0603, "loss_nan_ranks": 0, "loss_rank_avg": 0.01852181926369667, "step": 4305, "valid_targets_mean": 8375.8, "valid_targets_min": 2431 }, { "epoch": 4.1363199999999996, "grad_norm": 0.11684594358500293, "learning_rate": 3.5347620565231733e-06, "loss": 0.0563, "loss_nan_ranks": 0, "loss_rank_avg": 0.016558483242988586, "step": 4310, "valid_targets_mean": 8316.6, "valid_targets_min": 3148 }, { "epoch": 4.14112, "grad_norm": 0.1145696786032025, "learning_rate": 3.496821631628442e-06, "loss": 0.0556, "loss_nan_ranks": 0, "loss_rank_avg": 0.016824206337332726, "step": 4315, "valid_targets_mean": 9543.6, "valid_targets_min": 5120 }, { "epoch": 4.14592, "grad_norm": 0.1329769792894044, "learning_rate": 3.459066409076448e-06, "loss": 0.0577, "loss_nan_ranks": 0, "loss_rank_avg": 0.020469941198825836, "step": 4320, "valid_targets_mean": 9157.2, "valid_targets_min": 4740 }, { "epoch": 4.15072, "grad_norm": 0.12076030631519495, "learning_rate": 3.421496812564713e-06, "loss": 0.058, "loss_nan_ranks": 0, "loss_rank_avg": 0.019596287980675697, "step": 4325, "valid_targets_mean": 9119.2, "valid_targets_min": 2239 }, { "epoch": 4.15552, "grad_norm": 0.12445424995710275, "learning_rate": 3.384113263707609e-06, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.018446721136569977, "step": 4330, "valid_targets_mean": 7905.8, "valid_targets_min": 2773 }, { "epoch": 4.16032, "grad_norm": 0.11984162900794601, "learning_rate": 3.34691618203165e-06, "loss": 0.0606, "loss_nan_ranks": 0, "loss_rank_avg": 0.018406976014375687, "step": 4335, "valid_targets_mean": 9256.8, "valid_targets_min": 2197 }, { "epoch": 4.16512, "grad_norm": 0.12179081674701153, "learning_rate": 3.309905984970765e-06, "loss": 0.0585, "loss_nan_ranks": 0, "loss_rank_avg": 0.017512843012809753, "step": 4340, "valid_targets_mean": 8542.8, "valid_targets_min": 2767 }, { "epoch": 4.16992, "grad_norm": 0.11759843922722205, "learning_rate": 3.2730830878616305e-06, "loss": 0.0608, "loss_nan_ranks": 0, "loss_rank_avg": 0.02117135003209114, "step": 4345, "valid_targets_mean": 9212.2, "valid_targets_min": 2958 }, { "epoch": 4.17472, "grad_norm": 0.11807834168622429, "learning_rate": 3.2364479039389973e-06, "loss": 0.0606, "loss_nan_ranks": 0, "loss_rank_avg": 0.018724609166383743, "step": 4350, "valid_targets_mean": 8196.4, "valid_targets_min": 1964 }, { "epoch": 4.17952, "grad_norm": 0.1243844477116557, "learning_rate": 3.2000008443310505e-06, "loss": 0.0598, "loss_nan_ranks": 0, "loss_rank_avg": 0.02250153385102749, "step": 4355, "valid_targets_mean": 9202.8, "valid_targets_min": 1686 }, { "epoch": 4.18432, "grad_norm": 0.11956480020734431, "learning_rate": 3.1637423180548232e-06, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.022235415875911713, "step": 4360, "valid_targets_mean": 9636.3, "valid_targets_min": 1629 }, { "epoch": 4.18912, "grad_norm": 0.1185081417491982, "learning_rate": 3.127672732011564e-06, "loss": 0.0619, "loss_nan_ranks": 0, "loss_rank_avg": 0.022327009588479996, "step": 4365, "valid_targets_mean": 9096.0, "valid_targets_min": 4447 }, { "epoch": 4.19392, "grad_norm": 0.12464353748951823, "learning_rate": 3.0917924909821993e-06, "loss": 0.0586, "loss_nan_ranks": 0, "loss_rank_avg": 0.022116748616099358, "step": 4370, "valid_targets_mean": 8855.2, "valid_targets_min": 2971 }, { "epoch": 4.19872, "grad_norm": 0.11711235388240054, "learning_rate": 3.0561019976227867e-06, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.01701711304485798, "step": 4375, "valid_targets_mean": 8770.3, "valid_targets_min": 3883 }, { "epoch": 4.20352, "grad_norm": 0.12209386881284948, "learning_rate": 3.020601652459989e-06, "loss": 0.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.018716298043727875, "step": 4380, "valid_targets_mean": 8453.9, "valid_targets_min": 2471 }, { "epoch": 4.20832, "grad_norm": 0.1179732819427151, "learning_rate": 2.9852918538865847e-06, "loss": 0.0586, "loss_nan_ranks": 0, "loss_rank_avg": 0.01898093894124031, "step": 4385, "valid_targets_mean": 8763.5, "valid_targets_min": 1581 }, { "epoch": 4.21312, "grad_norm": 0.12433317521576756, "learning_rate": 2.950172998156995e-06, "loss": 0.0624, "loss_nan_ranks": 0, "loss_rank_avg": 0.023141473531723022, "step": 4390, "valid_targets_mean": 9088.0, "valid_targets_min": 3503 }, { "epoch": 4.21792, "grad_norm": 0.12187721181458719, "learning_rate": 2.91524547938284e-06, "loss": 0.057, "loss_nan_ranks": 0, "loss_rank_avg": 0.019292142242193222, "step": 4395, "valid_targets_mean": 9112.7, "valid_targets_min": 3780 }, { "epoch": 4.22272, "grad_norm": 0.1249249599539274, "learning_rate": 2.880509689528519e-06, "loss": 0.0589, "loss_nan_ranks": 0, "loss_rank_avg": 0.020155327394604683, "step": 4400, "valid_targets_mean": 8781.4, "valid_targets_min": 4800 }, { "epoch": 4.22752, "grad_norm": 0.12130990173874953, "learning_rate": 2.845966018406796e-06, "loss": 0.0602, "loss_nan_ranks": 0, "loss_rank_avg": 0.01886666938662529, "step": 4405, "valid_targets_mean": 8720.8, "valid_targets_min": 3689 }, { "epoch": 4.23232, "grad_norm": 0.12261482199844286, "learning_rate": 2.8116148536744448e-06, "loss": 0.0601, "loss_nan_ranks": 0, "loss_rank_avg": 0.02107727900147438, "step": 4410, "valid_targets_mean": 8796.9, "valid_targets_min": 4312 }, { "epoch": 4.23712, "grad_norm": 0.12041082622457164, "learning_rate": 2.777456580827882e-06, "loss": 0.0591, "loss_nan_ranks": 0, "loss_rank_avg": 0.02132035419344902, "step": 4415, "valid_targets_mean": 8781.2, "valid_targets_min": 2402 }, { "epoch": 4.24192, "grad_norm": 0.12018775604857752, "learning_rate": 2.7434915831988517e-06, "loss": 0.0603, "loss_nan_ranks": 0, "loss_rank_avg": 0.022251714020967484, "step": 4420, "valid_targets_mean": 9274.4, "valid_targets_min": 2195 }, { "epoch": 4.24672, "grad_norm": 0.12398684759078817, "learning_rate": 2.7097202419501246e-06, "loss": 0.0596, "loss_nan_ranks": 0, "loss_rank_avg": 0.018055105581879616, "step": 4425, "valid_targets_mean": 7853.2, "valid_targets_min": 2163 }, { "epoch": 4.25152, "grad_norm": 0.12381260153578, "learning_rate": 2.6761429360712045e-06, "loss": 0.0624, "loss_nan_ranks": 0, "loss_rank_avg": 0.022460700944066048, "step": 4430, "valid_targets_mean": 7861.3, "valid_targets_min": 2928 }, { "epoch": 4.25632, "grad_norm": 0.12825189987605026, "learning_rate": 2.642760042374106e-06, "loss": 0.0597, "loss_nan_ranks": 0, "loss_rank_avg": 0.020237209275364876, "step": 4435, "valid_targets_mean": 8969.5, "valid_targets_min": 3671 }, { "epoch": 4.26112, "grad_norm": 0.11707780055325222, "learning_rate": 2.6095719354890903e-06, "loss": 0.061, "loss_nan_ranks": 0, "loss_rank_avg": 0.02044464461505413, "step": 4440, "valid_targets_mean": 9385.6, "valid_targets_min": 5255 }, { "epoch": 4.26592, "grad_norm": 0.12130109167017335, "learning_rate": 2.5765789878604852e-06, "loss": 0.06, "loss_nan_ranks": 0, "loss_rank_avg": 0.021732307970523834, "step": 4445, "valid_targets_mean": 8074.7, "valid_targets_min": 1889 }, { "epoch": 4.27072, "grad_norm": 0.12861534811780176, "learning_rate": 2.543781569742496e-06, "loss": 0.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.021149098873138428, "step": 4450, "valid_targets_mean": 8897.9, "valid_targets_min": 4566 }, { "epoch": 4.27552, "grad_norm": 0.12345473230408648, "learning_rate": 2.5111800491950523e-06, "loss": 0.0616, "loss_nan_ranks": 0, "loss_rank_avg": 0.017032301053404808, "step": 4455, "valid_targets_mean": 8499.6, "valid_targets_min": 4038 }, { "epoch": 4.28032, "grad_norm": 0.11892032327078929, "learning_rate": 2.4787747920796723e-06, "loss": 0.0583, "loss_nan_ranks": 0, "loss_rank_avg": 0.021471751853823662, "step": 4460, "valid_targets_mean": 8411.4, "valid_targets_min": 2210 }, { "epoch": 4.28512, "grad_norm": 0.12166979430091211, "learning_rate": 2.446566162055377e-06, "loss": 0.0563, "loss_nan_ranks": 0, "loss_rank_avg": 0.017029765993356705, "step": 4465, "valid_targets_mean": 8300.8, "valid_targets_min": 1868 }, { "epoch": 4.28992, "grad_norm": 0.11722138076862068, "learning_rate": 2.414554520574579e-06, "loss": 0.0603, "loss_nan_ranks": 0, "loss_rank_avg": 0.01955687813460827, "step": 4470, "valid_targets_mean": 9353.0, "valid_targets_min": 3294 }, { "epoch": 4.29472, "grad_norm": 0.124316488723136, "learning_rate": 2.382740226879052e-06, "loss": 0.0604, "loss_nan_ranks": 0, "loss_rank_avg": 0.022426098585128784, "step": 4475, "valid_targets_mean": 9120.7, "valid_targets_min": 1679 }, { "epoch": 4.29952, "grad_norm": 0.11579019842855867, "learning_rate": 2.3511236379958824e-06, "loss": 0.0602, "loss_nan_ranks": 0, "loss_rank_avg": 0.018894197419285774, "step": 4480, "valid_targets_mean": 8811.9, "valid_targets_min": 3885 }, { "epoch": 4.30432, "grad_norm": 0.1259214272811187, "learning_rate": 2.31970510873347e-06, "loss": 0.0584, "loss_nan_ranks": 0, "loss_rank_avg": 0.024906959384679794, "step": 4485, "valid_targets_mean": 9129.3, "valid_targets_min": 3544 }, { "epoch": 4.30912, "grad_norm": 0.12084376607932995, "learning_rate": 2.2884849916775485e-06, "loss": 0.0616, "loss_nan_ranks": 0, "loss_rank_avg": 0.014221737161278725, "step": 4490, "valid_targets_mean": 8125.8, "valid_targets_min": 2826 }, { "epoch": 4.3139199999999995, "grad_norm": 0.11679620075564591, "learning_rate": 2.257463637187225e-06, "loss": 0.0574, "loss_nan_ranks": 0, "loss_rank_avg": 0.021385526284575462, "step": 4495, "valid_targets_mean": 8571.7, "valid_targets_min": 4541 }, { "epoch": 4.31872, "grad_norm": 0.12458729359845118, "learning_rate": 2.2266413933910426e-06, "loss": 0.058, "loss_nan_ranks": 0, "loss_rank_avg": 0.02144310250878334, "step": 4500, "valid_targets_mean": 8770.7, "valid_targets_min": 2390 }, { "epoch": 4.32352, "grad_norm": 0.1234814545306667, "learning_rate": 2.196018606183088e-06, "loss": 0.056, "loss_nan_ranks": 0, "loss_rank_avg": 0.01575743779540062, "step": 4505, "valid_targets_mean": 8572.1, "valid_targets_min": 2046 }, { "epoch": 4.32832, "grad_norm": 0.1203553321128352, "learning_rate": 2.1655956192191007e-06, "loss": 0.0588, "loss_nan_ranks": 0, "loss_rank_avg": 0.02352827787399292, "step": 4510, "valid_targets_mean": 9005.1, "valid_targets_min": 3201 }, { "epoch": 4.33312, "grad_norm": 0.12717131209745855, "learning_rate": 2.135372773912614e-06, "loss": 0.0583, "loss_nan_ranks": 0, "loss_rank_avg": 0.018232187256217003, "step": 4515, "valid_targets_mean": 8639.8, "valid_targets_min": 4028 }, { "epoch": 4.33792, "grad_norm": 0.12297416080936355, "learning_rate": 2.1053504094311285e-06, "loss": 0.0611, "loss_nan_ranks": 0, "loss_rank_avg": 0.02066735178232193, "step": 4520, "valid_targets_mean": 8406.8, "valid_targets_min": 2310 }, { "epoch": 4.34272, "grad_norm": 0.11408264364981706, "learning_rate": 2.0755288626923022e-06, "loss": 0.0609, "loss_nan_ranks": 0, "loss_rank_avg": 0.016809195280075073, "step": 4525, "valid_targets_mean": 8664.7, "valid_targets_min": 2680 }, { "epoch": 4.34752, "grad_norm": 0.11366877193389748, "learning_rate": 2.0459084683601736e-06, "loss": 0.0587, "loss_nan_ranks": 0, "loss_rank_avg": 0.018915891647338867, "step": 4530, "valid_targets_mean": 9101.0, "valid_targets_min": 4064 }, { "epoch": 4.35232, "grad_norm": 0.11780725593526946, "learning_rate": 2.0164895588414037e-06, "loss": 0.0573, "loss_nan_ranks": 0, "loss_rank_avg": 0.02268713340163231, "step": 4535, "valid_targets_mean": 9264.6, "valid_targets_min": 2587 }, { "epoch": 4.35712, "grad_norm": 0.11864430396627579, "learning_rate": 1.987272464281551e-06, "loss": 0.0595, "loss_nan_ranks": 0, "loss_rank_avg": 0.01781759038567543, "step": 4540, "valid_targets_mean": 8280.8, "valid_targets_min": 2616 }, { "epoch": 4.36192, "grad_norm": 0.12342667279516402, "learning_rate": 1.95825751256135e-06, "loss": 0.0603, "loss_nan_ranks": 0, "loss_rank_avg": 0.021349921822547913, "step": 4545, "valid_targets_mean": 7914.7, "valid_targets_min": 4779 }, { "epoch": 4.36672, "grad_norm": 0.12657913615634134, "learning_rate": 1.9294450292930576e-06, "loss": 0.0614, "loss_nan_ranks": 0, "loss_rank_avg": 0.02445283532142639, "step": 4550, "valid_targets_mean": 8156.9, "valid_targets_min": 3044 }, { "epoch": 4.37152, "grad_norm": 0.11859983603277927, "learning_rate": 1.9008353378167755e-06, "loss": 0.0589, "loss_nan_ranks": 0, "loss_rank_avg": 0.022507328540086746, "step": 4555, "valid_targets_mean": 9130.3, "valid_targets_min": 4855 }, { "epoch": 4.37632, "grad_norm": 0.11788766940094339, "learning_rate": 1.8724287591968294e-06, "loss": 0.0601, "loss_nan_ranks": 0, "loss_rank_avg": 0.022499315440654755, "step": 4560, "valid_targets_mean": 8801.2, "valid_targets_min": 4940 }, { "epoch": 4.38112, "grad_norm": 0.11786646314018358, "learning_rate": 1.8442256122181735e-06, "loss": 0.0597, "loss_nan_ranks": 0, "loss_rank_avg": 0.027995608747005463, "step": 4565, "valid_targets_mean": 8043.8, "valid_targets_min": 3907 }, { "epoch": 4.38592, "grad_norm": 0.11870348032090175, "learning_rate": 1.8162262133828013e-06, "loss": 0.0605, "loss_nan_ranks": 0, "loss_rank_avg": 0.01562669314444065, "step": 4570, "valid_targets_mean": 8143.3, "valid_targets_min": 2952 }, { "epoch": 4.39072, "grad_norm": 0.11550723988467981, "learning_rate": 1.7884308769061974e-06, "loss": 0.06, "loss_nan_ranks": 0, "loss_rank_avg": 0.017535259947180748, "step": 4575, "valid_targets_mean": 8207.1, "valid_targets_min": 1407 }, { "epoch": 4.39552, "grad_norm": 0.12858179033167436, "learning_rate": 1.7608399147138278e-06, "loss": 0.0606, "loss_nan_ranks": 0, "loss_rank_avg": 0.021043431013822556, "step": 4580, "valid_targets_mean": 9255.1, "valid_targets_min": 5243 }, { "epoch": 4.40032, "grad_norm": 0.12484115877372373, "learning_rate": 1.7334536364376075e-06, "loss": 0.0609, "loss_nan_ranks": 0, "loss_rank_avg": 0.01975128799676895, "step": 4585, "valid_targets_mean": 8706.5, "valid_targets_min": 3138 }, { "epoch": 4.40512, "grad_norm": 0.11517365050643107, "learning_rate": 1.7062723494124545e-06, "loss": 0.0573, "loss_nan_ranks": 0, "loss_rank_avg": 0.0198981910943985, "step": 4590, "valid_targets_mean": 8627.3, "valid_targets_min": 2762 }, { "epoch": 4.40992, "grad_norm": 0.12275506403955044, "learning_rate": 1.6792963586728195e-06, "loss": 0.0585, "loss_nan_ranks": 0, "loss_rank_avg": 0.02215822972357273, "step": 4595, "valid_targets_mean": 8069.7, "valid_targets_min": 2209 }, { "epoch": 4.41472, "grad_norm": 0.12581924286742757, "learning_rate": 1.6525259669492832e-06, "loss": 0.0615, "loss_nan_ranks": 0, "loss_rank_avg": 0.014441033825278282, "step": 4600, "valid_targets_mean": 8204.5, "valid_targets_min": 2901 }, { "epoch": 4.41952, "grad_norm": 0.11581290951072448, "learning_rate": 1.6259614746651364e-06, "loss": 0.059, "loss_nan_ranks": 0, "loss_rank_avg": 0.02150608040392399, "step": 4605, "valid_targets_mean": 9324.2, "valid_targets_min": 2902 }, { "epoch": 4.42432, "grad_norm": 0.1170339216117605, "learning_rate": 1.5996031799330315e-06, "loss": 0.0594, "loss_nan_ranks": 0, "loss_rank_avg": 0.020407576113939285, "step": 4610, "valid_targets_mean": 9710.2, "valid_targets_min": 6487 }, { "epoch": 4.42912, "grad_norm": 0.12174555375272791, "learning_rate": 1.5734513785516227e-06, "loss": 0.0601, "loss_nan_ranks": 0, "loss_rank_avg": 0.023040469735860825, "step": 4615, "valid_targets_mean": 8550.7, "valid_targets_min": 3146 }, { "epoch": 4.43392, "grad_norm": 0.11719954446471759, "learning_rate": 1.5475063640022425e-06, "loss": 0.0565, "loss_nan_ranks": 0, "loss_rank_avg": 0.021581973880529404, "step": 4620, "valid_targets_mean": 8845.3, "valid_targets_min": 3193 }, { "epoch": 4.43872, "grad_norm": 0.12444180899873919, "learning_rate": 1.5217684274456314e-06, "loss": 0.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.02068684622645378, "step": 4625, "valid_targets_mean": 8613.9, "valid_targets_min": 2223 }, { "epoch": 4.44352, "grad_norm": 0.11633434401162951, "learning_rate": 1.496237857718641e-06, "loss": 0.0557, "loss_nan_ranks": 0, "loss_rank_avg": 0.020495615899562836, "step": 4630, "valid_targets_mean": 9103.2, "valid_targets_min": 3690 }, { "epoch": 4.44832, "grad_norm": 0.11590364344133595, "learning_rate": 1.4709149413310076e-06, "loss": 0.0582, "loss_nan_ranks": 0, "loss_rank_avg": 0.020342785865068436, "step": 4635, "valid_targets_mean": 8995.2, "valid_targets_min": 3398 }, { "epoch": 4.45312, "grad_norm": 0.12329134950235973, "learning_rate": 1.445799962462142e-06, "loss": 0.0599, "loss_nan_ranks": 0, "loss_rank_avg": 0.023403488099575043, "step": 4640, "valid_targets_mean": 9009.5, "valid_targets_min": 2608 }, { "epoch": 4.45792, "grad_norm": 0.11404195513457407, "learning_rate": 1.420893202957927e-06, "loss": 0.0611, "loss_nan_ranks": 0, "loss_rank_avg": 0.0181783065199852, "step": 4645, "valid_targets_mean": 8686.3, "valid_targets_min": 5259 }, { "epoch": 4.46272, "grad_norm": 0.11754587410173165, "learning_rate": 1.3961949423275622e-06, "loss": 0.0595, "loss_nan_ranks": 0, "loss_rank_avg": 0.016123849898576736, "step": 4650, "valid_targets_mean": 9019.9, "valid_targets_min": 4229 }, { "epoch": 4.46752, "grad_norm": 0.11564141223039769, "learning_rate": 1.3717054577404331e-06, "loss": 0.06, "loss_nan_ranks": 0, "loss_rank_avg": 0.01637781225144863, "step": 4655, "valid_targets_mean": 8115.4, "valid_targets_min": 2226 }, { "epoch": 4.47232, "grad_norm": 0.1198827197232521, "learning_rate": 1.347425024022988e-06, "loss": 0.0608, "loss_nan_ranks": 0, "loss_rank_avg": 0.0225857961922884, "step": 4660, "valid_targets_mean": 9256.1, "valid_targets_min": 2916 }, { "epoch": 4.47712, "grad_norm": 0.12018530901808909, "learning_rate": 1.3233539136556606e-06, "loss": 0.0573, "loss_nan_ranks": 0, "loss_rank_avg": 0.021104391664266586, "step": 4665, "valid_targets_mean": 8460.7, "valid_targets_min": 4730 }, { "epoch": 4.48192, "grad_norm": 0.11519884136211274, "learning_rate": 1.2994923967698125e-06, "loss": 0.0586, "loss_nan_ranks": 0, "loss_rank_avg": 0.018374186009168625, "step": 4670, "valid_targets_mean": 8961.7, "valid_targets_min": 1893 }, { "epoch": 4.48672, "grad_norm": 0.11839023097383723, "learning_rate": 1.2758407411446982e-06, "loss": 0.0571, "loss_nan_ranks": 0, "loss_rank_avg": 0.01913219690322876, "step": 4675, "valid_targets_mean": 8664.0, "valid_targets_min": 3331 }, { "epoch": 4.49152, "grad_norm": 0.11419982429935628, "learning_rate": 1.252399212204467e-06, "loss": 0.0584, "loss_nan_ranks": 0, "loss_rank_avg": 0.0173068605363369, "step": 4680, "valid_targets_mean": 9348.1, "valid_targets_min": 4816 }, { "epoch": 4.49632, "grad_norm": 0.11701309750429871, "learning_rate": 1.22916807301517e-06, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.01966226100921631, "step": 4685, "valid_targets_mean": 8759.7, "valid_targets_min": 2106 }, { "epoch": 4.50112, "grad_norm": 0.12539881289660457, "learning_rate": 1.2061475842818337e-06, "loss": 0.0599, "loss_nan_ranks": 0, "loss_rank_avg": 0.023415343835949898, "step": 4690, "valid_targets_mean": 8409.9, "valid_targets_min": 3145 }, { "epoch": 4.50592, "grad_norm": 0.12883054072840242, "learning_rate": 1.1833380043455e-06, "loss": 0.0573, "loss_nan_ranks": 0, "loss_rank_avg": 0.022276621311903, "step": 4695, "valid_targets_mean": 8735.2, "valid_targets_min": 2713 }, { "epoch": 4.51072, "grad_norm": 0.11870029933701683, "learning_rate": 1.1607395891803641e-06, "loss": 0.0585, "loss_nan_ranks": 0, "loss_rank_avg": 0.018026743084192276, "step": 4700, "valid_targets_mean": 8477.8, "valid_targets_min": 2119 }, { "epoch": 4.51552, "grad_norm": 0.12926973339646206, "learning_rate": 1.1383525923908678e-06, "loss": 0.0588, "loss_nan_ranks": 0, "loss_rank_avg": 0.021603520959615707, "step": 4705, "valid_targets_mean": 8258.6, "valid_targets_min": 1976 }, { "epoch": 4.52032, "grad_norm": 0.1252253936787309, "learning_rate": 1.1161772652088775e-06, "loss": 0.0608, "loss_nan_ranks": 0, "loss_rank_avg": 0.022924084216356277, "step": 4710, "valid_targets_mean": 9499.5, "valid_targets_min": 5268 }, { "epoch": 4.52512, "grad_norm": 0.11418574330977625, "learning_rate": 1.094213856490849e-06, "loss": 0.0595, "loss_nan_ranks": 0, "loss_rank_avg": 0.01998257264494896, "step": 4715, "valid_targets_mean": 8799.8, "valid_targets_min": 2185 }, { "epoch": 4.52992, "grad_norm": 0.11970402415901457, "learning_rate": 1.0724626127150462e-06, "loss": 0.0592, "loss_nan_ranks": 0, "loss_rank_avg": 0.021041162312030792, "step": 4720, "valid_targets_mean": 9400.4, "valid_targets_min": 3753 }, { "epoch": 4.53472, "grad_norm": 0.12487355432604856, "learning_rate": 1.0509237779787717e-06, "loss": 0.0551, "loss_nan_ranks": 0, "loss_rank_avg": 0.020584046840667725, "step": 4725, "valid_targets_mean": 8329.1, "valid_targets_min": 2687 }, { "epoch": 4.5395199999999996, "grad_norm": 0.1162808601114574, "learning_rate": 1.029597593995626e-06, "loss": 0.0613, "loss_nan_ranks": 0, "loss_rank_avg": 0.017470069229602814, "step": 4730, "valid_targets_mean": 8599.2, "valid_targets_min": 2352 }, { "epoch": 4.54432, "grad_norm": 0.11243973717046013, "learning_rate": 1.008484300092798e-06, "loss": 0.0576, "loss_nan_ranks": 0, "loss_rank_avg": 0.01999412477016449, "step": 4735, "valid_targets_mean": 10049.0, "valid_targets_min": 3022 }, { "epoch": 4.54912, "grad_norm": 0.12376778314874719, "learning_rate": 9.87584133208368e-07, "loss": 0.0615, "loss_nan_ranks": 0, "loss_rank_avg": 0.02172812819480896, "step": 4740, "valid_targets_mean": 8882.0, "valid_targets_min": 3163 }, { "epoch": 4.55392, "grad_norm": 0.11754286609015283, "learning_rate": 9.66897327888665e-07, "loss": 0.0582, "loss_nan_ranks": 0, "loss_rank_avg": 0.01753995195031166, "step": 4745, "valid_targets_mean": 8957.7, "valid_targets_min": 2101 }, { "epoch": 4.55872, "grad_norm": 0.12288692811727639, "learning_rate": 9.464241162856269e-07, "loss": 0.0598, "loss_nan_ranks": 0, "loss_rank_avg": 0.022371970117092133, "step": 4750, "valid_targets_mean": 9342.5, "valid_targets_min": 3010 }, { "epoch": 4.5635200000000005, "grad_norm": 0.12193809956698538, "learning_rate": 9.261647281541908e-07, "loss": 0.0605, "loss_nan_ranks": 0, "loss_rank_avg": 0.019677281379699707, "step": 4755, "valid_targets_mean": 8768.8, "valid_targets_min": 2073 }, { "epoch": 4.56832, "grad_norm": 0.1179844087692095, "learning_rate": 9.061193908497201e-07, "loss": 0.0588, "loss_nan_ranks": 0, "loss_rank_avg": 0.02046424336731434, "step": 4760, "valid_targets_mean": 8664.7, "valid_targets_min": 2635 }, { "epoch": 4.57312, "grad_norm": 0.128157116339437, "learning_rate": 8.862883293254598e-07, "loss": 0.0578, "loss_nan_ranks": 0, "loss_rank_avg": 0.022372746840119362, "step": 4765, "valid_targets_mean": 9003.5, "valid_targets_min": 2891 }, { "epoch": 4.57792, "grad_norm": 0.11544338584988456, "learning_rate": 8.666717661299917e-07, "loss": 0.059, "loss_nan_ranks": 0, "loss_rank_avg": 0.015689603984355927, "step": 4770, "valid_targets_mean": 7997.3, "valid_targets_min": 1727 }, { "epoch": 4.58272, "grad_norm": 0.12217872408661101, "learning_rate": 8.472699214047652e-07, "loss": 0.0614, "loss_nan_ranks": 0, "loss_rank_avg": 0.022685006260871887, "step": 4775, "valid_targets_mean": 8804.0, "valid_targets_min": 4118 }, { "epoch": 4.58752, "grad_norm": 0.12274599705948007, "learning_rate": 8.280830128815953e-07, "loss": 0.0616, "loss_nan_ranks": 0, "loss_rank_avg": 0.01906590908765793, "step": 4780, "valid_targets_mean": 9177.7, "valid_targets_min": 3296 }, { "epoch": 4.59232, "grad_norm": 0.13080453191813954, "learning_rate": 8.09111255880246e-07, "loss": 0.0607, "loss_nan_ranks": 0, "loss_rank_avg": 0.018022168427705765, "step": 4785, "valid_targets_mean": 8568.4, "valid_targets_min": 3204 }, { "epoch": 4.59712, "grad_norm": 0.11609891660815055, "learning_rate": 7.903548633059955e-07, "loss": 0.0594, "loss_nan_ranks": 0, "loss_rank_avg": 0.015199240297079086, "step": 4790, "valid_targets_mean": 9195.6, "valid_targets_min": 4123 }, { "epoch": 4.60192, "grad_norm": 0.11296055178630578, "learning_rate": 7.718140456472612e-07, "loss": 0.0579, "loss_nan_ranks": 0, "loss_rank_avg": 0.019392728805541992, "step": 4795, "valid_targets_mean": 10019.9, "valid_targets_min": 2701 }, { "epoch": 4.60672, "grad_norm": 0.11439403685364499, "learning_rate": 7.534890109732229e-07, "loss": 0.0591, "loss_nan_ranks": 0, "loss_rank_avg": 0.020609967410564423, "step": 4800, "valid_targets_mean": 9014.2, "valid_targets_min": 1364 }, { "epoch": 4.61152, "grad_norm": 0.1327213756348675, "learning_rate": 7.353799649315085e-07, "loss": 0.0458, "loss_nan_ranks": 0, "loss_rank_avg": 0.019029157236218452, "step": 4805, "valid_targets_mean": 9159.7, "valid_targets_min": 3538 }, { "epoch": 4.61632, "grad_norm": 0.1306512860306434, "learning_rate": 7.174871107458603e-07, "loss": 0.0445, "loss_nan_ranks": 0, "loss_rank_avg": 0.013268783688545227, "step": 4810, "valid_targets_mean": 8492.3, "valid_targets_min": 2660 }, { "epoch": 4.62112, "grad_norm": 0.12316003257913177, "learning_rate": 6.998106492138724e-07, "loss": 0.0445, "loss_nan_ranks": 0, "loss_rank_avg": 0.016152355819940567, "step": 4815, "valid_targets_mean": 9058.9, "valid_targets_min": 4044 }, { "epoch": 4.62592, "grad_norm": 0.13208488394402484, "learning_rate": 6.823507787047346e-07, "loss": 0.0472, "loss_nan_ranks": 0, "loss_rank_avg": 0.01765730045735836, "step": 4820, "valid_targets_mean": 9080.8, "valid_targets_min": 1329 }, { "epoch": 4.63072, "grad_norm": 0.12845900831200494, "learning_rate": 6.65107695156999e-07, "loss": 0.0478, "loss_nan_ranks": 0, "loss_rank_avg": 0.019706537947058678, "step": 4825, "valid_targets_mean": 8834.9, "valid_targets_min": 2746 }, { "epoch": 4.63552, "grad_norm": 0.12699103671556508, "learning_rate": 6.480815920763905e-07, "loss": 0.0469, "loss_nan_ranks": 0, "loss_rank_avg": 0.015223637223243713, "step": 4830, "valid_targets_mean": 8278.7, "valid_targets_min": 2883 }, { "epoch": 4.64032, "grad_norm": 0.13082167598049418, "learning_rate": 6.312726605336306e-07, "loss": 0.0483, "loss_nan_ranks": 0, "loss_rank_avg": 0.01759178563952446, "step": 4835, "valid_targets_mean": 8804.4, "valid_targets_min": 1917 }, { "epoch": 4.64512, "grad_norm": 0.11954497001490652, "learning_rate": 6.146810891622923e-07, "loss": 0.0468, "loss_nan_ranks": 0, "loss_rank_avg": 0.016691675409674644, "step": 4840, "valid_targets_mean": 9112.6, "valid_targets_min": 2572 }, { "epoch": 4.64992, "grad_norm": 0.12299775936346398, "learning_rate": 5.983070641566802e-07, "loss": 0.0479, "loss_nan_ranks": 0, "loss_rank_avg": 0.01542404480278492, "step": 4845, "valid_targets_mean": 9376.9, "valid_targets_min": 4022 }, { "epoch": 4.65472, "grad_norm": 0.12357084213291525, "learning_rate": 5.821507692697537e-07, "loss": 0.0481, "loss_nan_ranks": 0, "loss_rank_avg": 0.016300935298204422, "step": 4850, "valid_targets_mean": 8835.5, "valid_targets_min": 2927 }, { "epoch": 4.65952, "grad_norm": 0.11639361498636804, "learning_rate": 5.662123858110513e-07, "loss": 0.0453, "loss_nan_ranks": 0, "loss_rank_avg": 0.012974596582353115, "step": 4855, "valid_targets_mean": 9376.3, "valid_targets_min": 4422 }, { "epoch": 4.66432, "grad_norm": 0.1973531314250708, "learning_rate": 5.504920926446611e-07, "loss": 0.0429, "loss_nan_ranks": 0, "loss_rank_avg": 0.014859823510050774, "step": 4860, "valid_targets_mean": 9044.0, "valid_targets_min": 2028 }, { "epoch": 4.66912, "grad_norm": 0.12053965390150939, "learning_rate": 5.349900661872132e-07, "loss": 0.0435, "loss_nan_ranks": 0, "loss_rank_avg": 0.013551025651395321, "step": 4865, "valid_targets_mean": 8233.1, "valid_targets_min": 2519 }, { "epoch": 4.67392, "grad_norm": 0.13237236041105185, "learning_rate": 5.197064804058971e-07, "loss": 0.0455, "loss_nan_ranks": 0, "loss_rank_avg": 0.015264524146914482, "step": 4870, "valid_targets_mean": 8967.7, "valid_targets_min": 4346 }, { "epoch": 4.67872, "grad_norm": 0.12851803325820077, "learning_rate": 5.046415068165234e-07, "loss": 0.0435, "loss_nan_ranks": 0, "loss_rank_avg": 0.01638580672442913, "step": 4875, "valid_targets_mean": 8687.0, "valid_targets_min": 1807 }, { "epoch": 4.68352, "grad_norm": 0.12984651854096851, "learning_rate": 4.897953144815759e-07, "loss": 0.0443, "loss_nan_ranks": 0, "loss_rank_avg": 0.013979455456137657, "step": 4880, "valid_targets_mean": 8094.6, "valid_targets_min": 3964 }, { "epoch": 4.68832, "grad_norm": 0.12218670654596375, "learning_rate": 4.7516807000833165e-07, "loss": 0.0473, "loss_nan_ranks": 0, "loss_rank_avg": 0.014194248244166374, "step": 4885, "valid_targets_mean": 8910.1, "valid_targets_min": 4014 }, { "epoch": 4.69312, "grad_norm": 0.13244930235944974, "learning_rate": 4.6075993754698623e-07, "loss": 0.0474, "loss_nan_ranks": 0, "loss_rank_avg": 0.017760399729013443, "step": 4890, "valid_targets_mean": 8803.0, "valid_targets_min": 2878 }, { "epoch": 4.69792, "grad_norm": 0.12159738107311469, "learning_rate": 4.4657107878881113e-07, "loss": 0.0457, "loss_nan_ranks": 0, "loss_rank_avg": 0.01536801178008318, "step": 4895, "valid_targets_mean": 8669.1, "valid_targets_min": 2293 }, { "epoch": 4.70272, "grad_norm": 0.13108853234312876, "learning_rate": 4.326016529643351e-07, "loss": 0.0448, "loss_nan_ranks": 0, "loss_rank_avg": 0.015306061133742332, "step": 4900, "valid_targets_mean": 8503.5, "valid_targets_min": 1683 }, { "epoch": 4.70752, "grad_norm": 0.128634595478892, "learning_rate": 4.1885181684157005e-07, "loss": 0.0475, "loss_nan_ranks": 0, "loss_rank_avg": 0.018076792359352112, "step": 4905, "valid_targets_mean": 8681.2, "valid_targets_min": 3721 }, { "epoch": 4.71232, "grad_norm": 0.12249409189586784, "learning_rate": 4.053217247242369e-07, "loss": 0.0446, "loss_nan_ranks": 0, "loss_rank_avg": 0.015645861625671387, "step": 4910, "valid_targets_mean": 9035.6, "valid_targets_min": 2773 }, { "epoch": 4.7171199999999995, "grad_norm": 0.13008375294057498, "learning_rate": 3.9201152845004476e-07, "loss": 0.0444, "loss_nan_ranks": 0, "loss_rank_avg": 0.014394369907677174, "step": 4915, "valid_targets_mean": 8486.8, "valid_targets_min": 2407 }, { "epoch": 4.72192, "grad_norm": 0.12484127400367312, "learning_rate": 3.789213773889744e-07, "loss": 0.0435, "loss_nan_ranks": 0, "loss_rank_avg": 0.016258973628282547, "step": 4920, "valid_targets_mean": 9018.9, "valid_targets_min": 1964 }, { "epoch": 4.72672, "grad_norm": 0.12298816364049474, "learning_rate": 3.6605141844162417e-07, "loss": 0.0416, "loss_nan_ranks": 0, "loss_rank_avg": 0.01498118694871664, "step": 4925, "valid_targets_mean": 8734.2, "valid_targets_min": 2137 }, { "epoch": 4.73152, "grad_norm": 0.12495538982194321, "learning_rate": 3.5340179603753354e-07, "loss": 0.0456, "loss_nan_ranks": 0, "loss_rank_avg": 0.01642123982310295, "step": 4930, "valid_targets_mean": 8728.7, "valid_targets_min": 1857 }, { "epoch": 4.73632, "grad_norm": 0.12397318336703354, "learning_rate": 3.4097265213358435e-07, "loss": 0.043, "loss_nan_ranks": 0, "loss_rank_avg": 0.013172818347811699, "step": 4935, "valid_targets_mean": 8926.8, "valid_targets_min": 3677 }, { "epoch": 4.7411200000000004, "grad_norm": 0.13443930370760981, "learning_rate": 3.287641262123975e-07, "loss": 0.0459, "loss_nan_ranks": 0, "loss_rank_avg": 0.016371993348002434, "step": 4940, "valid_targets_mean": 8540.3, "valid_targets_min": 1162 }, { "epoch": 4.74592, "grad_norm": 0.12803940564558636, "learning_rate": 3.1677635528076566e-07, "loss": 0.0445, "loss_nan_ranks": 0, "loss_rank_avg": 0.011617720127105713, "step": 4945, "valid_targets_mean": 9372.5, "valid_targets_min": 1983 }, { "epoch": 4.75072, "grad_norm": 0.1306802799160656, "learning_rate": 3.0500947386812973e-07, "loss": 0.0465, "loss_nan_ranks": 0, "loss_rank_avg": 0.014903305098414421, "step": 4950, "valid_targets_mean": 8770.1, "valid_targets_min": 2285 }, { "epoch": 4.75552, "grad_norm": 0.12387300110011946, "learning_rate": 2.934636140250513e-07, "loss": 0.0436, "loss_nan_ranks": 0, "loss_rank_avg": 0.012026086449623108, "step": 4955, "valid_targets_mean": 8344.1, "valid_targets_min": 2375 }, { "epoch": 4.76032, "grad_norm": 0.20661769231404678, "learning_rate": 2.821389053217383e-07, "loss": 0.0432, "loss_nan_ranks": 0, "loss_rank_avg": 0.014603785239160061, "step": 4960, "valid_targets_mean": 8906.2, "valid_targets_min": 2707 }, { "epoch": 4.76512, "grad_norm": 0.12591591545112674, "learning_rate": 2.710354748465949e-07, "loss": 0.0467, "loss_nan_ranks": 0, "loss_rank_avg": 0.014467072673141956, "step": 4965, "valid_targets_mean": 8309.1, "valid_targets_min": 1618 }, { "epoch": 4.76992, "grad_norm": 0.12713363799656874, "learning_rate": 2.6015344720479395e-07, "loss": 0.0455, "loss_nan_ranks": 0, "loss_rank_avg": 0.01415165513753891, "step": 4970, "valid_targets_mean": 8002.9, "valid_targets_min": 2313 }, { "epoch": 4.77472, "grad_norm": 0.12508628958334017, "learning_rate": 2.49492944516867e-07, "loss": 0.0476, "loss_nan_ranks": 0, "loss_rank_avg": 0.013956809416413307, "step": 4975, "valid_targets_mean": 7795.5, "valid_targets_min": 2816 }, { "epoch": 4.77952, "grad_norm": 0.1226101397357892, "learning_rate": 2.3905408641735183e-07, "loss": 0.0444, "loss_nan_ranks": 0, "loss_rank_avg": 0.0149923637509346, "step": 4980, "valid_targets_mean": 8852.8, "valid_targets_min": 3019 }, { "epoch": 4.78432, "grad_norm": 0.12517540140245537, "learning_rate": 2.288369900534404e-07, "loss": 0.0452, "loss_nan_ranks": 0, "loss_rank_avg": 0.011800020933151245, "step": 4985, "valid_targets_mean": 7697.3, "valid_targets_min": 3225 }, { "epoch": 4.7891200000000005, "grad_norm": 0.12617181013082826, "learning_rate": 2.1884177008366203e-07, "loss": 0.0448, "loss_nan_ranks": 0, "loss_rank_avg": 0.01531097013503313, "step": 4990, "valid_targets_mean": 9043.1, "valid_targets_min": 2615 }, { "epoch": 4.79392, "grad_norm": 0.13162859126890672, "learning_rate": 2.0906853867660004e-07, "loss": 0.0423, "loss_nan_ranks": 0, "loss_rank_avg": 0.015335047617554665, "step": 4995, "valid_targets_mean": 8755.2, "valid_targets_min": 2833 }, { "epoch": 4.79872, "grad_norm": 0.12921873760362335, "learning_rate": 1.9951740550963493e-07, "loss": 0.0443, "loss_nan_ranks": 0, "loss_rank_avg": 0.013373359106481075, "step": 5000, "valid_targets_mean": 8286.6, "valid_targets_min": 3311 }, { "epoch": 4.80352, "grad_norm": 0.1332690682878744, "learning_rate": 1.9018847776770987e-07, "loss": 0.0453, "loss_nan_ranks": 0, "loss_rank_avg": 0.015984494239091873, "step": 5005, "valid_targets_mean": 8718.6, "valid_targets_min": 2313 }, { "epoch": 4.80832, "grad_norm": 0.119227169078396, "learning_rate": 1.8108186014212935e-07, "loss": 0.0439, "loss_nan_ranks": 0, "loss_rank_avg": 0.01700938306748867, "step": 5010, "valid_targets_mean": 10023.7, "valid_targets_min": 5935 }, { "epoch": 4.81312, "grad_norm": 0.12005952635161173, "learning_rate": 1.7219765482938465e-07, "loss": 0.044, "loss_nan_ranks": 0, "loss_rank_avg": 0.011994611471891403, "step": 5015, "valid_targets_mean": 8354.2, "valid_targets_min": 1889 }, { "epoch": 4.81792, "grad_norm": 0.1257252009191287, "learning_rate": 1.635359615300036e-07, "loss": 0.0476, "loss_nan_ranks": 0, "loss_rank_avg": 0.013933985494077206, "step": 5020, "valid_targets_mean": 9395.4, "valid_targets_min": 2543 }, { "epoch": 4.82272, "grad_norm": 0.13135638987722986, "learning_rate": 1.5509687744744262e-07, "loss": 0.0456, "loss_nan_ranks": 0, "loss_rank_avg": 0.018428293988108635, "step": 5025, "valid_targets_mean": 9299.7, "valid_targets_min": 3480 }, { "epoch": 4.82752, "grad_norm": 0.11986507904934081, "learning_rate": 1.468804972869786e-07, "loss": 0.0464, "loss_nan_ranks": 0, "loss_rank_avg": 0.013786360621452332, "step": 5030, "valid_targets_mean": 8602.0, "valid_targets_min": 4552 }, { "epoch": 4.83232, "grad_norm": 0.12665116588140998, "learning_rate": 1.3888691325465886e-07, "loss": 0.0463, "loss_nan_ranks": 0, "loss_rank_avg": 0.017422419041395187, "step": 5035, "valid_targets_mean": 8720.6, "valid_targets_min": 3791 }, { "epoch": 4.83712, "grad_norm": 0.13342700487132997, "learning_rate": 1.3111621505626616e-07, "loss": 0.0466, "loss_nan_ranks": 0, "loss_rank_avg": 0.016414277255535126, "step": 5040, "valid_targets_mean": 9144.7, "valid_targets_min": 1516 }, { "epoch": 4.84192, "grad_norm": 0.12412199123426582, "learning_rate": 1.235684898963041e-07, "loss": 0.0428, "loss_nan_ranks": 0, "loss_rank_avg": 0.015540607273578644, "step": 5045, "valid_targets_mean": 8555.7, "valid_targets_min": 2332 }, { "epoch": 4.84672, "grad_norm": 0.12302925116599557, "learning_rate": 1.1624382247702681e-07, "loss": 0.0467, "loss_nan_ranks": 0, "loss_rank_avg": 0.014546379446983337, "step": 5050, "valid_targets_mean": 9193.9, "valid_targets_min": 2994 }, { "epoch": 4.85152, "grad_norm": 0.12049454142383617, "learning_rate": 1.0914229499748186e-07, "loss": 0.0461, "loss_nan_ranks": 0, "loss_rank_avg": 0.01593470387160778, "step": 5055, "valid_targets_mean": 7931.0, "valid_targets_min": 2226 }, { "epoch": 4.85632, "grad_norm": 0.12255879374376923, "learning_rate": 1.0226398715259322e-07, "loss": 0.0431, "loss_nan_ranks": 0, "loss_rank_avg": 0.014736687764525414, "step": 5060, "valid_targets_mean": 9324.5, "valid_targets_min": 2369 }, { "epoch": 4.86112, "grad_norm": 0.11765425870521874, "learning_rate": 9.560897613226205e-08, "loss": 0.0467, "loss_nan_ranks": 0, "loss_rank_avg": 0.013002576306462288, "step": 5065, "valid_targets_mean": 8633.2, "valid_targets_min": 3927 }, { "epoch": 4.86592, "grad_norm": 0.1274053457419819, "learning_rate": 8.917733662050287e-08, "loss": 0.0451, "loss_nan_ranks": 0, "loss_rank_avg": 0.016446460038423538, "step": 5070, "valid_targets_mean": 9135.6, "valid_targets_min": 4543 }, { "epoch": 4.87072, "grad_norm": 0.1278704051137457, "learning_rate": 8.296914079461094e-08, "loss": 0.0453, "loss_nan_ranks": 0, "loss_rank_avg": 0.018057048320770264, "step": 5075, "valid_targets_mean": 8849.5, "valid_targets_min": 2853 }, { "epoch": 4.87552, "grad_norm": 0.129798463098386, "learning_rate": 7.698445832433843e-08, "loss": 0.0475, "loss_nan_ranks": 0, "loss_rank_avg": 0.01605452410876751, "step": 5080, "valid_targets_mean": 9165.0, "valid_targets_min": 4097 }, { "epoch": 4.88032, "grad_norm": 0.12709516254412107, "learning_rate": 7.122335637112621e-08, "loss": 0.0465, "loss_nan_ranks": 0, "loss_rank_avg": 0.017007878050208092, "step": 5085, "valid_targets_mean": 8871.7, "valid_targets_min": 4935 }, { "epoch": 4.88512, "grad_norm": 0.12614752472781804, "learning_rate": 6.568589958734218e-08, "loss": 0.0467, "loss_nan_ranks": 0, "loss_rank_avg": 0.015092524699866772, "step": 5090, "valid_targets_mean": 8470.4, "valid_targets_min": 3363 }, { "epoch": 4.88992, "grad_norm": 0.1923253876332768, "learning_rate": 6.037215011556185e-08, "loss": 0.0454, "loss_nan_ranks": 0, "loss_rank_avg": 0.017001967877149582, "step": 5095, "valid_targets_mean": 8674.8, "valid_targets_min": 2585 }, { "epoch": 4.8947199999999995, "grad_norm": 0.11983896174408, "learning_rate": 5.5282167587862314e-08, "loss": 0.0454, "loss_nan_ranks": 0, "loss_rank_avg": 0.01640951633453369, "step": 5100, "valid_targets_mean": 8320.3, "valid_targets_min": 802 }, { "epoch": 4.89952, "grad_norm": 0.1245498830155723, "learning_rate": 5.041600912516264e-08, "loss": 0.0499, "loss_nan_ranks": 0, "loss_rank_avg": 0.016499202698469162, "step": 5105, "valid_targets_mean": 8774.8, "valid_targets_min": 1804 }, { "epoch": 4.90432, "grad_norm": 0.12071257658116219, "learning_rate": 4.5773729336577865e-08, "loss": 0.0464, "loss_nan_ranks": 0, "loss_rank_avg": 0.01530368346720934, "step": 5110, "valid_targets_mean": 8999.9, "valid_targets_min": 3408 }, { "epoch": 4.90912, "grad_norm": 0.12289113526900305, "learning_rate": 4.1355380318803816e-08, "loss": 0.0473, "loss_nan_ranks": 0, "loss_rank_avg": 0.014382155612111092, "step": 5115, "valid_targets_mean": 7970.6, "valid_targets_min": 1619 }, { "epoch": 4.91392, "grad_norm": 0.12271587443432708, "learning_rate": 3.7161011655535425e-08, "loss": 0.0489, "loss_nan_ranks": 0, "loss_rank_avg": 0.01587647944688797, "step": 5120, "valid_targets_mean": 8968.0, "valid_targets_min": 1910 }, { "epoch": 4.91872, "grad_norm": 0.11789556004029846, "learning_rate": 3.319067041691604e-08, "loss": 0.0458, "loss_nan_ranks": 0, "loss_rank_avg": 0.014570049941539764, "step": 5125, "valid_targets_mean": 8545.9, "valid_targets_min": 1723 }, { "epoch": 4.92352, "grad_norm": 0.11863148816376579, "learning_rate": 2.9444401158995606e-08, "loss": 0.046, "loss_nan_ranks": 0, "loss_rank_avg": 0.014068776741623878, "step": 5130, "valid_targets_mean": 9208.9, "valid_targets_min": 2341 }, { "epoch": 4.92832, "grad_norm": 0.1393289097006946, "learning_rate": 2.5922245923244436e-08, "loss": 0.0451, "loss_nan_ranks": 0, "loss_rank_avg": 0.01812027022242546, "step": 5135, "valid_targets_mean": 8554.4, "valid_targets_min": 2437 }, { "epoch": 4.93312, "grad_norm": 0.12652127402167426, "learning_rate": 2.2624244236071348e-08, "loss": 0.045, "loss_nan_ranks": 0, "loss_rank_avg": 0.01672193594276905, "step": 5140, "valid_targets_mean": 8582.4, "valid_targets_min": 2277 }, { "epoch": 4.93792, "grad_norm": 0.12288190891498557, "learning_rate": 1.9550433108384005e-08, "loss": 0.0462, "loss_nan_ranks": 0, "loss_rank_avg": 0.014536580070853233, "step": 5145, "valid_targets_mean": 8607.1, "valid_targets_min": 2724 }, { "epoch": 4.94272, "grad_norm": 0.12214205725983128, "learning_rate": 1.6700847035180378e-08, "loss": 0.0455, "loss_nan_ranks": 0, "loss_rank_avg": 0.014544010162353516, "step": 5150, "valid_targets_mean": 8026.7, "valid_targets_min": 3201 }, { "epoch": 4.94752, "grad_norm": 0.12608336933895256, "learning_rate": 1.4075517995146837e-08, "loss": 0.0441, "loss_nan_ranks": 0, "loss_rank_avg": 0.015675101429224014, "step": 5155, "valid_targets_mean": 8635.8, "valid_targets_min": 3217 }, { "epoch": 4.95232, "grad_norm": 0.1225680672115912, "learning_rate": 1.167447545031175e-08, "loss": 0.0451, "loss_nan_ranks": 0, "loss_rank_avg": 0.016280420124530792, "step": 5160, "valid_targets_mean": 8837.4, "valid_targets_min": 3252 }, { "epoch": 4.95712, "grad_norm": 0.12286400688787606, "learning_rate": 9.497746345705772e-09, "loss": 0.044, "loss_nan_ranks": 0, "loss_rank_avg": 0.015019871294498444, "step": 5165, "valid_targets_mean": 9391.8, "valid_targets_min": 4096 }, { "epoch": 4.96192, "grad_norm": 0.12859491123299127, "learning_rate": 7.545355109073172e-09, "loss": 0.0494, "loss_nan_ranks": 0, "loss_rank_avg": 0.019673161208629608, "step": 5170, "valid_targets_mean": 9072.6, "valid_targets_min": 3816 }, { "epoch": 4.9667200000000005, "grad_norm": 0.1244229546631015, "learning_rate": 5.817323650578743e-09, "loss": 0.0463, "loss_nan_ranks": 0, "loss_rank_avg": 0.014512769877910614, "step": 5175, "valid_targets_mean": 8819.8, "valid_targets_min": 2984 }, { "epoch": 4.97152, "grad_norm": 0.1281022316707428, "learning_rate": 4.313671362576877e-09, "loss": 0.0445, "loss_nan_ranks": 0, "loss_rank_avg": 0.014761531725525856, "step": 5180, "valid_targets_mean": 7589.6, "valid_targets_min": 2654 }, { "epoch": 4.97632, "grad_norm": 0.12672023643063166, "learning_rate": 3.0344151193917316e-09, "loss": 0.0466, "loss_nan_ranks": 0, "loss_rank_avg": 0.017525404691696167, "step": 5185, "valid_targets_mean": 9014.8, "valid_targets_min": 3080 }, { "epoch": 4.98112, "grad_norm": 0.12136843073730945, "learning_rate": 1.979569277117399e-09, "loss": 0.0457, "loss_nan_ranks": 0, "loss_rank_avg": 0.014057071879506111, "step": 5190, "valid_targets_mean": 8457.4, "valid_targets_min": 3076 }, { "epoch": 4.98592, "grad_norm": 0.12994809873959323, "learning_rate": 1.1491456734713524e-09, "loss": 0.0477, "loss_nan_ranks": 0, "loss_rank_avg": 0.015671029686927795, "step": 5195, "valid_targets_mean": 7887.4, "valid_targets_min": 3187 }, { "epoch": 4.99072, "grad_norm": 0.1298460048267671, "learning_rate": 5.431536276523375e-10, "loss": 0.0449, "loss_nan_ranks": 0, "loss_rank_avg": 0.015169478952884674, "step": 5200, "valid_targets_mean": 8369.0, "valid_targets_min": 2163 }, { "epoch": 4.99552, "grad_norm": 0.12910354490109707, "learning_rate": 1.6159994023601245e-10, "loss": 0.0467, "loss_nan_ranks": 0, "loss_rank_avg": 0.016222694888710976, "step": 5205, "valid_targets_mean": 8800.3, "valid_targets_min": 3409 }, { "epoch": 5.0, "grad_norm": 0.147008087077442, "learning_rate": 4.488893106113779e-12, "loss": 0.0436, "loss_nan_ranks": 0, "loss_rank_avg": 0.018921401351690292, "step": 5210, "valid_targets_mean": 8871.3, "valid_targets_min": 2185 }, { "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.018921401351690292, "step": 5210, "total_flos": 3.8872733453226344e+19, "train_loss": 0.0035894543761941615, "train_runtime": 12426.1828, "train_samples_per_second": 40.238, "train_steps_per_second": 0.419, "valid_targets_mean": 8871.3, "valid_targets_min": 2185 } ], "logging_steps": 5, "max_steps": 5210, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 300, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 3.8872733453226344e+19, "train_batch_size": 1, "trial_name": null, "trial_params": null }