Files
coderforge-100000-opt100k__…/trainer_state.json
ModelHub XC 791318bdc1 初始化项目,由ModelHub XC社区提供模型
Model: laion/coderforge-100000-opt100k__Qwen3-8B
Source: Original Platform
2026-05-27 22:32:22 +08:00

11510 lines
311 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 5210,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0048,
"grad_norm": 9.841835067235065,
"learning_rate": 3.071017274472169e-07,
"loss": 0.4918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17842981219291687,
"step": 5,
"valid_targets_mean": 9620.0,
"valid_targets_min": 4054
},
{
"epoch": 0.0096,
"grad_norm": 9.037327151868297,
"learning_rate": 6.909788867562381e-07,
"loss": 0.4922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15718884766101837,
"step": 10,
"valid_targets_mean": 8666.8,
"valid_targets_min": 2206
},
{
"epoch": 0.0144,
"grad_norm": 6.033909463391279,
"learning_rate": 1.074856046065259e-06,
"loss": 0.4709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15585705637931824,
"step": 15,
"valid_targets_mean": 8733.8,
"valid_targets_min": 4350
},
{
"epoch": 0.0192,
"grad_norm": 3.2861111342090337,
"learning_rate": 1.4587332053742803e-06,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14734426140785217,
"step": 20,
"valid_targets_mean": 7922.4,
"valid_targets_min": 1729
},
{
"epoch": 0.024,
"grad_norm": 1.6258530010888506,
"learning_rate": 1.8426103646833015e-06,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13337181508541107,
"step": 25,
"valid_targets_mean": 9515.2,
"valid_targets_min": 1791
},
{
"epoch": 0.0288,
"grad_norm": 1.1794986084798527,
"learning_rate": 2.2264875239923228e-06,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11573775112628937,
"step": 30,
"valid_targets_mean": 8802.9,
"valid_targets_min": 2606
},
{
"epoch": 0.0336,
"grad_norm": 0.7048103409679258,
"learning_rate": 2.6103646833013433e-06,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10993142426013947,
"step": 35,
"valid_targets_mean": 8278.6,
"valid_targets_min": 740
},
{
"epoch": 0.0384,
"grad_norm": 0.5264062159110527,
"learning_rate": 2.9942418426103648e-06,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10869134962558746,
"step": 40,
"valid_targets_mean": 8495.2,
"valid_targets_min": 2561
},
{
"epoch": 0.0432,
"grad_norm": 0.4514711080116693,
"learning_rate": 3.378119001919386e-06,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09915158152580261,
"step": 45,
"valid_targets_mean": 9248.5,
"valid_targets_min": 2873
},
{
"epoch": 0.048,
"grad_norm": 0.3420802729257966,
"learning_rate": 3.761996161228407e-06,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09442837536334991,
"step": 50,
"valid_targets_mean": 9355.0,
"valid_targets_min": 1269
},
{
"epoch": 0.0528,
"grad_norm": 0.28683988209383904,
"learning_rate": 4.145873320537428e-06,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08352220058441162,
"step": 55,
"valid_targets_mean": 8734.5,
"valid_targets_min": 3777
},
{
"epoch": 0.0576,
"grad_norm": 0.23737129343553093,
"learning_rate": 4.52975047984645e-06,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08115425705909729,
"step": 60,
"valid_targets_mean": 9034.8,
"valid_targets_min": 3693
},
{
"epoch": 0.0624,
"grad_norm": 0.19876401961795503,
"learning_rate": 4.91362763915547e-06,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07270577549934387,
"step": 65,
"valid_targets_mean": 8782.1,
"valid_targets_min": 4980
},
{
"epoch": 0.0672,
"grad_norm": 0.18075045396174094,
"learning_rate": 5.297504798464492e-06,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06922709941864014,
"step": 70,
"valid_targets_mean": 9367.7,
"valid_targets_min": 3471
},
{
"epoch": 0.072,
"grad_norm": 0.16424216569165836,
"learning_rate": 5.681381957773513e-06,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07363235950469971,
"step": 75,
"valid_targets_mean": 9389.4,
"valid_targets_min": 4957
},
{
"epoch": 0.0768,
"grad_norm": 0.17072015557944906,
"learning_rate": 6.065259117082534e-06,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06568406522274017,
"step": 80,
"valid_targets_mean": 8954.7,
"valid_targets_min": 2729
},
{
"epoch": 0.0816,
"grad_norm": 0.16204494202483938,
"learning_rate": 6.449136276391556e-06,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06659156829118729,
"step": 85,
"valid_targets_mean": 8714.0,
"valid_targets_min": 3139
},
{
"epoch": 0.0864,
"grad_norm": 0.16165159991381337,
"learning_rate": 6.833013435700576e-06,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05660694092512131,
"step": 90,
"valid_targets_mean": 8498.3,
"valid_targets_min": 2404
},
{
"epoch": 0.0912,
"grad_norm": 0.1560247037025123,
"learning_rate": 7.216890595009598e-06,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06358037143945694,
"step": 95,
"valid_targets_mean": 8950.7,
"valid_targets_min": 3809
},
{
"epoch": 0.096,
"grad_norm": 0.1616062884997598,
"learning_rate": 7.600767754318619e-06,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06089777871966362,
"step": 100,
"valid_targets_mean": 9242.6,
"valid_targets_min": 5629
},
{
"epoch": 0.1008,
"grad_norm": 0.19586837078411862,
"learning_rate": 7.98464491362764e-06,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06420055031776428,
"step": 105,
"valid_targets_mean": 8664.1,
"valid_targets_min": 4408
},
{
"epoch": 0.1056,
"grad_norm": 0.16113724556095765,
"learning_rate": 8.368522072936662e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06036144495010376,
"step": 110,
"valid_targets_mean": 8733.9,
"valid_targets_min": 1577
},
{
"epoch": 0.1104,
"grad_norm": 0.16110423128629503,
"learning_rate": 8.752399232245682e-06,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06447982788085938,
"step": 115,
"valid_targets_mean": 9054.4,
"valid_targets_min": 3944
},
{
"epoch": 0.1152,
"grad_norm": 0.176566106291253,
"learning_rate": 9.136276391554704e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062302470207214355,
"step": 120,
"valid_targets_mean": 9205.4,
"valid_targets_min": 1719
},
{
"epoch": 0.12,
"grad_norm": 0.17059615182231894,
"learning_rate": 9.520153550863724e-06,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058050885796546936,
"step": 125,
"valid_targets_mean": 8502.4,
"valid_targets_min": 3732
},
{
"epoch": 0.1248,
"grad_norm": 0.17066809947335904,
"learning_rate": 9.904030710172746e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05489126592874527,
"step": 130,
"valid_targets_mean": 7924.6,
"valid_targets_min": 2935
},
{
"epoch": 0.1296,
"grad_norm": 0.17976768953493777,
"learning_rate": 1.0287907869481766e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06662755459547043,
"step": 135,
"valid_targets_mean": 9386.0,
"valid_targets_min": 6181
},
{
"epoch": 0.1344,
"grad_norm": 0.16878851071563028,
"learning_rate": 1.067178502879079e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05300961434841156,
"step": 140,
"valid_targets_mean": 8530.2,
"valid_targets_min": 4057
},
{
"epoch": 0.1392,
"grad_norm": 0.18017955223205775,
"learning_rate": 1.105566218809981e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052747681736946106,
"step": 145,
"valid_targets_mean": 8150.8,
"valid_targets_min": 1979
},
{
"epoch": 0.144,
"grad_norm": 0.17011201848682178,
"learning_rate": 1.143953934740883e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053786564618349075,
"step": 150,
"valid_targets_mean": 9036.5,
"valid_targets_min": 1344
},
{
"epoch": 0.1488,
"grad_norm": 0.14948621014727742,
"learning_rate": 1.182341650671785e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04889284819364548,
"step": 155,
"valid_targets_mean": 9374.1,
"valid_targets_min": 5222
},
{
"epoch": 0.1536,
"grad_norm": 0.17837038997047153,
"learning_rate": 1.2207293666026872e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05337853729724884,
"step": 160,
"valid_targets_mean": 9026.4,
"valid_targets_min": 941
},
{
"epoch": 0.1584,
"grad_norm": 0.16794019625060191,
"learning_rate": 1.2591170825335894e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0580047108232975,
"step": 165,
"valid_targets_mean": 8909.0,
"valid_targets_min": 4147
},
{
"epoch": 0.1632,
"grad_norm": 0.16451121852700687,
"learning_rate": 1.2975047984644915e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05628425255417824,
"step": 170,
"valid_targets_mean": 9237.3,
"valid_targets_min": 2879
},
{
"epoch": 0.168,
"grad_norm": 0.1620845277038851,
"learning_rate": 1.3358925143953936e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05485953390598297,
"step": 175,
"valid_targets_mean": 8967.8,
"valid_targets_min": 1950
},
{
"epoch": 0.1728,
"grad_norm": 0.18552111008573974,
"learning_rate": 1.3742802303262956e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05156928300857544,
"step": 180,
"valid_targets_mean": 8037.1,
"valid_targets_min": 3591
},
{
"epoch": 0.1776,
"grad_norm": 0.1834362128640418,
"learning_rate": 1.4126679462571978e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05930773541331291,
"step": 185,
"valid_targets_mean": 8785.6,
"valid_targets_min": 2286
},
{
"epoch": 0.1824,
"grad_norm": 0.7040750475552785,
"learning_rate": 1.4510556621881e-05,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05356145650148392,
"step": 190,
"valid_targets_mean": 8743.2,
"valid_targets_min": 3331
},
{
"epoch": 0.1872,
"grad_norm": 0.17845848988906052,
"learning_rate": 1.4894433781190021e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050542086362838745,
"step": 195,
"valid_targets_mean": 8117.4,
"valid_targets_min": 2982
},
{
"epoch": 0.192,
"grad_norm": 0.1646793822772226,
"learning_rate": 1.527831094049904e-05,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05630158260464668,
"step": 200,
"valid_targets_mean": 9397.2,
"valid_targets_min": 3908
},
{
"epoch": 0.1968,
"grad_norm": 0.1653369285434222,
"learning_rate": 1.566218809980806e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05802737921476364,
"step": 205,
"valid_targets_mean": 9779.3,
"valid_targets_min": 2867
},
{
"epoch": 0.2016,
"grad_norm": 0.17699392141610665,
"learning_rate": 1.6046065259117082e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05261120945215225,
"step": 210,
"valid_targets_mean": 8929.7,
"valid_targets_min": 3230
},
{
"epoch": 0.2064,
"grad_norm": 0.15546901424567497,
"learning_rate": 1.6429942418426105e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0501735582947731,
"step": 215,
"valid_targets_mean": 9803.3,
"valid_targets_min": 4354
},
{
"epoch": 0.2112,
"grad_norm": 0.1647739852350217,
"learning_rate": 1.6813819577735126e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05220291018486023,
"step": 220,
"valid_targets_mean": 8609.9,
"valid_targets_min": 1686
},
{
"epoch": 0.216,
"grad_norm": 0.18923635383897736,
"learning_rate": 1.7197696737044146e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05251702666282654,
"step": 225,
"valid_targets_mean": 9155.3,
"valid_targets_min": 2869
},
{
"epoch": 0.2208,
"grad_norm": 0.17077125348550806,
"learning_rate": 1.758157389635317e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04130622744560242,
"step": 230,
"valid_targets_mean": 8067.4,
"valid_targets_min": 1355
},
{
"epoch": 0.2256,
"grad_norm": 0.16749430547993427,
"learning_rate": 1.796545105566219e-05,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046884313225746155,
"step": 235,
"valid_targets_mean": 8949.4,
"valid_targets_min": 5015
},
{
"epoch": 0.2304,
"grad_norm": 0.1686236778589441,
"learning_rate": 1.8349328214971213e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04728979989886284,
"step": 240,
"valid_targets_mean": 8402.7,
"valid_targets_min": 2024
},
{
"epoch": 0.2352,
"grad_norm": 0.17340081794047488,
"learning_rate": 1.8733205374280233e-05,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04933461174368858,
"step": 245,
"valid_targets_mean": 9134.0,
"valid_targets_min": 2863
},
{
"epoch": 0.24,
"grad_norm": 0.18643553683889033,
"learning_rate": 1.9117082533589253e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05289412662386894,
"step": 250,
"valid_targets_mean": 9414.7,
"valid_targets_min": 2948
},
{
"epoch": 0.2448,
"grad_norm": 0.16686892259142147,
"learning_rate": 1.9500959692898273e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0571310892701149,
"step": 255,
"valid_targets_mean": 9362.2,
"valid_targets_min": 1413
},
{
"epoch": 0.2496,
"grad_norm": 0.16428543489008277,
"learning_rate": 1.9884836852207294e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04735701531171799,
"step": 260,
"valid_targets_mean": 8750.2,
"valid_targets_min": 4447
},
{
"epoch": 0.2544,
"grad_norm": 0.1713855287966125,
"learning_rate": 2.0268714011516314e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04655732959508896,
"step": 265,
"valid_targets_mean": 8087.2,
"valid_targets_min": 2311
},
{
"epoch": 0.2592,
"grad_norm": 0.16600507062294687,
"learning_rate": 2.0652591170825337e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04228595644235611,
"step": 270,
"valid_targets_mean": 8538.3,
"valid_targets_min": 3618
},
{
"epoch": 0.264,
"grad_norm": 0.16203412094758496,
"learning_rate": 2.103646833013436e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04873499274253845,
"step": 275,
"valid_targets_mean": 8714.5,
"valid_targets_min": 2308
},
{
"epoch": 0.2688,
"grad_norm": 0.16232368985693238,
"learning_rate": 2.142034548944338e-05,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04977979511022568,
"step": 280,
"valid_targets_mean": 7793.4,
"valid_targets_min": 2243
},
{
"epoch": 0.2736,
"grad_norm": 0.16963787072822398,
"learning_rate": 2.18042226487524e-05,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04747937619686127,
"step": 285,
"valid_targets_mean": 8890.7,
"valid_targets_min": 3910
},
{
"epoch": 0.2784,
"grad_norm": 0.15596812207408062,
"learning_rate": 2.218809980806142e-05,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04897751659154892,
"step": 290,
"valid_targets_mean": 8705.1,
"valid_targets_min": 2007
},
{
"epoch": 0.2832,
"grad_norm": 0.17698628792600066,
"learning_rate": 2.2571976967370445e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04906153678894043,
"step": 295,
"valid_targets_mean": 8524.2,
"valid_targets_min": 2711
},
{
"epoch": 0.288,
"grad_norm": 0.15226044506219266,
"learning_rate": 2.2955854126679465e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04470205307006836,
"step": 300,
"valid_targets_mean": 9084.5,
"valid_targets_min": 4514
},
{
"epoch": 0.2928,
"grad_norm": 0.1631758341391722,
"learning_rate": 2.3339731285988485e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0455140583217144,
"step": 305,
"valid_targets_mean": 8223.5,
"valid_targets_min": 2624
},
{
"epoch": 0.2976,
"grad_norm": 0.16266001506773634,
"learning_rate": 2.372360844529751e-05,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04833702743053436,
"step": 310,
"valid_targets_mean": 9030.3,
"valid_targets_min": 2595
},
{
"epoch": 0.3024,
"grad_norm": 0.1552003389279275,
"learning_rate": 2.4107485604606525e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04400190711021423,
"step": 315,
"valid_targets_mean": 8977.0,
"valid_targets_min": 3447
},
{
"epoch": 0.3072,
"grad_norm": 0.16366961875606295,
"learning_rate": 2.449136276391555e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052342720329761505,
"step": 320,
"valid_targets_mean": 8492.8,
"valid_targets_min": 1643
},
{
"epoch": 0.312,
"grad_norm": 0.21633571289591977,
"learning_rate": 2.4875239923224573e-05,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06043235957622528,
"step": 325,
"valid_targets_mean": 9089.8,
"valid_targets_min": 3622
},
{
"epoch": 0.3168,
"grad_norm": 0.16778566765447833,
"learning_rate": 2.525911708253359e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04372868314385414,
"step": 330,
"valid_targets_mean": 8514.7,
"valid_targets_min": 1581
},
{
"epoch": 0.3216,
"grad_norm": 0.1525783264460117,
"learning_rate": 2.5642994241842613e-05,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04171153903007507,
"step": 335,
"valid_targets_mean": 8744.2,
"valid_targets_min": 2937
},
{
"epoch": 0.3264,
"grad_norm": 0.17090017951805586,
"learning_rate": 2.6026871401151633e-05,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046074796468019485,
"step": 340,
"valid_targets_mean": 8279.8,
"valid_targets_min": 2561
},
{
"epoch": 0.3312,
"grad_norm": 0.16550150425181892,
"learning_rate": 2.6410748560460657e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04613085091114044,
"step": 345,
"valid_targets_mean": 8464.2,
"valid_targets_min": 2617
},
{
"epoch": 0.336,
"grad_norm": 0.15473637741869978,
"learning_rate": 2.6794625719769677e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049118585884571075,
"step": 350,
"valid_targets_mean": 9190.0,
"valid_targets_min": 4909
},
{
"epoch": 0.3408,
"grad_norm": 0.1530756738736752,
"learning_rate": 2.7178502879078697e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04675169289112091,
"step": 355,
"valid_targets_mean": 8826.0,
"valid_targets_min": 2023
},
{
"epoch": 0.3456,
"grad_norm": 0.16704144085394457,
"learning_rate": 2.756238003838772e-05,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05301285907626152,
"step": 360,
"valid_targets_mean": 9298.4,
"valid_targets_min": 2038
},
{
"epoch": 0.3504,
"grad_norm": 0.1705539915112971,
"learning_rate": 2.7946257197696737e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047162771224975586,
"step": 365,
"valid_targets_mean": 8848.1,
"valid_targets_min": 2694
},
{
"epoch": 0.3552,
"grad_norm": 0.17172115669532714,
"learning_rate": 2.833013435700576e-05,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04858285188674927,
"step": 370,
"valid_targets_mean": 8245.0,
"valid_targets_min": 3959
},
{
"epoch": 0.36,
"grad_norm": 0.1635738602794979,
"learning_rate": 2.8714011516314784e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05017467588186264,
"step": 375,
"valid_targets_mean": 8803.3,
"valid_targets_min": 4631
},
{
"epoch": 0.3648,
"grad_norm": 0.14689162023635646,
"learning_rate": 2.90978886756238e-05,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04908227548003197,
"step": 380,
"valid_targets_mean": 9190.8,
"valid_targets_min": 2141
},
{
"epoch": 0.3696,
"grad_norm": 0.1735748309731461,
"learning_rate": 2.9481765834932825e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05058016628026962,
"step": 385,
"valid_targets_mean": 8794.3,
"valid_targets_min": 2139
},
{
"epoch": 0.3744,
"grad_norm": 0.16453333610787235,
"learning_rate": 2.9865642994241845e-05,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044411011040210724,
"step": 390,
"valid_targets_mean": 9082.6,
"valid_targets_min": 3334
},
{
"epoch": 0.3792,
"grad_norm": 0.16928223848401386,
"learning_rate": 3.0249520153550865e-05,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04547496512532234,
"step": 395,
"valid_targets_mean": 8381.7,
"valid_targets_min": 1637
},
{
"epoch": 0.384,
"grad_norm": 0.16575962515587384,
"learning_rate": 3.063339731285989e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052196696400642395,
"step": 400,
"valid_targets_mean": 9116.9,
"valid_targets_min": 3837
},
{
"epoch": 0.3888,
"grad_norm": 0.1465834004473263,
"learning_rate": 3.101727447216891e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042442236095666885,
"step": 405,
"valid_targets_mean": 8501.0,
"valid_targets_min": 2762
},
{
"epoch": 0.3936,
"grad_norm": 0.168887624117521,
"learning_rate": 3.140115163147793e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04733353853225708,
"step": 410,
"valid_targets_mean": 9785.0,
"valid_targets_min": 4165
},
{
"epoch": 0.3984,
"grad_norm": 0.1674817302783263,
"learning_rate": 3.178502879078695e-05,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04236965253949165,
"step": 415,
"valid_targets_mean": 7495.3,
"valid_targets_min": 2040
},
{
"epoch": 0.4032,
"grad_norm": 0.1633791795734902,
"learning_rate": 3.216890595009597e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04652637243270874,
"step": 420,
"valid_targets_mean": 9678.3,
"valid_targets_min": 3511
},
{
"epoch": 0.408,
"grad_norm": 0.15017097856344935,
"learning_rate": 3.2552783109404996e-05,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04723096638917923,
"step": 425,
"valid_targets_mean": 8518.3,
"valid_targets_min": 5212
},
{
"epoch": 0.4128,
"grad_norm": 0.16403792996616412,
"learning_rate": 3.2936660268714016e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045905664563179016,
"step": 430,
"valid_targets_mean": 8233.1,
"valid_targets_min": 1554
},
{
"epoch": 0.4176,
"grad_norm": 0.15363370389018594,
"learning_rate": 3.3320537428023036e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047167956829071045,
"step": 435,
"valid_targets_mean": 9401.3,
"valid_targets_min": 2729
},
{
"epoch": 0.4224,
"grad_norm": 0.14941194784466624,
"learning_rate": 3.3704414587332056e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04570108652114868,
"step": 440,
"valid_targets_mean": 8790.9,
"valid_targets_min": 1588
},
{
"epoch": 0.4272,
"grad_norm": 0.1366092155715405,
"learning_rate": 3.4088291746641077e-05,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04900815337896347,
"step": 445,
"valid_targets_mean": 9022.6,
"valid_targets_min": 3456
},
{
"epoch": 0.432,
"grad_norm": 0.15770732910450744,
"learning_rate": 3.4472168905950104e-05,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04628250002861023,
"step": 450,
"valid_targets_mean": 8808.2,
"valid_targets_min": 5148
},
{
"epoch": 0.4368,
"grad_norm": 0.1629314200910405,
"learning_rate": 3.485604606525912e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0451054573059082,
"step": 455,
"valid_targets_mean": 8471.3,
"valid_targets_min": 2409
},
{
"epoch": 0.4416,
"grad_norm": 0.160272458945177,
"learning_rate": 3.5239923224568144e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048758409917354584,
"step": 460,
"valid_targets_mean": 8512.3,
"valid_targets_min": 3525
},
{
"epoch": 0.4464,
"grad_norm": 0.16561926988288322,
"learning_rate": 3.5623800383877164e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05006253719329834,
"step": 465,
"valid_targets_mean": 8585.6,
"valid_targets_min": 2285
},
{
"epoch": 0.4512,
"grad_norm": 0.16050505436260384,
"learning_rate": 3.6007677543186184e-05,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05636896938085556,
"step": 470,
"valid_targets_mean": 9733.6,
"valid_targets_min": 2143
},
{
"epoch": 0.456,
"grad_norm": 0.14490817773722517,
"learning_rate": 3.6391554702495204e-05,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047622889280319214,
"step": 475,
"valid_targets_mean": 9244.6,
"valid_targets_min": 3390
},
{
"epoch": 0.4608,
"grad_norm": 0.15192210465120123,
"learning_rate": 3.6775431861804224e-05,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044686153531074524,
"step": 480,
"valid_targets_mean": 8674.3,
"valid_targets_min": 2361
},
{
"epoch": 0.4656,
"grad_norm": 0.15068638781498972,
"learning_rate": 3.7159309021113245e-05,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04900766536593437,
"step": 485,
"valid_targets_mean": 9105.2,
"valid_targets_min": 2433
},
{
"epoch": 0.4704,
"grad_norm": 0.16096900900073532,
"learning_rate": 3.7543186180422265e-05,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04619026556611061,
"step": 490,
"valid_targets_mean": 8567.6,
"valid_targets_min": 4220
},
{
"epoch": 0.4752,
"grad_norm": 0.15476058661894235,
"learning_rate": 3.792706333973129e-05,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04463457316160202,
"step": 495,
"valid_targets_mean": 8529.2,
"valid_targets_min": 2511
},
{
"epoch": 0.48,
"grad_norm": 0.15092582689941947,
"learning_rate": 3.831094049904031e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03905282914638519,
"step": 500,
"valid_targets_mean": 8270.3,
"valid_targets_min": 2377
},
{
"epoch": 0.4848,
"grad_norm": 0.1537525325660721,
"learning_rate": 3.869481765834933e-05,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041663214564323425,
"step": 505,
"valid_targets_mean": 7962.0,
"valid_targets_min": 3432
},
{
"epoch": 0.4896,
"grad_norm": 0.15466191978224791,
"learning_rate": 3.907869481765835e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04699457436800003,
"step": 510,
"valid_targets_mean": 8543.5,
"valid_targets_min": 1866
},
{
"epoch": 0.4944,
"grad_norm": 0.14871033158460176,
"learning_rate": 3.946257197696737e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04727835953235626,
"step": 515,
"valid_targets_mean": 8456.3,
"valid_targets_min": 4250
},
{
"epoch": 0.4992,
"grad_norm": 0.14338051178538652,
"learning_rate": 3.984644913627639e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040438905358314514,
"step": 520,
"valid_targets_mean": 8662.9,
"valid_targets_min": 2256
},
{
"epoch": 0.504,
"grad_norm": 0.15742380971099282,
"learning_rate": 3.999995959997414e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04269728064537048,
"step": 525,
"valid_targets_mean": 8493.9,
"valid_targets_min": 2420
},
{
"epoch": 0.5088,
"grad_norm": 0.15670069467354014,
"learning_rate": 3.999971271151827e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04551412910223007,
"step": 530,
"valid_targets_mean": 9344.8,
"valid_targets_min": 5656
},
{
"epoch": 0.5136,
"grad_norm": 0.15374405667621877,
"learning_rate": 3.9999241381832614e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0490286722779274,
"step": 535,
"valid_targets_mean": 8047.5,
"valid_targets_min": 3717
},
{
"epoch": 0.5184,
"grad_norm": 0.1519411027027414,
"learning_rate": 3.999854561620655e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045247673988342285,
"step": 540,
"valid_targets_mean": 9440.2,
"valid_targets_min": 2358
},
{
"epoch": 0.5232,
"grad_norm": 0.14569122526754544,
"learning_rate": 3.9997625422448114e-05,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04392744228243828,
"step": 545,
"valid_targets_mean": 9050.4,
"valid_targets_min": 5323
},
{
"epoch": 0.528,
"grad_norm": 0.13609907027733714,
"learning_rate": 3.999648081088391e-05,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04291406646370888,
"step": 550,
"valid_targets_mean": 9465.5,
"valid_targets_min": 2912
},
{
"epoch": 0.5328,
"grad_norm": 0.1377783947779239,
"learning_rate": 3.999511179435905e-05,
"loss": 0.1293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040753189474344254,
"step": 555,
"valid_targets_mean": 9555.9,
"valid_targets_min": 2568
},
{
"epoch": 0.5376,
"grad_norm": 0.1379593120954164,
"learning_rate": 3.999351838823691e-05,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04435383528470993,
"step": 560,
"valid_targets_mean": 9169.4,
"valid_targets_min": 3276
},
{
"epoch": 0.5424,
"grad_norm": 0.1418424270920895,
"learning_rate": 3.999170061039908e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046147946268320084,
"step": 565,
"valid_targets_mean": 9111.7,
"valid_targets_min": 1397
},
{
"epoch": 0.5472,
"grad_norm": 0.14040633557580692,
"learning_rate": 3.998965848124505e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048749588429927826,
"step": 570,
"valid_targets_mean": 9351.5,
"valid_targets_min": 5556
},
{
"epoch": 0.552,
"grad_norm": 0.13449375343867295,
"learning_rate": 3.998739202369205e-05,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041300173848867416,
"step": 575,
"valid_targets_mean": 8922.3,
"valid_targets_min": 2736
},
{
"epoch": 0.5568,
"grad_norm": 0.14743580069920623,
"learning_rate": 3.998490126317477e-05,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04395359009504318,
"step": 580,
"valid_targets_mean": 8960.4,
"valid_targets_min": 2701
},
{
"epoch": 0.5616,
"grad_norm": 0.14157038751939097,
"learning_rate": 3.9982186227645085e-05,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04324673116207123,
"step": 585,
"valid_targets_mean": 8823.2,
"valid_targets_min": 418
},
{
"epoch": 0.5664,
"grad_norm": 0.1582091638266866,
"learning_rate": 3.9979246947571724e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04149835929274559,
"step": 590,
"valid_targets_mean": 7495.4,
"valid_targets_min": 2352
},
{
"epoch": 0.5712,
"grad_norm": 0.14899721581452358,
"learning_rate": 3.9976083455939945e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04160813242197037,
"step": 595,
"valid_targets_mean": 8655.7,
"valid_targets_min": 2572
},
{
"epoch": 0.576,
"grad_norm": 0.1539653528766409,
"learning_rate": 3.9972695788251155e-05,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04525775834918022,
"step": 600,
"valid_targets_mean": 8892.5,
"valid_targets_min": 5296
},
{
"epoch": 0.5808,
"grad_norm": 0.14943883780637449,
"learning_rate": 3.996908398252251e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043959811329841614,
"step": 605,
"valid_targets_mean": 8608.5,
"valid_targets_min": 3362
},
{
"epoch": 0.5856,
"grad_norm": 0.13367238747822863,
"learning_rate": 3.9965248079286505e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04346688464283943,
"step": 610,
"valid_targets_mean": 9197.5,
"valid_targets_min": 1977
},
{
"epoch": 0.5904,
"grad_norm": 0.13643029241656873,
"learning_rate": 3.99611881215905e-05,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041380517184734344,
"step": 615,
"valid_targets_mean": 8393.2,
"valid_targets_min": 2051
},
{
"epoch": 0.5952,
"grad_norm": 0.1377113571496518,
"learning_rate": 3.995690415499624e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04686662554740906,
"step": 620,
"valid_targets_mean": 9150.6,
"valid_targets_min": 3686
},
{
"epoch": 0.6,
"grad_norm": 0.1403099261926008,
"learning_rate": 3.995239622757936e-05,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0410618893802166,
"step": 625,
"valid_targets_mean": 8159.0,
"valid_targets_min": 3947
},
{
"epoch": 0.6048,
"grad_norm": 0.14096536721898614,
"learning_rate": 3.994766438992882e-05,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03911704570055008,
"step": 630,
"valid_targets_mean": 7991.7,
"valid_targets_min": 1670
},
{
"epoch": 0.6096,
"grad_norm": 0.13195736313161857,
"learning_rate": 3.994270869514635e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0424465574324131,
"step": 635,
"valid_targets_mean": 8870.5,
"valid_targets_min": 2210
},
{
"epoch": 0.6144,
"grad_norm": 0.13332668179988635,
"learning_rate": 3.9937529198845864e-05,
"loss": 0.1283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04478909820318222,
"step": 640,
"valid_targets_mean": 8382.8,
"valid_targets_min": 2213
},
{
"epoch": 0.6192,
"grad_norm": 0.13716325538151122,
"learning_rate": 3.9932125959152833e-05,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04378994181752205,
"step": 645,
"valid_targets_mean": 8748.3,
"valid_targets_min": 2320
},
{
"epoch": 0.624,
"grad_norm": 0.1308079107487341,
"learning_rate": 3.9926499036703607e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038693659007549286,
"step": 650,
"valid_targets_mean": 8223.2,
"valid_targets_min": 3239
},
{
"epoch": 0.6288,
"grad_norm": 0.14424264976490078,
"learning_rate": 3.992064849464476e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043246474117040634,
"step": 655,
"valid_targets_mean": 7944.7,
"valid_targets_min": 1974
},
{
"epoch": 0.6336,
"grad_norm": 0.14454916157149716,
"learning_rate": 3.991457439863238e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052069369703531265,
"step": 660,
"valid_targets_mean": 9785.6,
"valid_targets_min": 2127
},
{
"epoch": 0.6384,
"grad_norm": 0.13727057460729494,
"learning_rate": 3.990827681683133e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04632120579481125,
"step": 665,
"valid_targets_mean": 8698.8,
"valid_targets_min": 1935
},
{
"epoch": 0.6432,
"grad_norm": 0.1398377748234492,
"learning_rate": 3.990175581991448e-05,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04159468784928322,
"step": 670,
"valid_targets_mean": 8791.3,
"valid_targets_min": 3886
},
{
"epoch": 0.648,
"grad_norm": 0.1345378725929749,
"learning_rate": 3.989501148106189e-05,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04403248429298401,
"step": 675,
"valid_targets_mean": 8627.5,
"valid_targets_min": 1892
},
{
"epoch": 0.6528,
"grad_norm": 0.12953037003518647,
"learning_rate": 3.988804387596005e-05,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042582374066114426,
"step": 680,
"valid_targets_mean": 9106.1,
"valid_targets_min": 3962
},
{
"epoch": 0.6576,
"grad_norm": 0.1350393492828008,
"learning_rate": 3.9880853082800965e-05,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041537463665008545,
"step": 685,
"valid_targets_mean": 8600.3,
"valid_targets_min": 3511
},
{
"epoch": 0.6624,
"grad_norm": 0.13206633754473568,
"learning_rate": 3.987343918228133e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044280827045440674,
"step": 690,
"valid_targets_mean": 8396.4,
"valid_targets_min": 3428
},
{
"epoch": 0.6672,
"grad_norm": 0.13729845663078688,
"learning_rate": 3.9865802257601584e-05,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04000245779752731,
"step": 695,
"valid_targets_mean": 8540.1,
"valid_targets_min": 1813
},
{
"epoch": 0.672,
"grad_norm": 0.13635663924478578,
"learning_rate": 3.9857942394464976e-05,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03872641175985336,
"step": 700,
"valid_targets_mean": 8601.8,
"valid_targets_min": 4288
},
{
"epoch": 0.6768,
"grad_norm": 0.15057437392276532,
"learning_rate": 3.984985968107667e-05,
"loss": 0.1262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04191380739212036,
"step": 705,
"valid_targets_mean": 8113.8,
"valid_targets_min": 1824
},
{
"epoch": 0.6816,
"grad_norm": 0.15262968979836647,
"learning_rate": 3.984155420814266e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045424915850162506,
"step": 710,
"valid_targets_mean": 9187.2,
"valid_targets_min": 3023
},
{
"epoch": 0.6864,
"grad_norm": 0.14131561005827004,
"learning_rate": 3.9833026068868814e-05,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04640107974410057,
"step": 715,
"valid_targets_mean": 9442.9,
"valid_targets_min": 2870
},
{
"epoch": 0.6912,
"grad_norm": 0.1536532150005904,
"learning_rate": 3.982427535895982e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04061667248606682,
"step": 720,
"valid_targets_mean": 7744.2,
"valid_targets_min": 1807
},
{
"epoch": 0.696,
"grad_norm": 0.14566890333011928,
"learning_rate": 3.9815302176618076e-05,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037999723106622696,
"step": 725,
"valid_targets_mean": 8014.6,
"valid_targets_min": 2692
},
{
"epoch": 0.7008,
"grad_norm": 0.1329319602860735,
"learning_rate": 3.980610662254264e-05,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043485239148139954,
"step": 730,
"valid_targets_mean": 8674.2,
"valid_targets_min": 1914
},
{
"epoch": 0.7056,
"grad_norm": 0.13214607087955763,
"learning_rate": 3.9796688799928075e-05,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03650156408548355,
"step": 735,
"valid_targets_mean": 8052.5,
"valid_targets_min": 1535
},
{
"epoch": 0.7104,
"grad_norm": 0.14666052223087997,
"learning_rate": 3.978704881446327e-05,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040827296674251556,
"step": 740,
"valid_targets_mean": 8658.8,
"valid_targets_min": 3364
},
{
"epoch": 0.7152,
"grad_norm": 0.13199011134390393,
"learning_rate": 3.9777186774330304e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03985761106014252,
"step": 745,
"valid_targets_mean": 8315.3,
"valid_targets_min": 2041
},
{
"epoch": 0.72,
"grad_norm": 0.13006510073207833,
"learning_rate": 3.976710279020318e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050185881555080414,
"step": 750,
"valid_targets_mean": 8819.3,
"valid_targets_min": 3518
},
{
"epoch": 0.7248,
"grad_norm": 0.12635946950837632,
"learning_rate": 3.975679697524661e-05,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0413113571703434,
"step": 755,
"valid_targets_mean": 9287.8,
"valid_targets_min": 2520
},
{
"epoch": 0.7296,
"grad_norm": 0.16619628024740615,
"learning_rate": 3.974626944511475e-05,
"loss": 0.1243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040970057249069214,
"step": 760,
"valid_targets_mean": 8394.7,
"valid_targets_min": 3787
},
{
"epoch": 0.7344,
"grad_norm": 0.13983220811078784,
"learning_rate": 3.973552031794988e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04032052308320999,
"step": 765,
"valid_targets_mean": 8312.5,
"valid_targets_min": 1690
},
{
"epoch": 0.7392,
"grad_norm": 0.13276909522770805,
"learning_rate": 3.9724549714381106e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0410274863243103,
"step": 770,
"valid_targets_mean": 9437.8,
"valid_targets_min": 4807
},
{
"epoch": 0.744,
"grad_norm": 0.14074663236062346,
"learning_rate": 3.971335775752298e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04447145760059357,
"step": 775,
"valid_targets_mean": 8283.8,
"valid_targets_min": 2255
},
{
"epoch": 0.7488,
"grad_norm": 0.13345475156150907,
"learning_rate": 3.970194457297414e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0476519837975502,
"step": 780,
"valid_targets_mean": 8958.5,
"valid_targets_min": 2037
},
{
"epoch": 0.7536,
"grad_norm": 0.13590512683057793,
"learning_rate": 3.9690310288815876e-05,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038623590022325516,
"step": 785,
"valid_targets_mean": 8875.8,
"valid_targets_min": 1547
},
{
"epoch": 0.7584,
"grad_norm": 0.12392055016932459,
"learning_rate": 3.967845503561073e-05,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03856155276298523,
"step": 790,
"valid_targets_mean": 8824.8,
"valid_targets_min": 3008
},
{
"epoch": 0.7632,
"grad_norm": 0.12808803769496246,
"learning_rate": 3.9666378946400974e-05,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04124930500984192,
"step": 795,
"valid_targets_mean": 8398.5,
"valid_targets_min": 4402
},
{
"epoch": 0.768,
"grad_norm": 0.12400753315300732,
"learning_rate": 3.965408215670719e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04107067734003067,
"step": 800,
"valid_targets_mean": 9418.2,
"valid_targets_min": 5645
},
{
"epoch": 0.7728,
"grad_norm": 0.1321463233062571,
"learning_rate": 3.964156480452667e-05,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040333010256290436,
"step": 805,
"valid_targets_mean": 9123.3,
"valid_targets_min": 2232
},
{
"epoch": 0.7776,
"grad_norm": 0.15850818767395258,
"learning_rate": 3.962882703033195e-05,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04237630218267441,
"step": 810,
"valid_targets_mean": 9014.5,
"valid_targets_min": 1757
},
{
"epoch": 0.7824,
"grad_norm": 0.13022752887109454,
"learning_rate": 3.961586897706915e-05,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03962777554988861,
"step": 815,
"valid_targets_mean": 8785.4,
"valid_targets_min": 3393
},
{
"epoch": 0.7872,
"grad_norm": 0.1411987989970659,
"learning_rate": 3.960269079015643e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04631964862346649,
"step": 820,
"valid_targets_mean": 9530.4,
"valid_targets_min": 5058
},
{
"epoch": 0.792,
"grad_norm": 0.13216475655191032,
"learning_rate": 3.958929261748236e-05,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04475382715463638,
"step": 825,
"valid_targets_mean": 8892.8,
"valid_targets_min": 2083
},
{
"epoch": 0.7968,
"grad_norm": 0.12772498172212535,
"learning_rate": 3.957567460940419e-05,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04453466087579727,
"step": 830,
"valid_targets_mean": 8443.8,
"valid_targets_min": 806
},
{
"epoch": 0.8016,
"grad_norm": 0.1288360457272141,
"learning_rate": 3.9561836918746256e-05,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04772651568055153,
"step": 835,
"valid_targets_mean": 9130.0,
"valid_targets_min": 3135
},
{
"epoch": 0.8064,
"grad_norm": 0.12904971741193666,
"learning_rate": 3.95477797007982e-05,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041636817157268524,
"step": 840,
"valid_targets_mean": 9023.4,
"valid_targets_min": 4250
},
{
"epoch": 0.8112,
"grad_norm": 0.1326001544343892,
"learning_rate": 3.953350311331325e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04039324074983597,
"step": 845,
"valid_targets_mean": 9260.4,
"valid_targets_min": 3688
},
{
"epoch": 0.816,
"grad_norm": 0.12642447244379482,
"learning_rate": 3.951900731650645e-05,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039405159652233124,
"step": 850,
"valid_targets_mean": 8837.0,
"valid_targets_min": 2405
},
{
"epoch": 0.8208,
"grad_norm": 0.13173156761588117,
"learning_rate": 3.950429247305286e-05,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03566863760352135,
"step": 855,
"valid_targets_mean": 7964.2,
"valid_targets_min": 1228
},
{
"epoch": 0.8256,
"grad_norm": 0.20449125184239303,
"learning_rate": 3.9489358748085737e-05,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044600710272789,
"step": 860,
"valid_targets_mean": 8969.1,
"valid_targets_min": 2519
},
{
"epoch": 0.8304,
"grad_norm": 0.1267782883516138,
"learning_rate": 3.947420630919466e-05,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040724076330661774,
"step": 865,
"valid_targets_mean": 8701.4,
"valid_targets_min": 2522
},
{
"epoch": 0.8352,
"grad_norm": 0.13947426674783286,
"learning_rate": 3.9458835326423674e-05,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03723190724849701,
"step": 870,
"valid_targets_mean": 8694.7,
"valid_targets_min": 3628
},
{
"epoch": 0.84,
"grad_norm": 0.1429427588322893,
"learning_rate": 3.9443245972269376e-05,
"loss": 0.1208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044337622821331024,
"step": 875,
"valid_targets_mean": 9151.8,
"valid_targets_min": 4207
},
{
"epoch": 0.8448,
"grad_norm": 0.12601811128568607,
"learning_rate": 3.942743842167896e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03860004246234894,
"step": 880,
"valid_targets_mean": 8116.6,
"valid_targets_min": 3504
},
{
"epoch": 0.8496,
"grad_norm": 0.1231651306256786,
"learning_rate": 3.941141285204829e-05,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03568350523710251,
"step": 885,
"valid_targets_mean": 8602.6,
"valid_targets_min": 3333
},
{
"epoch": 0.8544,
"grad_norm": 0.1327633357414085,
"learning_rate": 3.939516944321986e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03741621971130371,
"step": 890,
"valid_targets_mean": 7680.4,
"valid_targets_min": 2034
},
{
"epoch": 0.8592,
"grad_norm": 0.12782058862734189,
"learning_rate": 3.937870837748085e-05,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04108661413192749,
"step": 895,
"valid_targets_mean": 9461.2,
"valid_targets_min": 4191
},
{
"epoch": 0.864,
"grad_norm": 0.13095812423706943,
"learning_rate": 3.936202983956098e-05,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04491672292351723,
"step": 900,
"valid_targets_mean": 9060.0,
"valid_targets_min": 4238
},
{
"epoch": 0.8688,
"grad_norm": 0.14435955628562666,
"learning_rate": 3.934513401663052e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04353254288434982,
"step": 905,
"valid_targets_mean": 8174.2,
"valid_targets_min": 2049
},
{
"epoch": 0.8736,
"grad_norm": 0.13777422571076636,
"learning_rate": 3.9328021098298164e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04200918227434158,
"step": 910,
"valid_targets_mean": 7853.6,
"valid_targets_min": 2161
},
{
"epoch": 0.8784,
"grad_norm": 0.12925096382507895,
"learning_rate": 3.9310691276608894e-05,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03885449841618538,
"step": 915,
"valid_targets_mean": 8998.7,
"valid_targets_min": 4216
},
{
"epoch": 0.8832,
"grad_norm": 0.1299999207480068,
"learning_rate": 3.9293144746041824e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0414196252822876,
"step": 920,
"valid_targets_mean": 9441.6,
"valid_targets_min": 3116
},
{
"epoch": 0.888,
"grad_norm": 0.14119631019377754,
"learning_rate": 3.9275381703508034e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04161785542964935,
"step": 925,
"valid_targets_mean": 9032.9,
"valid_targets_min": 3320
},
{
"epoch": 0.8928,
"grad_norm": 0.1335427102135748,
"learning_rate": 3.925740234834833e-05,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039411455392837524,
"step": 930,
"valid_targets_mean": 8125.8,
"valid_targets_min": 2362
},
{
"epoch": 0.8976,
"grad_norm": 1.299524668859639,
"learning_rate": 3.9239206882331045e-05,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04274000972509384,
"step": 935,
"valid_targets_mean": 9362.2,
"valid_targets_min": 2499
},
{
"epoch": 0.9024,
"grad_norm": 0.14595064075165548,
"learning_rate": 3.922079550964976e-05,
"loss": 0.1203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041862644255161285,
"step": 940,
"valid_targets_mean": 8516.2,
"valid_targets_min": 2866
},
{
"epoch": 0.9072,
"grad_norm": 0.1406716428331579,
"learning_rate": 3.920216843692099e-05,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039388202130794525,
"step": 945,
"valid_targets_mean": 8288.1,
"valid_targets_min": 1520
},
{
"epoch": 0.912,
"grad_norm": 0.12120059012749052,
"learning_rate": 3.918332587318189e-05,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03998667746782303,
"step": 950,
"valid_targets_mean": 9838.4,
"valid_targets_min": 3065
},
{
"epoch": 0.9168,
"grad_norm": 0.12432674716745307,
"learning_rate": 3.916426802988791e-05,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034975167363882065,
"step": 955,
"valid_targets_mean": 8630.9,
"valid_targets_min": 3664
},
{
"epoch": 0.9216,
"grad_norm": 0.12453368828142465,
"learning_rate": 3.9144995120910414e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040313076227903366,
"step": 960,
"valid_targets_mean": 8565.8,
"valid_targets_min": 1313
},
{
"epoch": 0.9264,
"grad_norm": 0.12414549421169692,
"learning_rate": 3.912550736253428e-05,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03618764504790306,
"step": 965,
"valid_targets_mean": 9026.8,
"valid_targets_min": 2861
},
{
"epoch": 0.9312,
"grad_norm": 0.12295142873666405,
"learning_rate": 3.9105804973455466e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037326935678720474,
"step": 970,
"valid_targets_mean": 8990.8,
"valid_targets_min": 5060
},
{
"epoch": 0.936,
"grad_norm": 0.1199361629404387,
"learning_rate": 3.908588817477858e-05,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03776358813047409,
"step": 975,
"valid_targets_mean": 9242.8,
"valid_targets_min": 2535
},
{
"epoch": 0.9408,
"grad_norm": 0.11968391724432256,
"learning_rate": 3.9065757190014356e-05,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04064861685037613,
"step": 980,
"valid_targets_mean": 8815.6,
"valid_targets_min": 2016
},
{
"epoch": 0.9456,
"grad_norm": 0.13010903116296166,
"learning_rate": 3.90454122450772e-05,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03588135540485382,
"step": 985,
"valid_targets_mean": 8170.3,
"valid_targets_min": 3799
},
{
"epoch": 0.9504,
"grad_norm": 0.12285238315467241,
"learning_rate": 3.9024853568282615e-05,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03708403930068016,
"step": 990,
"valid_targets_mean": 9025.9,
"valid_targets_min": 5318
},
{
"epoch": 0.9552,
"grad_norm": 0.13047767902641233,
"learning_rate": 3.900408139034464e-05,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04085266962647438,
"step": 995,
"valid_targets_mean": 8927.5,
"valid_targets_min": 2808
},
{
"epoch": 0.96,
"grad_norm": 0.12509338732915287,
"learning_rate": 3.89830959443733e-05,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042269591242074966,
"step": 1000,
"valid_targets_mean": 9112.8,
"valid_targets_min": 3104
},
{
"epoch": 0.9648,
"grad_norm": 0.12707976296407147,
"learning_rate": 3.896189746587192e-05,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04251757264137268,
"step": 1005,
"valid_targets_mean": 9197.0,
"valid_targets_min": 4955
},
{
"epoch": 0.9696,
"grad_norm": 0.13513570063473687,
"learning_rate": 3.894048619273457e-05,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0449819378554821,
"step": 1010,
"valid_targets_mean": 8805.6,
"valid_targets_min": 2816
},
{
"epoch": 0.9744,
"grad_norm": 0.11628596725040473,
"learning_rate": 3.89188623652433e-05,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03957689553499222,
"step": 1015,
"valid_targets_mean": 9101.4,
"valid_targets_min": 5845
},
{
"epoch": 0.9792,
"grad_norm": 0.1395600161258974,
"learning_rate": 3.889702622606553e-05,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04011973738670349,
"step": 1020,
"valid_targets_mean": 8340.6,
"valid_targets_min": 2670
},
{
"epoch": 0.984,
"grad_norm": 0.12278646466936824,
"learning_rate": 3.887497802025129e-05,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03440343588590622,
"step": 1025,
"valid_targets_mean": 8029.5,
"valid_targets_min": 2752
},
{
"epoch": 0.9888,
"grad_norm": 0.12604219136442135,
"learning_rate": 3.885271799523043e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04180954396724701,
"step": 1030,
"valid_targets_mean": 8562.8,
"valid_targets_min": 2962
},
{
"epoch": 0.9936,
"grad_norm": 0.12564503884119702,
"learning_rate": 3.8830246400809925e-05,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03574180603027344,
"step": 1035,
"valid_targets_mean": 8152.6,
"valid_targets_min": 4152
},
{
"epoch": 0.9984,
"grad_norm": 0.12286222401223959,
"learning_rate": 3.880756348917101e-05,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04260804131627083,
"step": 1040,
"valid_targets_mean": 9008.5,
"valid_targets_min": 4527
},
{
"epoch": 1.00288,
"grad_norm": 0.13532126940346526,
"learning_rate": 3.8784669514866365e-05,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03753751516342163,
"step": 1045,
"valid_targets_mean": 10100.1,
"valid_targets_min": 5514
},
{
"epoch": 1.00768,
"grad_norm": 0.12973697576755405,
"learning_rate": 3.876156473481727e-05,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03712521493434906,
"step": 1050,
"valid_targets_mean": 9113.7,
"valid_targets_min": 3701
},
{
"epoch": 1.01248,
"grad_norm": 0.12040784575878684,
"learning_rate": 3.8738249408310716e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04298216104507446,
"step": 1055,
"valid_targets_mean": 9181.2,
"valid_targets_min": 3126
},
{
"epoch": 1.01728,
"grad_norm": 0.1290882287304988,
"learning_rate": 3.871472379699648e-05,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03602221980690956,
"step": 1060,
"valid_targets_mean": 8772.9,
"valid_targets_min": 2607
},
{
"epoch": 1.02208,
"grad_norm": 0.12406914379482467,
"learning_rate": 3.869098816488422e-05,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03653515875339508,
"step": 1065,
"valid_targets_mean": 9124.3,
"valid_targets_min": 5033
},
{
"epoch": 1.02688,
"grad_norm": 0.13729165019846906,
"learning_rate": 3.866704277834049e-05,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035046130418777466,
"step": 1070,
"valid_targets_mean": 8623.2,
"valid_targets_min": 3230
},
{
"epoch": 1.03168,
"grad_norm": 0.12036440804151036,
"learning_rate": 3.864288790608573e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034265272319316864,
"step": 1075,
"valid_targets_mean": 9006.2,
"valid_targets_min": 2326
},
{
"epoch": 1.03648,
"grad_norm": 0.12363412561657591,
"learning_rate": 3.861852381919132e-05,
"loss": 0.1086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038711585104465485,
"step": 1080,
"valid_targets_mean": 8283.0,
"valid_targets_min": 2443
},
{
"epoch": 1.04128,
"grad_norm": 0.12022387745735609,
"learning_rate": 3.8593950791076446e-05,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03348660469055176,
"step": 1085,
"valid_targets_mean": 8197.9,
"valid_targets_min": 1325
},
{
"epoch": 1.04608,
"grad_norm": 0.12541307411660785,
"learning_rate": 3.856916909750512e-05,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03612164780497551,
"step": 1090,
"valid_targets_mean": 8937.5,
"valid_targets_min": 4843
},
{
"epoch": 1.05088,
"grad_norm": 0.12767600777176324,
"learning_rate": 3.854417901658301e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036185123026371,
"step": 1095,
"valid_targets_mean": 8712.5,
"valid_targets_min": 4257
},
{
"epoch": 1.05568,
"grad_norm": 0.12527917305408634,
"learning_rate": 3.851898082875438e-05,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037031348794698715,
"step": 1100,
"valid_targets_mean": 9053.6,
"valid_targets_min": 3371
},
{
"epoch": 1.06048,
"grad_norm": 0.13136956141466558,
"learning_rate": 3.849357481679891e-05,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041252005845308304,
"step": 1105,
"valid_targets_mean": 8509.0,
"valid_targets_min": 3914
},
{
"epoch": 1.06528,
"grad_norm": 0.12922975818642823,
"learning_rate": 3.846796126582851e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03326720371842384,
"step": 1110,
"valid_targets_mean": 8771.5,
"valid_targets_min": 3884
},
{
"epoch": 1.07008,
"grad_norm": 0.12106396045806493,
"learning_rate": 3.844214046328416e-05,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043117620050907135,
"step": 1115,
"valid_targets_mean": 8209.8,
"valid_targets_min": 3243
},
{
"epoch": 1.07488,
"grad_norm": 0.13002226111527115,
"learning_rate": 3.841611269893266e-05,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03778604418039322,
"step": 1120,
"valid_targets_mean": 8510.7,
"valid_targets_min": 2567
},
{
"epoch": 1.07968,
"grad_norm": 0.12456407780457754,
"learning_rate": 3.8389878264863364e-05,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03702523559331894,
"step": 1125,
"valid_targets_mean": 9058.4,
"valid_targets_min": 5648
},
{
"epoch": 1.08448,
"grad_norm": 0.12625041807761278,
"learning_rate": 3.836343745548495e-05,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03746821731328964,
"step": 1130,
"valid_targets_mean": 9379.8,
"valid_targets_min": 2461
},
{
"epoch": 1.08928,
"grad_norm": 0.12729402444355445,
"learning_rate": 3.833679056752205e-05,
"loss": 0.1086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03369244933128357,
"step": 1135,
"valid_targets_mean": 8650.1,
"valid_targets_min": 2519
},
{
"epoch": 1.09408,
"grad_norm": 0.12251279578419882,
"learning_rate": 3.8309937900012e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035309284925460815,
"step": 1140,
"valid_targets_mean": 8545.1,
"valid_targets_min": 2214
},
{
"epoch": 1.09888,
"grad_norm": 0.12475486299736205,
"learning_rate": 3.8282879754301395e-05,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036522600799798965,
"step": 1145,
"valid_targets_mean": 9047.7,
"valid_targets_min": 2994
},
{
"epoch": 1.10368,
"grad_norm": 0.12100576465873229,
"learning_rate": 3.825561643404277e-05,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04240952804684639,
"step": 1150,
"valid_targets_mean": 9005.7,
"valid_targets_min": 4329
},
{
"epoch": 1.10848,
"grad_norm": 0.12172067784502344,
"learning_rate": 3.8228148245191195e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03200407326221466,
"step": 1155,
"valid_targets_mean": 8406.1,
"valid_targets_min": 4143
},
{
"epoch": 1.11328,
"grad_norm": 0.13157757940674708,
"learning_rate": 3.820047549600078e-05,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0324568971991539,
"step": 1160,
"valid_targets_mean": 8611.8,
"valid_targets_min": 4615
},
{
"epoch": 1.11808,
"grad_norm": 0.13712186902776327,
"learning_rate": 3.8172598497021304e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032350365072488785,
"step": 1165,
"valid_targets_mean": 8286.6,
"valid_targets_min": 3998
},
{
"epoch": 1.12288,
"grad_norm": 0.12296139282257143,
"learning_rate": 3.8144517561094635e-05,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03495969623327255,
"step": 1170,
"valid_targets_mean": 8338.6,
"valid_targets_min": 2001
},
{
"epoch": 1.12768,
"grad_norm": 0.12885506741767813,
"learning_rate": 3.811623300335129e-05,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03439897298812866,
"step": 1175,
"valid_targets_mean": 8294.6,
"valid_targets_min": 3388
},
{
"epoch": 1.13248,
"grad_norm": 0.13353947355498724,
"learning_rate": 3.808774514120689e-05,
"loss": 0.1068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03528585284948349,
"step": 1180,
"valid_targets_mean": 8710.7,
"valid_targets_min": 2226
},
{
"epoch": 1.13728,
"grad_norm": 0.11554578661926901,
"learning_rate": 3.805905429435856e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0375838503241539,
"step": 1185,
"valid_targets_mean": 9312.7,
"valid_targets_min": 4938
},
{
"epoch": 1.14208,
"grad_norm": 0.13553731807499625,
"learning_rate": 3.803016078478137e-05,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03697044402360916,
"step": 1190,
"valid_targets_mean": 8790.3,
"valid_targets_min": 3411
},
{
"epoch": 1.14688,
"grad_norm": 0.19558858259974732,
"learning_rate": 3.800106493672472e-05,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0370432510972023,
"step": 1195,
"valid_targets_mean": 8896.2,
"valid_targets_min": 2351
},
{
"epoch": 1.15168,
"grad_norm": 0.12694965655544607,
"learning_rate": 3.7971767076708704e-05,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03679373487830162,
"step": 1200,
"valid_targets_mean": 8190.5,
"valid_targets_min": 1331
},
{
"epoch": 1.15648,
"grad_norm": 0.1294349062636514,
"learning_rate": 3.794226753352042e-05,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03450850769877434,
"step": 1205,
"valid_targets_mean": 7733.4,
"valid_targets_min": 2324
},
{
"epoch": 1.16128,
"grad_norm": 0.13350423195151842,
"learning_rate": 3.791256663821032e-05,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03809414058923721,
"step": 1210,
"valid_targets_mean": 8429.0,
"valid_targets_min": 1850
},
{
"epoch": 1.16608,
"grad_norm": 0.11693967487810589,
"learning_rate": 3.788266472408846e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04129686951637268,
"step": 1215,
"valid_targets_mean": 9791.9,
"valid_targets_min": 3448
},
{
"epoch": 1.17088,
"grad_norm": 0.1171411660888164,
"learning_rate": 3.785256212672077e-05,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032727207988500595,
"step": 1220,
"valid_targets_mean": 8760.9,
"valid_targets_min": 3157
},
{
"epoch": 1.17568,
"grad_norm": 0.12246093881306887,
"learning_rate": 3.7822259183925324e-05,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03792506083846092,
"step": 1225,
"valid_targets_mean": 8479.7,
"valid_targets_min": 2780
},
{
"epoch": 1.18048,
"grad_norm": 0.11630087988559276,
"learning_rate": 3.7791756235768476e-05,
"loss": 0.1126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030140887945890427,
"step": 1230,
"valid_targets_mean": 8280.7,
"valid_targets_min": 1912
},
{
"epoch": 1.1852800000000001,
"grad_norm": 0.12034312206493047,
"learning_rate": 3.7761053624561104e-05,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041859276592731476,
"step": 1235,
"valid_targets_mean": 9125.2,
"valid_targets_min": 4384
},
{
"epoch": 1.19008,
"grad_norm": 0.12495575991658803,
"learning_rate": 3.7730151694854757e-05,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03812647983431816,
"step": 1240,
"valid_targets_mean": 8895.1,
"valid_targets_min": 3239
},
{
"epoch": 1.19488,
"grad_norm": 0.1279797576014592,
"learning_rate": 3.769905079343777e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03480718284845352,
"step": 1245,
"valid_targets_mean": 9148.8,
"valid_targets_min": 3375
},
{
"epoch": 1.19968,
"grad_norm": 0.1429209094833432,
"learning_rate": 3.766775126933138e-05,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03262244164943695,
"step": 1250,
"valid_targets_mean": 7446.3,
"valid_targets_min": 1642
},
{
"epoch": 1.20448,
"grad_norm": 0.11651049817133567,
"learning_rate": 3.7636253473785815e-05,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04041413217782974,
"step": 1255,
"valid_targets_mean": 9296.9,
"valid_targets_min": 1921
},
{
"epoch": 1.20928,
"grad_norm": 0.12715956000371428,
"learning_rate": 3.760455776027636e-05,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036815039813518524,
"step": 1260,
"valid_targets_mean": 8492.6,
"valid_targets_min": 2198
},
{
"epoch": 1.21408,
"grad_norm": 0.13088428982143835,
"learning_rate": 3.7572664484499365e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04161841422319412,
"step": 1265,
"valid_targets_mean": 9645.4,
"valid_targets_min": 5888
},
{
"epoch": 1.21888,
"grad_norm": 0.11844945935335202,
"learning_rate": 3.7540574004368264e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035760242491960526,
"step": 1270,
"valid_targets_mean": 8232.6,
"valid_targets_min": 972
},
{
"epoch": 1.2236799999999999,
"grad_norm": 0.1217454331633701,
"learning_rate": 3.750828668000959e-05,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044121257960796356,
"step": 1275,
"valid_targets_mean": 9731.1,
"valid_targets_min": 4826
},
{
"epoch": 1.22848,
"grad_norm": 0.11438951119465016,
"learning_rate": 3.747580287375887e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03459799289703369,
"step": 1280,
"valid_targets_mean": 8311.7,
"valid_targets_min": 3380
},
{
"epoch": 1.23328,
"grad_norm": 0.12344370046566683,
"learning_rate": 3.744312295015662e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03901112824678421,
"step": 1285,
"valid_targets_mean": 9534.2,
"valid_targets_min": 4213
},
{
"epoch": 1.23808,
"grad_norm": 0.1282738291200301,
"learning_rate": 3.7410247275944223e-05,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0330953374505043,
"step": 1290,
"valid_targets_mean": 7552.4,
"valid_targets_min": 1647
},
{
"epoch": 1.24288,
"grad_norm": 0.11797698703131318,
"learning_rate": 3.737717622005981e-05,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04117663949728012,
"step": 1295,
"valid_targets_mean": 8844.8,
"valid_targets_min": 4651
},
{
"epoch": 1.24768,
"grad_norm": 0.12402104881406364,
"learning_rate": 3.734391015363413e-05,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03869440779089928,
"step": 1300,
"valid_targets_mean": 9305.2,
"valid_targets_min": 3205
},
{
"epoch": 1.25248,
"grad_norm": 0.11958484310256949,
"learning_rate": 3.7310449449986404e-05,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035795748233795166,
"step": 1305,
"valid_targets_mean": 9048.6,
"valid_targets_min": 4788
},
{
"epoch": 1.25728,
"grad_norm": 0.13049242536465502,
"learning_rate": 3.727679448462009e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03678382933139801,
"step": 1310,
"valid_targets_mean": 8353.3,
"valid_targets_min": 2833
},
{
"epoch": 1.26208,
"grad_norm": 0.1181583760477813,
"learning_rate": 3.7242945635218696e-05,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03211447596549988,
"step": 1315,
"valid_targets_mean": 8366.3,
"valid_targets_min": 1833
},
{
"epoch": 1.26688,
"grad_norm": 0.11742791216030482,
"learning_rate": 3.720890328164156e-05,
"loss": 0.1084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042314011603593826,
"step": 1320,
"valid_targets_mean": 9944.7,
"valid_targets_min": 3926
},
{
"epoch": 1.27168,
"grad_norm": 0.11792444140621308,
"learning_rate": 3.717466780591956e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037658244371414185,
"step": 1325,
"valid_targets_mean": 8533.1,
"valid_targets_min": 2539
},
{
"epoch": 1.27648,
"grad_norm": 0.12225024480557042,
"learning_rate": 3.7140239592250804e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037245847284793854,
"step": 1330,
"valid_targets_mean": 9268.9,
"valid_targets_min": 5670
},
{
"epoch": 1.28128,
"grad_norm": 0.12318589546339119,
"learning_rate": 3.71056190269964e-05,
"loss": 0.1077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034685347229242325,
"step": 1335,
"valid_targets_mean": 8202.7,
"valid_targets_min": 1834
},
{
"epoch": 1.2860800000000001,
"grad_norm": 0.12403966425319882,
"learning_rate": 3.7070806498676025e-05,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042274922132492065,
"step": 1340,
"valid_targets_mean": 9153.2,
"valid_targets_min": 4013
},
{
"epoch": 1.29088,
"grad_norm": 0.11766905420453012,
"learning_rate": 3.7035802397963625e-05,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0366162545979023,
"step": 1345,
"valid_targets_mean": 8794.9,
"valid_targets_min": 1738
},
{
"epoch": 1.29568,
"grad_norm": 0.12007586908411454,
"learning_rate": 3.700060711768302e-05,
"loss": 0.1061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033832572400569916,
"step": 1350,
"valid_targets_mean": 9080.9,
"valid_targets_min": 3899
},
{
"epoch": 1.30048,
"grad_norm": 0.11667979309051224,
"learning_rate": 3.696522105280348e-05,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036710452288389206,
"step": 1355,
"valid_targets_mean": 9003.8,
"valid_targets_min": 2184
},
{
"epoch": 1.30528,
"grad_norm": 0.1263624995125729,
"learning_rate": 3.6929644600435303e-05,
"loss": 0.1084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03441833704710007,
"step": 1360,
"valid_targets_mean": 8348.5,
"valid_targets_min": 2806
},
{
"epoch": 1.3100800000000001,
"grad_norm": 0.11740982313324688,
"learning_rate": 3.689387815982536e-05,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038560301065444946,
"step": 1365,
"valid_targets_mean": 9448.6,
"valid_targets_min": 1822
},
{
"epoch": 1.31488,
"grad_norm": 0.1252151515739968,
"learning_rate": 3.6857922132352617e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03624051809310913,
"step": 1370,
"valid_targets_mean": 8632.9,
"valid_targets_min": 2701
},
{
"epoch": 1.31968,
"grad_norm": 0.13381310745789513,
"learning_rate": 3.6821776921523615e-05,
"loss": 0.103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0364258736371994,
"step": 1375,
"valid_targets_mean": 8644.5,
"valid_targets_min": 4506
},
{
"epoch": 1.3244799999999999,
"grad_norm": 0.1264214384761902,
"learning_rate": 3.678544293296797e-05,
"loss": 0.1052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034762680530548096,
"step": 1380,
"valid_targets_mean": 8907.5,
"valid_targets_min": 3498
},
{
"epoch": 1.32928,
"grad_norm": 0.11949522852717019,
"learning_rate": 3.674892057443378e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03189823776483536,
"step": 1385,
"valid_targets_mean": 8336.2,
"valid_targets_min": 2895
},
{
"epoch": 1.33408,
"grad_norm": 0.12933718554974194,
"learning_rate": 3.671221025578309e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03692135214805603,
"step": 1390,
"valid_targets_mean": 8362.5,
"valid_targets_min": 2327
},
{
"epoch": 1.33888,
"grad_norm": 0.1370376515161672,
"learning_rate": 3.6675312388987274e-05,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03446727246046066,
"step": 1395,
"valid_targets_mean": 8036.2,
"valid_targets_min": 3531
},
{
"epoch": 1.34368,
"grad_norm": 0.11519564170999727,
"learning_rate": 3.663822738812241e-05,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03143679350614548,
"step": 1400,
"valid_targets_mean": 8900.0,
"valid_targets_min": 4505
},
{
"epoch": 1.34848,
"grad_norm": 0.13667160069855397,
"learning_rate": 3.660095566936462e-05,
"loss": 0.107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04038439691066742,
"step": 1405,
"valid_targets_mean": 8623.7,
"valid_targets_min": 2516
},
{
"epoch": 1.35328,
"grad_norm": 0.11628807563727038,
"learning_rate": 3.656349765098546e-05,
"loss": 0.103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03632277250289917,
"step": 1410,
"valid_targets_mean": 9662.0,
"valid_targets_min": 5223
},
{
"epoch": 1.35808,
"grad_norm": 0.12165285738799775,
"learning_rate": 3.652585375334714e-05,
"loss": 0.1052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03766203299164772,
"step": 1415,
"valid_targets_mean": 9023.7,
"valid_targets_min": 2526
},
{
"epoch": 1.36288,
"grad_norm": 0.1210936758517175,
"learning_rate": 3.648802439889785e-05,
"loss": 0.107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03593523055315018,
"step": 1420,
"valid_targets_mean": 8797.6,
"valid_targets_min": 1723
},
{
"epoch": 1.36768,
"grad_norm": 0.12212797482243638,
"learning_rate": 3.645001001216705e-05,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03319096192717552,
"step": 1425,
"valid_targets_mean": 8514.3,
"valid_targets_min": 1460
},
{
"epoch": 1.37248,
"grad_norm": 0.12043836652635324,
"learning_rate": 3.641181101976065e-05,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039879005402326584,
"step": 1430,
"valid_targets_mean": 9830.4,
"valid_targets_min": 6223
},
{
"epoch": 1.37728,
"grad_norm": 0.12419659997953224,
"learning_rate": 3.637342785035624e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03451387211680412,
"step": 1435,
"valid_targets_mean": 7784.2,
"valid_targets_min": 3446
},
{
"epoch": 1.38208,
"grad_norm": 0.12369177870382055,
"learning_rate": 3.633486093469829e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03320624306797981,
"step": 1440,
"valid_targets_mean": 8363.7,
"valid_targets_min": 2814
},
{
"epoch": 1.3868800000000001,
"grad_norm": 0.11909211402446875,
"learning_rate": 3.629611070559333e-05,
"loss": 0.1054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03433164581656456,
"step": 1445,
"valid_targets_mean": 8183.8,
"valid_targets_min": 3490
},
{
"epoch": 1.39168,
"grad_norm": 0.11691264105478555,
"learning_rate": 3.625717759790506e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0365409217774868,
"step": 1450,
"valid_targets_mean": 9171.9,
"valid_targets_min": 4784
},
{
"epoch": 1.39648,
"grad_norm": 0.125375436081025,
"learning_rate": 3.621806204854947e-05,
"loss": 0.1049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03655450791120529,
"step": 1455,
"valid_targets_mean": 8703.1,
"valid_targets_min": 4353
},
{
"epoch": 1.40128,
"grad_norm": 0.1286467880870536,
"learning_rate": 3.617876449648998e-05,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039029087871313095,
"step": 1460,
"valid_targets_mean": 9403.0,
"valid_targets_min": 3483
},
{
"epoch": 1.40608,
"grad_norm": 0.11716905685866259,
"learning_rate": 3.613928538273247e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035078015178442,
"step": 1465,
"valid_targets_mean": 9139.4,
"valid_targets_min": 3472
},
{
"epoch": 1.4108800000000001,
"grad_norm": 0.11672670553448981,
"learning_rate": 3.609962515032034e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03533966466784477,
"step": 1470,
"valid_targets_mean": 9032.0,
"valid_targets_min": 1767
},
{
"epoch": 1.41568,
"grad_norm": 0.1243509687324732,
"learning_rate": 3.605978424432954e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03651345893740654,
"step": 1475,
"valid_targets_mean": 8722.7,
"valid_targets_min": 2884
},
{
"epoch": 1.42048,
"grad_norm": 0.12648765813571894,
"learning_rate": 3.601976311186361e-05,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03581051528453827,
"step": 1480,
"valid_targets_mean": 8290.9,
"valid_targets_min": 2516
},
{
"epoch": 1.4252799999999999,
"grad_norm": 0.11343351700255543,
"learning_rate": 3.597956220204861e-05,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036967843770980835,
"step": 1485,
"valid_targets_mean": 9481.8,
"valid_targets_min": 2996
},
{
"epoch": 1.43008,
"grad_norm": 0.1177270154654175,
"learning_rate": 3.5939181966028084e-05,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036307480186223984,
"step": 1490,
"valid_targets_mean": 9119.7,
"valid_targets_min": 2089
},
{
"epoch": 1.43488,
"grad_norm": 0.11948223416122511,
"learning_rate": 3.589862285695804e-05,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03213457390666008,
"step": 1495,
"valid_targets_mean": 8838.8,
"valid_targets_min": 3712
},
{
"epoch": 1.43968,
"grad_norm": 0.1211211334641555,
"learning_rate": 3.585788533000184e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03254202753305435,
"step": 1500,
"valid_targets_mean": 8756.7,
"valid_targets_min": 3942
},
{
"epoch": 1.44448,
"grad_norm": 0.11573696505962047,
"learning_rate": 3.581696984232508e-05,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027192670851945877,
"step": 1505,
"valid_targets_mean": 7469.8,
"valid_targets_min": 3106
},
{
"epoch": 1.44928,
"grad_norm": 0.12070460723365516,
"learning_rate": 3.5775876853090465e-05,
"loss": 0.1049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03165585547685623,
"step": 1510,
"valid_targets_mean": 8158.2,
"valid_targets_min": 2105
},
{
"epoch": 1.45408,
"grad_norm": 0.11620223694923805,
"learning_rate": 3.5734606823452686e-05,
"loss": 0.1047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037208959460258484,
"step": 1515,
"valid_targets_mean": 9556.5,
"valid_targets_min": 4435
},
{
"epoch": 1.45888,
"grad_norm": 0.11920297505293288,
"learning_rate": 3.569316021655319e-05,
"loss": 0.1012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02987070195376873,
"step": 1520,
"valid_targets_mean": 8496.3,
"valid_targets_min": 1915
},
{
"epoch": 1.46368,
"grad_norm": 0.1268442978445187,
"learning_rate": 3.565153749751505e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03451787680387497,
"step": 1525,
"valid_targets_mean": 9130.9,
"valid_targets_min": 2246
},
{
"epoch": 1.46848,
"grad_norm": 0.11701707630340304,
"learning_rate": 3.5609739133437666e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038270652294158936,
"step": 1530,
"valid_targets_mean": 9155.3,
"valid_targets_min": 2324
},
{
"epoch": 1.47328,
"grad_norm": 0.1282421956144873,
"learning_rate": 3.55677655933916e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03175165131688118,
"step": 1535,
"valid_targets_mean": 8443.1,
"valid_targets_min": 2640
},
{
"epoch": 1.47808,
"grad_norm": 0.11886359147221487,
"learning_rate": 3.5525617348413265e-05,
"loss": 0.1008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035145074129104614,
"step": 1540,
"valid_targets_mean": 9429.3,
"valid_targets_min": 4368
},
{
"epoch": 1.48288,
"grad_norm": 0.11951433549636696,
"learning_rate": 3.5483294871499646e-05,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032362401485443115,
"step": 1545,
"valid_targets_mean": 8555.6,
"valid_targets_min": 1834
},
{
"epoch": 1.4876800000000001,
"grad_norm": 0.1342430527003154,
"learning_rate": 3.544079863760302e-05,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03826196864247322,
"step": 1550,
"valid_targets_mean": 8434.8,
"valid_targets_min": 2927
},
{
"epoch": 1.49248,
"grad_norm": 0.1212927589438056,
"learning_rate": 3.5398129123625565e-05,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03314611315727234,
"step": 1555,
"valid_targets_mean": 8709.2,
"valid_targets_min": 3627
},
{
"epoch": 1.49728,
"grad_norm": 0.1259979005913219,
"learning_rate": 3.535528680841408e-05,
"loss": 0.1005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03330939635634422,
"step": 1560,
"valid_targets_mean": 9163.6,
"valid_targets_min": 3883
},
{
"epoch": 1.5020799999999999,
"grad_norm": 0.12508394927198732,
"learning_rate": 3.5312272172754566e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03124111518263817,
"step": 1565,
"valid_targets_mean": 7667.9,
"valid_targets_min": 1721
},
{
"epoch": 1.50688,
"grad_norm": 0.11330418088972559,
"learning_rate": 3.5269085699366844e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03747326508164406,
"step": 1570,
"valid_targets_mean": 9535.7,
"valid_targets_min": 3502
},
{
"epoch": 1.5116800000000001,
"grad_norm": 0.1238192398134257,
"learning_rate": 3.5225727872899136e-05,
"loss": 0.1052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03966061398386955,
"step": 1575,
"valid_targets_mean": 9409.5,
"valid_targets_min": 2901
},
{
"epoch": 1.51648,
"grad_norm": 0.12732035071816244,
"learning_rate": 3.518219917992262e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04096482694149017,
"step": 1580,
"valid_targets_mean": 9869.8,
"valid_targets_min": 4770
},
{
"epoch": 1.52128,
"grad_norm": 0.1342131928296109,
"learning_rate": 3.5138500108926e-05,
"loss": 0.1022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03232832998037338,
"step": 1585,
"valid_targets_mean": 7960.3,
"valid_targets_min": 1879
},
{
"epoch": 1.5260799999999999,
"grad_norm": 0.1279082191084901,
"learning_rate": 3.509463115030995e-05,
"loss": 0.1003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033002547919750214,
"step": 1590,
"valid_targets_mean": 8454.8,
"valid_targets_min": 1940
},
{
"epoch": 1.53088,
"grad_norm": 0.2811577290255808,
"learning_rate": 3.505059279638172e-05,
"loss": 0.1005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02976314350962639,
"step": 1595,
"valid_targets_mean": 8734.9,
"valid_targets_min": 3366
},
{
"epoch": 1.5356800000000002,
"grad_norm": 0.11869308529617718,
"learning_rate": 3.500638554134952e-05,
"loss": 0.0996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03650416061282158,
"step": 1600,
"valid_targets_mean": 9252.2,
"valid_targets_min": 4673
},
{
"epoch": 1.54048,
"grad_norm": 0.12182529682260378,
"learning_rate": 3.4962009881317005e-05,
"loss": 0.1,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03326595202088356,
"step": 1605,
"valid_targets_mean": 8089.7,
"valid_targets_min": 2269
},
{
"epoch": 1.54528,
"grad_norm": 0.11767713809063114,
"learning_rate": 3.491746631427772e-05,
"loss": 0.102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04178375005722046,
"step": 1610,
"valid_targets_mean": 9172.2,
"valid_targets_min": 2496
},
{
"epoch": 1.55008,
"grad_norm": 0.13558879371333668,
"learning_rate": 3.487275534010948e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034719523042440414,
"step": 1615,
"valid_targets_mean": 8640.8,
"valid_targets_min": 2299
},
{
"epoch": 1.55488,
"grad_norm": 0.11731890716900249,
"learning_rate": 3.482787746056881e-05,
"loss": 0.099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03394527733325958,
"step": 1620,
"valid_targets_mean": 9216.6,
"valid_targets_min": 3766
},
{
"epoch": 1.55968,
"grad_norm": 0.11494354049312823,
"learning_rate": 3.4782833179285256e-05,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03388223424553871,
"step": 1625,
"valid_targets_mean": 8900.3,
"valid_targets_min": 3332
},
{
"epoch": 1.56448,
"grad_norm": 0.10943738571395106,
"learning_rate": 3.473762300175578e-05,
"loss": 0.0999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030476726591587067,
"step": 1630,
"valid_targets_mean": 8088.4,
"valid_targets_min": 3008
},
{
"epoch": 1.56928,
"grad_norm": 0.11506597550483152,
"learning_rate": 3.469224743533906e-05,
"loss": 0.098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031209899112582207,
"step": 1635,
"valid_targets_mean": 9256.1,
"valid_targets_min": 4635
},
{
"epoch": 1.57408,
"grad_norm": 0.13082551295998132,
"learning_rate": 3.464670698924981e-05,
"loss": 0.1008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03382524102926254,
"step": 1640,
"valid_targets_mean": 8714.7,
"valid_targets_min": 3433
},
{
"epoch": 1.5788799999999998,
"grad_norm": 0.12427360078336991,
"learning_rate": 3.4601002174553055e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03731769323348999,
"step": 1645,
"valid_targets_mean": 8702.7,
"valid_targets_min": 2481
},
{
"epoch": 1.58368,
"grad_norm": 0.11446263987092861,
"learning_rate": 3.45551335041584e-05,
"loss": 0.1004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034496426582336426,
"step": 1650,
"valid_targets_mean": 9184.0,
"valid_targets_min": 3710
},
{
"epoch": 1.5884800000000001,
"grad_norm": 0.12739756370428226,
"learning_rate": 3.4509101492814286e-05,
"loss": 0.0994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034381356090307236,
"step": 1655,
"valid_targets_mean": 8748.2,
"valid_targets_min": 1423
},
{
"epoch": 1.59328,
"grad_norm": 0.11751460240058818,
"learning_rate": 3.446290665710219e-05,
"loss": 0.1019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029714802280068398,
"step": 1660,
"valid_targets_mean": 7678.1,
"valid_targets_min": 2099
},
{
"epoch": 1.59808,
"grad_norm": 0.11814198326450993,
"learning_rate": 3.441654951543085e-05,
"loss": 0.0992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036534734070301056,
"step": 1665,
"valid_targets_mean": 9461.3,
"valid_targets_min": 4091
},
{
"epoch": 1.6028799999999999,
"grad_norm": 0.11295334978255936,
"learning_rate": 3.4370030588030425e-05,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032168176025152206,
"step": 1670,
"valid_targets_mean": 8824.2,
"valid_targets_min": 5342
},
{
"epoch": 1.60768,
"grad_norm": 0.11944262820417971,
"learning_rate": 3.432335039694669e-05,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03803761303424835,
"step": 1675,
"valid_targets_mean": 8744.9,
"valid_targets_min": 1956
},
{
"epoch": 1.6124800000000001,
"grad_norm": 0.1188365242887442,
"learning_rate": 3.427650946603513e-05,
"loss": 0.0996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031139787286520004,
"step": 1680,
"valid_targets_mean": 8154.3,
"valid_targets_min": 1736
},
{
"epoch": 1.61728,
"grad_norm": 0.12123730509386084,
"learning_rate": 3.422950832095511e-05,
"loss": 0.0994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03488922864198685,
"step": 1685,
"valid_targets_mean": 8890.8,
"valid_targets_min": 2762
},
{
"epoch": 1.62208,
"grad_norm": 0.12417921438454016,
"learning_rate": 3.418234748916395e-05,
"loss": 0.1001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03286389634013176,
"step": 1690,
"valid_targets_mean": 8685.7,
"valid_targets_min": 4649
},
{
"epoch": 1.6268799999999999,
"grad_norm": 0.12427965821978078,
"learning_rate": 3.4135027499911003e-05,
"loss": 0.1015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03643377870321274,
"step": 1695,
"valid_targets_mean": 9603.3,
"valid_targets_min": 4519
},
{
"epoch": 1.63168,
"grad_norm": 0.12379457220006589,
"learning_rate": 3.408754888423173e-05,
"loss": 0.1035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03129050135612488,
"step": 1700,
"valid_targets_mean": 8723.2,
"valid_targets_min": 3745
},
{
"epoch": 1.6364800000000002,
"grad_norm": 0.12275475278899578,
"learning_rate": 3.403991217494172e-05,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031930018216371536,
"step": 1705,
"valid_targets_mean": 8601.5,
"valid_targets_min": 3257
},
{
"epoch": 1.64128,
"grad_norm": 0.1201804881346642,
"learning_rate": 3.3992117906630744e-05,
"loss": 0.1,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03500905632972717,
"step": 1710,
"valid_targets_mean": 9292.2,
"valid_targets_min": 2432
},
{
"epoch": 1.64608,
"grad_norm": 0.12998259303408505,
"learning_rate": 3.394416661565671e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03601759672164917,
"step": 1715,
"valid_targets_mean": 9329.5,
"valid_targets_min": 3473
},
{
"epoch": 1.65088,
"grad_norm": 0.15209411679668441,
"learning_rate": 3.389605884013969e-05,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03493211418390274,
"step": 1720,
"valid_targets_mean": 8974.5,
"valid_targets_min": 3096
},
{
"epoch": 1.65568,
"grad_norm": 0.11967594276263603,
"learning_rate": 3.384779511995587e-05,
"loss": 0.1004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028926797211170197,
"step": 1725,
"valid_targets_mean": 8098.5,
"valid_targets_min": 3942
},
{
"epoch": 1.66048,
"grad_norm": 0.1263183650621345,
"learning_rate": 3.379937599673144e-05,
"loss": 0.0968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029895996674895287,
"step": 1730,
"valid_targets_mean": 9455.5,
"valid_targets_min": 4168
},
{
"epoch": 1.66528,
"grad_norm": 0.1116628577909989,
"learning_rate": 3.3750802013836596e-05,
"loss": 0.0961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029331346973776817,
"step": 1735,
"valid_targets_mean": 8593.4,
"valid_targets_min": 2814
},
{
"epoch": 1.67008,
"grad_norm": 0.11669743828129955,
"learning_rate": 3.370207371637939e-05,
"loss": 0.0981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03486446291208267,
"step": 1740,
"valid_targets_mean": 8908.1,
"valid_targets_min": 3582
},
{
"epoch": 1.67488,
"grad_norm": 0.11206048763400174,
"learning_rate": 3.3653191651199635e-05,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029872918501496315,
"step": 1745,
"valid_targets_mean": 8751.2,
"valid_targets_min": 3097
},
{
"epoch": 1.6796799999999998,
"grad_norm": 0.12149392067550448,
"learning_rate": 3.360415636686274e-05,
"loss": 0.0992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03125841170549393,
"step": 1750,
"valid_targets_mean": 9348.4,
"valid_targets_min": 1952
},
{
"epoch": 1.68448,
"grad_norm": 0.11409949572763738,
"learning_rate": 3.355496841365359e-05,
"loss": 0.0998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034153811633586884,
"step": 1755,
"valid_targets_mean": 9130.1,
"valid_targets_min": 3227
},
{
"epoch": 1.6892800000000001,
"grad_norm": 0.12180781545084879,
"learning_rate": 3.350562834357034e-05,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03245352953672409,
"step": 1760,
"valid_targets_mean": 8648.5,
"valid_targets_min": 4313
},
{
"epoch": 1.69408,
"grad_norm": 0.13247571796223342,
"learning_rate": 3.345613671031827e-05,
"loss": 0.1011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03612162172794342,
"step": 1765,
"valid_targets_mean": 8704.3,
"valid_targets_min": 4184
},
{
"epoch": 1.69888,
"grad_norm": 0.21647507224098106,
"learning_rate": 3.340649406930349e-05,
"loss": 0.0977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029728224501013756,
"step": 1770,
"valid_targets_mean": 8391.2,
"valid_targets_min": 1727
},
{
"epoch": 1.7036799999999999,
"grad_norm": 0.12422077040157983,
"learning_rate": 3.335670097762677e-05,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029321834444999695,
"step": 1775,
"valid_targets_mean": 8637.8,
"valid_targets_min": 1912
},
{
"epoch": 1.70848,
"grad_norm": 0.11698536286578931,
"learning_rate": 3.330675799407728e-05,
"loss": 0.1,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032984182238578796,
"step": 1780,
"valid_targets_mean": 8554.4,
"valid_targets_min": 3850
},
{
"epoch": 1.7132800000000001,
"grad_norm": 0.12071451043408635,
"learning_rate": 3.32566656791263e-05,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030606457963585854,
"step": 1785,
"valid_targets_mean": 8076.9,
"valid_targets_min": 1413
},
{
"epoch": 1.71808,
"grad_norm": 0.12127568160825884,
"learning_rate": 3.320642459492095e-05,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03138080984354019,
"step": 1790,
"valid_targets_mean": 8827.6,
"valid_targets_min": 3318
},
{
"epoch": 1.72288,
"grad_norm": 0.12309891269800873,
"learning_rate": 3.315603530527785e-05,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034938737750053406,
"step": 1795,
"valid_targets_mean": 8190.7,
"valid_targets_min": 1990
},
{
"epoch": 1.7276799999999999,
"grad_norm": 0.13448328329653705,
"learning_rate": 3.310549837567685e-05,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03196977078914642,
"step": 1800,
"valid_targets_mean": 8209.2,
"valid_targets_min": 4291
},
{
"epoch": 1.73248,
"grad_norm": 0.1270134755763155,
"learning_rate": 3.3054814373254615e-05,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03308798000216484,
"step": 1805,
"valid_targets_mean": 9097.6,
"valid_targets_min": 3023
},
{
"epoch": 1.7372800000000002,
"grad_norm": 0.1215462716174612,
"learning_rate": 3.300398386679831e-05,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03231578692793846,
"step": 1810,
"valid_targets_mean": 8737.8,
"valid_targets_min": 2789
},
{
"epoch": 1.74208,
"grad_norm": 0.12659381214839838,
"learning_rate": 3.2953007426739204e-05,
"loss": 0.0994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030647259205579758,
"step": 1815,
"valid_targets_mean": 9287.0,
"valid_targets_min": 3191
},
{
"epoch": 1.74688,
"grad_norm": 0.12152296869764756,
"learning_rate": 3.290188562514624e-05,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02994205430150032,
"step": 1820,
"valid_targets_mean": 8389.3,
"valid_targets_min": 4479
},
{
"epoch": 1.75168,
"grad_norm": 0.11579730176913727,
"learning_rate": 3.285061903571968e-05,
"loss": 0.0976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03409838303923607,
"step": 1825,
"valid_targets_mean": 8725.6,
"valid_targets_min": 3671
},
{
"epoch": 1.75648,
"grad_norm": 0.12042202731658365,
"learning_rate": 3.27992082337846e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03129231929779053,
"step": 1830,
"valid_targets_mean": 8376.2,
"valid_targets_min": 2786
},
{
"epoch": 1.76128,
"grad_norm": 0.1150574556332984,
"learning_rate": 3.274765379628447e-05,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03116718865931034,
"step": 1835,
"valid_targets_mean": 9754.7,
"valid_targets_min": 2668
},
{
"epoch": 1.76608,
"grad_norm": 0.12221087122396483,
"learning_rate": 3.2695956301774664e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03059461899101734,
"step": 1840,
"valid_targets_mean": 8807.2,
"valid_targets_min": 1560
},
{
"epoch": 1.77088,
"grad_norm": 0.12550586828813198,
"learning_rate": 3.264411633041598e-05,
"loss": 0.0996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03288565203547478,
"step": 1845,
"valid_targets_mean": 8430.9,
"valid_targets_min": 4166
},
{
"epoch": 1.77568,
"grad_norm": 0.11800390703235397,
"learning_rate": 3.259213446396812e-05,
"loss": 0.0971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03617793321609497,
"step": 1850,
"valid_targets_mean": 8808.0,
"valid_targets_min": 2379
},
{
"epoch": 1.7804799999999998,
"grad_norm": 0.12065501117992328,
"learning_rate": 3.254001128578317e-05,
"loss": 0.0971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03944634646177292,
"step": 1855,
"valid_targets_mean": 9181.4,
"valid_targets_min": 3240
},
{
"epoch": 1.78528,
"grad_norm": 0.12815781801241774,
"learning_rate": 3.2487747380799036e-05,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03340938687324524,
"step": 1860,
"valid_targets_mean": 9103.5,
"valid_targets_min": 5535
},
{
"epoch": 1.7900800000000001,
"grad_norm": 0.12256539621255265,
"learning_rate": 3.243534333553291e-05,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03244269639253616,
"step": 1865,
"valid_targets_mean": 9035.9,
"valid_targets_min": 3874
},
{
"epoch": 1.79488,
"grad_norm": 0.11939887366602382,
"learning_rate": 3.2382799738074635e-05,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036362893879413605,
"step": 1870,
"valid_targets_mean": 9146.4,
"valid_targets_min": 3073
},
{
"epoch": 1.79968,
"grad_norm": 0.11295140221263837,
"learning_rate": 3.2330117178080184e-05,
"loss": 0.0957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03275471180677414,
"step": 1875,
"valid_targets_mean": 9356.5,
"valid_targets_min": 3597
},
{
"epoch": 1.8044799999999999,
"grad_norm": 0.11596482995260982,
"learning_rate": 3.227729624676497e-05,
"loss": 0.0991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033212386071681976,
"step": 1880,
"valid_targets_mean": 8404.9,
"valid_targets_min": 1753
},
{
"epoch": 1.80928,
"grad_norm": 0.12299614142264025,
"learning_rate": 3.222433753689724e-05,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030806001275777817,
"step": 1885,
"valid_targets_mean": 9172.8,
"valid_targets_min": 2605
},
{
"epoch": 1.8140800000000001,
"grad_norm": 0.12294732258255374,
"learning_rate": 3.2171241642791443e-05,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03270886838436127,
"step": 1890,
"valid_targets_mean": 8817.4,
"valid_targets_min": 3170
},
{
"epoch": 1.81888,
"grad_norm": 0.12454651137241947,
"learning_rate": 3.211800916030152e-05,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03188232332468033,
"step": 1895,
"valid_targets_mean": 8884.1,
"valid_targets_min": 3236
},
{
"epoch": 1.82368,
"grad_norm": 0.11875714790732037,
"learning_rate": 3.206464068681424e-05,
"loss": 0.0962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03125854209065437,
"step": 1900,
"valid_targets_mean": 8837.4,
"valid_targets_min": 3141
},
{
"epoch": 1.8284799999999999,
"grad_norm": 0.25615170544022126,
"learning_rate": 3.20111368212425e-05,
"loss": 0.0972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031216248869895935,
"step": 1905,
"valid_targets_mean": 8927.4,
"valid_targets_min": 2351
},
{
"epoch": 1.83328,
"grad_norm": 0.11553048251166381,
"learning_rate": 3.19574981640186e-05,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032985836267471313,
"step": 1910,
"valid_targets_mean": 9137.7,
"valid_targets_min": 2457
},
{
"epoch": 1.8380800000000002,
"grad_norm": 0.12332033201339215,
"learning_rate": 3.1903725317087495e-05,
"loss": 0.0962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02826140820980072,
"step": 1915,
"valid_targets_mean": 7582.6,
"valid_targets_min": 1979
},
{
"epoch": 1.84288,
"grad_norm": 0.12373198100671594,
"learning_rate": 3.184981888390003e-05,
"loss": 0.0943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03438425809144974,
"step": 1920,
"valid_targets_mean": 8750.5,
"valid_targets_min": 3715
},
{
"epoch": 1.84768,
"grad_norm": 0.11898830073691476,
"learning_rate": 3.1795779469406226e-05,
"loss": 0.0996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027855921536684036,
"step": 1925,
"valid_targets_mean": 8388.7,
"valid_targets_min": 3606
},
{
"epoch": 1.85248,
"grad_norm": 0.13049198537601311,
"learning_rate": 3.174160768004842e-05,
"loss": 0.0938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03077923133969307,
"step": 1930,
"valid_targets_mean": 9521.2,
"valid_targets_min": 3478
},
{
"epoch": 1.85728,
"grad_norm": 0.12890383965255006,
"learning_rate": 3.168730412375449e-05,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033480048179626465,
"step": 1935,
"valid_targets_mean": 8513.8,
"valid_targets_min": 2941
},
{
"epoch": 1.86208,
"grad_norm": 0.1259489564584358,
"learning_rate": 3.1632869409931036e-05,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03304038196802139,
"step": 1940,
"valid_targets_mean": 8453.8,
"valid_targets_min": 3095
},
{
"epoch": 1.86688,
"grad_norm": 0.12379490782070443,
"learning_rate": 3.1578304149456544e-05,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02992902509868145,
"step": 1945,
"valid_targets_mean": 8997.7,
"valid_targets_min": 2944
},
{
"epoch": 1.87168,
"grad_norm": 0.1908649386565199,
"learning_rate": 3.1523608954674524e-05,
"loss": 0.0985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030526556074619293,
"step": 1950,
"valid_targets_mean": 8728.9,
"valid_targets_min": 3733
},
{
"epoch": 1.87648,
"grad_norm": 0.12058817025819538,
"learning_rate": 3.1468784439386614e-05,
"loss": 0.0978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029100410640239716,
"step": 1955,
"valid_targets_mean": 7976.5,
"valid_targets_min": 1588
},
{
"epoch": 1.8812799999999998,
"grad_norm": 0.12374514028101315,
"learning_rate": 3.141383121884576e-05,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030075032263994217,
"step": 1960,
"valid_targets_mean": 9350.9,
"valid_targets_min": 2993
},
{
"epoch": 1.88608,
"grad_norm": 0.12949723183843131,
"learning_rate": 3.1358749909749214e-05,
"loss": 0.0957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02782047912478447,
"step": 1965,
"valid_targets_mean": 8918.0,
"valid_targets_min": 4011
},
{
"epoch": 1.8908800000000001,
"grad_norm": 0.12321752636472717,
"learning_rate": 3.1303541130231703e-05,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03179875388741493,
"step": 1970,
"valid_targets_mean": 8427.1,
"valid_targets_min": 2242
},
{
"epoch": 1.89568,
"grad_norm": 0.1250357323229381,
"learning_rate": 3.1248205499858446e-05,
"loss": 0.0974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031728826463222504,
"step": 1975,
"valid_targets_mean": 8332.0,
"valid_targets_min": 1698
},
{
"epoch": 1.90048,
"grad_norm": 0.1269808845116901,
"learning_rate": 3.119274363961821e-05,
"loss": 0.0976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030242368578910828,
"step": 1980,
"valid_targets_mean": 8013.0,
"valid_targets_min": 2329
},
{
"epoch": 1.9052799999999999,
"grad_norm": 0.12594906129488526,
"learning_rate": 3.113715617191634e-05,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033120714128017426,
"step": 1985,
"valid_targets_mean": 9525.1,
"valid_targets_min": 5176
},
{
"epoch": 1.91008,
"grad_norm": 0.1128437524239124,
"learning_rate": 3.1081443720567785e-05,
"loss": 0.0976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03407108783721924,
"step": 1990,
"valid_targets_mean": 8913.7,
"valid_targets_min": 2222
},
{
"epoch": 1.9148800000000001,
"grad_norm": 0.12271441054409966,
"learning_rate": 3.102560691079007e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03202490508556366,
"step": 1995,
"valid_targets_mean": 8219.6,
"valid_targets_min": 4856
},
{
"epoch": 1.91968,
"grad_norm": 0.11928104900985406,
"learning_rate": 3.0969646369196307e-05,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03154480457305908,
"step": 2000,
"valid_targets_mean": 7679.9,
"valid_targets_min": 2327
},
{
"epoch": 1.92448,
"grad_norm": 0.11764578388415199,
"learning_rate": 3.0913562723788174e-05,
"loss": 0.0937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028950994834303856,
"step": 2005,
"valid_targets_mean": 8590.5,
"valid_targets_min": 2687
},
{
"epoch": 1.9292799999999999,
"grad_norm": 0.11959529477268145,
"learning_rate": 3.085735660394881e-05,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03188043832778931,
"step": 2010,
"valid_targets_mean": 8712.7,
"valid_targets_min": 2239
},
{
"epoch": 1.93408,
"grad_norm": 0.12288064731447748,
"learning_rate": 3.080102864043581e-05,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03270117938518524,
"step": 2015,
"valid_targets_mean": 8825.5,
"valid_targets_min": 2184
},
{
"epoch": 1.9388800000000002,
"grad_norm": 0.12062672309603491,
"learning_rate": 3.074457946537413e-05,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03260117769241333,
"step": 2020,
"valid_targets_mean": 8145.7,
"valid_targets_min": 3013
},
{
"epoch": 1.94368,
"grad_norm": 0.11717401223355793,
"learning_rate": 3.068800971224898e-05,
"loss": 0.0938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030992349609732628,
"step": 2025,
"valid_targets_mean": 8825.3,
"valid_targets_min": 1526
},
{
"epoch": 1.94848,
"grad_norm": 0.11964450711810551,
"learning_rate": 3.0631320015898735e-05,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03208611160516739,
"step": 2030,
"valid_targets_mean": 9341.5,
"valid_targets_min": 4514
},
{
"epoch": 1.95328,
"grad_norm": 0.1300777102273075,
"learning_rate": 3.057451101250778e-05,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027757877483963966,
"step": 2035,
"valid_targets_mean": 8905.0,
"valid_targets_min": 4482
},
{
"epoch": 1.95808,
"grad_norm": 0.13016926678324173,
"learning_rate": 3.051758333959941e-05,
"loss": 0.0938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034215047955513,
"step": 2040,
"valid_targets_mean": 9087.2,
"valid_targets_min": 4268
},
{
"epoch": 1.96288,
"grad_norm": 0.13459529117746524,
"learning_rate": 3.046053763602865e-05,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03139539062976837,
"step": 2045,
"valid_targets_mean": 7871.2,
"valid_targets_min": 2346
},
{
"epoch": 1.96768,
"grad_norm": 0.11324489273915117,
"learning_rate": 3.0403374541975078e-05,
"loss": 0.0928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029846232384443283,
"step": 2050,
"valid_targets_mean": 8258.1,
"valid_targets_min": 2241
},
{
"epoch": 1.97248,
"grad_norm": 0.11489197140280931,
"learning_rate": 3.034609469893567e-05,
"loss": 0.0929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032914385199546814,
"step": 2055,
"valid_targets_mean": 9554.0,
"valid_targets_min": 4598
},
{
"epoch": 1.97728,
"grad_norm": 0.11581208074394174,
"learning_rate": 3.028869874971758e-05,
"loss": 0.0959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03447406738996506,
"step": 2060,
"valid_targets_mean": 8354.8,
"valid_targets_min": 2758
},
{
"epoch": 1.9820799999999998,
"grad_norm": 0.11852330994590476,
"learning_rate": 3.0231187338430944e-05,
"loss": 0.0931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03049747459590435,
"step": 2065,
"valid_targets_mean": 8763.3,
"valid_targets_min": 3186
},
{
"epoch": 1.98688,
"grad_norm": 0.12012402161638631,
"learning_rate": 3.0173561110481606e-05,
"loss": 0.0943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030883774161338806,
"step": 2070,
"valid_targets_mean": 9102.0,
"valid_targets_min": 3763
},
{
"epoch": 1.9916800000000001,
"grad_norm": 0.12029947880726818,
"learning_rate": 3.011582071256394e-05,
"loss": 0.0938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03472603112459183,
"step": 2075,
"valid_targets_mean": 9187.4,
"valid_targets_min": 4685
},
{
"epoch": 1.99648,
"grad_norm": 0.12080815720093505,
"learning_rate": 3.0057966792653547e-05,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03140140324831009,
"step": 2080,
"valid_targets_mean": 7961.4,
"valid_targets_min": 2523
},
{
"epoch": 2.00096,
"grad_norm": 0.127348881807781,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.0898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029651004821062088,
"step": 2085,
"valid_targets_mean": 9488.9,
"valid_targets_min": 2667
},
{
"epoch": 2.00576,
"grad_norm": 0.12239161231781547,
"learning_rate": 2.9941920985119562e-05,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02701239474117756,
"step": 2090,
"valid_targets_mean": 8532.2,
"valid_targets_min": 2701
},
{
"epoch": 2.01056,
"grad_norm": 0.11882885393990238,
"learning_rate": 2.988373039978786e-05,
"loss": 0.0868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03091384470462799,
"step": 2095,
"valid_targets_mean": 9679.6,
"valid_targets_min": 2730
},
{
"epoch": 2.01536,
"grad_norm": 0.11563223856575051,
"learning_rate": 2.98254288970326e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0300716795027256,
"step": 2100,
"valid_targets_mean": 8815.1,
"valid_targets_min": 2632
},
{
"epoch": 2.02016,
"grad_norm": 0.12238216828812892,
"learning_rate": 2.9767017131126245e-05,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031115412712097168,
"step": 2105,
"valid_targets_mean": 9428.0,
"valid_targets_min": 4481
},
{
"epoch": 2.02496,
"grad_norm": 0.11820045344397803,
"learning_rate": 2.9708495757578633e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0273810513317585,
"step": 2110,
"valid_targets_mean": 8535.9,
"valid_targets_min": 3766
},
{
"epoch": 2.02976,
"grad_norm": 0.110408263933541,
"learning_rate": 2.964986543312964e-05,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02771226316690445,
"step": 2115,
"valid_targets_mean": 8563.7,
"valid_targets_min": 2594
},
{
"epoch": 2.03456,
"grad_norm": 0.12029390455853219,
"learning_rate": 2.9591126815741832e-05,
"loss": 0.0869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03002401813864708,
"step": 2120,
"valid_targets_mean": 8298.8,
"valid_targets_min": 2022
},
{
"epoch": 2.03936,
"grad_norm": 0.11511228961091312,
"learning_rate": 2.953228056459305e-05,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026876386255025864,
"step": 2125,
"valid_targets_mean": 9043.5,
"valid_targets_min": 3188
},
{
"epoch": 2.04416,
"grad_norm": 0.1226523942167117,
"learning_rate": 2.947332734006903e-05,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026805460453033447,
"step": 2130,
"valid_targets_mean": 8803.2,
"valid_targets_min": 3904
},
{
"epoch": 2.04896,
"grad_norm": 0.11684267393301566,
"learning_rate": 2.9414267803755988e-05,
"loss": 0.0896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03486183285713196,
"step": 2135,
"valid_targets_mean": 9706.5,
"valid_targets_min": 3528
},
{
"epoch": 2.05376,
"grad_norm": 0.11633157562826041,
"learning_rate": 2.9355102618433197e-05,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02780848927795887,
"step": 2140,
"valid_targets_mean": 8743.6,
"valid_targets_min": 2084
},
{
"epoch": 2.05856,
"grad_norm": 0.1176794789427386,
"learning_rate": 2.929583244806553e-05,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030458780005574226,
"step": 2145,
"valid_targets_mean": 7875.6,
"valid_targets_min": 1516
},
{
"epoch": 2.06336,
"grad_norm": 0.11576596805179132,
"learning_rate": 2.9236457957796047e-05,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025129785761237144,
"step": 2150,
"valid_targets_mean": 8653.1,
"valid_targets_min": 1776
},
{
"epoch": 2.0681599999999998,
"grad_norm": 0.1125861546534315,
"learning_rate": 2.9176979813938494e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030581803992390633,
"step": 2155,
"valid_targets_mean": 7886.0,
"valid_targets_min": 3848
},
{
"epoch": 2.07296,
"grad_norm": 0.11990337393515425,
"learning_rate": 2.9117398683969857e-05,
"loss": 0.0897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02741706185042858,
"step": 2160,
"valid_targets_mean": 8171.0,
"valid_targets_min": 1914
},
{
"epoch": 2.07776,
"grad_norm": 0.12242894662914258,
"learning_rate": 2.9057715236522833e-05,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029523633420467377,
"step": 2165,
"valid_targets_mean": 8559.4,
"valid_targets_min": 3236
},
{
"epoch": 2.08256,
"grad_norm": 0.1241427713541584,
"learning_rate": 2.899793014137836e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030984241515398026,
"step": 2170,
"valid_targets_mean": 9196.1,
"valid_targets_min": 3004
},
{
"epoch": 2.08736,
"grad_norm": 0.12063838069741276,
"learning_rate": 2.8938044069458094e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028892911970615387,
"step": 2175,
"valid_targets_mean": 8572.5,
"valid_targets_min": 3225
},
{
"epoch": 2.09216,
"grad_norm": 0.11160240696578047,
"learning_rate": 2.8878057692816877e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026819078251719475,
"step": 2180,
"valid_targets_mean": 8104.5,
"valid_targets_min": 2774
},
{
"epoch": 2.09696,
"grad_norm": 0.15191956279033425,
"learning_rate": 2.8817971684635178e-05,
"loss": 0.0888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02786080725491047,
"step": 2185,
"valid_targets_mean": 8554.4,
"valid_targets_min": 1925
},
{
"epoch": 2.10176,
"grad_norm": 0.12240055182601953,
"learning_rate": 2.8757786719211555e-05,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02772444486618042,
"step": 2190,
"valid_targets_mean": 8159.0,
"valid_targets_min": 2615
},
{
"epoch": 2.10656,
"grad_norm": 0.11643689287045982,
"learning_rate": 2.8697503471955106e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02837887965142727,
"step": 2195,
"valid_targets_mean": 8464.4,
"valid_targets_min": 1413
},
{
"epoch": 2.11136,
"grad_norm": 0.11654047788382643,
"learning_rate": 2.8637122619377848e-05,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03045256994664669,
"step": 2200,
"valid_targets_mean": 8479.0,
"valid_targets_min": 3845
},
{
"epoch": 2.11616,
"grad_norm": 0.12522178378425464,
"learning_rate": 2.8576644839087152e-05,
"loss": 0.0885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03251127153635025,
"step": 2205,
"valid_targets_mean": 9498.2,
"valid_targets_min": 3661
},
{
"epoch": 2.12096,
"grad_norm": 0.1828803070115879,
"learning_rate": 2.8516070809778145e-05,
"loss": 0.086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02694122865796089,
"step": 2210,
"valid_targets_mean": 8186.5,
"valid_targets_min": 2913
},
{
"epoch": 2.12576,
"grad_norm": 0.11379440969301187,
"learning_rate": 2.845540121122607e-05,
"loss": 0.0835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02929331548511982,
"step": 2215,
"valid_targets_mean": 8543.1,
"valid_targets_min": 2580
},
{
"epoch": 2.13056,
"grad_norm": 0.13579664419486132,
"learning_rate": 2.839463672427867e-05,
"loss": 0.086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029128937050700188,
"step": 2220,
"valid_targets_mean": 8281.3,
"valid_targets_min": 2203
},
{
"epoch": 2.13536,
"grad_norm": 0.15179636273038324,
"learning_rate": 2.833377803084855e-05,
"loss": 0.0848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03110337257385254,
"step": 2225,
"valid_targets_mean": 9488.6,
"valid_targets_min": 3850
},
{
"epoch": 2.14016,
"grad_norm": 0.12272951835579388,
"learning_rate": 2.8272825813905522e-05,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03079194948077202,
"step": 2230,
"valid_targets_mean": 8683.3,
"valid_targets_min": 1928
},
{
"epoch": 2.14496,
"grad_norm": 0.12474318671383416,
"learning_rate": 2.8211780757468942e-05,
"loss": 0.089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030205946415662766,
"step": 2235,
"valid_targets_mean": 8289.2,
"valid_targets_min": 2163
},
{
"epoch": 2.14976,
"grad_norm": 0.11310821373925851,
"learning_rate": 2.8150643546600012e-05,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025783589109778404,
"step": 2240,
"valid_targets_mean": 8930.8,
"valid_targets_min": 2381
},
{
"epoch": 2.15456,
"grad_norm": 0.12359622662935445,
"learning_rate": 2.808941486739414e-05,
"loss": 0.0894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02596352994441986,
"step": 2245,
"valid_targets_mean": 8079.3,
"valid_targets_min": 2770
},
{
"epoch": 2.15936,
"grad_norm": 0.11807904032902185,
"learning_rate": 2.80280954069732e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027037806808948517,
"step": 2250,
"valid_targets_mean": 8114.3,
"valid_targets_min": 2376
},
{
"epoch": 2.16416,
"grad_norm": 0.12242403638033678,
"learning_rate": 2.7966685853477828e-05,
"loss": 0.0879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030830947682261467,
"step": 2255,
"valid_targets_mean": 9222.7,
"valid_targets_min": 3138
},
{
"epoch": 2.16896,
"grad_norm": 0.11760527959631821,
"learning_rate": 2.790518689605971e-05,
"loss": 0.0839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03028050996363163,
"step": 2260,
"valid_targets_mean": 8239.4,
"valid_targets_min": 3664
},
{
"epoch": 2.17376,
"grad_norm": 0.12713317820214887,
"learning_rate": 2.7843599224873833e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029034830629825592,
"step": 2265,
"valid_targets_mean": 8398.4,
"valid_targets_min": 2683
},
{
"epoch": 2.17856,
"grad_norm": 0.11448227095558705,
"learning_rate": 2.7781923531070775e-05,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02563052624464035,
"step": 2270,
"valid_targets_mean": 9533.0,
"valid_targets_min": 1521
},
{
"epoch": 2.18336,
"grad_norm": 0.12163245887119671,
"learning_rate": 2.7720160506788896e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026498647406697273,
"step": 2275,
"valid_targets_mean": 9146.3,
"valid_targets_min": 3145
},
{
"epoch": 2.18816,
"grad_norm": 0.1227312763442586,
"learning_rate": 2.7658310845146598e-05,
"loss": 0.0858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03034115955233574,
"step": 2280,
"valid_targets_mean": 9096.8,
"valid_targets_min": 2617
},
{
"epoch": 2.19296,
"grad_norm": 0.13297660140986542,
"learning_rate": 2.7596375240234574e-05,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026283323764801025,
"step": 2285,
"valid_targets_mean": 8396.1,
"valid_targets_min": 1588
},
{
"epoch": 2.19776,
"grad_norm": 0.12220411513735026,
"learning_rate": 2.7534354387107975e-05,
"loss": 0.0885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030644144862890244,
"step": 2290,
"valid_targets_mean": 8958.4,
"valid_targets_min": 4317
},
{
"epoch": 2.20256,
"grad_norm": 0.11764379302404512,
"learning_rate": 2.747224898177862e-05,
"loss": 0.0836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025263972580432892,
"step": 2295,
"valid_targets_mean": 9061.1,
"valid_targets_min": 3336
},
{
"epoch": 2.20736,
"grad_norm": 0.12966871279969255,
"learning_rate": 2.7410059721207187e-05,
"loss": 0.0859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028944432735443115,
"step": 2300,
"valid_targets_mean": 9488.6,
"valid_targets_min": 3839
},
{
"epoch": 2.21216,
"grad_norm": 0.11142932566793738,
"learning_rate": 2.734778730329543e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03101763129234314,
"step": 2305,
"valid_targets_mean": 9028.5,
"valid_targets_min": 1917
},
{
"epoch": 2.21696,
"grad_norm": 0.1143112294079201,
"learning_rate": 2.7285432426878275e-05,
"loss": 0.0891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02940632961690426,
"step": 2310,
"valid_targets_mean": 9081.0,
"valid_targets_min": 2201
},
{
"epoch": 2.22176,
"grad_norm": 0.14446948206235952,
"learning_rate": 2.7222995791716034e-05,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029054325073957443,
"step": 2315,
"valid_targets_mean": 8472.1,
"valid_targets_min": 2854
},
{
"epoch": 2.22656,
"grad_norm": 0.1298305463827391,
"learning_rate": 2.716047809848653e-05,
"loss": 0.0868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027578776702284813,
"step": 2320,
"valid_targets_mean": 8983.7,
"valid_targets_min": 2322
},
{
"epoch": 2.23136,
"grad_norm": 0.11734106721527403,
"learning_rate": 2.7097880048777238e-05,
"loss": 0.0883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026591507717967033,
"step": 2325,
"valid_targets_mean": 8910.7,
"valid_targets_min": 2719
},
{
"epoch": 2.23616,
"grad_norm": 0.1185128622335491,
"learning_rate": 2.703520234507742e-05,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028162341564893723,
"step": 2330,
"valid_targets_mean": 9224.5,
"valid_targets_min": 2254
},
{
"epoch": 2.24096,
"grad_norm": 0.12387215840197503,
"learning_rate": 2.697244569077021e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02742118015885353,
"step": 2335,
"valid_targets_mean": 8428.2,
"valid_targets_min": 2526
},
{
"epoch": 2.24576,
"grad_norm": 0.12075017881250852,
"learning_rate": 2.6909610790124772e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03025822341442108,
"step": 2340,
"valid_targets_mean": 9657.5,
"valid_targets_min": 4578
},
{
"epoch": 2.25056,
"grad_norm": 0.11206154418590676,
"learning_rate": 2.684669834828835e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030417874455451965,
"step": 2345,
"valid_targets_mean": 9800.4,
"valid_targets_min": 4694
},
{
"epoch": 2.25536,
"grad_norm": 0.12123597031997373,
"learning_rate": 2.6783709071278372e-05,
"loss": 0.0858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02864830195903778,
"step": 2350,
"valid_targets_mean": 9171.4,
"valid_targets_min": 3791
},
{
"epoch": 2.26016,
"grad_norm": 0.1124147307567478,
"learning_rate": 2.6720643665974522e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028500908985733986,
"step": 2355,
"valid_targets_mean": 8550.7,
"valid_targets_min": 1956
},
{
"epoch": 2.26496,
"grad_norm": 0.12143490811782527,
"learning_rate": 2.665750284011085e-05,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02900022640824318,
"step": 2360,
"valid_targets_mean": 8569.2,
"valid_targets_min": 2633
},
{
"epoch": 2.2697599999999998,
"grad_norm": 0.14818249191876692,
"learning_rate": 2.6594287302267744e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030275695025920868,
"step": 2365,
"valid_targets_mean": 8356.2,
"valid_targets_min": 3503
},
{
"epoch": 2.27456,
"grad_norm": 0.12193784051429168,
"learning_rate": 2.653099776186405e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030562900006771088,
"step": 2370,
"valid_targets_mean": 8735.8,
"valid_targets_min": 3683
},
{
"epoch": 2.27936,
"grad_norm": 0.12820083550312378,
"learning_rate": 2.646763492914908e-05,
"loss": 0.089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02770865336060524,
"step": 2375,
"valid_targets_mean": 8340.5,
"valid_targets_min": 3782
},
{
"epoch": 2.28416,
"grad_norm": 0.12584158181503047,
"learning_rate": 2.640419951519467e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027583956718444824,
"step": 2380,
"valid_targets_mean": 8902.2,
"valid_targets_min": 2519
},
{
"epoch": 2.28896,
"grad_norm": 0.11669888252699596,
"learning_rate": 2.634069223188715e-05,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02490045502781868,
"step": 2385,
"valid_targets_mean": 8558.5,
"valid_targets_min": 1749
},
{
"epoch": 2.29376,
"grad_norm": 0.13839389337555474,
"learning_rate": 2.627711379191939e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03266286849975586,
"step": 2390,
"valid_targets_mean": 8944.8,
"valid_targets_min": 1162
},
{
"epoch": 2.29856,
"grad_norm": 0.11514986701905704,
"learning_rate": 2.621346490878281e-05,
"loss": 0.0885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02784108743071556,
"step": 2395,
"valid_targets_mean": 8955.2,
"valid_targets_min": 3938
},
{
"epoch": 2.30336,
"grad_norm": 0.11881869791073651,
"learning_rate": 2.614974629675935e-05,
"loss": 0.092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023495035246014595,
"step": 2400,
"valid_targets_mean": 7342.0,
"valid_targets_min": 169
},
{
"epoch": 2.30816,
"grad_norm": 0.12360572532300317,
"learning_rate": 2.608595867091346e-05,
"loss": 0.0815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027920987457036972,
"step": 2405,
"valid_targets_mean": 8327.4,
"valid_targets_min": 2364
},
{
"epoch": 2.31296,
"grad_norm": 0.11715967892279636,
"learning_rate": 2.6022102747084084e-05,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027643052861094475,
"step": 2410,
"valid_targets_mean": 7846.9,
"valid_targets_min": 2577
},
{
"epoch": 2.31776,
"grad_norm": 0.12758321508927314,
"learning_rate": 2.595817924187663e-05,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02899922803044319,
"step": 2415,
"valid_targets_mean": 9130.7,
"valid_targets_min": 3316
},
{
"epoch": 2.32256,
"grad_norm": 0.13414710490899953,
"learning_rate": 2.589418887265489e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026726992800831795,
"step": 2420,
"valid_targets_mean": 8485.5,
"valid_targets_min": 3077
},
{
"epoch": 2.32736,
"grad_norm": 0.13587055559492064,
"learning_rate": 2.5830132357533044e-05,
"loss": 0.0845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029106823727488518,
"step": 2425,
"valid_targets_mean": 8432.3,
"valid_targets_min": 4446
},
{
"epoch": 2.33216,
"grad_norm": 0.15493957733521915,
"learning_rate": 2.5766010415367567e-05,
"loss": 0.0813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022029448300600052,
"step": 2430,
"valid_targets_mean": 8394.6,
"valid_targets_min": 3922
},
{
"epoch": 2.33696,
"grad_norm": 0.13728604655180596,
"learning_rate": 2.5701823765749187e-05,
"loss": 0.0807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027791917324066162,
"step": 2435,
"valid_targets_mean": 8548.2,
"valid_targets_min": 4766
},
{
"epoch": 2.34176,
"grad_norm": 0.1543128408800076,
"learning_rate": 2.563757312899477e-05,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026925476267933846,
"step": 2440,
"valid_targets_mean": 8387.8,
"valid_targets_min": 2338
},
{
"epoch": 2.34656,
"grad_norm": 0.13024914354519151,
"learning_rate": 2.557325922613926e-05,
"loss": 0.0791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02424551174044609,
"step": 2445,
"valid_targets_mean": 7773.3,
"valid_targets_min": 2357
},
{
"epoch": 2.35136,
"grad_norm": 0.11383491062887292,
"learning_rate": 2.5508882778927615e-05,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02507830783724785,
"step": 2450,
"valid_targets_mean": 9141.1,
"valid_targets_min": 2616
},
{
"epoch": 2.35616,
"grad_norm": 0.1354783740772417,
"learning_rate": 2.5444444509806654e-05,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02786952257156372,
"step": 2455,
"valid_targets_mean": 9109.7,
"valid_targets_min": 1796
},
{
"epoch": 2.36096,
"grad_norm": 0.12620305822721312,
"learning_rate": 2.5379945141916976e-05,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026485783979296684,
"step": 2460,
"valid_targets_mean": 8629.1,
"valid_targets_min": 1912
},
{
"epoch": 2.36576,
"grad_norm": 0.1257587782311723,
"learning_rate": 2.531538539908486e-05,
"loss": 0.0836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03141780570149422,
"step": 2465,
"valid_targets_mean": 8329.3,
"valid_targets_min": 2077
},
{
"epoch": 2.3705600000000002,
"grad_norm": 0.12781978557050486,
"learning_rate": 2.5250766005814108e-05,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026302650570869446,
"step": 2470,
"valid_targets_mean": 8031.9,
"valid_targets_min": 2063
},
{
"epoch": 2.37536,
"grad_norm": 0.12209146990464828,
"learning_rate": 2.5186087687277956e-05,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025557709857821465,
"step": 2475,
"valid_targets_mean": 8948.2,
"valid_targets_min": 5096
},
{
"epoch": 2.38016,
"grad_norm": 0.1382679318537906,
"learning_rate": 2.5121351169310887e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024665851145982742,
"step": 2480,
"valid_targets_mean": 8454.4,
"valid_targets_min": 2141
},
{
"epoch": 2.38496,
"grad_norm": 0.13902487378784473,
"learning_rate": 2.505655717840052e-05,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031393177807331085,
"step": 2485,
"valid_targets_mean": 8371.2,
"valid_targets_min": 1984
},
{
"epoch": 2.38976,
"grad_norm": 0.13282389888635227,
"learning_rate": 2.499170644167946e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024904152378439903,
"step": 2490,
"valid_targets_mean": 8406.3,
"valid_targets_min": 1938
},
{
"epoch": 2.3945600000000002,
"grad_norm": 0.1299330392423453,
"learning_rate": 2.49267996869171e-05,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03227228298783302,
"step": 2495,
"valid_targets_mean": 9098.1,
"valid_targets_min": 4981
},
{
"epoch": 2.39936,
"grad_norm": 0.1252546953275161,
"learning_rate": 2.486183764251151e-05,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02573280595242977,
"step": 2500,
"valid_targets_mean": 8719.9,
"valid_targets_min": 2288
},
{
"epoch": 2.40416,
"grad_norm": 0.12721435122351463,
"learning_rate": 2.4796821037481215e-05,
"loss": 0.0789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027574259787797928,
"step": 2505,
"valid_targets_mean": 8806.6,
"valid_targets_min": 1830
},
{
"epoch": 2.40896,
"grad_norm": 0.13390795751399273,
"learning_rate": 2.473175060145703e-05,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026054752990603447,
"step": 2510,
"valid_targets_mean": 8937.4,
"valid_targets_min": 2541
},
{
"epoch": 2.41376,
"grad_norm": 0.1184645193517672,
"learning_rate": 2.4666627064673892e-05,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024346385151147842,
"step": 2515,
"valid_targets_mean": 7785.2,
"valid_targets_min": 2980
},
{
"epoch": 2.41856,
"grad_norm": 0.1364358933879091,
"learning_rate": 2.4601451157962616e-05,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029486022889614105,
"step": 2520,
"valid_targets_mean": 9084.0,
"valid_targets_min": 4241
},
{
"epoch": 2.42336,
"grad_norm": 0.14177621555064562,
"learning_rate": 2.4536223612741754e-05,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025790728628635406,
"step": 2525,
"valid_targets_mean": 9287.2,
"valid_targets_min": 2587
},
{
"epoch": 2.42816,
"grad_norm": 0.12254560093831562,
"learning_rate": 2.447094516100934e-05,
"loss": 0.0801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025828056037425995,
"step": 2530,
"valid_targets_mean": 8999.5,
"valid_targets_min": 3557
},
{
"epoch": 2.43296,
"grad_norm": 0.12839180536574532,
"learning_rate": 2.4405616535334695e-05,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030729684978723526,
"step": 2535,
"valid_targets_mean": 9717.8,
"valid_targets_min": 5031
},
{
"epoch": 2.43776,
"grad_norm": 0.11585615309614611,
"learning_rate": 2.43402384688502e-05,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023497575893998146,
"step": 2540,
"valid_targets_mean": 9059.8,
"valid_targets_min": 1635
},
{
"epoch": 2.44256,
"grad_norm": 0.12134766967020498,
"learning_rate": 2.4274811695243085e-05,
"loss": 0.0801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02694030851125717,
"step": 2545,
"valid_targets_mean": 8850.2,
"valid_targets_min": 3299
},
{
"epoch": 2.4473599999999998,
"grad_norm": 0.1316863971028815,
"learning_rate": 2.4209336948747168e-05,
"loss": 0.0803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02972356602549553,
"step": 2550,
"valid_targets_mean": 9398.3,
"valid_targets_min": 4232
},
{
"epoch": 2.45216,
"grad_norm": 0.12287062451907484,
"learning_rate": 2.414381496413464e-05,
"loss": 0.0782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0246087945997715,
"step": 2555,
"valid_targets_mean": 8041.0,
"valid_targets_min": 2944
},
{
"epoch": 2.45696,
"grad_norm": 0.12535471909521592,
"learning_rate": 2.4078246476707793e-05,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024066515266895294,
"step": 2560,
"valid_targets_mean": 8603.2,
"valid_targets_min": 2279
},
{
"epoch": 2.46176,
"grad_norm": 0.1264236899638182,
"learning_rate": 2.4012632222290802e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02529139630496502,
"step": 2565,
"valid_targets_mean": 8860.7,
"valid_targets_min": 3159
},
{
"epoch": 2.46656,
"grad_norm": 0.12748116305719281,
"learning_rate": 2.3946972937221444e-05,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03009450063109398,
"step": 2570,
"valid_targets_mean": 9358.7,
"valid_targets_min": 1975
},
{
"epoch": 2.47136,
"grad_norm": 0.13952086450619908,
"learning_rate": 2.3881269358342828e-05,
"loss": 0.0785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028878334909677505,
"step": 2575,
"valid_targets_mean": 8155.2,
"valid_targets_min": 2432
},
{
"epoch": 2.47616,
"grad_norm": 0.12234682090534985,
"learning_rate": 2.3815522222995158e-05,
"loss": 0.0777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023882580921053886,
"step": 2580,
"valid_targets_mean": 7829.0,
"valid_targets_min": 2730
},
{
"epoch": 2.48096,
"grad_norm": 0.1212451765174174,
"learning_rate": 2.3749732269007427e-05,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02354244887828827,
"step": 2585,
"valid_targets_mean": 8768.0,
"valid_targets_min": 1602
},
{
"epoch": 2.48576,
"grad_norm": 0.12337580575976319,
"learning_rate": 2.3683900234689142e-05,
"loss": 0.075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021861132234334946,
"step": 2590,
"valid_targets_mean": 8479.1,
"valid_targets_min": 1756
},
{
"epoch": 2.49056,
"grad_norm": 0.1264164703524998,
"learning_rate": 2.3618026858822054e-05,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030043430626392365,
"step": 2595,
"valid_targets_mean": 8425.5,
"valid_targets_min": 2912
},
{
"epoch": 2.49536,
"grad_norm": 0.13322500466357357,
"learning_rate": 2.355211288065187e-05,
"loss": 0.0773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02616289258003235,
"step": 2600,
"valid_targets_mean": 8737.0,
"valid_targets_min": 2762
},
{
"epoch": 2.50016,
"grad_norm": 0.14281821332399597,
"learning_rate": 2.348615903987991e-05,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027944108471274376,
"step": 2605,
"valid_targets_mean": 8119.4,
"valid_targets_min": 1852
},
{
"epoch": 2.50496,
"grad_norm": 0.12278110816702006,
"learning_rate": 2.3420166076654873e-05,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02698206529021263,
"step": 2610,
"valid_targets_mean": 9372.3,
"valid_targets_min": 1970
},
{
"epoch": 2.50976,
"grad_norm": 0.12717072751197384,
"learning_rate": 2.335413473156449e-05,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02557991072535515,
"step": 2615,
"valid_targets_mean": 8949.4,
"valid_targets_min": 3090
},
{
"epoch": 2.51456,
"grad_norm": 0.1215114979896222,
"learning_rate": 2.328806574562722e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021433714777231216,
"step": 2620,
"valid_targets_mean": 8481.4,
"valid_targets_min": 3181
},
{
"epoch": 2.51936,
"grad_norm": 0.13269527558167965,
"learning_rate": 2.322195986028393e-05,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023230556398630142,
"step": 2625,
"valid_targets_mean": 8499.2,
"valid_targets_min": 3799
},
{
"epoch": 2.52416,
"grad_norm": 0.12500369623855434,
"learning_rate": 2.315581781738959e-05,
"loss": 0.0771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02225703001022339,
"step": 2630,
"valid_targets_mean": 8066.4,
"valid_targets_min": 2881
},
{
"epoch": 2.52896,
"grad_norm": 0.12839309833611812,
"learning_rate": 2.3089640359204937e-05,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02520071715116501,
"step": 2635,
"valid_targets_mean": 8992.2,
"valid_targets_min": 1565
},
{
"epoch": 2.53376,
"grad_norm": 0.1309485140869025,
"learning_rate": 2.3023428228388144e-05,
"loss": 0.0765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02432047203183174,
"step": 2640,
"valid_targets_mean": 8642.0,
"valid_targets_min": 1852
},
{
"epoch": 2.53856,
"grad_norm": 0.13195500479172162,
"learning_rate": 2.2957182167986486e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02704329788684845,
"step": 2645,
"valid_targets_mean": 8725.4,
"valid_targets_min": 2588
},
{
"epoch": 2.54336,
"grad_norm": 0.14879671880870712,
"learning_rate": 2.2890902921428004e-05,
"loss": 0.0757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023556988686323166,
"step": 2650,
"valid_targets_mean": 8299.9,
"valid_targets_min": 1915
},
{
"epoch": 2.54816,
"grad_norm": 0.13418012766582119,
"learning_rate": 2.2824591232513153e-05,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024494722485542297,
"step": 2655,
"valid_targets_mean": 7699.7,
"valid_targets_min": 1729
},
{
"epoch": 2.55296,
"grad_norm": 0.11860664564020829,
"learning_rate": 2.2758247845406495e-05,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025114569813013077,
"step": 2660,
"valid_targets_mean": 8217.2,
"valid_targets_min": 2032
},
{
"epoch": 2.55776,
"grad_norm": 0.13999752211175603,
"learning_rate": 2.2691873504628282e-05,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02651476487517357,
"step": 2665,
"valid_targets_mean": 8598.3,
"valid_targets_min": 3847
},
{
"epoch": 2.56256,
"grad_norm": 0.12447169923083799,
"learning_rate": 2.2625468955046143e-05,
"loss": 0.0771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02548210322856903,
"step": 2670,
"valid_targets_mean": 8152.9,
"valid_targets_min": 1921
},
{
"epoch": 2.56736,
"grad_norm": 0.1225074570696376,
"learning_rate": 2.2559034941866727e-05,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025047052651643753,
"step": 2675,
"valid_targets_mean": 8584.6,
"valid_targets_min": 2518
},
{
"epoch": 2.5721600000000002,
"grad_norm": 0.1257466044762218,
"learning_rate": 2.2492572210627325e-05,
"loss": 0.0754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02429202012717724,
"step": 2680,
"valid_targets_mean": 8235.4,
"valid_targets_min": 2038
},
{
"epoch": 2.57696,
"grad_norm": 0.13557857735015535,
"learning_rate": 2.24260815071875e-05,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023734377697110176,
"step": 2685,
"valid_targets_mean": 8223.3,
"valid_targets_min": 1543
},
{
"epoch": 2.58176,
"grad_norm": 0.12431085511827711,
"learning_rate": 2.2359563577720743e-05,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026736926287412643,
"step": 2690,
"valid_targets_mean": 9182.7,
"valid_targets_min": 3127
},
{
"epoch": 2.58656,
"grad_norm": 0.11900321217430507,
"learning_rate": 2.229301916870606e-05,
"loss": 0.0731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027746083214879036,
"step": 2695,
"valid_targets_mean": 9351.5,
"valid_targets_min": 4599
},
{
"epoch": 2.59136,
"grad_norm": 0.1383700323259459,
"learning_rate": 2.2226449026919637e-05,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029470983892679214,
"step": 2700,
"valid_targets_mean": 9054.1,
"valid_targets_min": 5678
},
{
"epoch": 2.5961600000000002,
"grad_norm": 0.13012742542583644,
"learning_rate": 2.2159853899426427e-05,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025567417964339256,
"step": 2705,
"valid_targets_mean": 9233.9,
"valid_targets_min": 2233
},
{
"epoch": 2.60096,
"grad_norm": 0.12657750747445207,
"learning_rate": 2.209323453357178e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02532579004764557,
"step": 2710,
"valid_targets_mean": 8470.7,
"valid_targets_min": 3447
},
{
"epoch": 2.60576,
"grad_norm": 0.13279951041017773,
"learning_rate": 2.202659167697306e-05,
"loss": 0.0764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02570538967847824,
"step": 2715,
"valid_targets_mean": 9163.9,
"valid_targets_min": 3626
},
{
"epoch": 2.61056,
"grad_norm": 0.12127499458765617,
"learning_rate": 2.1959926077511234e-05,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020813290029764175,
"step": 2720,
"valid_targets_mean": 9457.5,
"valid_targets_min": 2096
},
{
"epoch": 2.61536,
"grad_norm": 0.1253460206942048,
"learning_rate": 2.1893238483322512e-05,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023362675681710243,
"step": 2725,
"valid_targets_mean": 8545.1,
"valid_targets_min": 2994
},
{
"epoch": 2.6201600000000003,
"grad_norm": 0.13220273622382875,
"learning_rate": 2.1826529642789923e-05,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02266569808125496,
"step": 2730,
"valid_targets_mean": 8827.2,
"valid_targets_min": 3646
},
{
"epoch": 2.6249599999999997,
"grad_norm": 0.1320216526163596,
"learning_rate": 2.1759800304534936e-05,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027949821203947067,
"step": 2735,
"valid_targets_mean": 8625.2,
"valid_targets_min": 2142
},
{
"epoch": 2.62976,
"grad_norm": 0.11911754506105855,
"learning_rate": 2.1693051217409048e-05,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02508479729294777,
"step": 2740,
"valid_targets_mean": 8534.6,
"valid_targets_min": 1960
},
{
"epoch": 2.63456,
"grad_norm": 0.12386094956552933,
"learning_rate": 2.1626283130485365e-05,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02538812719285488,
"step": 2745,
"valid_targets_mean": 8241.4,
"valid_targets_min": 2379
},
{
"epoch": 2.63936,
"grad_norm": 0.1730315798377173,
"learning_rate": 2.1559496793050235e-05,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027699865400791168,
"step": 2750,
"valid_targets_mean": 9055.9,
"valid_targets_min": 3489
},
{
"epoch": 2.64416,
"grad_norm": 0.12946922012219694,
"learning_rate": 2.1492692954594815e-05,
"loss": 0.0773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02325347810983658,
"step": 2755,
"valid_targets_mean": 8042.9,
"valid_targets_min": 2633
},
{
"epoch": 2.6489599999999998,
"grad_norm": 0.1366619849837903,
"learning_rate": 2.1425872364806642e-05,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02587948739528656,
"step": 2760,
"valid_targets_mean": 8853.9,
"valid_targets_min": 3540
},
{
"epoch": 2.65376,
"grad_norm": 0.12647286473054808,
"learning_rate": 2.1359035773561275e-05,
"loss": 0.0787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029227159917354584,
"step": 2765,
"valid_targets_mean": 9773.8,
"valid_targets_min": 3960
},
{
"epoch": 2.65856,
"grad_norm": 0.14185801754999453,
"learning_rate": 2.1292183930913803e-05,
"loss": 0.0749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02531890943646431,
"step": 2770,
"valid_targets_mean": 8255.2,
"valid_targets_min": 1987
},
{
"epoch": 2.66336,
"grad_norm": 0.12863813890549577,
"learning_rate": 2.1225317587090507e-05,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027946345508098602,
"step": 2775,
"valid_targets_mean": 8502.0,
"valid_targets_min": 1123
},
{
"epoch": 2.66816,
"grad_norm": 0.12736788349292172,
"learning_rate": 2.1158437492480384e-05,
"loss": 0.0716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01997240260243416,
"step": 2780,
"valid_targets_mean": 7395.3,
"valid_targets_min": 2185
},
{
"epoch": 2.67296,
"grad_norm": 0.12976383848578613,
"learning_rate": 2.1091544397626752e-05,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025439299643039703,
"step": 2785,
"valid_targets_mean": 8741.4,
"valid_targets_min": 3209
},
{
"epoch": 2.67776,
"grad_norm": 0.12360076149823336,
"learning_rate": 2.102463905321881e-05,
"loss": 0.0747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023299697786569595,
"step": 2790,
"valid_targets_mean": 8274.7,
"valid_targets_min": 3255
},
{
"epoch": 2.68256,
"grad_norm": 0.12579718860137898,
"learning_rate": 2.095772221008323e-05,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024257106706500053,
"step": 2795,
"valid_targets_mean": 8911.9,
"valid_targets_min": 5452
},
{
"epoch": 2.68736,
"grad_norm": 0.1309826914466945,
"learning_rate": 2.0890794619175745e-05,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026484040543437004,
"step": 2800,
"valid_targets_mean": 8579.1,
"valid_targets_min": 1887
},
{
"epoch": 2.69216,
"grad_norm": 0.1314840553029046,
"learning_rate": 2.0823857031572663e-05,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026499971747398376,
"step": 2805,
"valid_targets_mean": 8582.2,
"valid_targets_min": 3171
},
{
"epoch": 2.69696,
"grad_norm": 0.13542623007736973,
"learning_rate": 2.0756910198462515e-05,
"loss": 0.0746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024281367659568787,
"step": 2810,
"valid_targets_mean": 8698.7,
"valid_targets_min": 2419
},
{
"epoch": 2.70176,
"grad_norm": 0.12828824896006688,
"learning_rate": 2.0689954871137558e-05,
"loss": 0.0747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02330276370048523,
"step": 2815,
"valid_targets_mean": 9369.3,
"valid_targets_min": 2792
},
{
"epoch": 2.70656,
"grad_norm": 0.1274100600671183,
"learning_rate": 2.0622991800985398e-05,
"loss": 0.0763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02662099152803421,
"step": 2820,
"valid_targets_mean": 8691.3,
"valid_targets_min": 2503
},
{
"epoch": 2.71136,
"grad_norm": 0.13208316669833364,
"learning_rate": 2.055602173948051e-05,
"loss": 0.0757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023739665746688843,
"step": 2825,
"valid_targets_mean": 8986.6,
"valid_targets_min": 4021
},
{
"epoch": 2.71616,
"grad_norm": 0.1347761848229569,
"learning_rate": 2.0489045438175842e-05,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022743025794625282,
"step": 2830,
"valid_targets_mean": 7970.3,
"valid_targets_min": 2753
},
{
"epoch": 2.72096,
"grad_norm": 0.13563435389041437,
"learning_rate": 2.042206364869436e-05,
"loss": 0.0718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020514879375696182,
"step": 2835,
"valid_targets_mean": 8056.1,
"valid_targets_min": 1768
},
{
"epoch": 2.72576,
"grad_norm": 0.12106789458820655,
"learning_rate": 2.0355077122720625e-05,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01979285106062889,
"step": 2840,
"valid_targets_mean": 8668.8,
"valid_targets_min": 1889
},
{
"epoch": 2.73056,
"grad_norm": 0.13331211562297765,
"learning_rate": 2.0288086611992344e-05,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02285662479698658,
"step": 2845,
"valid_targets_mean": 8784.2,
"valid_targets_min": 2507
},
{
"epoch": 2.73536,
"grad_norm": 0.12283461413697871,
"learning_rate": 2.0221092868291953e-05,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024631857872009277,
"step": 2850,
"valid_targets_mean": 9224.7,
"valid_targets_min": 3740
},
{
"epoch": 2.74016,
"grad_norm": 0.13462190750677952,
"learning_rate": 2.0154096643438153e-05,
"loss": 0.0739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02646755427122116,
"step": 2855,
"valid_targets_mean": 9081.2,
"valid_targets_min": 3634
},
{
"epoch": 2.74496,
"grad_norm": 0.15212100488432875,
"learning_rate": 2.008709868927751e-05,
"loss": 0.0742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02177482843399048,
"step": 2860,
"valid_targets_mean": 9343.9,
"valid_targets_min": 1558
},
{
"epoch": 2.74976,
"grad_norm": 0.13891228481080325,
"learning_rate": 2.0020099757675978e-05,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023706315085291862,
"step": 2865,
"valid_targets_mean": 8286.4,
"valid_targets_min": 4347
},
{
"epoch": 2.75456,
"grad_norm": 0.12578790912092921,
"learning_rate": 1.9953100600510487e-05,
"loss": 0.0705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0233942698687315,
"step": 2870,
"valid_targets_mean": 8919.5,
"valid_targets_min": 4034
},
{
"epoch": 2.75936,
"grad_norm": 0.12433449798647353,
"learning_rate": 1.9886101969660504e-05,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02069215103983879,
"step": 2875,
"valid_targets_mean": 8321.7,
"valid_targets_min": 2865
},
{
"epoch": 2.76416,
"grad_norm": 0.12331619896381704,
"learning_rate": 1.9819104616999584e-05,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02588079310953617,
"step": 2880,
"valid_targets_mean": 8835.1,
"valid_targets_min": 3375
},
{
"epoch": 2.76896,
"grad_norm": 0.12198016602770331,
"learning_rate": 1.975210929438693e-05,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023465629667043686,
"step": 2885,
"valid_targets_mean": 8514.5,
"valid_targets_min": 1894
},
{
"epoch": 2.7737600000000002,
"grad_norm": 0.1285591492170375,
"learning_rate": 1.9685116753658982e-05,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023442579433321953,
"step": 2890,
"valid_targets_mean": 9131.8,
"valid_targets_min": 2375
},
{
"epoch": 2.77856,
"grad_norm": 0.14027229866879554,
"learning_rate": 1.9618127746620944e-05,
"loss": 0.0729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027585767209529877,
"step": 2895,
"valid_targets_mean": 9061.1,
"valid_targets_min": 3636
},
{
"epoch": 2.78336,
"grad_norm": 0.12175580215805587,
"learning_rate": 1.9551143025038363e-05,
"loss": 0.0733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025040633976459503,
"step": 2900,
"valid_targets_mean": 8019.9,
"valid_targets_min": 4226
},
{
"epoch": 2.78816,
"grad_norm": 0.12631373857068798,
"learning_rate": 1.9484163340628724e-05,
"loss": 0.074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022008750587701797,
"step": 2905,
"valid_targets_mean": 8278.6,
"valid_targets_min": 3655
},
{
"epoch": 2.79296,
"grad_norm": 0.12353277202856984,
"learning_rate": 1.941718944505294e-05,
"loss": 0.0703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0223405584692955,
"step": 2910,
"valid_targets_mean": 8777.7,
"valid_targets_min": 2390
},
{
"epoch": 2.7977600000000002,
"grad_norm": 0.12477152321684222,
"learning_rate": 1.9350222089906994e-05,
"loss": 0.0731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022324811667203903,
"step": 2915,
"valid_targets_mean": 8715.5,
"valid_targets_min": 2780
},
{
"epoch": 2.80256,
"grad_norm": 0.1274810275629356,
"learning_rate": 1.9283262026713456e-05,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024463120847940445,
"step": 2920,
"valid_targets_mean": 8644.3,
"valid_targets_min": 2357
},
{
"epoch": 2.80736,
"grad_norm": 0.15489737871525144,
"learning_rate": 1.9216310006913058e-05,
"loss": 0.0724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0199250690639019,
"step": 2925,
"valid_targets_mean": 8119.0,
"valid_targets_min": 2239
},
{
"epoch": 2.81216,
"grad_norm": 0.13087489077175116,
"learning_rate": 1.914936678185629e-05,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02115030400454998,
"step": 2930,
"valid_targets_mean": 8713.2,
"valid_targets_min": 2695
},
{
"epoch": 2.81696,
"grad_norm": 0.12942414716942643,
"learning_rate": 1.9082433102794918e-05,
"loss": 0.0736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025940679013729095,
"step": 2935,
"valid_targets_mean": 9562.3,
"valid_targets_min": 4015
},
{
"epoch": 2.8217600000000003,
"grad_norm": 0.11899703583290817,
"learning_rate": 1.9015509720873603e-05,
"loss": 0.0726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028031064197421074,
"step": 2940,
"valid_targets_mean": 9664.9,
"valid_targets_min": 2235
},
{
"epoch": 2.8265599999999997,
"grad_norm": 0.12835916290377014,
"learning_rate": 1.894859738712143e-05,
"loss": 0.0745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023106276988983154,
"step": 2945,
"valid_targets_mean": 8617.7,
"valid_targets_min": 2343
},
{
"epoch": 2.83136,
"grad_norm": 0.12234620395991247,
"learning_rate": 1.888169685244352e-05,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021706473082304,
"step": 2950,
"valid_targets_mean": 7974.6,
"valid_targets_min": 1989
},
{
"epoch": 2.83616,
"grad_norm": 0.12135472934515772,
"learning_rate": 1.8814808867612568e-05,
"loss": 0.0739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0252741239964962,
"step": 2955,
"valid_targets_mean": 9213.8,
"valid_targets_min": 3497
},
{
"epoch": 2.84096,
"grad_norm": 0.12341097629186015,
"learning_rate": 1.8747934183260427e-05,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022089535370469093,
"step": 2960,
"valid_targets_mean": 8485.8,
"valid_targets_min": 2813
},
{
"epoch": 2.84576,
"grad_norm": 0.12185458825230623,
"learning_rate": 1.868107354986971e-05,
"loss": 0.0745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023958466947078705,
"step": 2965,
"valid_targets_mean": 8559.1,
"valid_targets_min": 2934
},
{
"epoch": 2.8505599999999998,
"grad_norm": 0.2019700331379936,
"learning_rate": 1.8614227717765327e-05,
"loss": 0.0727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023400334641337395,
"step": 2970,
"valid_targets_mean": 8567.7,
"valid_targets_min": 3655
},
{
"epoch": 2.85536,
"grad_norm": 0.12307094056404946,
"learning_rate": 1.8547397437106084e-05,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02216029167175293,
"step": 2975,
"valid_targets_mean": 8859.0,
"valid_targets_min": 3690
},
{
"epoch": 2.86016,
"grad_norm": 0.1363174764510877,
"learning_rate": 1.848058345787629e-05,
"loss": 0.074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024962490424513817,
"step": 2980,
"valid_targets_mean": 8806.0,
"valid_targets_min": 3210
},
{
"epoch": 2.86496,
"grad_norm": 0.12263761790836711,
"learning_rate": 1.8413786529877288e-05,
"loss": 0.0706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0196840763092041,
"step": 2985,
"valid_targets_mean": 8160.8,
"valid_targets_min": 2827
},
{
"epoch": 2.86976,
"grad_norm": 0.12703370316175627,
"learning_rate": 1.8347007402719082e-05,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025346554815769196,
"step": 2990,
"valid_targets_mean": 9061.6,
"valid_targets_min": 4220
},
{
"epoch": 2.87456,
"grad_norm": 0.12244916720977835,
"learning_rate": 1.828024682581191e-05,
"loss": 0.0762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026083365082740784,
"step": 2995,
"valid_targets_mean": 9098.1,
"valid_targets_min": 1492
},
{
"epoch": 2.87936,
"grad_norm": 0.13150902110865764,
"learning_rate": 1.8213505548357822e-05,
"loss": 0.0729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023833446204662323,
"step": 3000,
"valid_targets_mean": 8153.8,
"valid_targets_min": 2983
},
{
"epoch": 2.88416,
"grad_norm": 0.12212915178092341,
"learning_rate": 1.814678431934231e-05,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02612268179655075,
"step": 3005,
"valid_targets_mean": 9175.3,
"valid_targets_min": 4008
},
{
"epoch": 2.88896,
"grad_norm": 0.1346347379421597,
"learning_rate": 1.8080083887525862e-05,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023977095261216164,
"step": 3010,
"valid_targets_mean": 8365.3,
"valid_targets_min": 2239
},
{
"epoch": 2.89376,
"grad_norm": 0.12570526531776613,
"learning_rate": 1.801340500143557e-05,
"loss": 0.0724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02590319886803627,
"step": 3015,
"valid_targets_mean": 8906.6,
"valid_targets_min": 4035
},
{
"epoch": 2.89856,
"grad_norm": 0.12095421806855092,
"learning_rate": 1.7946748409356746e-05,
"loss": 0.0758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024391578510403633,
"step": 3020,
"valid_targets_mean": 8243.3,
"valid_targets_min": 1280
},
{
"epoch": 2.90336,
"grad_norm": 0.13265519572762954,
"learning_rate": 1.788011485932451e-05,
"loss": 0.0733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02277197316288948,
"step": 3025,
"valid_targets_mean": 8158.2,
"valid_targets_min": 1629
},
{
"epoch": 2.90816,
"grad_norm": 0.13107630504480672,
"learning_rate": 1.78135050991154e-05,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02625724859535694,
"step": 3030,
"valid_targets_mean": 8981.2,
"valid_targets_min": 3186
},
{
"epoch": 2.91296,
"grad_norm": 0.41703413499653275,
"learning_rate": 1.774691987623898e-05,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026596393436193466,
"step": 3035,
"valid_targets_mean": 9226.0,
"valid_targets_min": 3192
},
{
"epoch": 2.91776,
"grad_norm": 0.15139444386768838,
"learning_rate": 1.768035993792944e-05,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027542371302843094,
"step": 3040,
"valid_targets_mean": 10083.0,
"valid_targets_min": 6144
},
{
"epoch": 2.92256,
"grad_norm": 0.12675751853167433,
"learning_rate": 1.7613826031137245e-05,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02687855437397957,
"step": 3045,
"valid_targets_mean": 8895.7,
"valid_targets_min": 4809
},
{
"epoch": 2.92736,
"grad_norm": 0.12662474766507864,
"learning_rate": 1.7547318902520693e-05,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024971062317490578,
"step": 3050,
"valid_targets_mean": 8946.8,
"valid_targets_min": 4309
},
{
"epoch": 2.93216,
"grad_norm": 0.1286424743817585,
"learning_rate": 1.7480839298437612e-05,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025227583944797516,
"step": 3055,
"valid_targets_mean": 9259.2,
"valid_targets_min": 2514
},
{
"epoch": 2.93696,
"grad_norm": 0.12893517435268495,
"learning_rate": 1.7414387964936913e-05,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026150595396757126,
"step": 3060,
"valid_targets_mean": 9149.1,
"valid_targets_min": 3181
},
{
"epoch": 2.94176,
"grad_norm": 0.12655174215859458,
"learning_rate": 1.7347965647750264e-05,
"loss": 0.0707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024759739637374878,
"step": 3065,
"valid_targets_mean": 9399.6,
"valid_targets_min": 3759
},
{
"epoch": 2.94656,
"grad_norm": 0.13072454712552234,
"learning_rate": 1.7281573092283698e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021730834618210793,
"step": 3070,
"valid_targets_mean": 8040.0,
"valid_targets_min": 3188
},
{
"epoch": 2.95136,
"grad_norm": 0.12321743168297426,
"learning_rate": 1.721521104360925e-05,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023660646751523018,
"step": 3075,
"valid_targets_mean": 8968.6,
"valid_targets_min": 3813
},
{
"epoch": 2.95616,
"grad_norm": 0.12969336877295307,
"learning_rate": 1.714888024645662e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027581918984651566,
"step": 3080,
"valid_targets_mean": 8911.6,
"valid_targets_min": 1185
},
{
"epoch": 2.96096,
"grad_norm": 0.12602670418990503,
"learning_rate": 1.708258144520478e-05,
"loss": 0.0735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027505237609148026,
"step": 3085,
"valid_targets_mean": 8821.6,
"valid_targets_min": 3186
},
{
"epoch": 2.96576,
"grad_norm": 0.1297030798288961,
"learning_rate": 1.7016315383873637e-05,
"loss": 0.0725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02171483263373375,
"step": 3090,
"valid_targets_mean": 8498.5,
"valid_targets_min": 1844
},
{
"epoch": 2.97056,
"grad_norm": 0.14699243538398662,
"learning_rate": 1.6950082806115692e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02368342876434326,
"step": 3095,
"valid_targets_mean": 9345.1,
"valid_targets_min": 5842
},
{
"epoch": 2.9753600000000002,
"grad_norm": 0.1232468312629796,
"learning_rate": 1.6883884455207685e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021345708519220352,
"step": 3100,
"valid_targets_mean": 7081.2,
"valid_targets_min": 2668
},
{
"epoch": 2.98016,
"grad_norm": 0.12761627571559783,
"learning_rate": 1.6817721074042254e-05,
"loss": 0.0736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021635062992572784,
"step": 3105,
"valid_targets_mean": 8916.5,
"valid_targets_min": 3337
},
{
"epoch": 2.98496,
"grad_norm": 0.127886107487912,
"learning_rate": 1.675159340511958e-05,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024836886674165726,
"step": 3110,
"valid_targets_mean": 8576.9,
"valid_targets_min": 3946
},
{
"epoch": 2.98976,
"grad_norm": 0.12291271639984096,
"learning_rate": 1.6685502190539106e-05,
"loss": 0.0703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02228378877043724,
"step": 3115,
"valid_targets_mean": 8604.4,
"valid_targets_min": 3261
},
{
"epoch": 2.99456,
"grad_norm": 0.12950070508669648,
"learning_rate": 1.6619448171991155e-05,
"loss": 0.0715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02772909589111805,
"step": 3120,
"valid_targets_mean": 9047.2,
"valid_targets_min": 4860
},
{
"epoch": 2.9993600000000002,
"grad_norm": 0.12916728839087535,
"learning_rate": 1.6553432090748624e-05,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022339988499879837,
"step": 3125,
"valid_targets_mean": 8654.5,
"valid_targets_min": 2501
},
{
"epoch": 3.00384,
"grad_norm": 0.13436467200946856,
"learning_rate": 1.648745468765869e-05,
"loss": 0.0695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02428019419312477,
"step": 3130,
"valid_targets_mean": 8521.2,
"valid_targets_min": 2029
},
{
"epoch": 3.00864,
"grad_norm": 0.1213964690982203,
"learning_rate": 1.6421516703134463e-05,
"loss": 0.0693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02279294840991497,
"step": 3135,
"valid_targets_mean": 9165.6,
"valid_targets_min": 3462
},
{
"epoch": 3.01344,
"grad_norm": 0.12809915325981858,
"learning_rate": 1.6355618877146685e-05,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02425113320350647,
"step": 3140,
"valid_targets_mean": 8720.2,
"valid_targets_min": 2045
},
{
"epoch": 3.01824,
"grad_norm": 0.12474776089090203,
"learning_rate": 1.6289761949215435e-05,
"loss": 0.0686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024004336446523666,
"step": 3145,
"valid_targets_mean": 8093.4,
"valid_targets_min": 1630
},
{
"epoch": 3.02304,
"grad_norm": 0.121771797960631,
"learning_rate": 1.6223946658401818e-05,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023814337328076363,
"step": 3150,
"valid_targets_mean": 8823.8,
"valid_targets_min": 4465
},
{
"epoch": 3.02784,
"grad_norm": 0.11750594629421643,
"learning_rate": 1.6158173743299692e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021509505808353424,
"step": 3155,
"valid_targets_mean": 8647.9,
"valid_targets_min": 4037
},
{
"epoch": 3.03264,
"grad_norm": 0.12614285302682426,
"learning_rate": 1.6092443942027356e-05,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0257541723549366,
"step": 3160,
"valid_targets_mean": 8363.3,
"valid_targets_min": 4240
},
{
"epoch": 3.03744,
"grad_norm": 0.11499077249412011,
"learning_rate": 1.602675799221927e-05,
"loss": 0.0703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021260704845190048,
"step": 3165,
"valid_targets_mean": 8695.0,
"valid_targets_min": 4039
},
{
"epoch": 3.04224,
"grad_norm": 0.12297680388920865,
"learning_rate": 1.59611166310178e-05,
"loss": 0.0699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021927397698163986,
"step": 3170,
"valid_targets_mean": 8749.3,
"valid_targets_min": 2927
},
{
"epoch": 3.04704,
"grad_norm": 0.12361795520196853,
"learning_rate": 1.5895520595064913e-05,
"loss": 0.0673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0205059964209795,
"step": 3175,
"valid_targets_mean": 7927.1,
"valid_targets_min": 2442
},
{
"epoch": 3.05184,
"grad_norm": 0.12814989984155925,
"learning_rate": 1.5829970620493932e-05,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027933187782764435,
"step": 3180,
"valid_targets_mean": 8855.2,
"valid_targets_min": 2084
},
{
"epoch": 3.05664,
"grad_norm": 0.11677970502216538,
"learning_rate": 1.5764467442921274e-05,
"loss": 0.0717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024320311844348907,
"step": 3185,
"valid_targets_mean": 8660.4,
"valid_targets_min": 2754
},
{
"epoch": 3.06144,
"grad_norm": 0.1239216085007504,
"learning_rate": 1.569901179743818e-05,
"loss": 0.0725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025944417342543602,
"step": 3190,
"valid_targets_mean": 9009.9,
"valid_targets_min": 4500
},
{
"epoch": 3.06624,
"grad_norm": 0.12945831869172478,
"learning_rate": 1.5633604418602483e-05,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023855559527873993,
"step": 3195,
"valid_targets_mean": 8333.2,
"valid_targets_min": 2803
},
{
"epoch": 3.07104,
"grad_norm": 0.13013260461232284,
"learning_rate": 1.5568246040430343e-05,
"loss": 0.0718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023685764521360397,
"step": 3200,
"valid_targets_mean": 7983.8,
"valid_targets_min": 4751
},
{
"epoch": 3.07584,
"grad_norm": 0.1273699840697591,
"learning_rate": 1.5502937396388046e-05,
"loss": 0.0683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023623168468475342,
"step": 3205,
"valid_targets_mean": 8991.2,
"valid_targets_min": 2308
},
{
"epoch": 3.08064,
"grad_norm": 0.11916279939675328,
"learning_rate": 1.543767921938374e-05,
"loss": 0.0689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022730082273483276,
"step": 3210,
"valid_targets_mean": 8499.2,
"valid_targets_min": 3355
},
{
"epoch": 3.08544,
"grad_norm": 0.12119443723949427,
"learning_rate": 1.537247224175922e-05,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021023793146014214,
"step": 3215,
"valid_targets_mean": 8985.7,
"valid_targets_min": 2404
},
{
"epoch": 3.09024,
"grad_norm": 0.13319695318574473,
"learning_rate": 1.53073171952817e-05,
"loss": 0.0692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02610372006893158,
"step": 3220,
"valid_targets_mean": 8657.2,
"valid_targets_min": 3664
},
{
"epoch": 3.09504,
"grad_norm": 0.11480415485378342,
"learning_rate": 1.5242214811135631e-05,
"loss": 0.0698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01964818686246872,
"step": 3225,
"valid_targets_mean": 7869.1,
"valid_targets_min": 1796
},
{
"epoch": 3.09984,
"grad_norm": 0.1509063264703375,
"learning_rate": 1.5177165819914461e-05,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023284582421183586,
"step": 3230,
"valid_targets_mean": 8114.5,
"valid_targets_min": 2202
},
{
"epoch": 3.10464,
"grad_norm": 0.12290331374199842,
"learning_rate": 1.5112170951612455e-05,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02735215239226818,
"step": 3235,
"valid_targets_mean": 9238.8,
"valid_targets_min": 2446
},
{
"epoch": 3.10944,
"grad_norm": 0.11627326471177059,
"learning_rate": 1.5047230935616497e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021479297429323196,
"step": 3240,
"valid_targets_mean": 8806.2,
"valid_targets_min": 3618
},
{
"epoch": 3.11424,
"grad_norm": 0.11908066536540551,
"learning_rate": 1.4982346500697916e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02094453200697899,
"step": 3245,
"valid_targets_mean": 8300.2,
"valid_targets_min": 4744
},
{
"epoch": 3.11904,
"grad_norm": 0.12430053568242028,
"learning_rate": 1.4917518375004281e-05,
"loss": 0.0673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020661715418100357,
"step": 3250,
"valid_targets_mean": 8002.1,
"valid_targets_min": 2486
},
{
"epoch": 3.12384,
"grad_norm": 0.11897850439214286,
"learning_rate": 1.4852747286051254e-05,
"loss": 0.0691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022244051098823547,
"step": 3255,
"valid_targets_mean": 9271.3,
"valid_targets_min": 3148
},
{
"epoch": 3.12864,
"grad_norm": 0.12101646152970325,
"learning_rate": 1.478803396071443e-05,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021861432120203972,
"step": 3260,
"valid_targets_mean": 8306.7,
"valid_targets_min": 2471
},
{
"epoch": 3.1334400000000002,
"grad_norm": 0.12377621716047282,
"learning_rate": 1.472337912522115e-05,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026585116982460022,
"step": 3265,
"valid_targets_mean": 8930.8,
"valid_targets_min": 3933
},
{
"epoch": 3.13824,
"grad_norm": 0.12365934012769708,
"learning_rate": 1.4658783505142368e-05,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023925743997097015,
"step": 3270,
"valid_targets_mean": 9297.8,
"valid_targets_min": 3247
},
{
"epoch": 3.14304,
"grad_norm": 0.12034112660714659,
"learning_rate": 1.4594247825384529e-05,
"loss": 0.0736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027109742164611816,
"step": 3275,
"valid_targets_mean": 8862.9,
"valid_targets_min": 2457
},
{
"epoch": 3.14784,
"grad_norm": 0.12419182575224802,
"learning_rate": 1.4529772810181398e-05,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022144844755530357,
"step": 3280,
"valid_targets_mean": 8546.1,
"valid_targets_min": 4936
},
{
"epoch": 3.15264,
"grad_norm": 0.12581501967835582,
"learning_rate": 1.4465359183085958e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02213982678949833,
"step": 3285,
"valid_targets_mean": 8170.9,
"valid_targets_min": 1037
},
{
"epoch": 3.15744,
"grad_norm": 0.13756118658624505,
"learning_rate": 1.4401007666962276e-05,
"loss": 0.0705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021517571061849594,
"step": 3290,
"valid_targets_mean": 8457.0,
"valid_targets_min": 2482
},
{
"epoch": 3.16224,
"grad_norm": 0.12193998039781807,
"learning_rate": 1.4336718983977389e-05,
"loss": 0.0726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024007262662053108,
"step": 3295,
"valid_targets_mean": 8692.9,
"valid_targets_min": 1922
},
{
"epoch": 3.16704,
"grad_norm": 0.1265404462653089,
"learning_rate": 1.4272493855593222e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023130342364311218,
"step": 3300,
"valid_targets_mean": 9112.4,
"valid_targets_min": 2050
},
{
"epoch": 3.17184,
"grad_norm": 0.1226326357869858,
"learning_rate": 1.4208333002558462e-05,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020230181515216827,
"step": 3305,
"valid_targets_mean": 8190.9,
"valid_targets_min": 1771
},
{
"epoch": 3.17664,
"grad_norm": 0.11414582360833214,
"learning_rate": 1.4144237144900497e-05,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024489928036928177,
"step": 3310,
"valid_targets_mean": 8684.1,
"valid_targets_min": 4674
},
{
"epoch": 3.18144,
"grad_norm": 0.12744621953971752,
"learning_rate": 1.4080207001917302e-05,
"loss": 0.0703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025685835629701614,
"step": 3315,
"valid_targets_mean": 8462.4,
"valid_targets_min": 1313
},
{
"epoch": 3.18624,
"grad_norm": 0.12631083930426035,
"learning_rate": 1.4016243292169413e-05,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020424753427505493,
"step": 3320,
"valid_targets_mean": 8725.7,
"valid_targets_min": 2161
},
{
"epoch": 3.19104,
"grad_norm": 0.11679712809878957,
"learning_rate": 1.3952346733471822e-05,
"loss": 0.0676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023827986791729927,
"step": 3325,
"valid_targets_mean": 8154.0,
"valid_targets_min": 3181
},
{
"epoch": 3.19584,
"grad_norm": 0.125231699118407,
"learning_rate": 1.3888518042885934e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02799840085208416,
"step": 3330,
"valid_targets_mean": 8681.6,
"valid_targets_min": 3326
},
{
"epoch": 3.20064,
"grad_norm": 0.11959339338389416,
"learning_rate": 1.3824757936711537e-05,
"loss": 0.0702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02259810082614422,
"step": 3335,
"valid_targets_mean": 9545.6,
"valid_targets_min": 2357
},
{
"epoch": 3.20544,
"grad_norm": 0.12174988786208792,
"learning_rate": 1.3761067130478738e-05,
"loss": 0.0703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02313234657049179,
"step": 3340,
"valid_targets_mean": 8121.8,
"valid_targets_min": 1979
},
{
"epoch": 3.21024,
"grad_norm": 0.11323346166579101,
"learning_rate": 1.3697446338939942e-05,
"loss": 0.0677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022821880877017975,
"step": 3345,
"valid_targets_mean": 8020.8,
"valid_targets_min": 3447
},
{
"epoch": 3.21504,
"grad_norm": 0.11671762619810887,
"learning_rate": 1.3633896276061847e-05,
"loss": 0.0668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02655469998717308,
"step": 3350,
"valid_targets_mean": 10324.1,
"valid_targets_min": 3177
},
{
"epoch": 3.21984,
"grad_norm": 0.11750097777157643,
"learning_rate": 1.3570417655017405e-05,
"loss": 0.0715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0216502882540226,
"step": 3355,
"valid_targets_mean": 8658.6,
"valid_targets_min": 3458
},
{
"epoch": 3.22464,
"grad_norm": 0.11820178487678269,
"learning_rate": 1.3507011188177846e-05,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022721372544765472,
"step": 3360,
"valid_targets_mean": 9518.7,
"valid_targets_min": 4699
},
{
"epoch": 3.22944,
"grad_norm": 0.11417679512946696,
"learning_rate": 1.3443677587104655e-05,
"loss": 0.0694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020779889076948166,
"step": 3365,
"valid_targets_mean": 8670.8,
"valid_targets_min": 3094
},
{
"epoch": 3.23424,
"grad_norm": 0.12624839454578163,
"learning_rate": 1.3380417562541604e-05,
"loss": 0.067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020790942013263702,
"step": 3370,
"valid_targets_mean": 8187.2,
"valid_targets_min": 1278
},
{
"epoch": 3.23904,
"grad_norm": 0.14609588360307785,
"learning_rate": 1.3317231824406783e-05,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024372944608330727,
"step": 3375,
"valid_targets_mean": 8531.4,
"valid_targets_min": 2185
},
{
"epoch": 3.24384,
"grad_norm": 0.117776839936567,
"learning_rate": 1.325412108178461e-05,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022288871929049492,
"step": 3380,
"valid_targets_mean": 8573.8,
"valid_targets_min": 3315
},
{
"epoch": 3.24864,
"grad_norm": 0.11646493488526218,
"learning_rate": 1.3191086042917895e-05,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02496308647096157,
"step": 3385,
"valid_targets_mean": 9230.8,
"valid_targets_min": 3590
},
{
"epoch": 3.25344,
"grad_norm": 0.12779066870734346,
"learning_rate": 1.3128127415199883e-05,
"loss": 0.0732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023436348885297775,
"step": 3390,
"valid_targets_mean": 8449.2,
"valid_targets_min": 2540
},
{
"epoch": 3.25824,
"grad_norm": 0.11925664271364658,
"learning_rate": 1.3065245905166316e-05,
"loss": 0.0655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021665815263986588,
"step": 3395,
"valid_targets_mean": 8535.0,
"valid_targets_min": 1755
},
{
"epoch": 3.26304,
"grad_norm": 0.11609499082097684,
"learning_rate": 1.30024422184875e-05,
"loss": 0.0702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020767629146575928,
"step": 3400,
"valid_targets_mean": 9026.3,
"valid_targets_min": 3114
},
{
"epoch": 3.26784,
"grad_norm": 0.12322940130660784,
"learning_rate": 1.2939717059960384e-05,
"loss": 0.0716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026769880205392838,
"step": 3405,
"valid_targets_mean": 9266.4,
"valid_targets_min": 2437
},
{
"epoch": 3.27264,
"grad_norm": 0.12268486970388134,
"learning_rate": 1.287707113350068e-05,
"loss": 0.0717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021298786625266075,
"step": 3410,
"valid_targets_mean": 8315.7,
"valid_targets_min": 1885
},
{
"epoch": 3.27744,
"grad_norm": 0.12293752242798077,
"learning_rate": 1.2814505142134921e-05,
"loss": 0.0682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0239997711032629,
"step": 3415,
"valid_targets_mean": 8773.1,
"valid_targets_min": 3471
},
{
"epoch": 3.28224,
"grad_norm": 0.11888564915744372,
"learning_rate": 1.2752019787992587e-05,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023440586403012276,
"step": 3420,
"valid_targets_mean": 9244.7,
"valid_targets_min": 2556
},
{
"epoch": 3.28704,
"grad_norm": 0.12035054922676984,
"learning_rate": 1.268961577229824e-05,
"loss": 0.0681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024956464767456055,
"step": 3425,
"valid_targets_mean": 9113.6,
"valid_targets_min": 6681
},
{
"epoch": 3.29184,
"grad_norm": 0.11609541056449521,
"learning_rate": 1.262729379536365e-05,
"loss": 0.0689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018632816150784492,
"step": 3430,
"valid_targets_mean": 8057.3,
"valid_targets_min": 2719
},
{
"epoch": 3.29664,
"grad_norm": 0.1156523388586678,
"learning_rate": 1.2565054556579917e-05,
"loss": 0.0695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03179524093866348,
"step": 3435,
"valid_targets_mean": 9017.0,
"valid_targets_min": 4248
},
{
"epoch": 3.30144,
"grad_norm": 0.12003104066174144,
"learning_rate": 1.2502898754409637e-05,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027027547359466553,
"step": 3440,
"valid_targets_mean": 8732.1,
"valid_targets_min": 2923
},
{
"epoch": 3.30624,
"grad_norm": 0.11525424183716788,
"learning_rate": 1.2440827086379055e-05,
"loss": 0.0689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023295942693948746,
"step": 3445,
"valid_targets_mean": 8759.2,
"valid_targets_min": 4664
},
{
"epoch": 3.31104,
"grad_norm": 0.12531104004344787,
"learning_rate": 1.2378840249070265e-05,
"loss": 0.0679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022183142602443695,
"step": 3450,
"valid_targets_mean": 8153.5,
"valid_targets_min": 2609
},
{
"epoch": 3.31584,
"grad_norm": 0.12343198360816166,
"learning_rate": 1.2316938938113356e-05,
"loss": 0.0696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023251008242368698,
"step": 3455,
"valid_targets_mean": 8565.3,
"valid_targets_min": 3428
},
{
"epoch": 3.32064,
"grad_norm": 0.1292388288269661,
"learning_rate": 1.2255123848178619e-05,
"loss": 0.0686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023235727101564407,
"step": 3460,
"valid_targets_mean": 9135.2,
"valid_targets_min": 2746
},
{
"epoch": 3.32544,
"grad_norm": 0.1215681936479102,
"learning_rate": 1.2193395672968765e-05,
"loss": 0.0717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02227572724223137,
"step": 3465,
"valid_targets_mean": 8278.0,
"valid_targets_min": 3403
},
{
"epoch": 3.33024,
"grad_norm": 0.11710136257925326,
"learning_rate": 1.2131755105211118e-05,
"loss": 0.0663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019895605742931366,
"step": 3470,
"valid_targets_mean": 8391.2,
"valid_targets_min": 2984
},
{
"epoch": 3.3350400000000002,
"grad_norm": 0.12542638777454168,
"learning_rate": 1.2070202836649855e-05,
"loss": 0.0676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021651022136211395,
"step": 3475,
"valid_targets_mean": 9145.8,
"valid_targets_min": 2439
},
{
"epoch": 3.33984,
"grad_norm": 0.12565404407998096,
"learning_rate": 1.2008739558038247e-05,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023290030658245087,
"step": 3480,
"valid_targets_mean": 7567.0,
"valid_targets_min": 2494
},
{
"epoch": 3.34464,
"grad_norm": 0.11631140589000345,
"learning_rate": 1.1947365959130895e-05,
"loss": 0.0667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018959272652864456,
"step": 3485,
"valid_targets_mean": 8354.6,
"valid_targets_min": 2992
},
{
"epoch": 3.34944,
"grad_norm": 0.1188568050783418,
"learning_rate": 1.1886082728675984e-05,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024846302345395088,
"step": 3490,
"valid_targets_mean": 8987.2,
"valid_targets_min": 4280
},
{
"epoch": 3.35424,
"grad_norm": 0.12019159263147859,
"learning_rate": 1.1824890554407574e-05,
"loss": 0.0691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018579427152872086,
"step": 3495,
"valid_targets_mean": 8977.7,
"valid_targets_min": 4890
},
{
"epoch": 3.3590400000000002,
"grad_norm": 0.1139585905859666,
"learning_rate": 1.1763790123037873e-05,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02406950294971466,
"step": 3500,
"valid_targets_mean": 9003.8,
"valid_targets_min": 1951
},
{
"epoch": 3.36384,
"grad_norm": 0.14319366739189193,
"learning_rate": 1.1702782120249539e-05,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024110540747642517,
"step": 3505,
"valid_targets_mean": 9082.9,
"valid_targets_min": 1492
},
{
"epoch": 3.36864,
"grad_norm": 0.11863992872229728,
"learning_rate": 1.164186723068795e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02288087084889412,
"step": 3510,
"valid_targets_mean": 8180.7,
"valid_targets_min": 2277
},
{
"epoch": 3.37344,
"grad_norm": 0.11512399838967773,
"learning_rate": 1.1581046137953575e-05,
"loss": 0.0687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022692613303661346,
"step": 3515,
"valid_targets_mean": 8648.9,
"valid_targets_min": 4250
},
{
"epoch": 3.37824,
"grad_norm": 0.13242448957401462,
"learning_rate": 1.1520319524594256e-05,
"loss": 0.0716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025992343202233315,
"step": 3520,
"valid_targets_mean": 8879.0,
"valid_targets_min": 1942
},
{
"epoch": 3.38304,
"grad_norm": 0.12807878449294854,
"learning_rate": 1.1459688072097568e-05,
"loss": 0.0685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022017603740096092,
"step": 3525,
"valid_targets_mean": 8338.1,
"valid_targets_min": 3877
},
{
"epoch": 3.38784,
"grad_norm": 0.11648212904241022,
"learning_rate": 1.1399152460883176e-05,
"loss": 0.0702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020594323053956032,
"step": 3530,
"valid_targets_mean": 9214.3,
"valid_targets_min": 2528
},
{
"epoch": 3.39264,
"grad_norm": 0.11821877317071199,
"learning_rate": 1.1338713370295189e-05,
"loss": 0.0718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026048175990581512,
"step": 3535,
"valid_targets_mean": 9281.7,
"valid_targets_min": 2639
},
{
"epoch": 3.39744,
"grad_norm": 0.11736629336592669,
"learning_rate": 1.1278371478594538e-05,
"loss": 0.0682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021891873329877853,
"step": 3540,
"valid_targets_mean": 8865.2,
"valid_targets_min": 2688
},
{
"epoch": 3.40224,
"grad_norm": 0.11972853626552638,
"learning_rate": 1.1218127462951367e-05,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02370895817875862,
"step": 3545,
"valid_targets_mean": 8682.7,
"valid_targets_min": 1583
},
{
"epoch": 3.40704,
"grad_norm": 0.12360516334847126,
"learning_rate": 1.1157981999437444e-05,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027519740164279938,
"step": 3550,
"valid_targets_mean": 8607.8,
"valid_targets_min": 3517
},
{
"epoch": 3.4118399999999998,
"grad_norm": 0.12508266248465932,
"learning_rate": 1.109793576301855e-05,
"loss": 0.0683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019669760018587112,
"step": 3555,
"valid_targets_mean": 9355.0,
"valid_targets_min": 1912
},
{
"epoch": 3.41664,
"grad_norm": 0.12060718453496497,
"learning_rate": 1.1037989427546924e-05,
"loss": 0.0684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023211004212498665,
"step": 3560,
"valid_targets_mean": 8907.0,
"valid_targets_min": 3938
},
{
"epoch": 3.42144,
"grad_norm": 0.11856868790700098,
"learning_rate": 1.0978143665753692e-05,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025470038875937462,
"step": 3565,
"valid_targets_mean": 8779.1,
"valid_targets_min": 1956
},
{
"epoch": 3.42624,
"grad_norm": 0.1202644007888738,
"learning_rate": 1.0918399149241314e-05,
"loss": 0.0671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025088073685765266,
"step": 3570,
"valid_targets_mean": 9472.4,
"valid_targets_min": 5452
},
{
"epoch": 3.43104,
"grad_norm": 0.11890989905758134,
"learning_rate": 1.0858756548476058e-05,
"loss": 0.0669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019012611359357834,
"step": 3575,
"valid_targets_mean": 8079.2,
"valid_targets_min": 2365
},
{
"epoch": 3.43584,
"grad_norm": 0.11535717573780561,
"learning_rate": 1.0799216532780478e-05,
"loss": 0.0656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020330175757408142,
"step": 3580,
"valid_targets_mean": 8638.0,
"valid_targets_min": 2657
},
{
"epoch": 3.44064,
"grad_norm": 0.11982122538634377,
"learning_rate": 1.0739779770325885e-05,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02101993001997471,
"step": 3585,
"valid_targets_mean": 8114.7,
"valid_targets_min": 3253
},
{
"epoch": 3.44544,
"grad_norm": 0.11568924363050549,
"learning_rate": 1.0680446928124872e-05,
"loss": 0.0699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024274956434965134,
"step": 3590,
"valid_targets_mean": 8969.8,
"valid_targets_min": 5479
},
{
"epoch": 3.45024,
"grad_norm": 0.12311519721414897,
"learning_rate": 1.06212186720238e-05,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02398882806301117,
"step": 3595,
"valid_targets_mean": 9083.4,
"valid_targets_min": 2236
},
{
"epoch": 3.45504,
"grad_norm": 0.1176232528105872,
"learning_rate": 1.0562095666695352e-05,
"loss": 0.0689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022245021536946297,
"step": 3600,
"valid_targets_mean": 8506.0,
"valid_targets_min": 530
},
{
"epoch": 3.45984,
"grad_norm": 0.12814024690841339,
"learning_rate": 1.0503078575631052e-05,
"loss": 0.0565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019158998504281044,
"step": 3605,
"valid_targets_mean": 9547.4,
"valid_targets_min": 4525
},
{
"epoch": 3.46464,
"grad_norm": 0.1352022401477249,
"learning_rate": 1.0444168061133846e-05,
"loss": 0.0587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019761083647608757,
"step": 3610,
"valid_targets_mean": 8394.5,
"valid_targets_min": 4757
},
{
"epoch": 3.46944,
"grad_norm": 0.12312753724496196,
"learning_rate": 1.0385364784310636e-05,
"loss": 0.0558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017157310619950294,
"step": 3615,
"valid_targets_mean": 8024.5,
"valid_targets_min": 2974
},
{
"epoch": 3.47424,
"grad_norm": 0.13533009632046408,
"learning_rate": 1.0326669405064904e-05,
"loss": 0.056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015769323334097862,
"step": 3620,
"valid_targets_mean": 9096.3,
"valid_targets_min": 3278
},
{
"epoch": 3.47904,
"grad_norm": 0.14320717457173768,
"learning_rate": 1.0268082582089263e-05,
"loss": 0.0575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01656205952167511,
"step": 3625,
"valid_targets_mean": 7964.6,
"valid_targets_min": 2824
},
{
"epoch": 3.48384,
"grad_norm": 0.1436771220110468,
"learning_rate": 1.0209604972858081e-05,
"loss": 0.0553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01845899596810341,
"step": 3630,
"valid_targets_mean": 8401.7,
"valid_targets_min": 2868
},
{
"epoch": 3.48864,
"grad_norm": 0.1331002867624431,
"learning_rate": 1.0151237233620115e-05,
"loss": 0.0546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015434859320521355,
"step": 3635,
"valid_targets_mean": 8922.3,
"valid_targets_min": 3232
},
{
"epoch": 3.49344,
"grad_norm": 0.15962729586395075,
"learning_rate": 1.0092980019391132e-05,
"loss": 0.0592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018679436296224594,
"step": 3640,
"valid_targets_mean": 9329.9,
"valid_targets_min": 3781
},
{
"epoch": 3.49824,
"grad_norm": 0.15818938989627598,
"learning_rate": 1.0034833983946561e-05,
"loss": 0.0553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016482515260577202,
"step": 3645,
"valid_targets_mean": 8887.6,
"valid_targets_min": 1640
},
{
"epoch": 3.50304,
"grad_norm": 0.12431356399603527,
"learning_rate": 9.976799779814157e-06,
"loss": 0.0555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017481375485658646,
"step": 3650,
"valid_targets_mean": 8482.5,
"valid_targets_min": 4381
},
{
"epoch": 3.50784,
"grad_norm": 0.1322854401566673,
"learning_rate": 9.918878058266687e-06,
"loss": 0.0576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017938459292054176,
"step": 3655,
"valid_targets_mean": 8828.8,
"valid_targets_min": 3313
},
{
"epoch": 3.51264,
"grad_norm": 0.1253467544366567,
"learning_rate": 9.86106946931462e-06,
"loss": 0.0596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019131455570459366,
"step": 3660,
"valid_targets_mean": 9941.3,
"valid_targets_min": 4437
},
{
"epoch": 3.51744,
"grad_norm": 0.13652918694567162,
"learning_rate": 9.803374661698802e-06,
"loss": 0.0559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019458845257759094,
"step": 3665,
"valid_targets_mean": 7816.9,
"valid_targets_min": 1823
},
{
"epoch": 3.52224,
"grad_norm": 0.14742469694336255,
"learning_rate": 9.745794282883215e-06,
"loss": 0.057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01716812141239643,
"step": 3670,
"valid_targets_mean": 8304.0,
"valid_targets_min": 2191
},
{
"epoch": 3.52704,
"grad_norm": 0.13348912229457513,
"learning_rate": 9.688328979047689e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018630236387252808,
"step": 3675,
"valid_targets_mean": 8479.3,
"valid_targets_min": 3012
},
{
"epoch": 3.53184,
"grad_norm": 0.13047629376112002,
"learning_rate": 9.630979395080667e-06,
"loss": 0.0594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01872425712645054,
"step": 3680,
"valid_targets_mean": 7992.5,
"valid_targets_min": 2228
},
{
"epoch": 3.5366400000000002,
"grad_norm": 0.13156923893488706,
"learning_rate": 9.573746174571947e-06,
"loss": 0.0555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016432328149676323,
"step": 3685,
"valid_targets_mean": 9221.1,
"valid_targets_min": 2341
},
{
"epoch": 3.54144,
"grad_norm": 0.13209300474839575,
"learning_rate": 9.516629959805468e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02003823220729828,
"step": 3690,
"valid_targets_mean": 8710.9,
"valid_targets_min": 1444
},
{
"epoch": 3.54624,
"grad_norm": 0.13116046245364235,
"learning_rate": 9.459631391752126e-06,
"loss": 0.0568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01843874529004097,
"step": 3695,
"valid_targets_mean": 8378.2,
"valid_targets_min": 3062
},
{
"epoch": 3.55104,
"grad_norm": 0.1285017503304282,
"learning_rate": 9.40275111006254e-06,
"loss": 0.0548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016842100769281387,
"step": 3700,
"valid_targets_mean": 8139.7,
"valid_targets_min": 2295
},
{
"epoch": 3.55584,
"grad_norm": 0.1472596562975354,
"learning_rate": 9.345989753059895e-06,
"loss": 0.0543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016040191054344177,
"step": 3705,
"valid_targets_mean": 7992.1,
"valid_targets_min": 2724
},
{
"epoch": 3.5606400000000002,
"grad_norm": 0.15633419217487327,
"learning_rate": 9.289347957732779e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017493966966867447,
"step": 3710,
"valid_targets_mean": 8839.2,
"valid_targets_min": 1647
},
{
"epoch": 3.56544,
"grad_norm": 0.1357694551726591,
"learning_rate": 9.232826359728034e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015739034861326218,
"step": 3715,
"valid_targets_mean": 8887.0,
"valid_targets_min": 2183
},
{
"epoch": 3.57024,
"grad_norm": 0.12207172176713575,
"learning_rate": 9.17642559334362e-06,
"loss": 0.054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017870184034109116,
"step": 3720,
"valid_targets_mean": 8897.0,
"valid_targets_min": 2011
},
{
"epoch": 3.57504,
"grad_norm": 0.14244558932230125,
"learning_rate": 9.120146291521488e-06,
"loss": 0.0561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018513241782784462,
"step": 3725,
"valid_targets_mean": 8319.8,
"valid_targets_min": 2365
},
{
"epoch": 3.57984,
"grad_norm": 0.13508176921493603,
"learning_rate": 9.063989085840506e-06,
"loss": 0.0566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020369049161672592,
"step": 3730,
"valid_targets_mean": 8704.0,
"valid_targets_min": 2203
},
{
"epoch": 3.5846400000000003,
"grad_norm": 0.12623222486610447,
"learning_rate": 9.007954606509346e-06,
"loss": 0.0534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01837966777384281,
"step": 3735,
"valid_targets_mean": 8965.4,
"valid_targets_min": 1896
},
{
"epoch": 3.5894399999999997,
"grad_norm": 0.13304702719999412,
"learning_rate": 8.952043482359408e-06,
"loss": 0.0534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016147565096616745,
"step": 3740,
"valid_targets_mean": 8392.1,
"valid_targets_min": 2734
},
{
"epoch": 3.59424,
"grad_norm": 0.1364610341024647,
"learning_rate": 8.896256340837779e-06,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01738559827208519,
"step": 3745,
"valid_targets_mean": 8307.7,
"valid_targets_min": 1612
},
{
"epoch": 3.59904,
"grad_norm": 0.12080918237441046,
"learning_rate": 8.840593808000182e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017990585416555405,
"step": 3750,
"valid_targets_mean": 8898.8,
"valid_targets_min": 3751
},
{
"epoch": 3.60384,
"grad_norm": 0.135206313127372,
"learning_rate": 8.785056508503956e-06,
"loss": 0.0572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01876853033900261,
"step": 3755,
"valid_targets_mean": 8321.2,
"valid_targets_min": 1956
},
{
"epoch": 3.60864,
"grad_norm": 0.14146043288365848,
"learning_rate": 8.729645065601045e-06,
"loss": 0.058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0189354345202446,
"step": 3760,
"valid_targets_mean": 8984.0,
"valid_targets_min": 1806
},
{
"epoch": 3.6134399999999998,
"grad_norm": 0.1357690858168711,
"learning_rate": 8.674360101130994e-06,
"loss": 0.0545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02032206952571869,
"step": 3765,
"valid_targets_mean": 8590.7,
"valid_targets_min": 2433
},
{
"epoch": 3.61824,
"grad_norm": 0.13373124703486686,
"learning_rate": 8.619202235514e-06,
"loss": 0.0537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016812438145279884,
"step": 3770,
"valid_targets_mean": 8781.7,
"valid_targets_min": 4288
},
{
"epoch": 3.62304,
"grad_norm": 0.13777338990715324,
"learning_rate": 8.564172087743903e-06,
"loss": 0.057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01906885765492916,
"step": 3775,
"valid_targets_mean": 8735.4,
"valid_targets_min": 3098
},
{
"epoch": 3.62784,
"grad_norm": 0.13709427310817707,
"learning_rate": 8.50927027538128e-06,
"loss": 0.0558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021031895652413368,
"step": 3780,
"valid_targets_mean": 8737.2,
"valid_targets_min": 4732
},
{
"epoch": 3.63264,
"grad_norm": 0.1329046208350066,
"learning_rate": 8.454497414546497e-06,
"loss": 0.0583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019182361662387848,
"step": 3785,
"valid_targets_mean": 9016.9,
"valid_targets_min": 3997
},
{
"epoch": 3.63744,
"grad_norm": 0.12784288201977764,
"learning_rate": 8.39985411991279e-06,
"loss": 0.0587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022063791751861572,
"step": 3790,
"valid_targets_mean": 9467.2,
"valid_targets_min": 2158
},
{
"epoch": 3.64224,
"grad_norm": 0.13698351144349497,
"learning_rate": 8.345341004699386e-06,
"loss": 0.0574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01915154419839382,
"step": 3795,
"valid_targets_mean": 9378.7,
"valid_targets_min": 3433
},
{
"epoch": 3.64704,
"grad_norm": 0.13732974847111012,
"learning_rate": 8.290958680664591e-06,
"loss": 0.0585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020820364356040955,
"step": 3800,
"valid_targets_mean": 8005.5,
"valid_targets_min": 1450
},
{
"epoch": 3.65184,
"grad_norm": 0.13505357343036875,
"learning_rate": 8.236707758098965e-06,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022526472806930542,
"step": 3805,
"valid_targets_mean": 8850.6,
"valid_targets_min": 2488
},
{
"epoch": 3.65664,
"grad_norm": 0.1259729066577338,
"learning_rate": 8.182588845818452e-06,
"loss": 0.0552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017887916415929794,
"step": 3810,
"valid_targets_mean": 8914.6,
"valid_targets_min": 3411
},
{
"epoch": 3.66144,
"grad_norm": 0.13771971908346792,
"learning_rate": 8.128602551157523e-06,
"loss": 0.0546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018062973394989967,
"step": 3815,
"valid_targets_mean": 8964.6,
"valid_targets_min": 5691
},
{
"epoch": 3.66624,
"grad_norm": 0.1386182298823841,
"learning_rate": 8.074749479962407e-06,
"loss": 0.052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016328800469636917,
"step": 3820,
"valid_targets_mean": 8711.1,
"valid_targets_min": 2956
},
{
"epoch": 3.67104,
"grad_norm": 0.13208007285920464,
"learning_rate": 8.021030236584254e-06,
"loss": 0.0544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01910882256925106,
"step": 3825,
"valid_targets_mean": 9311.3,
"valid_targets_min": 2524
},
{
"epoch": 3.67584,
"grad_norm": 0.1526032805811713,
"learning_rate": 7.967445423872384e-06,
"loss": 0.0534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015861565247178078,
"step": 3830,
"valid_targets_mean": 8945.5,
"valid_targets_min": 2509
},
{
"epoch": 3.68064,
"grad_norm": 0.13026368761507842,
"learning_rate": 7.913995643167494e-06,
"loss": 0.0534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017038773745298386,
"step": 3835,
"valid_targets_mean": 8394.8,
"valid_targets_min": 2738
},
{
"epoch": 3.68544,
"grad_norm": 0.13774012408734024,
"learning_rate": 7.860681494294917e-06,
"loss": 0.056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02027728408575058,
"step": 3840,
"valid_targets_mean": 8938.6,
"valid_targets_min": 2062
},
{
"epoch": 3.69024,
"grad_norm": 0.14717144639640956,
"learning_rate": 7.80750357555792e-06,
"loss": 0.0582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023341909050941467,
"step": 3845,
"valid_targets_mean": 8292.6,
"valid_targets_min": 1771
},
{
"epoch": 3.69504,
"grad_norm": 0.1300340768573447,
"learning_rate": 7.75446248373094e-06,
"loss": 0.0552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01564173400402069,
"step": 3850,
"valid_targets_mean": 8664.2,
"valid_targets_min": 1719
},
{
"epoch": 3.69984,
"grad_norm": 0.13796606966954172,
"learning_rate": 7.701558814052928e-06,
"loss": 0.0564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01939544826745987,
"step": 3855,
"valid_targets_mean": 8037.8,
"valid_targets_min": 3725
},
{
"epoch": 3.70464,
"grad_norm": 0.12327605601391764,
"learning_rate": 7.648793160220637e-06,
"loss": 0.055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019700098782777786,
"step": 3860,
"valid_targets_mean": 9027.4,
"valid_targets_min": 3266
},
{
"epoch": 3.70944,
"grad_norm": 0.12894451099718549,
"learning_rate": 7.596166114381991e-06,
"loss": 0.0561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01795964688062668,
"step": 3865,
"valid_targets_mean": 9631.7,
"valid_targets_min": 4464
},
{
"epoch": 3.71424,
"grad_norm": 0.1462188211290315,
"learning_rate": 7.543678267129408e-06,
"loss": 0.0548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021304085850715637,
"step": 3870,
"valid_targets_mean": 9413.1,
"valid_targets_min": 3409
},
{
"epoch": 3.71904,
"grad_norm": 0.13526202499913728,
"learning_rate": 7.491330207493215e-06,
"loss": 0.0521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018997564911842346,
"step": 3875,
"valid_targets_mean": 8982.6,
"valid_targets_min": 1331
},
{
"epoch": 3.72384,
"grad_norm": 0.12959402426419273,
"learning_rate": 7.4391225229349785e-06,
"loss": 0.0537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0176476389169693,
"step": 3880,
"valid_targets_mean": 8661.0,
"valid_targets_min": 4132
},
{
"epoch": 3.72864,
"grad_norm": 0.1380153099186334,
"learning_rate": 7.387055799340977e-06,
"loss": 0.0513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018710440024733543,
"step": 3885,
"valid_targets_mean": 8980.4,
"valid_targets_min": 2790
},
{
"epoch": 3.73344,
"grad_norm": 0.1381226259425154,
"learning_rate": 7.3351306210155645e-06,
"loss": 0.0541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017781345173716545,
"step": 3890,
"valid_targets_mean": 9528.7,
"valid_targets_min": 5213
},
{
"epoch": 3.7382400000000002,
"grad_norm": 0.14650329599062215,
"learning_rate": 7.283347570674664e-06,
"loss": 0.0536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019584622234106064,
"step": 3895,
"valid_targets_mean": 9252.9,
"valid_targets_min": 1925
},
{
"epoch": 3.74304,
"grad_norm": 0.13350511389861328,
"learning_rate": 7.231707229439191e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018930701538920403,
"step": 3900,
"valid_targets_mean": 8362.8,
"valid_targets_min": 3106
},
{
"epoch": 3.74784,
"grad_norm": 0.1301142031540442,
"learning_rate": 7.180210176828557e-06,
"loss": 0.0539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01843518391251564,
"step": 3905,
"valid_targets_mean": 8952.4,
"valid_targets_min": 1932
},
{
"epoch": 3.75264,
"grad_norm": 0.14804851725083004,
"learning_rate": 7.1288569907541495e-06,
"loss": 0.0542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016517702490091324,
"step": 3910,
"valid_targets_mean": 8982.4,
"valid_targets_min": 3753
},
{
"epoch": 3.75744,
"grad_norm": 0.1472353370607068,
"learning_rate": 7.0776482475128674e-06,
"loss": 0.0527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01933884434401989,
"step": 3915,
"valid_targets_mean": 7994.6,
"valid_targets_min": 1413
},
{
"epoch": 3.7622400000000003,
"grad_norm": 0.12792785699272863,
"learning_rate": 7.026584521780628e-06,
"loss": 0.052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021142924204468727,
"step": 3920,
"valid_targets_mean": 9141.5,
"valid_targets_min": 2962
},
{
"epoch": 3.76704,
"grad_norm": 0.1365740601360126,
"learning_rate": 6.9756663866059324e-06,
"loss": 0.0568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017975568771362305,
"step": 3925,
"valid_targets_mean": 8611.1,
"valid_targets_min": 3075
},
{
"epoch": 3.77184,
"grad_norm": 0.1280897139250657,
"learning_rate": 6.924894413403434e-06,
"loss": 0.0562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015527415089309216,
"step": 3930,
"valid_targets_mean": 7602.2,
"valid_targets_min": 3152
},
{
"epoch": 3.77664,
"grad_norm": 0.133581093629811,
"learning_rate": 6.874269171947516e-06,
"loss": 0.0545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01571614481508732,
"step": 3935,
"valid_targets_mean": 8710.9,
"valid_targets_min": 3037
},
{
"epoch": 3.78144,
"grad_norm": 0.13173898278248164,
"learning_rate": 6.8237912303659195e-06,
"loss": 0.0549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01879742182791233,
"step": 3940,
"valid_targets_mean": 8989.7,
"valid_targets_min": 3746
},
{
"epoch": 3.7862400000000003,
"grad_norm": 0.12954058129422952,
"learning_rate": 6.773461155133334e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016739197075366974,
"step": 3945,
"valid_targets_mean": 8927.5,
"valid_targets_min": 5341
},
{
"epoch": 3.7910399999999997,
"grad_norm": 0.12613131464245048,
"learning_rate": 6.723279511065088e-06,
"loss": 0.0523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016926273703575134,
"step": 3950,
"valid_targets_mean": 9623.4,
"valid_targets_min": 2541
},
{
"epoch": 3.79584,
"grad_norm": 0.1292964362058766,
"learning_rate": 6.673246861310751e-06,
"loss": 0.0532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017725899815559387,
"step": 3955,
"valid_targets_mean": 7859.5,
"valid_targets_min": 3588
},
{
"epoch": 3.80064,
"grad_norm": 0.130316879874074,
"learning_rate": 6.623363767347874e-06,
"loss": 0.0535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02152263931930065,
"step": 3960,
"valid_targets_mean": 9065.3,
"valid_targets_min": 1925
},
{
"epoch": 3.80544,
"grad_norm": 0.12971369743191016,
"learning_rate": 6.5736307889756425e-06,
"loss": 0.0545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016394753009080887,
"step": 3965,
"valid_targets_mean": 8884.4,
"valid_targets_min": 2482
},
{
"epoch": 3.81024,
"grad_norm": 0.1568859332985799,
"learning_rate": 6.5240484843086095e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021794119849801064,
"step": 3970,
"valid_targets_mean": 9304.8,
"valid_targets_min": 1462
},
{
"epoch": 3.8150399999999998,
"grad_norm": 0.13421165461310694,
"learning_rate": 6.474617409770441e-06,
"loss": 0.0542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01763138733804226,
"step": 3975,
"valid_targets_mean": 8132.8,
"valid_targets_min": 922
},
{
"epoch": 3.81984,
"grad_norm": 0.12677902333212412,
"learning_rate": 6.425338120087665e-06,
"loss": 0.0542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017714576795697212,
"step": 3980,
"valid_targets_mean": 8993.7,
"valid_targets_min": 2647
},
{
"epoch": 3.82464,
"grad_norm": 0.13212966268794687,
"learning_rate": 6.3762111682834374e-06,
"loss": 0.0545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01865052804350853,
"step": 3985,
"valid_targets_mean": 8879.0,
"valid_targets_min": 2453
},
{
"epoch": 3.82944,
"grad_norm": 0.1407986051119374,
"learning_rate": 6.327237105671362e-06,
"loss": 0.0558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017468944191932678,
"step": 3990,
"valid_targets_mean": 9018.7,
"valid_targets_min": 2962
},
{
"epoch": 3.83424,
"grad_norm": 0.1320979084915881,
"learning_rate": 6.278416481849274e-06,
"loss": 0.0548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016698092222213745,
"step": 3995,
"valid_targets_mean": 8318.9,
"valid_targets_min": 3301
},
{
"epoch": 3.83904,
"grad_norm": 0.12990710853432647,
"learning_rate": 6.22974984469308e-06,
"loss": 0.0537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01842219941318035,
"step": 4000,
"valid_targets_mean": 8659.0,
"valid_targets_min": 1468
},
{
"epoch": 3.84384,
"grad_norm": 0.13236712617272228,
"learning_rate": 6.181237740350625e-06,
"loss": 0.0533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020259007811546326,
"step": 4005,
"valid_targets_mean": 8054.6,
"valid_targets_min": 2687
},
{
"epoch": 3.84864,
"grad_norm": 0.13041784618423918,
"learning_rate": 6.132880713235543e-06,
"loss": 0.0554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018737755715847015,
"step": 4010,
"valid_targets_mean": 9364.6,
"valid_targets_min": 3819
},
{
"epoch": 3.85344,
"grad_norm": 0.13524360240078845,
"learning_rate": 6.084679306021162e-06,
"loss": 0.053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015698693692684174,
"step": 4015,
"valid_targets_mean": 7918.4,
"valid_targets_min": 2787
},
{
"epoch": 3.85824,
"grad_norm": 0.12236282756023174,
"learning_rate": 6.036634059634403e-06,
"loss": 0.0533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016556216403841972,
"step": 4020,
"valid_targets_mean": 8993.7,
"valid_targets_min": 3277
},
{
"epoch": 3.86304,
"grad_norm": 0.13236991040385118,
"learning_rate": 5.988745513249723e-06,
"loss": 0.0548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015798557549715042,
"step": 4025,
"valid_targets_mean": 7554.2,
"valid_targets_min": 2150
},
{
"epoch": 3.86784,
"grad_norm": 0.1290662796744428,
"learning_rate": 5.941014204283065e-06,
"loss": 0.0524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017221640795469284,
"step": 4030,
"valid_targets_mean": 8782.2,
"valid_targets_min": 3375
},
{
"epoch": 3.87264,
"grad_norm": 0.14205933896083572,
"learning_rate": 5.893440668385797e-06,
"loss": 0.056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018951009958982468,
"step": 4035,
"valid_targets_mean": 8017.5,
"valid_targets_min": 3253
},
{
"epoch": 3.87744,
"grad_norm": 0.1368306093679873,
"learning_rate": 5.8460254394387335e-06,
"loss": 0.0562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018680622801184654,
"step": 4040,
"valid_targets_mean": 8573.9,
"valid_targets_min": 3166
},
{
"epoch": 3.88224,
"grad_norm": 0.14792994727994602,
"learning_rate": 5.798769049546136e-06,
"loss": 0.0536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01788490265607834,
"step": 4045,
"valid_targets_mean": 8650.3,
"valid_targets_min": 3015
},
{
"epoch": 3.88704,
"grad_norm": 0.12797744609338996,
"learning_rate": 5.751672029029734e-06,
"loss": 0.0541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017983146011829376,
"step": 4050,
"valid_targets_mean": 9032.2,
"valid_targets_min": 3561
},
{
"epoch": 3.89184,
"grad_norm": 0.1368383859346621,
"learning_rate": 5.704734906422775e-06,
"loss": 0.0542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01866726018488407,
"step": 4055,
"valid_targets_mean": 8509.7,
"valid_targets_min": 1352
},
{
"epoch": 3.89664,
"grad_norm": 0.1274931135133911,
"learning_rate": 5.657958208464103e-06,
"loss": 0.0543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017809130251407623,
"step": 4060,
"valid_targets_mean": 9095.2,
"valid_targets_min": 3414
},
{
"epoch": 3.90144,
"grad_norm": 0.12446892196214056,
"learning_rate": 5.611342460092244e-06,
"loss": 0.0569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018567975610494614,
"step": 4065,
"valid_targets_mean": 8345.9,
"valid_targets_min": 1662
},
{
"epoch": 3.90624,
"grad_norm": 0.13830759122979366,
"learning_rate": 5.564888184439505e-06,
"loss": 0.0567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017078258097171783,
"step": 4070,
"valid_targets_mean": 8059.1,
"valid_targets_min": 1554
},
{
"epoch": 3.91104,
"grad_norm": 0.36165706553152754,
"learning_rate": 5.5185959028261135e-06,
"loss": 0.0553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02065645530819893,
"step": 4075,
"valid_targets_mean": 9743.2,
"valid_targets_min": 5526
},
{
"epoch": 3.91584,
"grad_norm": 0.1316808841029414,
"learning_rate": 5.47246613475436e-06,
"loss": 0.0547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01675555296242237,
"step": 4080,
"valid_targets_mean": 9094.8,
"valid_targets_min": 4363
},
{
"epoch": 3.92064,
"grad_norm": 0.14798968834118362,
"learning_rate": 5.4264993979027735e-06,
"loss": 0.055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019093751907348633,
"step": 4085,
"valid_targets_mean": 9276.1,
"valid_targets_min": 2780
},
{
"epoch": 3.92544,
"grad_norm": 0.13158694237133187,
"learning_rate": 5.380696208120315e-06,
"loss": 0.052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020652972161769867,
"step": 4090,
"valid_targets_mean": 9859.9,
"valid_targets_min": 4035
},
{
"epoch": 3.93024,
"grad_norm": 0.14195945121470888,
"learning_rate": 5.335057079420571e-06,
"loss": 0.0532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017747461795806885,
"step": 4095,
"valid_targets_mean": 8872.0,
"valid_targets_min": 2232
},
{
"epoch": 3.93504,
"grad_norm": 0.1374303761783451,
"learning_rate": 5.289582523976015e-06,
"loss": 0.0536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017126193270087242,
"step": 4100,
"valid_targets_mean": 8146.2,
"valid_targets_min": 2982
},
{
"epoch": 3.9398400000000002,
"grad_norm": 0.14182449340419634,
"learning_rate": 5.244273052112241e-06,
"loss": 0.0536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018104974180459976,
"step": 4105,
"valid_targets_mean": 8459.2,
"valid_targets_min": 4292
},
{
"epoch": 3.94464,
"grad_norm": 0.12798985706630067,
"learning_rate": 5.199129172302224e-06,
"loss": 0.0516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018952365964651108,
"step": 4110,
"valid_targets_mean": 9065.8,
"valid_targets_min": 2898
},
{
"epoch": 3.94944,
"grad_norm": 0.13189531058235807,
"learning_rate": 5.154151391160638e-06,
"loss": 0.0521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018595896661281586,
"step": 4115,
"valid_targets_mean": 9053.8,
"valid_targets_min": 2092
},
{
"epoch": 3.95424,
"grad_norm": 0.1247555985934334,
"learning_rate": 5.109340213438156e-06,
"loss": 0.0503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015505434945225716,
"step": 4120,
"valid_targets_mean": 8914.9,
"valid_targets_min": 2859
},
{
"epoch": 3.95904,
"grad_norm": 0.13611501132172,
"learning_rate": 5.0646961420157995e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018326323479413986,
"step": 4125,
"valid_targets_mean": 8805.6,
"valid_targets_min": 4681
},
{
"epoch": 3.9638400000000003,
"grad_norm": 0.14009893602915602,
"learning_rate": 5.020219677899276e-06,
"loss": 0.0567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016717668622732162,
"step": 4130,
"valid_targets_mean": 8772.8,
"valid_targets_min": 2911
},
{
"epoch": 3.9686399999999997,
"grad_norm": 0.12119906324919044,
"learning_rate": 4.975911320213365e-06,
"loss": 0.0509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01370596420019865,
"step": 4135,
"valid_targets_mean": 8794.0,
"valid_targets_min": 1818
},
{
"epoch": 3.97344,
"grad_norm": 0.14093350602423113,
"learning_rate": 4.931771566196332e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016862042248249054,
"step": 4140,
"valid_targets_mean": 8397.8,
"valid_targets_min": 3079
},
{
"epoch": 3.97824,
"grad_norm": 0.1349495489817161,
"learning_rate": 4.887800911194327e-06,
"loss": 0.0558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02118859626352787,
"step": 4145,
"valid_targets_mean": 9048.3,
"valid_targets_min": 5051
},
{
"epoch": 3.98304,
"grad_norm": 0.13142737943814867,
"learning_rate": 4.8439998486558246e-06,
"loss": 0.0528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01611470803618431,
"step": 4150,
"valid_targets_mean": 8308.8,
"valid_targets_min": 2652
},
{
"epoch": 3.9878400000000003,
"grad_norm": 0.13509533467515525,
"learning_rate": 4.800368870126111e-06,
"loss": 0.0528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0191353652626276,
"step": 4155,
"valid_targets_mean": 8963.3,
"valid_targets_min": 3633
},
{
"epoch": 3.9926399999999997,
"grad_norm": 0.14336406928605755,
"learning_rate": 4.756908465241736e-06,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01861722022294998,
"step": 4160,
"valid_targets_mean": 8617.6,
"valid_targets_min": 1813
},
{
"epoch": 3.99744,
"grad_norm": 0.13786327261197132,
"learning_rate": 4.713619121725039e-06,
"loss": 0.052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016211070120334625,
"step": 4165,
"valid_targets_mean": 8242.3,
"valid_targets_min": 1738
},
{
"epoch": 4.00192,
"grad_norm": 0.13937769816078396,
"learning_rate": 4.670501325378682e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024742331355810165,
"step": 4170,
"valid_targets_mean": 9415.3,
"valid_targets_min": 1752
},
{
"epoch": 4.00672,
"grad_norm": 0.13260992045284067,
"learning_rate": 4.627555560080173e-06,
"loss": 0.0611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020355109125375748,
"step": 4175,
"valid_targets_mean": 8578.2,
"valid_targets_min": 2279
},
{
"epoch": 4.01152,
"grad_norm": 0.12136644577113068,
"learning_rate": 4.5847823077764565e-06,
"loss": 0.059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01977297104895115,
"step": 4180,
"valid_targets_mean": 9292.6,
"valid_targets_min": 2064
},
{
"epoch": 4.01632,
"grad_norm": 0.12215655268804888,
"learning_rate": 4.5421820484784936e-06,
"loss": 0.0593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01999478042125702,
"step": 4185,
"valid_targets_mean": 7845.3,
"valid_targets_min": 2443
},
{
"epoch": 4.02112,
"grad_norm": 0.11025685198030728,
"learning_rate": 4.499755260255881e-06,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018016569316387177,
"step": 4190,
"valid_targets_mean": 9317.6,
"valid_targets_min": 4456
},
{
"epoch": 4.02592,
"grad_norm": 0.12199348277560307,
"learning_rate": 4.457502419231483e-06,
"loss": 0.0585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018790187314152718,
"step": 4195,
"valid_targets_mean": 8750.2,
"valid_targets_min": 2849
},
{
"epoch": 4.03072,
"grad_norm": 0.11851887247821241,
"learning_rate": 4.415423999576091e-06,
"loss": 0.0595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018436409533023834,
"step": 4200,
"valid_targets_mean": 8257.3,
"valid_targets_min": 2090
},
{
"epoch": 4.03552,
"grad_norm": 0.12943593708733644,
"learning_rate": 4.373520473503097e-06,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022049235180020332,
"step": 4205,
"valid_targets_mean": 8969.0,
"valid_targets_min": 1560
},
{
"epoch": 4.04032,
"grad_norm": 0.12087582197109357,
"learning_rate": 4.33179231126321e-06,
"loss": 0.0566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017242740839719772,
"step": 4210,
"valid_targets_mean": 8371.2,
"valid_targets_min": 3676
},
{
"epoch": 4.04512,
"grad_norm": 0.12253314755510665,
"learning_rate": 4.2902399811391575e-06,
"loss": 0.06,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019466323778033257,
"step": 4215,
"valid_targets_mean": 9305.2,
"valid_targets_min": 4992
},
{
"epoch": 4.04992,
"grad_norm": 0.11319613242190042,
"learning_rate": 4.248863949440436e-06,
"loss": 0.0586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018419280648231506,
"step": 4220,
"valid_targets_mean": 9305.4,
"valid_targets_min": 3216
},
{
"epoch": 4.05472,
"grad_norm": 0.12553938847694884,
"learning_rate": 4.207664680498094e-06,
"loss": 0.0591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01968151330947876,
"step": 4225,
"valid_targets_mean": 9126.7,
"valid_targets_min": 2259
},
{
"epoch": 4.05952,
"grad_norm": 0.12183311961705774,
"learning_rate": 4.166642636659495e-06,
"loss": 0.0602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01877449080348015,
"step": 4230,
"valid_targets_mean": 8311.8,
"valid_targets_min": 3816
},
{
"epoch": 4.06432,
"grad_norm": 0.1174766482044172,
"learning_rate": 4.125798278283155e-06,
"loss": 0.0576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017112433910369873,
"step": 4235,
"valid_targets_mean": 8814.9,
"valid_targets_min": 2509
},
{
"epoch": 4.06912,
"grad_norm": 0.11859507691645307,
"learning_rate": 4.085132063733554e-06,
"loss": 0.0599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02330220490694046,
"step": 4240,
"valid_targets_mean": 8392.0,
"valid_targets_min": 2719
},
{
"epoch": 4.07392,
"grad_norm": 0.12638051636040903,
"learning_rate": 4.0446444493760165e-06,
"loss": 0.0614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01938215270638466,
"step": 4245,
"valid_targets_mean": 8159.9,
"valid_targets_min": 3346
},
{
"epoch": 4.07872,
"grad_norm": 0.1228089615134463,
"learning_rate": 4.004335889571556e-06,
"loss": 0.0585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0213320329785347,
"step": 4250,
"valid_targets_mean": 8913.4,
"valid_targets_min": 2661
},
{
"epoch": 4.08352,
"grad_norm": 0.11774846166929161,
"learning_rate": 3.96420683667182e-06,
"loss": 0.059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017504338175058365,
"step": 4255,
"valid_targets_mean": 8633.9,
"valid_targets_min": 3543
},
{
"epoch": 4.08832,
"grad_norm": 0.11486128306446362,
"learning_rate": 3.924257741013968e-06,
"loss": 0.0593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01892087049782276,
"step": 4260,
"valid_targets_mean": 9490.9,
"valid_targets_min": 5870
},
{
"epoch": 4.09312,
"grad_norm": 0.12123842804798597,
"learning_rate": 3.884489050915652e-06,
"loss": 0.0577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017838746309280396,
"step": 4265,
"valid_targets_mean": 9250.5,
"valid_targets_min": 2459
},
{
"epoch": 4.09792,
"grad_norm": 0.12190469160340199,
"learning_rate": 3.844901212669962e-06,
"loss": 0.0583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019511397927999496,
"step": 4270,
"valid_targets_mean": 8654.8,
"valid_targets_min": 4446
},
{
"epoch": 4.10272,
"grad_norm": 0.12941809477086033,
"learning_rate": 3.8054946705404415e-06,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021360494196414948,
"step": 4275,
"valid_targets_mean": 7698.9,
"valid_targets_min": 2140
},
{
"epoch": 4.10752,
"grad_norm": 0.11911570039785059,
"learning_rate": 3.7662698667560714e-06,
"loss": 0.058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022066941484808922,
"step": 4280,
"valid_targets_mean": 8562.8,
"valid_targets_min": 2101
},
{
"epoch": 4.11232,
"grad_norm": 0.1237060154496202,
"learning_rate": 3.7272272415063484e-06,
"loss": 0.0596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020797599107027054,
"step": 4285,
"valid_targets_mean": 9182.3,
"valid_targets_min": 2194
},
{
"epoch": 4.11712,
"grad_norm": 0.12222076744088618,
"learning_rate": 3.6883672329363007e-06,
"loss": 0.0615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020003672689199448,
"step": 4290,
"valid_targets_mean": 8025.3,
"valid_targets_min": 2380
},
{
"epoch": 4.12192,
"grad_norm": 0.1268561459483808,
"learning_rate": 3.649690277141598e-06,
"loss": 0.0592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020146148279309273,
"step": 4295,
"valid_targets_mean": 8866.0,
"valid_targets_min": 1757
},
{
"epoch": 4.12672,
"grad_norm": 0.1203324885785926,
"learning_rate": 3.6111968081636507e-06,
"loss": 0.0616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021221231669187546,
"step": 4300,
"valid_targets_mean": 8719.1,
"valid_targets_min": 3671
},
{
"epoch": 4.13152,
"grad_norm": 0.12018186551080842,
"learning_rate": 3.572887257984743e-06,
"loss": 0.0603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01852181926369667,
"step": 4305,
"valid_targets_mean": 8375.8,
"valid_targets_min": 2431
},
{
"epoch": 4.1363199999999996,
"grad_norm": 0.11684594358500293,
"learning_rate": 3.5347620565231733e-06,
"loss": 0.0563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016558483242988586,
"step": 4310,
"valid_targets_mean": 8316.6,
"valid_targets_min": 3148
},
{
"epoch": 4.14112,
"grad_norm": 0.1145696786032025,
"learning_rate": 3.496821631628442e-06,
"loss": 0.0556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016824206337332726,
"step": 4315,
"valid_targets_mean": 9543.6,
"valid_targets_min": 5120
},
{
"epoch": 4.14592,
"grad_norm": 0.1329769792894044,
"learning_rate": 3.459066409076448e-06,
"loss": 0.0577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020469941198825836,
"step": 4320,
"valid_targets_mean": 9157.2,
"valid_targets_min": 4740
},
{
"epoch": 4.15072,
"grad_norm": 0.12076030631519495,
"learning_rate": 3.421496812564713e-06,
"loss": 0.058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019596287980675697,
"step": 4325,
"valid_targets_mean": 9119.2,
"valid_targets_min": 2239
},
{
"epoch": 4.15552,
"grad_norm": 0.12445424995710275,
"learning_rate": 3.384113263707609e-06,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018446721136569977,
"step": 4330,
"valid_targets_mean": 7905.8,
"valid_targets_min": 2773
},
{
"epoch": 4.16032,
"grad_norm": 0.11984162900794601,
"learning_rate": 3.34691618203165e-06,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018406976014375687,
"step": 4335,
"valid_targets_mean": 9256.8,
"valid_targets_min": 2197
},
{
"epoch": 4.16512,
"grad_norm": 0.12179081674701153,
"learning_rate": 3.309905984970765e-06,
"loss": 0.0585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017512843012809753,
"step": 4340,
"valid_targets_mean": 8542.8,
"valid_targets_min": 2767
},
{
"epoch": 4.16992,
"grad_norm": 0.11759843922722205,
"learning_rate": 3.2730830878616305e-06,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02117135003209114,
"step": 4345,
"valid_targets_mean": 9212.2,
"valid_targets_min": 2958
},
{
"epoch": 4.17472,
"grad_norm": 0.11807834168622429,
"learning_rate": 3.2364479039389973e-06,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018724609166383743,
"step": 4350,
"valid_targets_mean": 8196.4,
"valid_targets_min": 1964
},
{
"epoch": 4.17952,
"grad_norm": 0.1243844477116557,
"learning_rate": 3.2000008443310505e-06,
"loss": 0.0598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02250153385102749,
"step": 4355,
"valid_targets_mean": 9202.8,
"valid_targets_min": 1686
},
{
"epoch": 4.18432,
"grad_norm": 0.11956480020734431,
"learning_rate": 3.1637423180548232e-06,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022235415875911713,
"step": 4360,
"valid_targets_mean": 9636.3,
"valid_targets_min": 1629
},
{
"epoch": 4.18912,
"grad_norm": 0.1185081417491982,
"learning_rate": 3.127672732011564e-06,
"loss": 0.0619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022327009588479996,
"step": 4365,
"valid_targets_mean": 9096.0,
"valid_targets_min": 4447
},
{
"epoch": 4.19392,
"grad_norm": 0.12464353748951823,
"learning_rate": 3.0917924909821993e-06,
"loss": 0.0586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022116748616099358,
"step": 4370,
"valid_targets_mean": 8855.2,
"valid_targets_min": 2971
},
{
"epoch": 4.19872,
"grad_norm": 0.11711235388240054,
"learning_rate": 3.0561019976227867e-06,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01701711304485798,
"step": 4375,
"valid_targets_mean": 8770.3,
"valid_targets_min": 3883
},
{
"epoch": 4.20352,
"grad_norm": 0.12209386881284948,
"learning_rate": 3.020601652459989e-06,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018716298043727875,
"step": 4380,
"valid_targets_mean": 8453.9,
"valid_targets_min": 2471
},
{
"epoch": 4.20832,
"grad_norm": 0.1179732819427151,
"learning_rate": 2.9852918538865847e-06,
"loss": 0.0586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01898093894124031,
"step": 4385,
"valid_targets_mean": 8763.5,
"valid_targets_min": 1581
},
{
"epoch": 4.21312,
"grad_norm": 0.12433317521576756,
"learning_rate": 2.950172998156995e-06,
"loss": 0.0624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023141473531723022,
"step": 4390,
"valid_targets_mean": 9088.0,
"valid_targets_min": 3503
},
{
"epoch": 4.21792,
"grad_norm": 0.12187721181458719,
"learning_rate": 2.91524547938284e-06,
"loss": 0.057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019292142242193222,
"step": 4395,
"valid_targets_mean": 9112.7,
"valid_targets_min": 3780
},
{
"epoch": 4.22272,
"grad_norm": 0.1249249599539274,
"learning_rate": 2.880509689528519e-06,
"loss": 0.0589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020155327394604683,
"step": 4400,
"valid_targets_mean": 8781.4,
"valid_targets_min": 4800
},
{
"epoch": 4.22752,
"grad_norm": 0.12130990173874953,
"learning_rate": 2.845966018406796e-06,
"loss": 0.0602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01886666938662529,
"step": 4405,
"valid_targets_mean": 8720.8,
"valid_targets_min": 3689
},
{
"epoch": 4.23232,
"grad_norm": 0.12261482199844286,
"learning_rate": 2.8116148536744448e-06,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02107727900147438,
"step": 4410,
"valid_targets_mean": 8796.9,
"valid_targets_min": 4312
},
{
"epoch": 4.23712,
"grad_norm": 0.12041082622457164,
"learning_rate": 2.777456580827882e-06,
"loss": 0.0591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02132035419344902,
"step": 4415,
"valid_targets_mean": 8781.2,
"valid_targets_min": 2402
},
{
"epoch": 4.24192,
"grad_norm": 0.12018775604857752,
"learning_rate": 2.7434915831988517e-06,
"loss": 0.0603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022251714020967484,
"step": 4420,
"valid_targets_mean": 9274.4,
"valid_targets_min": 2195
},
{
"epoch": 4.24672,
"grad_norm": 0.12398684759078817,
"learning_rate": 2.7097202419501246e-06,
"loss": 0.0596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018055105581879616,
"step": 4425,
"valid_targets_mean": 7853.2,
"valid_targets_min": 2163
},
{
"epoch": 4.25152,
"grad_norm": 0.12381260153578,
"learning_rate": 2.6761429360712045e-06,
"loss": 0.0624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022460700944066048,
"step": 4430,
"valid_targets_mean": 7861.3,
"valid_targets_min": 2928
},
{
"epoch": 4.25632,
"grad_norm": 0.12825189987605026,
"learning_rate": 2.642760042374106e-06,
"loss": 0.0597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020237209275364876,
"step": 4435,
"valid_targets_mean": 8969.5,
"valid_targets_min": 3671
},
{
"epoch": 4.26112,
"grad_norm": 0.11707780055325222,
"learning_rate": 2.6095719354890903e-06,
"loss": 0.061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02044464461505413,
"step": 4440,
"valid_targets_mean": 9385.6,
"valid_targets_min": 5255
},
{
"epoch": 4.26592,
"grad_norm": 0.12130109167017335,
"learning_rate": 2.5765789878604852e-06,
"loss": 0.06,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021732307970523834,
"step": 4445,
"valid_targets_mean": 8074.7,
"valid_targets_min": 1889
},
{
"epoch": 4.27072,
"grad_norm": 0.12861534811780176,
"learning_rate": 2.543781569742496e-06,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021149098873138428,
"step": 4450,
"valid_targets_mean": 8897.9,
"valid_targets_min": 4566
},
{
"epoch": 4.27552,
"grad_norm": 0.12345473230408648,
"learning_rate": 2.5111800491950523e-06,
"loss": 0.0616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017032301053404808,
"step": 4455,
"valid_targets_mean": 8499.6,
"valid_targets_min": 4038
},
{
"epoch": 4.28032,
"grad_norm": 0.11892032327078929,
"learning_rate": 2.4787747920796723e-06,
"loss": 0.0583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021471751853823662,
"step": 4460,
"valid_targets_mean": 8411.4,
"valid_targets_min": 2210
},
{
"epoch": 4.28512,
"grad_norm": 0.12166979430091211,
"learning_rate": 2.446566162055377e-06,
"loss": 0.0563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017029765993356705,
"step": 4465,
"valid_targets_mean": 8300.8,
"valid_targets_min": 1868
},
{
"epoch": 4.28992,
"grad_norm": 0.11722138076862068,
"learning_rate": 2.414554520574579e-06,
"loss": 0.0603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01955687813460827,
"step": 4470,
"valid_targets_mean": 9353.0,
"valid_targets_min": 3294
},
{
"epoch": 4.29472,
"grad_norm": 0.124316488723136,
"learning_rate": 2.382740226879052e-06,
"loss": 0.0604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022426098585128784,
"step": 4475,
"valid_targets_mean": 9120.7,
"valid_targets_min": 1679
},
{
"epoch": 4.29952,
"grad_norm": 0.11579019842855867,
"learning_rate": 2.3511236379958824e-06,
"loss": 0.0602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018894197419285774,
"step": 4480,
"valid_targets_mean": 8811.9,
"valid_targets_min": 3885
},
{
"epoch": 4.30432,
"grad_norm": 0.1259214272811187,
"learning_rate": 2.31970510873347e-06,
"loss": 0.0584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024906959384679794,
"step": 4485,
"valid_targets_mean": 9129.3,
"valid_targets_min": 3544
},
{
"epoch": 4.30912,
"grad_norm": 0.12084376607932995,
"learning_rate": 2.2884849916775485e-06,
"loss": 0.0616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014221737161278725,
"step": 4490,
"valid_targets_mean": 8125.8,
"valid_targets_min": 2826
},
{
"epoch": 4.3139199999999995,
"grad_norm": 0.11679620075564591,
"learning_rate": 2.257463637187225e-06,
"loss": 0.0574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021385526284575462,
"step": 4495,
"valid_targets_mean": 8571.7,
"valid_targets_min": 4541
},
{
"epoch": 4.31872,
"grad_norm": 0.12458729359845118,
"learning_rate": 2.2266413933910426e-06,
"loss": 0.058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02144310250878334,
"step": 4500,
"valid_targets_mean": 8770.7,
"valid_targets_min": 2390
},
{
"epoch": 4.32352,
"grad_norm": 0.1234814545306667,
"learning_rate": 2.196018606183088e-06,
"loss": 0.056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01575743779540062,
"step": 4505,
"valid_targets_mean": 8572.1,
"valid_targets_min": 2046
},
{
"epoch": 4.32832,
"grad_norm": 0.1203553321128352,
"learning_rate": 2.1655956192191007e-06,
"loss": 0.0588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02352827787399292,
"step": 4510,
"valid_targets_mean": 9005.1,
"valid_targets_min": 3201
},
{
"epoch": 4.33312,
"grad_norm": 0.12717131209745855,
"learning_rate": 2.135372773912614e-06,
"loss": 0.0583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018232187256217003,
"step": 4515,
"valid_targets_mean": 8639.8,
"valid_targets_min": 4028
},
{
"epoch": 4.33792,
"grad_norm": 0.12297416080936355,
"learning_rate": 2.1053504094311285e-06,
"loss": 0.0611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02066735178232193,
"step": 4520,
"valid_targets_mean": 8406.8,
"valid_targets_min": 2310
},
{
"epoch": 4.34272,
"grad_norm": 0.11408264364981706,
"learning_rate": 2.0755288626923022e-06,
"loss": 0.0609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016809195280075073,
"step": 4525,
"valid_targets_mean": 8664.7,
"valid_targets_min": 2680
},
{
"epoch": 4.34752,
"grad_norm": 0.11366877193389748,
"learning_rate": 2.0459084683601736e-06,
"loss": 0.0587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018915891647338867,
"step": 4530,
"valid_targets_mean": 9101.0,
"valid_targets_min": 4064
},
{
"epoch": 4.35232,
"grad_norm": 0.11780725593526946,
"learning_rate": 2.0164895588414037e-06,
"loss": 0.0573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02268713340163231,
"step": 4535,
"valid_targets_mean": 9264.6,
"valid_targets_min": 2587
},
{
"epoch": 4.35712,
"grad_norm": 0.11864430396627579,
"learning_rate": 1.987272464281551e-06,
"loss": 0.0595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01781759038567543,
"step": 4540,
"valid_targets_mean": 8280.8,
"valid_targets_min": 2616
},
{
"epoch": 4.36192,
"grad_norm": 0.12342667279516402,
"learning_rate": 1.95825751256135e-06,
"loss": 0.0603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021349921822547913,
"step": 4545,
"valid_targets_mean": 7914.7,
"valid_targets_min": 4779
},
{
"epoch": 4.36672,
"grad_norm": 0.12657913615634134,
"learning_rate": 1.9294450292930576e-06,
"loss": 0.0614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02445283532142639,
"step": 4550,
"valid_targets_mean": 8156.9,
"valid_targets_min": 3044
},
{
"epoch": 4.37152,
"grad_norm": 0.11859983603277927,
"learning_rate": 1.9008353378167755e-06,
"loss": 0.0589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022507328540086746,
"step": 4555,
"valid_targets_mean": 9130.3,
"valid_targets_min": 4855
},
{
"epoch": 4.37632,
"grad_norm": 0.11788766940094339,
"learning_rate": 1.8724287591968294e-06,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022499315440654755,
"step": 4560,
"valid_targets_mean": 8801.2,
"valid_targets_min": 4940
},
{
"epoch": 4.38112,
"grad_norm": 0.11786646314018358,
"learning_rate": 1.8442256122181735e-06,
"loss": 0.0597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027995608747005463,
"step": 4565,
"valid_targets_mean": 8043.8,
"valid_targets_min": 3907
},
{
"epoch": 4.38592,
"grad_norm": 0.11870348032090175,
"learning_rate": 1.8162262133828013e-06,
"loss": 0.0605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01562669314444065,
"step": 4570,
"valid_targets_mean": 8143.3,
"valid_targets_min": 2952
},
{
"epoch": 4.39072,
"grad_norm": 0.11550723988467981,
"learning_rate": 1.7884308769061974e-06,
"loss": 0.06,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017535259947180748,
"step": 4575,
"valid_targets_mean": 8207.1,
"valid_targets_min": 1407
},
{
"epoch": 4.39552,
"grad_norm": 0.12858179033167436,
"learning_rate": 1.7608399147138278e-06,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021043431013822556,
"step": 4580,
"valid_targets_mean": 9255.1,
"valid_targets_min": 5243
},
{
"epoch": 4.40032,
"grad_norm": 0.12484115877372373,
"learning_rate": 1.7334536364376075e-06,
"loss": 0.0609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01975128799676895,
"step": 4585,
"valid_targets_mean": 8706.5,
"valid_targets_min": 3138
},
{
"epoch": 4.40512,
"grad_norm": 0.11517365050643107,
"learning_rate": 1.7062723494124545e-06,
"loss": 0.0573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0198981910943985,
"step": 4590,
"valid_targets_mean": 8627.3,
"valid_targets_min": 2762
},
{
"epoch": 4.40992,
"grad_norm": 0.12275506403955044,
"learning_rate": 1.6792963586728195e-06,
"loss": 0.0585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02215822972357273,
"step": 4595,
"valid_targets_mean": 8069.7,
"valid_targets_min": 2209
},
{
"epoch": 4.41472,
"grad_norm": 0.12581924286742757,
"learning_rate": 1.6525259669492832e-06,
"loss": 0.0615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014441033825278282,
"step": 4600,
"valid_targets_mean": 8204.5,
"valid_targets_min": 2901
},
{
"epoch": 4.41952,
"grad_norm": 0.11581290951072448,
"learning_rate": 1.6259614746651364e-06,
"loss": 0.059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02150608040392399,
"step": 4605,
"valid_targets_mean": 9324.2,
"valid_targets_min": 2902
},
{
"epoch": 4.42432,
"grad_norm": 0.1170339216117605,
"learning_rate": 1.5996031799330315e-06,
"loss": 0.0594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020407576113939285,
"step": 4610,
"valid_targets_mean": 9710.2,
"valid_targets_min": 6487
},
{
"epoch": 4.42912,
"grad_norm": 0.12174555375272791,
"learning_rate": 1.5734513785516227e-06,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023040469735860825,
"step": 4615,
"valid_targets_mean": 8550.7,
"valid_targets_min": 3146
},
{
"epoch": 4.43392,
"grad_norm": 0.11719954446471759,
"learning_rate": 1.5475063640022425e-06,
"loss": 0.0565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021581973880529404,
"step": 4620,
"valid_targets_mean": 8845.3,
"valid_targets_min": 3193
},
{
"epoch": 4.43872,
"grad_norm": 0.12444180899873919,
"learning_rate": 1.5217684274456314e-06,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02068684622645378,
"step": 4625,
"valid_targets_mean": 8613.9,
"valid_targets_min": 2223
},
{
"epoch": 4.44352,
"grad_norm": 0.11633434401162951,
"learning_rate": 1.496237857718641e-06,
"loss": 0.0557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020495615899562836,
"step": 4630,
"valid_targets_mean": 9103.2,
"valid_targets_min": 3690
},
{
"epoch": 4.44832,
"grad_norm": 0.11590364344133595,
"learning_rate": 1.4709149413310076e-06,
"loss": 0.0582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020342785865068436,
"step": 4635,
"valid_targets_mean": 8995.2,
"valid_targets_min": 3398
},
{
"epoch": 4.45312,
"grad_norm": 0.12329134950235973,
"learning_rate": 1.445799962462142e-06,
"loss": 0.0599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023403488099575043,
"step": 4640,
"valid_targets_mean": 9009.5,
"valid_targets_min": 2608
},
{
"epoch": 4.45792,
"grad_norm": 0.11404195513457407,
"learning_rate": 1.420893202957927e-06,
"loss": 0.0611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0181783065199852,
"step": 4645,
"valid_targets_mean": 8686.3,
"valid_targets_min": 5259
},
{
"epoch": 4.46272,
"grad_norm": 0.11754587410173165,
"learning_rate": 1.3961949423275622e-06,
"loss": 0.0595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016123849898576736,
"step": 4650,
"valid_targets_mean": 9019.9,
"valid_targets_min": 4229
},
{
"epoch": 4.46752,
"grad_norm": 0.11564141223039769,
"learning_rate": 1.3717054577404331e-06,
"loss": 0.06,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01637781225144863,
"step": 4655,
"valid_targets_mean": 8115.4,
"valid_targets_min": 2226
},
{
"epoch": 4.47232,
"grad_norm": 0.1198827197232521,
"learning_rate": 1.347425024022988e-06,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0225857961922884,
"step": 4660,
"valid_targets_mean": 9256.1,
"valid_targets_min": 2916
},
{
"epoch": 4.47712,
"grad_norm": 0.12018530901808909,
"learning_rate": 1.3233539136556606e-06,
"loss": 0.0573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021104391664266586,
"step": 4665,
"valid_targets_mean": 8460.7,
"valid_targets_min": 4730
},
{
"epoch": 4.48192,
"grad_norm": 0.11519884136211274,
"learning_rate": 1.2994923967698125e-06,
"loss": 0.0586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018374186009168625,
"step": 4670,
"valid_targets_mean": 8961.7,
"valid_targets_min": 1893
},
{
"epoch": 4.48672,
"grad_norm": 0.11839023097383723,
"learning_rate": 1.2758407411446982e-06,
"loss": 0.0571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01913219690322876,
"step": 4675,
"valid_targets_mean": 8664.0,
"valid_targets_min": 3331
},
{
"epoch": 4.49152,
"grad_norm": 0.11419982429935628,
"learning_rate": 1.252399212204467e-06,
"loss": 0.0584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0173068605363369,
"step": 4680,
"valid_targets_mean": 9348.1,
"valid_targets_min": 4816
},
{
"epoch": 4.49632,
"grad_norm": 0.11701309750429871,
"learning_rate": 1.22916807301517e-06,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01966226100921631,
"step": 4685,
"valid_targets_mean": 8759.7,
"valid_targets_min": 2106
},
{
"epoch": 4.50112,
"grad_norm": 0.12539881289660457,
"learning_rate": 1.2061475842818337e-06,
"loss": 0.0599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023415343835949898,
"step": 4690,
"valid_targets_mean": 8409.9,
"valid_targets_min": 3145
},
{
"epoch": 4.50592,
"grad_norm": 0.12883054072840242,
"learning_rate": 1.1833380043455e-06,
"loss": 0.0573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022276621311903,
"step": 4695,
"valid_targets_mean": 8735.2,
"valid_targets_min": 2713
},
{
"epoch": 4.51072,
"grad_norm": 0.11870029933701683,
"learning_rate": 1.1607395891803641e-06,
"loss": 0.0585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018026743084192276,
"step": 4700,
"valid_targets_mean": 8477.8,
"valid_targets_min": 2119
},
{
"epoch": 4.51552,
"grad_norm": 0.12926973339646206,
"learning_rate": 1.1383525923908678e-06,
"loss": 0.0588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021603520959615707,
"step": 4705,
"valid_targets_mean": 8258.6,
"valid_targets_min": 1976
},
{
"epoch": 4.52032,
"grad_norm": 0.1252253936787309,
"learning_rate": 1.1161772652088775e-06,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022924084216356277,
"step": 4710,
"valid_targets_mean": 9499.5,
"valid_targets_min": 5268
},
{
"epoch": 4.52512,
"grad_norm": 0.11418574330977625,
"learning_rate": 1.094213856490849e-06,
"loss": 0.0595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01998257264494896,
"step": 4715,
"valid_targets_mean": 8799.8,
"valid_targets_min": 2185
},
{
"epoch": 4.52992,
"grad_norm": 0.11970402415901457,
"learning_rate": 1.0724626127150462e-06,
"loss": 0.0592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021041162312030792,
"step": 4720,
"valid_targets_mean": 9400.4,
"valid_targets_min": 3753
},
{
"epoch": 4.53472,
"grad_norm": 0.12487355432604856,
"learning_rate": 1.0509237779787717e-06,
"loss": 0.0551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020584046840667725,
"step": 4725,
"valid_targets_mean": 8329.1,
"valid_targets_min": 2687
},
{
"epoch": 4.5395199999999996,
"grad_norm": 0.1162808601114574,
"learning_rate": 1.029597593995626e-06,
"loss": 0.0613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017470069229602814,
"step": 4730,
"valid_targets_mean": 8599.2,
"valid_targets_min": 2352
},
{
"epoch": 4.54432,
"grad_norm": 0.11243973717046013,
"learning_rate": 1.008484300092798e-06,
"loss": 0.0576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01999412477016449,
"step": 4735,
"valid_targets_mean": 10049.0,
"valid_targets_min": 3022
},
{
"epoch": 4.54912,
"grad_norm": 0.12376778314874719,
"learning_rate": 9.87584133208368e-07,
"loss": 0.0615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02172812819480896,
"step": 4740,
"valid_targets_mean": 8882.0,
"valid_targets_min": 3163
},
{
"epoch": 4.55392,
"grad_norm": 0.11754286609015283,
"learning_rate": 9.66897327888665e-07,
"loss": 0.0582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01753995195031166,
"step": 4745,
"valid_targets_mean": 8957.7,
"valid_targets_min": 2101
},
{
"epoch": 4.55872,
"grad_norm": 0.12288692811727639,
"learning_rate": 9.464241162856269e-07,
"loss": 0.0598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022371970117092133,
"step": 4750,
"valid_targets_mean": 9342.5,
"valid_targets_min": 3010
},
{
"epoch": 4.5635200000000005,
"grad_norm": 0.12193809956698538,
"learning_rate": 9.261647281541908e-07,
"loss": 0.0605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019677281379699707,
"step": 4755,
"valid_targets_mean": 8768.8,
"valid_targets_min": 2073
},
{
"epoch": 4.56832,
"grad_norm": 0.1179844087692095,
"learning_rate": 9.061193908497201e-07,
"loss": 0.0588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02046424336731434,
"step": 4760,
"valid_targets_mean": 8664.7,
"valid_targets_min": 2635
},
{
"epoch": 4.57312,
"grad_norm": 0.128157116339437,
"learning_rate": 8.862883293254598e-07,
"loss": 0.0578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022372746840119362,
"step": 4765,
"valid_targets_mean": 9003.5,
"valid_targets_min": 2891
},
{
"epoch": 4.57792,
"grad_norm": 0.11544338584988456,
"learning_rate": 8.666717661299917e-07,
"loss": 0.059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015689603984355927,
"step": 4770,
"valid_targets_mean": 7997.3,
"valid_targets_min": 1727
},
{
"epoch": 4.58272,
"grad_norm": 0.12217872408661101,
"learning_rate": 8.472699214047652e-07,
"loss": 0.0614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022685006260871887,
"step": 4775,
"valid_targets_mean": 8804.0,
"valid_targets_min": 4118
},
{
"epoch": 4.58752,
"grad_norm": 0.12274599705948007,
"learning_rate": 8.280830128815953e-07,
"loss": 0.0616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01906590908765793,
"step": 4780,
"valid_targets_mean": 9177.7,
"valid_targets_min": 3296
},
{
"epoch": 4.59232,
"grad_norm": 0.13080453191813954,
"learning_rate": 8.09111255880246e-07,
"loss": 0.0607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018022168427705765,
"step": 4785,
"valid_targets_mean": 8568.4,
"valid_targets_min": 3204
},
{
"epoch": 4.59712,
"grad_norm": 0.11609891660815055,
"learning_rate": 7.903548633059955e-07,
"loss": 0.0594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015199240297079086,
"step": 4790,
"valid_targets_mean": 9195.6,
"valid_targets_min": 4123
},
{
"epoch": 4.60192,
"grad_norm": 0.11296055178630578,
"learning_rate": 7.718140456472612e-07,
"loss": 0.0579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019392728805541992,
"step": 4795,
"valid_targets_mean": 10019.9,
"valid_targets_min": 2701
},
{
"epoch": 4.60672,
"grad_norm": 0.11439403685364499,
"learning_rate": 7.534890109732229e-07,
"loss": 0.0591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020609967410564423,
"step": 4800,
"valid_targets_mean": 9014.2,
"valid_targets_min": 1364
},
{
"epoch": 4.61152,
"grad_norm": 0.1327213756348675,
"learning_rate": 7.353799649315085e-07,
"loss": 0.0458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019029157236218452,
"step": 4805,
"valid_targets_mean": 9159.7,
"valid_targets_min": 3538
},
{
"epoch": 4.61632,
"grad_norm": 0.1306512860306434,
"learning_rate": 7.174871107458603e-07,
"loss": 0.0445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013268783688545227,
"step": 4810,
"valid_targets_mean": 8492.3,
"valid_targets_min": 2660
},
{
"epoch": 4.62112,
"grad_norm": 0.12316003257913177,
"learning_rate": 6.998106492138724e-07,
"loss": 0.0445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016152355819940567,
"step": 4815,
"valid_targets_mean": 9058.9,
"valid_targets_min": 4044
},
{
"epoch": 4.62592,
"grad_norm": 0.13208488394402484,
"learning_rate": 6.823507787047346e-07,
"loss": 0.0472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01765730045735836,
"step": 4820,
"valid_targets_mean": 9080.8,
"valid_targets_min": 1329
},
{
"epoch": 4.63072,
"grad_norm": 0.12845900831200494,
"learning_rate": 6.65107695156999e-07,
"loss": 0.0478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019706537947058678,
"step": 4825,
"valid_targets_mean": 8834.9,
"valid_targets_min": 2746
},
{
"epoch": 4.63552,
"grad_norm": 0.12699103671556508,
"learning_rate": 6.480815920763905e-07,
"loss": 0.0469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015223637223243713,
"step": 4830,
"valid_targets_mean": 8278.7,
"valid_targets_min": 2883
},
{
"epoch": 4.64032,
"grad_norm": 0.13082167598049418,
"learning_rate": 6.312726605336306e-07,
"loss": 0.0483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01759178563952446,
"step": 4835,
"valid_targets_mean": 8804.4,
"valid_targets_min": 1917
},
{
"epoch": 4.64512,
"grad_norm": 0.11954497001490652,
"learning_rate": 6.146810891622923e-07,
"loss": 0.0468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016691675409674644,
"step": 4840,
"valid_targets_mean": 9112.6,
"valid_targets_min": 2572
},
{
"epoch": 4.64992,
"grad_norm": 0.12299775936346398,
"learning_rate": 5.983070641566802e-07,
"loss": 0.0479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01542404480278492,
"step": 4845,
"valid_targets_mean": 9376.9,
"valid_targets_min": 4022
},
{
"epoch": 4.65472,
"grad_norm": 0.12357084213291525,
"learning_rate": 5.821507692697537e-07,
"loss": 0.0481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016300935298204422,
"step": 4850,
"valid_targets_mean": 8835.5,
"valid_targets_min": 2927
},
{
"epoch": 4.65952,
"grad_norm": 0.11639361498636804,
"learning_rate": 5.662123858110513e-07,
"loss": 0.0453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.012974596582353115,
"step": 4855,
"valid_targets_mean": 9376.3,
"valid_targets_min": 4422
},
{
"epoch": 4.66432,
"grad_norm": 0.1973531314250708,
"learning_rate": 5.504920926446611e-07,
"loss": 0.0429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014859823510050774,
"step": 4860,
"valid_targets_mean": 9044.0,
"valid_targets_min": 2028
},
{
"epoch": 4.66912,
"grad_norm": 0.12053965390150939,
"learning_rate": 5.349900661872132e-07,
"loss": 0.0435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013551025651395321,
"step": 4865,
"valid_targets_mean": 8233.1,
"valid_targets_min": 2519
},
{
"epoch": 4.67392,
"grad_norm": 0.13237236041105185,
"learning_rate": 5.197064804058971e-07,
"loss": 0.0455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015264524146914482,
"step": 4870,
"valid_targets_mean": 8967.7,
"valid_targets_min": 4346
},
{
"epoch": 4.67872,
"grad_norm": 0.12851803325820077,
"learning_rate": 5.046415068165234e-07,
"loss": 0.0435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01638580672442913,
"step": 4875,
"valid_targets_mean": 8687.0,
"valid_targets_min": 1807
},
{
"epoch": 4.68352,
"grad_norm": 0.12984651854096851,
"learning_rate": 4.897953144815759e-07,
"loss": 0.0443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013979455456137657,
"step": 4880,
"valid_targets_mean": 8094.6,
"valid_targets_min": 3964
},
{
"epoch": 4.68832,
"grad_norm": 0.12218670654596375,
"learning_rate": 4.7516807000833165e-07,
"loss": 0.0473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014194248244166374,
"step": 4885,
"valid_targets_mean": 8910.1,
"valid_targets_min": 4014
},
{
"epoch": 4.69312,
"grad_norm": 0.13244930235944974,
"learning_rate": 4.6075993754698623e-07,
"loss": 0.0474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017760399729013443,
"step": 4890,
"valid_targets_mean": 8803.0,
"valid_targets_min": 2878
},
{
"epoch": 4.69792,
"grad_norm": 0.12159738107311469,
"learning_rate": 4.4657107878881113e-07,
"loss": 0.0457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01536801178008318,
"step": 4895,
"valid_targets_mean": 8669.1,
"valid_targets_min": 2293
},
{
"epoch": 4.70272,
"grad_norm": 0.13108853234312876,
"learning_rate": 4.326016529643351e-07,
"loss": 0.0448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015306061133742332,
"step": 4900,
"valid_targets_mean": 8503.5,
"valid_targets_min": 1683
},
{
"epoch": 4.70752,
"grad_norm": 0.128634595478892,
"learning_rate": 4.1885181684157005e-07,
"loss": 0.0475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018076792359352112,
"step": 4905,
"valid_targets_mean": 8681.2,
"valid_targets_min": 3721
},
{
"epoch": 4.71232,
"grad_norm": 0.12249409189586784,
"learning_rate": 4.053217247242369e-07,
"loss": 0.0446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015645861625671387,
"step": 4910,
"valid_targets_mean": 9035.6,
"valid_targets_min": 2773
},
{
"epoch": 4.7171199999999995,
"grad_norm": 0.13008375294057498,
"learning_rate": 3.9201152845004476e-07,
"loss": 0.0444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014394369907677174,
"step": 4915,
"valid_targets_mean": 8486.8,
"valid_targets_min": 2407
},
{
"epoch": 4.72192,
"grad_norm": 0.12484127400367312,
"learning_rate": 3.789213773889744e-07,
"loss": 0.0435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016258973628282547,
"step": 4920,
"valid_targets_mean": 9018.9,
"valid_targets_min": 1964
},
{
"epoch": 4.72672,
"grad_norm": 0.12298816364049474,
"learning_rate": 3.6605141844162417e-07,
"loss": 0.0416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01498118694871664,
"step": 4925,
"valid_targets_mean": 8734.2,
"valid_targets_min": 2137
},
{
"epoch": 4.73152,
"grad_norm": 0.12495538982194321,
"learning_rate": 3.5340179603753354e-07,
"loss": 0.0456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01642123982310295,
"step": 4930,
"valid_targets_mean": 8728.7,
"valid_targets_min": 1857
},
{
"epoch": 4.73632,
"grad_norm": 0.12397318336703354,
"learning_rate": 3.4097265213358435e-07,
"loss": 0.043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013172818347811699,
"step": 4935,
"valid_targets_mean": 8926.8,
"valid_targets_min": 3677
},
{
"epoch": 4.7411200000000004,
"grad_norm": 0.13443930370760981,
"learning_rate": 3.287641262123975e-07,
"loss": 0.0459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016371993348002434,
"step": 4940,
"valid_targets_mean": 8540.3,
"valid_targets_min": 1162
},
{
"epoch": 4.74592,
"grad_norm": 0.12803940564558636,
"learning_rate": 3.1677635528076566e-07,
"loss": 0.0445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.011617720127105713,
"step": 4945,
"valid_targets_mean": 9372.5,
"valid_targets_min": 1983
},
{
"epoch": 4.75072,
"grad_norm": 0.1306802799160656,
"learning_rate": 3.0500947386812973e-07,
"loss": 0.0465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014903305098414421,
"step": 4950,
"valid_targets_mean": 8770.1,
"valid_targets_min": 2285
},
{
"epoch": 4.75552,
"grad_norm": 0.12387300110011946,
"learning_rate": 2.934636140250513e-07,
"loss": 0.0436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.012026086449623108,
"step": 4955,
"valid_targets_mean": 8344.1,
"valid_targets_min": 2375
},
{
"epoch": 4.76032,
"grad_norm": 0.20661769231404678,
"learning_rate": 2.821389053217383e-07,
"loss": 0.0432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014603785239160061,
"step": 4960,
"valid_targets_mean": 8906.2,
"valid_targets_min": 2707
},
{
"epoch": 4.76512,
"grad_norm": 0.12591591545112674,
"learning_rate": 2.710354748465949e-07,
"loss": 0.0467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014467072673141956,
"step": 4965,
"valid_targets_mean": 8309.1,
"valid_targets_min": 1618
},
{
"epoch": 4.76992,
"grad_norm": 0.12713363799656874,
"learning_rate": 2.6015344720479395e-07,
"loss": 0.0455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01415165513753891,
"step": 4970,
"valid_targets_mean": 8002.9,
"valid_targets_min": 2313
},
{
"epoch": 4.77472,
"grad_norm": 0.12508628958334017,
"learning_rate": 2.49492944516867e-07,
"loss": 0.0476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013956809416413307,
"step": 4975,
"valid_targets_mean": 7795.5,
"valid_targets_min": 2816
},
{
"epoch": 4.77952,
"grad_norm": 0.1226101397357892,
"learning_rate": 2.3905408641735183e-07,
"loss": 0.0444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0149923637509346,
"step": 4980,
"valid_targets_mean": 8852.8,
"valid_targets_min": 3019
},
{
"epoch": 4.78432,
"grad_norm": 0.12517540140245537,
"learning_rate": 2.288369900534404e-07,
"loss": 0.0452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.011800020933151245,
"step": 4985,
"valid_targets_mean": 7697.3,
"valid_targets_min": 3225
},
{
"epoch": 4.7891200000000005,
"grad_norm": 0.12617181013082826,
"learning_rate": 2.1884177008366203e-07,
"loss": 0.0448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01531097013503313,
"step": 4990,
"valid_targets_mean": 9043.1,
"valid_targets_min": 2615
},
{
"epoch": 4.79392,
"grad_norm": 0.13162859126890672,
"learning_rate": 2.0906853867660004e-07,
"loss": 0.0423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015335047617554665,
"step": 4995,
"valid_targets_mean": 8755.2,
"valid_targets_min": 2833
},
{
"epoch": 4.79872,
"grad_norm": 0.12921873760362335,
"learning_rate": 1.9951740550963493e-07,
"loss": 0.0443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013373359106481075,
"step": 5000,
"valid_targets_mean": 8286.6,
"valid_targets_min": 3311
},
{
"epoch": 4.80352,
"grad_norm": 0.1332690682878744,
"learning_rate": 1.9018847776770987e-07,
"loss": 0.0453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015984494239091873,
"step": 5005,
"valid_targets_mean": 8718.6,
"valid_targets_min": 2313
},
{
"epoch": 4.80832,
"grad_norm": 0.119227169078396,
"learning_rate": 1.8108186014212935e-07,
"loss": 0.0439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01700938306748867,
"step": 5010,
"valid_targets_mean": 10023.7,
"valid_targets_min": 5935
},
{
"epoch": 4.81312,
"grad_norm": 0.12005952635161173,
"learning_rate": 1.7219765482938465e-07,
"loss": 0.044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.011994611471891403,
"step": 5015,
"valid_targets_mean": 8354.2,
"valid_targets_min": 1889
},
{
"epoch": 4.81792,
"grad_norm": 0.1257252009191287,
"learning_rate": 1.635359615300036e-07,
"loss": 0.0476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013933985494077206,
"step": 5020,
"valid_targets_mean": 9395.4,
"valid_targets_min": 2543
},
{
"epoch": 4.82272,
"grad_norm": 0.13135638987722986,
"learning_rate": 1.5509687744744262e-07,
"loss": 0.0456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018428293988108635,
"step": 5025,
"valid_targets_mean": 9299.7,
"valid_targets_min": 3480
},
{
"epoch": 4.82752,
"grad_norm": 0.11986507904934081,
"learning_rate": 1.468804972869786e-07,
"loss": 0.0464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013786360621452332,
"step": 5030,
"valid_targets_mean": 8602.0,
"valid_targets_min": 4552
},
{
"epoch": 4.83232,
"grad_norm": 0.12665116588140998,
"learning_rate": 1.3888691325465886e-07,
"loss": 0.0463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017422419041395187,
"step": 5035,
"valid_targets_mean": 8720.6,
"valid_targets_min": 3791
},
{
"epoch": 4.83712,
"grad_norm": 0.13342700487132997,
"learning_rate": 1.3111621505626616e-07,
"loss": 0.0466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016414277255535126,
"step": 5040,
"valid_targets_mean": 9144.7,
"valid_targets_min": 1516
},
{
"epoch": 4.84192,
"grad_norm": 0.12412199123426582,
"learning_rate": 1.235684898963041e-07,
"loss": 0.0428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015540607273578644,
"step": 5045,
"valid_targets_mean": 8555.7,
"valid_targets_min": 2332
},
{
"epoch": 4.84672,
"grad_norm": 0.12302925116599557,
"learning_rate": 1.1624382247702681e-07,
"loss": 0.0467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014546379446983337,
"step": 5050,
"valid_targets_mean": 9193.9,
"valid_targets_min": 2994
},
{
"epoch": 4.85152,
"grad_norm": 0.12049454142383617,
"learning_rate": 1.0914229499748186e-07,
"loss": 0.0461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01593470387160778,
"step": 5055,
"valid_targets_mean": 7931.0,
"valid_targets_min": 2226
},
{
"epoch": 4.85632,
"grad_norm": 0.12255879374376923,
"learning_rate": 1.0226398715259322e-07,
"loss": 0.0431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014736687764525414,
"step": 5060,
"valid_targets_mean": 9324.5,
"valid_targets_min": 2369
},
{
"epoch": 4.86112,
"grad_norm": 0.11765425870521874,
"learning_rate": 9.560897613226205e-08,
"loss": 0.0467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.013002576306462288,
"step": 5065,
"valid_targets_mean": 8633.2,
"valid_targets_min": 3927
},
{
"epoch": 4.86592,
"grad_norm": 0.1274053457419819,
"learning_rate": 8.917733662050287e-08,
"loss": 0.0451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016446460038423538,
"step": 5070,
"valid_targets_mean": 9135.6,
"valid_targets_min": 4543
},
{
"epoch": 4.87072,
"grad_norm": 0.1278704051137457,
"learning_rate": 8.296914079461094e-08,
"loss": 0.0453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018057048320770264,
"step": 5075,
"valid_targets_mean": 8849.5,
"valid_targets_min": 2853
},
{
"epoch": 4.87552,
"grad_norm": 0.129798463098386,
"learning_rate": 7.698445832433843e-08,
"loss": 0.0475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01605452410876751,
"step": 5080,
"valid_targets_mean": 9165.0,
"valid_targets_min": 4097
},
{
"epoch": 4.88032,
"grad_norm": 0.12709516254412107,
"learning_rate": 7.122335637112621e-08,
"loss": 0.0465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017007878050208092,
"step": 5085,
"valid_targets_mean": 8871.7,
"valid_targets_min": 4935
},
{
"epoch": 4.88512,
"grad_norm": 0.12614752472781804,
"learning_rate": 6.568589958734218e-08,
"loss": 0.0467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015092524699866772,
"step": 5090,
"valid_targets_mean": 8470.4,
"valid_targets_min": 3363
},
{
"epoch": 4.88992,
"grad_norm": 0.1923253876332768,
"learning_rate": 6.037215011556185e-08,
"loss": 0.0454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017001967877149582,
"step": 5095,
"valid_targets_mean": 8674.8,
"valid_targets_min": 2585
},
{
"epoch": 4.8947199999999995,
"grad_norm": 0.11983896174408,
"learning_rate": 5.5282167587862314e-08,
"loss": 0.0454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01640951633453369,
"step": 5100,
"valid_targets_mean": 8320.3,
"valid_targets_min": 802
},
{
"epoch": 4.89952,
"grad_norm": 0.1245498830155723,
"learning_rate": 5.041600912516264e-08,
"loss": 0.0499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016499202698469162,
"step": 5105,
"valid_targets_mean": 8774.8,
"valid_targets_min": 1804
},
{
"epoch": 4.90432,
"grad_norm": 0.12071257658116219,
"learning_rate": 4.5773729336577865e-08,
"loss": 0.0464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01530368346720934,
"step": 5110,
"valid_targets_mean": 8999.9,
"valid_targets_min": 3408
},
{
"epoch": 4.90912,
"grad_norm": 0.12289113526900305,
"learning_rate": 4.1355380318803816e-08,
"loss": 0.0473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014382155612111092,
"step": 5115,
"valid_targets_mean": 7970.6,
"valid_targets_min": 1619
},
{
"epoch": 4.91392,
"grad_norm": 0.12271587443432708,
"learning_rate": 3.7161011655535425e-08,
"loss": 0.0489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01587647944688797,
"step": 5120,
"valid_targets_mean": 8968.0,
"valid_targets_min": 1910
},
{
"epoch": 4.91872,
"grad_norm": 0.11789556004029846,
"learning_rate": 3.319067041691604e-08,
"loss": 0.0458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014570049941539764,
"step": 5125,
"valid_targets_mean": 8545.9,
"valid_targets_min": 1723
},
{
"epoch": 4.92352,
"grad_norm": 0.11863148816376579,
"learning_rate": 2.9444401158995606e-08,
"loss": 0.046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014068776741623878,
"step": 5130,
"valid_targets_mean": 9208.9,
"valid_targets_min": 2341
},
{
"epoch": 4.92832,
"grad_norm": 0.1393289097006946,
"learning_rate": 2.5922245923244436e-08,
"loss": 0.0451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01812027022242546,
"step": 5135,
"valid_targets_mean": 8554.4,
"valid_targets_min": 2437
},
{
"epoch": 4.93312,
"grad_norm": 0.12652127402167426,
"learning_rate": 2.2624244236071348e-08,
"loss": 0.045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01672193594276905,
"step": 5140,
"valid_targets_mean": 8582.4,
"valid_targets_min": 2277
},
{
"epoch": 4.93792,
"grad_norm": 0.12288190891498557,
"learning_rate": 1.9550433108384005e-08,
"loss": 0.0462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014536580070853233,
"step": 5145,
"valid_targets_mean": 8607.1,
"valid_targets_min": 2724
},
{
"epoch": 4.94272,
"grad_norm": 0.12214205725983128,
"learning_rate": 1.6700847035180378e-08,
"loss": 0.0455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014544010162353516,
"step": 5150,
"valid_targets_mean": 8026.7,
"valid_targets_min": 3201
},
{
"epoch": 4.94752,
"grad_norm": 0.12608336933895256,
"learning_rate": 1.4075517995146837e-08,
"loss": 0.0441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015675101429224014,
"step": 5155,
"valid_targets_mean": 8635.8,
"valid_targets_min": 3217
},
{
"epoch": 4.95232,
"grad_norm": 0.1225680672115912,
"learning_rate": 1.167447545031175e-08,
"loss": 0.0451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016280420124530792,
"step": 5160,
"valid_targets_mean": 8837.4,
"valid_targets_min": 3252
},
{
"epoch": 4.95712,
"grad_norm": 0.12286400688787606,
"learning_rate": 9.497746345705772e-09,
"loss": 0.044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015019871294498444,
"step": 5165,
"valid_targets_mean": 9391.8,
"valid_targets_min": 4096
},
{
"epoch": 4.96192,
"grad_norm": 0.12859491123299127,
"learning_rate": 7.545355109073172e-09,
"loss": 0.0494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019673161208629608,
"step": 5170,
"valid_targets_mean": 9072.6,
"valid_targets_min": 3816
},
{
"epoch": 4.9667200000000005,
"grad_norm": 0.1244229546631015,
"learning_rate": 5.817323650578743e-09,
"loss": 0.0463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014512769877910614,
"step": 5175,
"valid_targets_mean": 8819.8,
"valid_targets_min": 2984
},
{
"epoch": 4.97152,
"grad_norm": 0.1281022316707428,
"learning_rate": 4.313671362576877e-09,
"loss": 0.0445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014761531725525856,
"step": 5180,
"valid_targets_mean": 7589.6,
"valid_targets_min": 2654
},
{
"epoch": 4.97632,
"grad_norm": 0.12672023643063166,
"learning_rate": 3.0344151193917316e-09,
"loss": 0.0466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017525404691696167,
"step": 5185,
"valid_targets_mean": 9014.8,
"valid_targets_min": 3080
},
{
"epoch": 4.98112,
"grad_norm": 0.12136843073730945,
"learning_rate": 1.979569277117399e-09,
"loss": 0.0457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.014057071879506111,
"step": 5190,
"valid_targets_mean": 8457.4,
"valid_targets_min": 3076
},
{
"epoch": 4.98592,
"grad_norm": 0.12994809873959323,
"learning_rate": 1.1491456734713524e-09,
"loss": 0.0477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015671029686927795,
"step": 5195,
"valid_targets_mean": 7887.4,
"valid_targets_min": 3187
},
{
"epoch": 4.99072,
"grad_norm": 0.1298460048267671,
"learning_rate": 5.431536276523375e-10,
"loss": 0.0449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.015169478952884674,
"step": 5200,
"valid_targets_mean": 8369.0,
"valid_targets_min": 2163
},
{
"epoch": 4.99552,
"grad_norm": 0.12910354490109707,
"learning_rate": 1.6159994023601245e-10,
"loss": 0.0467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016222694888710976,
"step": 5205,
"valid_targets_mean": 8800.3,
"valid_targets_min": 3409
},
{
"epoch": 5.0,
"grad_norm": 0.147008087077442,
"learning_rate": 4.488893106113779e-12,
"loss": 0.0436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018921401351690292,
"step": 5210,
"valid_targets_mean": 8871.3,
"valid_targets_min": 2185
},
{
"epoch": 5.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018921401351690292,
"step": 5210,
"total_flos": 3.8872733453226344e+19,
"train_loss": 0.0035894543761941615,
"train_runtime": 12426.1828,
"train_samples_per_second": 40.238,
"train_steps_per_second": 0.419,
"valid_targets_mean": 8871.3,
"valid_targets_min": 2185
}
],
"logging_steps": 5,
"max_steps": 5210,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 300,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 3.8872733453226344e+19,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}